From d62125c7aacb7a4eb444761dcb0e51d547c44e1c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 5 May 2023 10:04:38 -0700
Subject: [PATCH 001/161] fix: codegen for hashmaps with string keys (#3384)

this commit fixes a regression introduced in 3abe588, where the
codegen in parse_Subscript would handle string keys as non-bytestrings
(thus treating the value of the string as word loaded by the string
 pointer - its length value). it also cleans up the logic a little bit,
avoiding a redundant unwrap_location (since get_element_ptr calls
unwrap_location itself), and removing a dead argument from
keccak256_helper.
---
 tests/parser/features/test_string_map_keys.py | 25 +++++++++++++++++++
 vyper/builtins/functions.py                   |  2 +-
 vyper/codegen/events.py                       |  2 +-
 vyper/codegen/expr.py                         | 11 ++++----
 vyper/codegen/keccak256_helper.py             |  6 ++---
 5 files changed, 35 insertions(+), 11 deletions(-)
 create mode 100644 tests/parser/features/test_string_map_keys.py

diff --git a/tests/parser/features/test_string_map_keys.py b/tests/parser/features/test_string_map_keys.py
new file mode 100644
index 0000000000..c52bd72821
--- /dev/null
+++ b/tests/parser/features/test_string_map_keys.py
@@ -0,0 +1,25 @@
+def test_string_map_keys(get_contract):
+    code = """
+f:HashMap[String[1], bool]
+@external
+def test() -> bool:
+    a:String[1] = "a"
+    b:String[1] = "b"
+    self.f[a] = True
+    return self.f[b]  # should return False
+    """
+    c = get_contract(code)
+    c.test()
+    assert c.test() is False
+
+
+def test_string_map_keys_literals(get_contract):
+    code = """
+f:HashMap[String[1], bool]
+@external
+def test() -> bool:
+    self.f["a"] = True
+    return self.f["b"]  # should return False
+    """
+    c = get_contract(code)
+    assert c.test() is False
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 93dce54756..7733b3331f 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -611,7 +611,7 @@ def infer_arg_types(self, node):
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
         assert len(args) == 1
-        return keccak256_helper(expr, args[0], context)
+        return keccak256_helper(args[0], context)
 
 
 def _make_sha256_call(inp_start, inp_len, out_start, out_len):
diff --git a/vyper/codegen/events.py b/vyper/codegen/events.py
index 9508a869ea..30a1b1e591 100644
--- a/vyper/codegen/events.py
+++ b/vyper/codegen/events.py
@@ -15,7 +15,7 @@ def _encode_log_topics(expr, event_id, arg_nodes, context):
             value = unwrap_location(arg)
 
         elif isinstance(arg.typ, _BytestringT):
-            value = keccak256_helper(expr, arg, context=context)
+            value = keccak256_helper(arg, context=context)
         else:
             # TODO block at higher level
             raise TypeMismatch("Event indexes may only be value types", expr)
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index dfba469084..5f45f66f71 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -338,11 +338,10 @@ def parse_Subscript(self):
 
         if isinstance(sub.typ, HashMapT):
             # TODO sanity check we are in a self.my_map[i] situation
-            index = Expr.parse_value_expr(self.expr.slice.value, self.context)
-            if isinstance(index.typ, BytesT):
+            index = Expr(self.expr.slice.value, self.context).ir_node
+            if isinstance(index.typ, _BytestringT):
                 # we have to hash the key to get a storage location
-                assert len(index.args) == 1
-                index = keccak256_helper(self.expr.slice.value, index.args[0], self.context)
+                index = keccak256_helper(index, self.context)
 
         elif is_array_like(sub.typ):
             index = Expr.parse_value_expr(self.expr.slice.value, self.context)
@@ -528,8 +527,8 @@ def parse_Compare(self):
             left = Expr(self.expr.left, self.context).ir_node
             right = Expr(self.expr.right, self.context).ir_node
 
-            left_keccak = keccak256_helper(self.expr, left, self.context)
-            right_keccak = keccak256_helper(self.expr, right, self.context)
+            left_keccak = keccak256_helper(left, self.context)
+            right_keccak = keccak256_helper(right, self.context)
 
             if op not in ("eq", "ne"):
                 return  # raises
diff --git a/vyper/codegen/keccak256_helper.py b/vyper/codegen/keccak256_helper.py
index b22453761b..9c5f5eb1d0 100644
--- a/vyper/codegen/keccak256_helper.py
+++ b/vyper/codegen/keccak256_helper.py
@@ -8,7 +8,7 @@
 from vyper.utils import SHA3_BASE, SHA3_PER_WORD, MemoryPositions, bytes_to_int, keccak256
 
 
-def _check_byteslike(typ, _expr):
+def _check_byteslike(typ):
     if not isinstance(typ, _BytestringT) and typ != BYTES32_T:
         # NOTE this may be checked at a higher level, but just be safe
         raise CompilerPanic("keccak256 only accepts bytes-like objects")
@@ -18,8 +18,8 @@ def _gas_bound(num_words):
     return SHA3_BASE + num_words * SHA3_PER_WORD
 
 
-def keccak256_helper(expr, to_hash, context):
-    _check_byteslike(to_hash.typ, expr)
+def keccak256_helper(to_hash, context):
+    _check_byteslike(to_hash.typ)
 
     # Can hash literals
     # TODO this is dead code.

From 9cc56b618a54e6144829d6c056feb43e00c9c5fe Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sat, 6 May 2023 05:08:28 +0800
Subject: [PATCH 002/161] chore: improve error message for subscripted type
 validation (#3313)

type annotations like `Bytestring` with no length annotation would fail
with an unhelpful error message
---
 tests/parser/syntax/test_byte_string.py   | 26 -----------------------
 tests/parser/syntax/test_bytes.py         | 16 +++++++++++++-
 tests/parser/syntax/test_dynamic_array.py |  8 +++++++
 tests/parser/syntax/test_invalids.py      |  7 ++++++
 tests/parser/syntax/test_string.py        | 23 ++++++++++++++++++++
 vyper/semantics/types/utils.py            |  9 +++++++-
 6 files changed, 61 insertions(+), 28 deletions(-)
 delete mode 100644 tests/parser/syntax/test_byte_string.py

diff --git a/tests/parser/syntax/test_byte_string.py b/tests/parser/syntax/test_byte_string.py
deleted file mode 100644
index 90bbe197b0..0000000000
--- a/tests/parser/syntax/test_byte_string.py
+++ /dev/null
@@ -1,26 +0,0 @@
-import pytest
-
-from vyper import compiler
-
-valid_list = [
-    """
-@external
-def foo() -> String[10]:
-    return "badminton"
-    """,
-    """
-@external
-def foo():
-    x: String[11] = "¡très bien!"
-    """,
-    """
-@external
-def test() -> String[100]:
-    return "hello world!"
-    """,
-]
-
-
-@pytest.mark.parametrize("good_code", valid_list)
-def test_byte_string_success(good_code):
-    assert compiler.compile_code(good_code) is not None
diff --git a/tests/parser/syntax/test_bytes.py b/tests/parser/syntax/test_bytes.py
index d732ec3ea5..a7fb7e77ce 100644
--- a/tests/parser/syntax/test_bytes.py
+++ b/tests/parser/syntax/test_bytes.py
@@ -1,7 +1,13 @@
 import pytest
 
 from vyper import compiler
-from vyper.exceptions import InvalidOperation, InvalidType, SyntaxException, TypeMismatch
+from vyper.exceptions import (
+    InvalidOperation,
+    InvalidType,
+    StructureException,
+    SyntaxException,
+    TypeMismatch,
+)
 
 fail_list = [
     (
@@ -77,6 +83,14 @@ def test() -> Bytes[1]:
     """,
         SyntaxException,
     ),
+    (
+        """
+@external
+def foo():
+    a: Bytes = b"abc"
+    """,
+        StructureException,
+    ),
 ]
 
 
diff --git a/tests/parser/syntax/test_dynamic_array.py b/tests/parser/syntax/test_dynamic_array.py
index e7dc2d1183..0c23bf67da 100644
--- a/tests/parser/syntax/test_dynamic_array.py
+++ b/tests/parser/syntax/test_dynamic_array.py
@@ -16,6 +16,14 @@
     """,
         StructureException,
     ),
+    (
+        """
+@external
+def foo():
+    a: DynArray = [1, 2, 3]
+    """,
+        StructureException,
+    ),
 ]
 
 
diff --git a/tests/parser/syntax/test_invalids.py b/tests/parser/syntax/test_invalids.py
index 3c51075e60..33478fcff1 100644
--- a/tests/parser/syntax/test_invalids.py
+++ b/tests/parser/syntax/test_invalids.py
@@ -363,6 +363,13 @@ def a():
     UnknownAttribute,
 )
 
+must_fail(
+    """
+a: HashMap
+""",
+    StructureException,
+)
+
 
 @pytest.mark.parametrize("bad_code,exception_type", fail_list)
 def test_compilation_fails_with_exception(bad_code, exception_type):
diff --git a/tests/parser/syntax/test_string.py b/tests/parser/syntax/test_string.py
index 5b5b9e5bb5..6252011bd9 100644
--- a/tests/parser/syntax/test_string.py
+++ b/tests/parser/syntax/test_string.py
@@ -1,6 +1,7 @@
 import pytest
 
 from vyper import compiler
+from vyper.exceptions import StructureException
 
 valid_list = [
     """
@@ -27,9 +28,31 @@ def foo() -> bool:
     y: String[12] = "test"
     return x != y
     """,
+    """
+@external
+def test() -> String[100]:
+    return "hello world!"
+    """,
 ]
 
 
 @pytest.mark.parametrize("good_code", valid_list)
 def test_string_success(good_code):
     assert compiler.compile_code(good_code) is not None
+
+
+invalid_list = [
+    (
+        """
+@external
+def foo():
+    a: String = "abc"
+    """,
+        StructureException,
+    )
+]
+
+
+@pytest.mark.parametrize("bad_code,exc", invalid_list)
+def test_string_fail(assert_compile_failed, get_contract_with_gas_estimation, bad_code, exc):
+    assert_compile_failed(lambda: get_contract_with_gas_estimation(bad_code), exc)
diff --git a/vyper/semantics/types/utils.py b/vyper/semantics/types/utils.py
index 6ae677e451..1549684460 100644
--- a/vyper/semantics/types/utils.py
+++ b/vyper/semantics/types/utils.py
@@ -104,7 +104,14 @@ def _failwith(type_name):
     if node.id not in namespace:
         _failwith(node.node_source_code)
 
-    return namespace[node.id]
+    typ_ = namespace[node.id]
+    if hasattr(typ_, "from_annotation"):
+        # cases where the object in the namespace is an uninstantiated
+        # type object, ex. Bytestring or DynArray (with no length provided).
+        # call from_annotation to produce a better error message.
+        typ_.from_annotation(node)
+
+    return typ_
 
 
 def get_index_value(node: vy_ast.Index) -> int:

From c13f26d40831a467fb040739cd0755b9ee73b2e8 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sun, 7 May 2023 14:43:54 +0800
Subject: [PATCH 003/161] chore: update comments and docs (#3355)

* update interface comments

* update semantics README

* remove incorrect comment
---
 vyper/semantics/README.md          | 105 ++++++++---------------------
 vyper/semantics/analysis/module.py |   2 +-
 vyper/semantics/analysis/utils.py  |   2 -
 vyper/semantics/types/user.py      |   4 +-
 4 files changed, 32 insertions(+), 81 deletions(-)

diff --git a/vyper/semantics/README.md b/vyper/semantics/README.md
index 64be46c0e8..969f849838 100644
--- a/vyper/semantics/README.md
+++ b/vyper/semantics/README.md
@@ -10,47 +10,42 @@ Vyper abstract syntax tree (AST).
 `vyper.semantics` has the following structure:
 
 * [`types/`](types): Subpackage of classes and methods used to represent types
-  * [`types/indexable/`](types/indexable)
-    * [`mapping.py`](types/indexable/mapping.py): Mapping type
-    * [`sequence.py`](types/indexable/sequence.py): Array and Tuple types
-  * [`types/user/`](types/user)
-    * [`interface.py`](types/user/interface.py): Contract interface types and getter functions
-    * [`struct.py`](types/user/struct.py): Struct types and getter functions
-  * [`types/value/`](types/value)
-    * [`address.py`](types/value/address.py): Address type
-    * [`array_value.py`](types/value/array_value.py): Single-value subscript types (bytes, string)
-    * [`boolean.py`](types/value/boolean.py): Boolean type
-    * [`bytes_fixed.py`](types/value/bytes_fixed.py): Fixed length byte types
-    * [`numeric.py`](types/value/numeric.py): Integer and decimal types
-  * [`abstract.py`](types/abstract.py): Abstract data type classes
   * [`bases.py`](types/bases.py): Common base classes for all type objects
-  * [`event.py`](types/user/event.py): `Event` type class
-  * [`function.py`](types/function.py): `ContractFunction` type class
+  * [`bytestrings.py`](types/bytestrings.py): Single-value subscript types (bytes, string)
+  * [`function.py`](types/function.py): Contract function and member function types
+  * [`primitives.py`](types/primitives.py): Address, boolean, fixed length byte, integer and decimal types
+  * [`shortcuts.py`](types/shortcuts.py): Helper constants for commonly used types
+  * [`subscriptable.py`](types/subscriptable.py): Mapping, array and tuple types
+  * [`user.py`](types/user.py): Enum, event, interface and struct types
   * [`utils.py`](types/utils.py): Functions for generating and fetching type objects
-* [`validation/`](validation): Subpackage for type checking and syntax verification logic
-  * [`base.py`](validation/base.py): Base validation class
-  * [`local.py`](validation/local.py): Validates the local namespace of each function within a contract
-  * [`module.py`](validation/module.py): Validates the module namespace of a contract.
-  * [`utils.py`](validation/utils.py): Functions for comparing and validating types
+* [`analysis/`](analysis): Subpackage for type checking and syntax verification logic
+  * [`annotation.py`](analysis/annotation.py): Annotates statements and expressions with the appropriate type information
+  * [`base.py`](analysis/base.py): Base validation class
+  * [`common.py`](analysis/common.py): Base AST visitor class
+  * [`data_positions`](analysis/data_positions.py): Functions for tracking storage variables and allocating storage slots
+  * [`levenhtein_utils.py`](analysis/levenshtein_utils.py): Helper for better error messages
+  * [`local.py`](analysis/local.py): Validates the local namespace of each function within a contract
+  * [`module.py`](analysis/module.py): Validates the module namespace of a contract.
+  * [`utils.py`](analysis/utils.py): Functions for comparing and validating types
 * [`environment.py`](environment.py): Environment variables and builtin constants
 * [`namespace.py`](namespace.py): `Namespace` object, a `dict` subclass representing the namespace of a contract
 
 ## Control Flow
 
-The [`validation`](validation) subpackage contains the top-level `validate_semantics`
+The [`analysis`](analysis) subpackage contains the top-level `validate_semantics`
 function. This function is used to verify and type-check a contract. The process
 consists of three steps:
 
 1. Preparing the builtin namespace
 2. Validating the module-level scope
-3. Validating local scopes
+3. Annotating and validating local scopes
 
 ### 1. Preparing the builtin namespace
 
 The [`Namespace`](namespace.py) object represents the namespace for a contract.
 Builtins are added upon initialization of the object. This includes:
 
-* Adding primitive type classes from the [`types/`](types) subpackage
+* Adding type classes from the [`types/`](types) subpackage
 * Adding environment variables and builtin constants from [`environment.py`](environment.py)
 * Adding builtin functions from the [`functions`](../builtins/functions.py) package
 * Adding / resetting `self` and `log`
@@ -65,11 +60,11 @@ of a contract. This includes:
 and functions
 * Validating import statements and function signatures
 
-### 3. Validating the Local Scopes
+### 3. Annotating and validating the Local Scopes
 
 [`validation/local.py`](validation/local.py) validates the local scope within each
 function in a contract. `FunctionNodeVisitor` is used to iterate over the statement
-nodes in each function body and apply appropriate checks.
+nodes in each function body, annotate them and apply appropriate checks.
 
 To learn more about the checks on each node type, read the docstrings on the methods
 of `FunctionNodeVisitor`.
@@ -106,45 +101,6 @@ The array is given a type of `int128[2]`.
 
 All type classes are found within the [`semantics/types/`](types) subpackage.
 
-Type classes rely on inheritance to define their structure and functionlity.
-Vyper uses three broad categories to represent types within the compiler.
-
-#### Primitive Types
-
-A **primitive type** (or just primitive) defines the base attributes of a given type.
-There is only one primitive type object created for each Vyper type. All primitive
-classes are subclasses of `BasePrimitive`.
-
-Along with the builtin primitive types, user-defined ones may be created. These
-primitives are defined in the modules within [`semantics/types/user`](types/user).
-See the docstrings there for more information.
-
-#### Type Definitions
-
-A **type definition** (or just definition) is a type that has been assigned to a
-specific variable, literal, or other value. Definition objects are typically derived
-from primitives. They include additional information such as the constancy,
-visibility and scope of the associated value.
-
-A primitive type always has a corresponding type definition. However, not all
-type definitions have a primitive type, e.g. arrays and tuples.
-
-Comparing a definition to it's related primitive type will always evaluate `True`.
-Comparing two definitions of the same class can sometimes evaluate false depending
-on certain attributes. All definition classes are subclasses of `BaseTypeDefinition`.
-
-Additionally, literal values sometimes have multiple _potential type definitions_.
-In this case, a membership check determines if the literal is valid by comparing
-the list of potential types against a specific type.
-
-#### Abstract Types
-
-An **abstract type** is an inherited class shared by two or more definition
-classes. Abstract types do not implement any functionality and may not be directly
-assigned to any values. They are used for broad type checking, in cases where
-e.g. a function expects any numeric value, or any bytes value. All abstract type
-classes are subclasses of `AbstractDataType`.
-
 ### Namespace
 
 [`namespace.py`](namespace.py) contains the `Namespace` object. `Namespace` is a
@@ -190,12 +146,12 @@ namespace['foo']  # this raises an UndeclaredDefinition
 
 Validation is handled by calling methods within each type object. In general:
 
-* Primitive type objects include one or both of `from_annotation` and `from_literal`
-methods, which validate an AST node and a produce definition object
-* Definition objects include a variety of `get_<thing>` and `validate_<action>` methods,
+* Type objects include one or both of `from_annotation` and `from_literal`
+methods, which validate an AST node and produce a type object
+* Type objects include a variety of `get_<thing>` and `validate_<action>` methods,
 which are used to validate interactions and obtain new types based on AST nodes
 
-All possible methods for primitives and definitions are outlined within the base
+All possible methods for type objects are outlined within the base
 classes in [`types/bases.py`](types/bases.py). The functionality within the methods
 of the base classes is typically to raise and give a meaningful explanation
 for _why_ the syntax not valid.
@@ -208,9 +164,7 @@ Here are some examples:
 foo: int128
 ```
 
-1. We look up `int128` in `namespace`. We retrieve an `Int128Primitive` object.
-2. We call `Int128Primitive.from_annotation` with the AST node of the statement. This
-method validates the statement and returns an `Int128Definition` object.
+1. We look up `int128` in `namespace`. We retrieve an `IntegerT` object.
 3. We store the new definition under the key `foo` within `namespace`.
 
 #### 2. Modifying the value of a variable
@@ -219,15 +173,14 @@ method validates the statement and returns an `Int128Definition` object.
 foo += 6
 ```
 
-1. We look up `foo` in `namespace` and retrieve the `Int128Definition`.
+1. We look up `foo` in `namespace` and retrieve an `IntegerT` with `_is_signed=True` and `_bits=128`.
 2. We call `get_potential_types_from_node` with the target node
 and are returned a list of types that are valid for the literal `6`. In this
-case, the list includes `Int128Definition`. The type check for the statement
-passes.
+case, the list includes an `IntegerT` with `_is_signed=True` and `_bits=128`. The type check for the statement passes.
 3. We call the `validate_modification` method on the definition object
 for `foo` to confirm that it is a value that may be modified (not a constant).
 4. Because the statement involves a mathematical operator, we also call the
-`validate_numeric_operation` method on `foo` to confirm that the operation is
+`validate_numeric_op` method on `foo` to confirm that the operation is
 allowed.
 
 #### 3. Calling a builtin function
@@ -240,7 +193,7 @@ bar: bytes32 = sha256(b"hash me!")
 function.
 2. We call `fetch_call_return` on the function definition object, with the AST
 node representing the call. This method validates the input arguments, and returns
-a `Bytes32Definition`.
+a `BytesM_T` with `m=32`.
 3. We validation of the delcaration of `bar` in the same manner as the first
 example, and compare the generated type to that returned by `sha256`.
 
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index db9b9d7c91..209b63e989 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -87,7 +87,7 @@ def __init__(
             if count == len(module_nodes):
                 err_list.raise_if_not_empty()
 
-        # generate an `InterfacePrimitive` from the top-level node - used for building the ABI
+        # generate an `InterfaceT` from the top-level node - used for building the ABI
         interface = InterfaceT.from_ast(module_node)
         module_node._metadata["type"] = interface
         self.interface = interface  # this is useful downstream
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index 136012f9ea..7aaf9647c4 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -219,8 +219,6 @@ def types_from_BinOp(self, node):
             and isinstance(node.right, vy_ast.Num)
             and not node.right.value
         ):
-            # CMC 2022-07-20 this seems like unreachable code -
-            # should be handled in evaluate()
             raise ZeroDivisionException(f"{node.op.description} by zero", node)
 
         return _validate_op(node, types_list, "validate_numeric_op")
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index 536d482e75..89af9b99c0 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -396,7 +396,7 @@ def from_json_abi(cls, name: str, abi: dict) -> "InterfaceT":
     @classmethod
     def from_ast(cls, node: Union[vy_ast.InterfaceDef, vy_ast.Module]) -> "InterfaceT":
         """
-        Generate an `InterfacePrimitive` object from a Vyper ast node.
+        Generate an `InterfaceT` object from a Vyper ast node.
 
         Arguments
         ---------
@@ -404,7 +404,7 @@ def from_ast(cls, node: Union[vy_ast.InterfaceDef, vy_ast.Module]) -> "Interface
             Vyper ast node defining the interface
         Returns
         -------
-        InterfacePrimitive
+        InterfaceT
             primitive interface type
         """
         if isinstance(node, vy_ast.Module):

From cf00f418768cec3ede9eee69d702d5f6161b2fd9 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 7 May 2023 09:57:57 -0700
Subject: [PATCH 004/161] docs: clarify `skip_contract_check=True` can result
 in undefined behavior (#3386)

---
 docs/interfaces.rst | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/interfaces.rst b/docs/interfaces.rst
index 00db584443..b4182cced7 100644
--- a/docs/interfaces.rst
+++ b/docs/interfaces.rst
@@ -75,6 +75,10 @@ The ``default_return_value`` parameter can be used to handle ERC20 tokens affect
     ERC20(USDT).transfer(msg.sender, 1, default_return_value=True) # returns True
     ERC20(USDT).transfer(msg.sender, 1) # reverts because nothing returned
 
+.. warning::
+
+   When ``skip_contract_check=True`` is used and the called function returns data (ex.: ``x: uint256 = SomeContract.foo(skip_contract_check=True)``, no guarantees are provided by the compiler as to the validity of the returned value. In other words, it is undefined behavior what happens if the called contract did not exist. In particular, the returned value might point to garbage memory. It is therefore recommended to only use ``skip_contract_check=True`` to call contracts which have been manually ensured to exist at the time of the call.
+
 Importing Interfaces
 ====================
 

From 895fbf240af5dd42742f803847aee0f20fce7437 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 7 May 2023 11:59:10 -0700
Subject: [PATCH 005/161] chore: update published build to python 3.11 (#3385)

and also update the rest of the CI to use 3.11. two reasons for doing
this, even though 3.11 is a relatively new release:
- python 3.11 is about 10% faster based on local benchmarks
- universal2 images for darwin (on github actions) are only available
  for python builds starting with 3.11. cf.
  https://github.com/actions/setup-python/issues/439#issuecomment-1247646682
---
 .github/workflows/build.yml   | 12 ++++++------
 .github/workflows/publish.yml |  2 +-
 .github/workflows/test.yml    | 32 ++++++++++++++++----------------
 Dockerfile                    |  2 +-
 4 files changed, 24 insertions(+), 24 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 872d8366e1..a3e9a195f6 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -31,9 +31,9 @@ jobs:
             fetch-depth: 0
 
       - name: Python
-        uses: actions/setup-python@v2
+        uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.11"
 
       - name: Generate Binary
         run: >-
@@ -42,7 +42,7 @@ jobs:
           make freeze
 
       - name: Upload Artifact
-        uses: actions/upload-artifact@v2
+        uses: actions/upload-artifact@v3
         with:
           path: dist/vyper.*
 
@@ -58,9 +58,9 @@ jobs:
             fetch-depth: 0
 
       - name: Python
-        uses: actions/setup-python@v2
+        uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.11"
 
       - name: Generate Binary
         run: >-
@@ -69,6 +69,6 @@ jobs:
           ./make.cmd freeze
 
       - name: Upload Artifact
-        uses: actions/upload-artifact@v2
+        uses: actions/upload-artifact@v3
         with:
           path: dist/vyper.*
diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
index ecc2fa5e1f..5a8d989038 100644
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -16,7 +16,7 @@ jobs:
     - uses: actions/checkout@v2
 
     - name: Python
-      uses: actions/setup-python@v2
+      uses: actions/setup-python@v4
       with:
         python-version: '3.x'
 
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index f8fcb54f7d..4a09914d59 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -17,10 +17,10 @@ jobs:
     steps:
     - uses: actions/checkout@v1
 
-    - name: Set up Python 3.10
-      uses: actions/setup-python@v1
+    - name: Set up Python 3.11
+      uses: actions/setup-python@v4
       with:
-        python-version: "3.10"
+        python-version: "3.11"
 
     - name: Install Dependencies
       run: pip install .[lint]
@@ -42,10 +42,10 @@ jobs:
     steps:
       - uses: actions/checkout@v1
 
-      - name: Set up Python 3.10
-        uses: actions/setup-python@v1
+      - name: Set up Python 3.11
+        uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.11"
 
       - name: Install Tox
         run: pip install tox
@@ -59,10 +59,10 @@ jobs:
     steps:
     - uses: actions/checkout@v1
 
-    - name: Set up Python 3.10
-      uses: actions/setup-python@v1
+    - name: Set up Python 3.11
+      uses: actions/setup-python@v4
       with:
-        python-version: "3.10"
+        python-version: "3.11"
 
     - name: Install Tox
       run: pip install tox
@@ -75,7 +75,7 @@ jobs:
     runs-on: ubuntu-latest
     strategy:
       matrix:
-        python-version: [["3.10", "310", ["3.11", "311"]]]
+        python-version: [["3.10", "310"], ["3.11", "311"]]
         # run in default (optimized) and --no-optimize mode
         flag: ["core", "no-opt"]
 
@@ -126,10 +126,10 @@ jobs:
     steps:
     - uses: actions/checkout@v1
 
-    - name: Set up Python 3.10
-      uses: actions/setup-python@v1
+    - name: Set up Python 3.11
+      uses: actions/setup-python@v4
       with:
-        python-version: "3.10"
+        python-version: "3.11"
 
     - name: Install Tox
       run: pip install tox
@@ -167,10 +167,10 @@ jobs:
     steps:
     - uses: actions/checkout@v1
 
-    - name: Set up Python 3.10
-      uses: actions/setup-python@v1
+    - name: Set up Python 3.11
+      uses: actions/setup-python@v4
       with:
-        python-version: "3.10"
+        python-version: "3.11"
 
     - name: Install Tox
       run: pip install tox
diff --git a/Dockerfile b/Dockerfile
index c2245ee981..bc5bb607d6 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.10-slim
+FROM python:3.11-slim
 
 # Specify label-schema specific arguments and labels.
 ARG BUILD_DATE

From 3c83947223e19a526e27bbeed69141021b82e060 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Mon, 8 May 2023 04:36:40 +0800
Subject: [PATCH 006/161] fix: guard against instantiation of events and
 hashmaps (#3341)

fix: guard against instantiation of events and hashmaps

this commit fixes a regression introduced in 046ea166d93. as a result of
removing the location kwarg from `type_from_annotation()`, events could
be instantiated in the type system (althought attempts to use them would
fail during codegen). this commit reintroduces the location kwarg, and
also streamlines some logic so that HashMaps and events can all be
handled in the same code paths.

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 .../types/test_type_from_annotation.py        | 23 ++++--
 .../test_instantiation_exception.py           | 81 +++++++++++++++++++
 tests/parser/functions/test_empty.py          |  4 +-
 tests/parser/syntax/test_structs.py           | 13 ++-
 vyper/builtins/functions.py                   |  2 +-
 vyper/codegen/abi_encoder.py                  |  2 +-
 vyper/codegen/context.py                      |  2 +-
 vyper/codegen/core.py                         |  2 +-
 vyper/codegen/expr.py                         |  2 +-
 vyper/codegen/external_call.py                |  2 +-
 .../function_definitions/external_function.py |  2 +-
 vyper/codegen/ir_node.py                      |  2 +-
 vyper/codegen/return_.py                      |  2 +-
 vyper/codegen/self_call.py                    |  2 +-
 vyper/codegen/stmt.py                         |  2 +-
 vyper/{ => evm}/address_space.py              |  0
 vyper/exceptions.py                           |  4 +
 vyper/semantics/README.md                     |  1 +
 vyper/semantics/analysis/base.py              | 10 +--
 vyper/semantics/analysis/local.py             |  5 +-
 vyper/semantics/analysis/module.py            |  5 +-
 vyper/semantics/data_locations.py             |  9 +++
 vyper/semantics/types/base.py                 |  3 +
 vyper/semantics/types/function.py             | 15 ++--
 vyper/semantics/types/subscriptable.py        | 26 ++++--
 vyper/semantics/types/user.py                 |  7 +-
 vyper/semantics/types/utils.py                | 26 +++++-
 27 files changed, 196 insertions(+), 58 deletions(-)
 create mode 100644 tests/parser/exceptions/test_instantiation_exception.py
 rename vyper/{ => evm}/address_space.py (100%)
 create mode 100644 vyper/semantics/data_locations.py

diff --git a/tests/functional/semantics/types/test_type_from_annotation.py b/tests/functional/semantics/types/test_type_from_annotation.py
index 200d2bbcfc..16a31cc651 100644
--- a/tests/functional/semantics/types/test_type_from_annotation.py
+++ b/tests/functional/semantics/types/test_type_from_annotation.py
@@ -6,6 +6,7 @@
     StructureException,
     UndeclaredDefinition,
 )
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.types import PRIMITIVE_TYPES, HashMapT, SArrayT
 from vyper.semantics.types.utils import type_from_annotation
 
@@ -14,7 +15,8 @@
 
 
 @pytest.mark.parametrize("type_str", BASE_TYPES)
-def test_base_types(build_node, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_base_types(build_node, type_str, location):
     node = build_node(type_str)
     base_t = PRIMITIVE_TYPES[type_str]
 
@@ -24,7 +26,8 @@ def test_base_types(build_node, type_str):
 
 
 @pytest.mark.parametrize("type_str", BYTESTRING_TYPES)
-def test_array_value_types(build_node, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_array_value_types(build_node, type_str, location):
     node = build_node(f"{type_str}[1]")
     base_t = PRIMITIVE_TYPES[type_str](1)
 
@@ -34,7 +37,8 @@ def test_array_value_types(build_node, type_str):
 
 
 @pytest.mark.parametrize("type_str", BASE_TYPES)
-def test_base_types_as_arrays(build_node, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_base_types_as_arrays(build_node, type_str, location):
     node = build_node(f"{type_str}[3]")
     base_t = PRIMITIVE_TYPES[type_str]
 
@@ -44,7 +48,8 @@ def test_base_types_as_arrays(build_node, type_str):
 
 
 @pytest.mark.parametrize("type_str", BYTESTRING_TYPES)
-def test_array_value_types_as_arrays(build_node, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_array_value_types_as_arrays(build_node, type_str, location):
     node = build_node(f"{type_str}[1][1]")
 
     with pytest.raises(StructureException):
@@ -52,7 +57,8 @@ def test_array_value_types_as_arrays(build_node, type_str):
 
 
 @pytest.mark.parametrize("type_str", BASE_TYPES)
-def test_base_types_as_multidimensional_arrays(build_node, namespace, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_base_types_as_multidimensional_arrays(build_node, namespace, type_str, location):
     node = build_node(f"{type_str}[3][5]")
     base_t = PRIMITIVE_TYPES[type_str]
 
@@ -63,7 +69,8 @@ def test_base_types_as_multidimensional_arrays(build_node, namespace, type_str):
 
 @pytest.mark.parametrize("type_str", ["int128", "String"])
 @pytest.mark.parametrize("idx", ["0", "-1", "0x00", "'1'", "foo", "[1]", "(1,)"])
-def test_invalid_index(build_node, idx, type_str):
+@pytest.mark.parametrize("location", iter(DataLocation))
+def test_invalid_index(build_node, idx, type_str, location):
     node = build_node(f"{type_str}[{idx}]")
     with pytest.raises(
         (ArrayIndexException, InvalidType, StructureException, UndeclaredDefinition)
@@ -77,7 +84,7 @@ def test_mapping(build_node, type_str, type_str2):
     node = build_node(f"HashMap[{type_str}, {type_str2}]")
     types = PRIMITIVE_TYPES
 
-    ann_t = type_from_annotation(node)
+    ann_t = type_from_annotation(node, DataLocation.STORAGE)
 
     k_t = types[type_str]
     v_t = types[type_str2]
@@ -91,7 +98,7 @@ def test_multidimensional_mapping(build_node, type_str, type_str2):
     node = build_node(f"HashMap[{type_str}, HashMap[{type_str}, {type_str2}]]")
     types = PRIMITIVE_TYPES
 
-    ann_t = type_from_annotation(node)
+    ann_t = type_from_annotation(node, DataLocation.STORAGE)
 
     k_t = types[type_str]
     v_t = types[type_str2]
diff --git a/tests/parser/exceptions/test_instantiation_exception.py b/tests/parser/exceptions/test_instantiation_exception.py
new file mode 100644
index 0000000000..0d641f154a
--- /dev/null
+++ b/tests/parser/exceptions/test_instantiation_exception.py
@@ -0,0 +1,81 @@
+import pytest
+
+from vyper.exceptions import InstantiationException
+
+invalid_list = [
+    """
+event Foo:
+    a: uint256
+
+@external
+def foo() -> Foo:
+    return Foo(2)
+    """,
+    """
+event Foo:
+    a: uint256
+
+@external
+def foo() -> (uint256, Foo):
+    return 1, Foo(2)
+    """,
+    """
+a: HashMap[uint256, uint256]
+
+@external
+def foo() -> HashMap[uint256, uint256]:
+    return self.a
+    """,
+    """
+event Foo:
+    a: uint256
+
+@external
+def foo(x: Foo):
+    pass
+    """,
+    """
+@external
+def foo(x: HashMap[uint256, uint256]):
+    pass
+    """,
+    """
+event Foo:
+    a: uint256
+
+foo: Foo
+    """,
+    """
+event Foo:
+    a: uint256
+
+@external
+def foo():
+    f: Foo = Foo(1)
+    pass
+    """,
+    """
+event Foo:
+    a: uint256
+
+b: HashMap[uint256, Foo]
+    """,
+    """
+event Foo:
+    a: uint256
+
+b: HashMap[Foo, uint256]
+    """,
+    """
+b: immutable(HashMap[uint256, uint256])
+
+@external
+def __init__():
+    b = empty(HashMap[uint256, uint256])
+    """,
+]
+
+
+@pytest.mark.parametrize("bad_code", invalid_list)
+def test_instantiation_exception(bad_code, get_contract, assert_compile_failed):
+    assert_compile_failed(lambda: get_contract(bad_code), InstantiationException)
diff --git a/tests/parser/functions/test_empty.py b/tests/parser/functions/test_empty.py
index 20fd98f543..c10d03550a 100644
--- a/tests/parser/functions/test_empty.py
+++ b/tests/parser/functions/test_empty.py
@@ -1,6 +1,6 @@
 import pytest
 
-from vyper.exceptions import TypeMismatch
+from vyper.exceptions import InstantiationException, TypeMismatch
 
 
 @pytest.mark.parametrize(
@@ -711,4 +711,4 @@ def test():
     ],
 )
 def test_invalid_types(contract, get_contract, assert_compile_failed):
-    assert_compile_failed(lambda: get_contract(contract), TypeMismatch)
+    assert_compile_failed(lambda: get_contract(contract), InstantiationException)
diff --git a/tests/parser/syntax/test_structs.py b/tests/parser/syntax/test_structs.py
index 757c46c4b3..b30f7e6098 100644
--- a/tests/parser/syntax/test_structs.py
+++ b/tests/parser/syntax/test_structs.py
@@ -2,6 +2,7 @@
 
 from vyper import compiler
 from vyper.exceptions import (
+    InstantiationException,
     InvalidType,
     StructureException,
     TypeMismatch,
@@ -297,7 +298,7 @@ def foo():
     a: HashMap[int128, C]
     b: int128
     """,
-        StructureException,
+        InstantiationException,
     ),
     """
 struct C1:
@@ -429,6 +430,16 @@ def foo():
     """,
         StructureException,
     ),
+    (
+        """
+event Foo:
+    a: uint256
+
+struct Bar:
+    a: Foo
+    """,
+        InstantiationException,
+    ),
 ]
 
 
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 7733b3331f..bfe90bb669 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -5,7 +5,6 @@
 
 from vyper import ast as vy_ast
 from vyper.abi_types import ABI_Tuple
-from vyper.address_space import MEMORY, STORAGE
 from vyper.ast.validation import validate_call_args
 from vyper.codegen.abi_encoder import abi_encode
 from vyper.codegen.context import Context, VariableRecord
@@ -39,6 +38,7 @@
 from vyper.codegen.expr import Expr
 from vyper.codegen.ir_node import Encoding
 from vyper.codegen.keccak256_helper import keccak256_helper
+from vyper.evm.address_space import MEMORY, STORAGE
 from vyper.exceptions import (
     ArgumentException,
     CompilerPanic,
diff --git a/vyper/codegen/abi_encoder.py b/vyper/codegen/abi_encoder.py
index e76fbf2f64..66d61a9c16 100644
--- a/vyper/codegen/abi_encoder.py
+++ b/vyper/codegen/abi_encoder.py
@@ -1,4 +1,3 @@
-from vyper.address_space import MEMORY
 from vyper.codegen.core import (
     STORE,
     add_ofst,
@@ -9,6 +8,7 @@
     zero_pad,
 )
 from vyper.codegen.ir_node import IRnode
+from vyper.evm.address_space import MEMORY
 from vyper.exceptions import CompilerPanic
 from vyper.semantics.types import DArrayT, SArrayT, _BytestringT
 from vyper.semantics.types.shortcuts import UINT256_T
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index 2efba960de..cc9f9744f0 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -3,8 +3,8 @@
 from dataclasses import dataclass
 from typing import Any, Optional
 
-from vyper.address_space import MEMORY, AddrSpace
 from vyper.codegen.ir_node import Encoding
+from vyper.evm.address_space import MEMORY, AddrSpace
 from vyper.exceptions import CompilerPanic, StateAccessViolation
 from vyper.semantics.types import VyperType
 
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 1cc601413c..86fe19818c 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -1,6 +1,6 @@
 from vyper import ast as vy_ast
-from vyper.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE
 from vyper.codegen.ir_node import Encoding, IRnode
+from vyper.evm.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE
 from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StructureException, TypeCheckFailure, TypeMismatch
 from vyper.semantics.types import (
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 5f45f66f71..87293a4794 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -3,7 +3,6 @@
 
 import vyper.codegen.arithmetic as arithmetic
 from vyper import ast as vy_ast
-from vyper.address_space import DATA, IMMUTABLES, MEMORY, STORAGE
 from vyper.codegen import external_call, self_call
 from vyper.codegen.core import (
     clamp,
@@ -24,6 +23,7 @@
 )
 from vyper.codegen.ir_node import IRnode
 from vyper.codegen.keccak256_helper import keccak256_helper
+from vyper.evm.address_space import DATA, IMMUTABLES, MEMORY, STORAGE
 from vyper.evm.opcodes import version_check
 from vyper.exceptions import (
     CompilerPanic,
diff --git a/vyper/codegen/external_call.py b/vyper/codegen/external_call.py
index f99723f16d..88ea4b098e 100644
--- a/vyper/codegen/external_call.py
+++ b/vyper/codegen/external_call.py
@@ -1,7 +1,6 @@
 from dataclasses import dataclass
 
 import vyper.utils as util
-from vyper.address_space import MEMORY
 from vyper.codegen.abi_encoder import abi_encode
 from vyper.codegen.core import (
     _freshname,
@@ -17,6 +16,7 @@
     wrap_value_for_external_return,
 )
 from vyper.codegen.ir_node import Encoding, IRnode
+from vyper.evm.address_space import MEMORY
 from vyper.exceptions import TypeCheckFailure
 from vyper.semantics.types import InterfaceT, TupleT
 from vyper.semantics.types.function import StateMutability
diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index feb2973e2a..42ea11a035 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -1,7 +1,6 @@
 from typing import Any, List
 
 import vyper.utils as util
-from vyper.address_space import CALLDATA, DATA, MEMORY
 from vyper.ast.signatures.function_signature import FunctionSignature
 from vyper.codegen.abi_encoder import abi_encoding_matches_vyper
 from vyper.codegen.context import Context, VariableRecord
@@ -10,6 +9,7 @@
 from vyper.codegen.function_definitions.utils import get_nonreentrant_lock
 from vyper.codegen.ir_node import Encoding, IRnode
 from vyper.codegen.stmt import parse_body
+from vyper.evm.address_space import CALLDATA, DATA, MEMORY
 from vyper.semantics.types import TupleT
 
 
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index c2c127b9d5..1ba4122c66 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -3,8 +3,8 @@
 from functools import cached_property
 from typing import Any, List, Optional, Tuple, Union
 
-from vyper.address_space import AddrSpace
 from vyper.compiler.settings import VYPER_COLOR_OUTPUT
+from vyper.evm.address_space import AddrSpace
 from vyper.evm.opcodes import get_ir_opcodes
 from vyper.exceptions import CodegenPanic, CompilerPanic
 from vyper.semantics.types import VyperType
diff --git a/vyper/codegen/return_.py b/vyper/codegen/return_.py
index 1cd50075a1..4a39127a14 100644
--- a/vyper/codegen/return_.py
+++ b/vyper/codegen/return_.py
@@ -1,6 +1,5 @@
 from typing import Any, Optional
 
-from vyper.address_space import MEMORY
 from vyper.codegen.abi_encoder import abi_encode, abi_encoding_matches_vyper
 from vyper.codegen.context import Context
 from vyper.codegen.core import (
@@ -13,6 +12,7 @@
     wrap_value_for_external_return,
 )
 from vyper.codegen.ir_node import IRnode
+from vyper.evm.address_space import MEMORY
 
 Stmt = Any  # mypy kludge
 
diff --git a/vyper/codegen/self_call.py b/vyper/codegen/self_call.py
index 2669f99192..b5429ca255 100644
--- a/vyper/codegen/self_call.py
+++ b/vyper/codegen/self_call.py
@@ -1,6 +1,6 @@
-from vyper.address_space import MEMORY
 from vyper.codegen.core import _freshname, eval_once_check, make_setter
 from vyper.codegen.ir_node import IRnode, push_label_to_stack
+from vyper.evm.address_space import MEMORY
 from vyper.exceptions import StateAccessViolation, StructureException
 from vyper.semantics.types.subscriptable import TupleT
 
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index de9801a740..204e861184 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -1,7 +1,6 @@
 import vyper.codegen.events as events
 import vyper.utils as util
 from vyper import ast as vy_ast
-from vyper.address_space import MEMORY, STORAGE
 from vyper.builtins.functions import STMT_DISPATCH_TABLE
 from vyper.codegen import external_call, self_call
 from vyper.codegen.context import Constancy, Context
@@ -23,6 +22,7 @@
 )
 from vyper.codegen.expr import Expr
 from vyper.codegen.return_ import make_return_stmt
+from vyper.evm.address_space import MEMORY, STORAGE
 from vyper.exceptions import CompilerPanic, StructureException, TypeCheckFailure
 from vyper.semantics.types import DArrayT, MemberFunctionT
 from vyper.semantics.types.shortcuts import INT256_T, UINT256_T
diff --git a/vyper/address_space.py b/vyper/evm/address_space.py
similarity index 100%
rename from vyper/address_space.py
rename to vyper/evm/address_space.py
diff --git a/vyper/exceptions.py b/vyper/exceptions.py
index 9c4358a9ad..07d972c343 100644
--- a/vyper/exceptions.py
+++ b/vyper/exceptions.py
@@ -151,6 +151,10 @@ class StructureException(VyperException):
     """Invalid structure for parsable syntax."""
 
 
+class InstantiationException(StructureException):
+    """Variable or expression cannot be instantiated"""
+
+
 class VersionException(VyperException):
     """Version string is malformed or incompatible with this compiler version."""
 
diff --git a/vyper/semantics/README.md b/vyper/semantics/README.md
index 969f849838..1d81a0979b 100644
--- a/vyper/semantics/README.md
+++ b/vyper/semantics/README.md
@@ -27,6 +27,7 @@ Vyper abstract syntax tree (AST).
   * [`local.py`](analysis/local.py): Validates the local namespace of each function within a contract
   * [`module.py`](analysis/module.py): Validates the module namespace of a contract.
   * [`utils.py`](analysis/utils.py): Functions for comparing and validating types
+* [`data_locations.py`](data_locations.py): `DataLocation` object for type location information
 * [`environment.py`](environment.py): Environment variables and builtin constants
 * [`namespace.py`](namespace.py): `Namespace` object, a `dict` subclass representing the namespace of a contract
 
diff --git a/vyper/semantics/analysis/base.py b/vyper/semantics/analysis/base.py
index 27f04577af..5919c96686 100644
--- a/vyper/semantics/analysis/base.py
+++ b/vyper/semantics/analysis/base.py
@@ -9,6 +9,7 @@
     StateAccessViolation,
     VyperInternalException,
 )
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.types.base import VyperType
 
 
@@ -92,15 +93,6 @@ def from_abi(cls, abi_dict: Dict) -> "StateMutability":
         #       specifying a state mutability modifier at all. Do the same here.
 
 
-# TODO: move me to locations.py?
-class DataLocation(enum.Enum):
-    UNSET = 0
-    MEMORY = 1
-    STORAGE = 2
-    CALLDATA = 3
-    CODE = 4
-
-
 class DataPosition:
     _location: DataLocation
 
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index f9bd0db297..5de03d611b 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -19,7 +19,7 @@
     VyperException,
 )
 from vyper.semantics.analysis.annotation import StatementAnnotationVisitor
-from vyper.semantics.analysis.base import DataLocation, VarInfo
+from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.common import VyperNodeVisitorBase
 from vyper.semantics.analysis.utils import (
     get_common_types,
@@ -28,6 +28,7 @@
     get_possible_types_from_node,
     validate_expected_type,
 )
+from vyper.semantics.data_locations import DataLocation
 
 # TODO consolidate some of these imports
 from vyper.semantics.environment import CONSTANT_ENVIRONMENT_VARS, MUTABLE_ENVIRONMENT_VARS
@@ -232,7 +233,7 @@ def visit_AnnAssign(self, node):
                 "Memory variables must be declared with an initial value", node
             )
 
-        type_ = type_from_annotation(node.annotation)
+        type_ = type_from_annotation(node.annotation, DataLocation.MEMORY)
         validate_expected_type(node.value, type_)
 
         try:
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index 209b63e989..22ac8cecaf 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -18,7 +18,7 @@
     VariableDeclarationException,
     VyperException,
 )
-from vyper.semantics.analysis.base import DataLocation, VarInfo
+from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.common import VyperNodeVisitorBase
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
 from vyper.semantics.analysis.utils import (
@@ -26,6 +26,7 @@
     validate_expected_type,
     validate_unique_method_ids,
 )
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import Namespace, get_namespace
 from vyper.semantics.types import EnumT, EventT, InterfaceT, StructT
 from vyper.semantics.types.function import ContractFunctionT
@@ -196,7 +197,7 @@ def visit_VariableDecl(self, node):
             else DataLocation.STORAGE
         )
 
-        type_ = type_from_annotation(node.annotation)
+        type_ = type_from_annotation(node.annotation, data_loc)
         var_info = VarInfo(
             type_,
             decl_node=node,
diff --git a/vyper/semantics/data_locations.py b/vyper/semantics/data_locations.py
new file mode 100644
index 0000000000..0ec374e42f
--- /dev/null
+++ b/vyper/semantics/data_locations.py
@@ -0,0 +1,9 @@
+import enum
+
+
+class DataLocation(enum.Enum):
+    UNSET = 0
+    MEMORY = 1
+    STORAGE = 2
+    CALLDATA = 3
+    CODE = 4
diff --git a/vyper/semantics/types/base.py b/vyper/semantics/types/base.py
index 0ac4f7b06d..8a174566eb 100644
--- a/vyper/semantics/types/base.py
+++ b/vyper/semantics/types/base.py
@@ -40,6 +40,8 @@ class VyperType:
         If `True`, this type can be used as the base member for an array.
     _valid_literal : Tuple
         A tuple of Vyper ast classes that may be assigned this type.
+    _invalid_locations : Tuple
+        A tuple of invalid `DataLocation`s for this type
     _is_prim_word: bool, optional
         This is a word type like uint256, int8, bytesM or address
     """
@@ -47,6 +49,7 @@ class VyperType:
     _id: str
     _type_members: Optional[Dict] = None
     _valid_literal: Tuple = ()
+    _invalid_locations: Tuple = ()
     _is_prim_word: bool = False
     _equality_attrs: Optional[Tuple] = None
     _is_array_type: bool = False
diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index 75fa3a1214..9ec4506632 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -15,13 +15,9 @@
     StateAccessViolation,
     StructureException,
 )
-from vyper.semantics.analysis.base import (
-    DataLocation,
-    FunctionVisibility,
-    StateMutability,
-    StorageSlot,
-)
+from vyper.semantics.analysis.base import FunctionVisibility, StateMutability, StorageSlot
 from vyper.semantics.analysis.utils import check_kwargable, validate_expected_type
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import get_namespace
 from vyper.semantics.types.base import KwargSettings, VyperType
 from vyper.semantics.types.primitives import BoolT
@@ -297,7 +293,7 @@ def from_FunctionDef(
             if arg.annotation is None:
                 raise ArgumentException(f"Function argument '{arg.arg}' is missing a type", arg)
 
-            type_ = type_from_annotation(arg.annotation)
+            type_ = type_from_annotation(arg.annotation, DataLocation.CALLDATA)
 
             if value is not None:
                 if not check_kwargable(value):
@@ -316,7 +312,8 @@ def from_FunctionDef(
                 "Constructor may not have a return type", node.returns
             )
         elif isinstance(node.returns, (vy_ast.Name, vy_ast.Subscript, vy_ast.Tuple)):
-            return_type = type_from_annotation(node.returns)
+            # note: consider, for cleanliness, adding DataLocation.RETURN_VALUE
+            return_type = type_from_annotation(node.returns, DataLocation.MEMORY)
         else:
             raise InvalidType("Function return value must be a type name or tuple", node.returns)
 
@@ -350,7 +347,7 @@ def getter_from_VariableDecl(cls, node: vy_ast.VariableDecl) -> "ContractFunctio
         """
         if not node.is_public:
             raise CompilerPanic("getter generated for non-public function")
-        type_ = type_from_annotation(node.annotation)
+        type_ = type_from_annotation(node.annotation, DataLocation.STORAGE)
         arguments, return_type = type_.getter_signature
         args_dict: OrderedDict = OrderedDict()
         for item in arguments:
diff --git a/vyper/semantics/types/subscriptable.py b/vyper/semantics/types/subscriptable.py
index 85aa0b9064..6a2d3aae73 100644
--- a/vyper/semantics/types/subscriptable.py
+++ b/vyper/semantics/types/subscriptable.py
@@ -4,6 +4,7 @@
 from vyper import ast as vy_ast
 from vyper.abi_types import ABI_DynamicArray, ABI_StaticArray, ABI_Tuple, ABIType
 from vyper.exceptions import ArrayIndexException, InvalidType, StructureException
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.types.base import VyperType
 from vyper.semantics.types.primitives import IntegerT
 from vyper.semantics.types.shortcuts import UINT256_T
@@ -44,6 +45,14 @@ class HashMapT(_SubscriptableT):
 
     _equality_attrs = ("key_type", "value_type")
 
+    # disallow everything but storage
+    _invalid_locations = (
+        DataLocation.UNSET,
+        DataLocation.CALLDATA,
+        DataLocation.CODE,
+        DataLocation.MEMORY,
+    )
+
     def __repr__(self):
         return f"HashMap[{self.key_type}, {self.value_type}]"
 
@@ -73,15 +82,13 @@ def from_annotation(cls, node: Union[vy_ast.Name, vy_ast.Call, vy_ast.Subscript]
                 ),
                 node,
             )
-        # if location != DataLocation.STORAGE or is_immutable:
-        #    raise StructureException("HashMap can only be declared as a storage variable", node)
 
         k_ast, v_ast = node.slice.value.elements
-        key_type = type_from_annotation(k_ast)
+        key_type = type_from_annotation(k_ast, DataLocation.STORAGE)
         if not key_type._as_hashmap_key:
             raise InvalidType("can only use primitive types as HashMap key!", k_ast)
 
-        value_type = type_from_annotation(v_ast)
+        value_type = type_from_annotation(v_ast, DataLocation.STORAGE)
 
         return cls(key_type, value_type)
 
@@ -291,12 +298,19 @@ class TupleT(VyperType):
     """
     Tuple type definition.
 
-    This class is used to represent multiple return values from
-    functions.
+    This class is used to represent multiple return values from functions.
     """
 
     _equality_attrs = ("members",)
 
+    # note: docs say that tuples are not instantiable but they
+    # are in fact instantiable and the codegen works. if we
+    # wanted to be stricter in the typechecker, we could
+    # add _invalid_locations = everything but UNSET and RETURN_VALUE.
+    # (we would need to add a DataLocation.RETURN_VALUE in order for
+    # tuples to be instantiable as return values but not in memory).
+    # _invalid_locations = ...
+
     def __init__(self, member_types: Tuple[VyperType, ...]) -> None:
         super().__init__()
         self.member_types = member_types
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index 89af9b99c0..444f9256e7 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -17,6 +17,7 @@
 from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
 from vyper.semantics.analysis.utils import validate_expected_type, validate_unique_method_ids
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import get_namespace
 from vyper.semantics.types.base import VyperType
 from vyper.semantics.types.function import ContractFunctionT
@@ -153,6 +154,8 @@ class EventT(_UserType):
         Name of the event.
     """
 
+    _invalid_locations = tuple(iter(DataLocation))  # not instantiable in any location
+
     def __init__(self, name: str, arguments: dict, indexed: list) -> None:
         super().__init__(members=arguments)
         self.name = name
@@ -471,10 +474,6 @@ def __init__(self, _id, members, ast_def=None):
 
         self.ast_def = ast_def
 
-        for n, t in self.members.items():
-            if isinstance(t, HashMapT):
-                raise StructureException(f"Struct contains a mapping '{n}'", ast_def)
-
     @cached_property
     def name(self) -> str:
         # Alias for API compatibility with codegen
diff --git a/vyper/semantics/types/utils.py b/vyper/semantics/types/utils.py
index 1549684460..1187080ca9 100644
--- a/vyper/semantics/types/utils.py
+++ b/vyper/semantics/types/utils.py
@@ -1,8 +1,15 @@
 from typing import Dict
 
 from vyper import ast as vy_ast
-from vyper.exceptions import ArrayIndexException, InvalidType, StructureException, UnknownType
+from vyper.exceptions import (
+    ArrayIndexException,
+    InstantiationException,
+    InvalidType,
+    StructureException,
+    UnknownType,
+)
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
+from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import get_namespace
 from vyper.semantics.types.base import VyperType
 
@@ -60,9 +67,11 @@ def type_from_abi(abi_type: Dict) -> VyperType:
             raise UnknownType(f"ABI contains unknown type: {type_string}") from None
 
 
-def type_from_annotation(node: vy_ast.VyperNode) -> VyperType:
+def type_from_annotation(
+    node: vy_ast.VyperNode, location: DataLocation = DataLocation.UNSET
+) -> VyperType:
     """
-    Return a type object for the given AST node.
+    Return a type object for the given AST node after validating its location.
 
     Arguments
     ---------
@@ -74,6 +83,16 @@ def type_from_annotation(node: vy_ast.VyperNode) -> VyperType:
     VyperType
         Type definition object.
     """
+    typ_ = _type_from_annotation(node)
+
+    if location in typ_._invalid_locations:
+        location_str = "" if location is DataLocation.UNSET else f"in {location.name.lower()}"
+        raise InstantiationException(f"{typ_} is not instantiable {location_str}", node)
+
+    return typ_
+
+
+def _type_from_annotation(node: vy_ast.VyperNode) -> VyperType:
     namespace = get_namespace()
 
     def _failwith(type_name):
@@ -84,7 +103,6 @@ def _failwith(type_name):
 
     if isinstance(node, vy_ast.Tuple):
         tuple_t = namespace["$TupleT"]
-
         return tuple_t.from_annotation(node)
 
     if isinstance(node, vy_ast.Subscript):

From d9e376ca49977d39bf549201e0f7db42ddaa6358 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Mon, 8 May 2023 23:22:20 +0800
Subject: [PATCH 007/161] fix: string to bool conversion (#3391)

* add StringT to cases in _convert.py
* add tests
---
 tests/parser/functions/test_convert.py | 15 ++++++++++++++-
 vyper/builtins/_convert.py             |  2 +-
 2 files changed, 15 insertions(+), 2 deletions(-)

diff --git a/tests/parser/functions/test_convert.py b/tests/parser/functions/test_convert.py
index d6a72c66af..eb8449447c 100644
--- a/tests/parser/functions/test_convert.py
+++ b/tests/parser/functions/test_convert.py
@@ -22,7 +22,7 @@
 
 BASE_TYPES = set(IntegerT.all()) | set(BytesM_T.all()) | {DecimalT(), AddressT(), BoolT()}
 
-TEST_TYPES = BASE_TYPES | {BytesT(32)}
+TEST_TYPES = BASE_TYPES | {BytesT(32)} | {StringT(32)}
 
 ZERO_ADDRESS = "0x0000000000000000000000000000000000000000"
 
@@ -163,6 +163,17 @@ def _cases_for_Bytes(typ):
     # would not need this if we tested all Bytes[1]...Bytes[32] types.
     for i in range(32):
         ret.extend(_cases_for_bytes(BytesM_T(i + 1)))
+
+    ret.append(b"")
+    return uniq(ret)
+
+
+def _cases_for_String(typ):
+    ret = []
+    # would not need this if we tested all Bytes[1]...Bytes[32] types.
+    for i in range(32):
+        ret.extend([str(c, "utf-8") for c in _cases_for_bytes(BytesM_T(i + 1))])
+    ret.append("")
     return uniq(ret)
 
 
@@ -176,6 +187,8 @@ def interesting_cases_for_type(typ):
         return _cases_for_bytes(typ)
     if isinstance(typ, BytesT):
         return _cases_for_Bytes(typ)
+    if isinstance(typ, StringT):
+        return _cases_for_String(typ)
     if isinstance(typ, BoolT):
         return _cases_for_bool(typ)
     if isinstance(typ, AddressT):
diff --git a/vyper/builtins/_convert.py b/vyper/builtins/_convert.py
index 407a32f3e9..546207072a 100644
--- a/vyper/builtins/_convert.py
+++ b/vyper/builtins/_convert.py
@@ -267,7 +267,7 @@ def _literal_decimal(expr, arg_typ, out_typ):
 def to_bool(expr, arg, out_typ):
     _check_bytes(expr, arg, out_typ, 32)  # should we restrict to Bytes[1]?
 
-    if isinstance(arg.typ, BytesT):
+    if isinstance(arg.typ, _BytestringT):
         # no clamp. checks for any nonzero bytes.
         arg = _bytes_to_num(arg, out_typ, signed=False)
 

From eeccea9ce794f1c2183aed8ec5e7d6d43b58811e Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 9 May 2023 09:45:17 -0700
Subject: [PATCH 008/161] fix: metadata output (#3393)

`-f metadata` output was not working for some functions. this fixes the
issue and also checks that metadata output is successfully produced in
the `get_contract` fixture to avoid this in the future.
---
 tests/base_conftest.py   | 3 ++-
 vyper/compiler/output.py | 3 +--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index 4c3d0136bb..2b29a4a384 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -112,7 +112,8 @@ def w3(tester):
 def _get_contract(w3, source_code, no_optimize, *args, **kwargs):
     out = compiler.compile_code(
         source_code,
-        ["abi", "bytecode"],
+        # test that metadata gets generated
+        ["abi", "bytecode", "metadata"],
         interface_codes=kwargs.pop("interface_codes", None),
         no_optimize=no_optimize,
         evm_version=kwargs.pop("evm_version", None),
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 82e583c160..408cb9d239 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -130,8 +130,7 @@ def _to_dict(sig):
             # e.g. {"x": vy_ast.Int(..)} -> {"x": 1}
             ret["default_values"][k] = ret["default_values"][k].node_source_code
         ret["frame_info"] = vars(ret["frame_info"])
-        for k in ret["frame_info"]["frame_vars"].keys():
-            ret["frame_info"]["frame_vars"][k] = _var_rec_dict(ret["frame_info"]["frame_vars"][k])
+        del ret["frame_info"]["frame_vars"]  # frame_var.pos might be IR, cannot serialize
         return ret
 
     return {"function_info": {name: _to_dict(sig) for (name, sig) in sigs.items()}}

From 51e1316aef95e1567f5454ffb5f5ddb9e65b0b91 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 12:39:32 -0700
Subject: [PATCH 009/161] feat: add ternary operator (#3398)

add python's ternary `a if test else b` operator to vyper
---
 tests/parser/features/test_ternary.py  | 280 +++++++++++++++++++++++++
 tests/parser/syntax/test_ternary.py    | 138 ++++++++++++
 vyper/ast/grammar.lark                 |   3 +
 vyper/ast/nodes.py                     |   4 +
 vyper/ast/nodes.pyi                    |   5 +
 vyper/codegen/expr.py                  |  23 ++
 vyper/semantics/analysis/annotation.py |  13 +-
 vyper/semantics/analysis/local.py      |   5 +
 vyper/semantics/analysis/utils.py      |  11 +
 9 files changed, 481 insertions(+), 1 deletion(-)
 create mode 100644 tests/parser/features/test_ternary.py
 create mode 100644 tests/parser/syntax/test_ternary.py

diff --git a/tests/parser/features/test_ternary.py b/tests/parser/features/test_ternary.py
new file mode 100644
index 0000000000..c5480286c8
--- /dev/null
+++ b/tests/parser/features/test_ternary.py
@@ -0,0 +1,280 @@
+import pytest
+
+simple_cases = [
+    (
+        """
+@external
+def foo(t: bool, x: uint256, y: uint256) -> uint256:
+    return x if t else y
+    """,
+        (1, 2),
+    ),
+    (  # literal test
+        """
+@external
+def foo(_t: bool, x: uint256, y: uint256) -> uint256:
+    return x if {test} else y
+    """,
+        (1, 2),
+    ),
+    (  # literal body
+        """
+@external
+def foo(t: bool, _x: uint256, y: uint256) -> uint256:
+    return {x} if t else y
+    """,
+        (1, 2),
+    ),
+    (  # literal orelse
+        """
+@external
+def foo(t: bool, x: uint256, _y: uint256) -> uint256:
+    return x if t else {y}
+    """,
+        (1, 2),
+    ),
+    (  # literal body/orelse
+        """
+@external
+def foo(t: bool, _x: uint256, _y: uint256) -> uint256:
+    return {x} if t else {y}
+    """,
+        (1, 2),
+    ),
+    (  # literal everything
+        """
+@external
+def foo(_t: bool, _x: uint256, _y: uint256) -> uint256:
+    return {x} if {test} else {y}
+    """,
+        (1, 2),
+    ),
+    (  # body/orelse in storage and memory
+        """
+s: uint256
+@external
+def foo(t: bool, x: uint256, y: uint256) -> uint256:
+    self.s = x
+    return self.s if t else y
+    """,
+        (1, 2),
+    ),
+    (  # body/orelse in memory and storage
+        """
+s: uint256
+@external
+def foo(t: bool, x: uint256, y: uint256) -> uint256:
+    self.s = x
+    return self.s if t else y
+    """,
+        (1, 2),
+    ),
+    (  # body/orelse in memory and constant
+        """
+S: constant(uint256) = {y}
+@external
+def foo(t: bool, x: uint256, _y: uint256) -> uint256:
+    return x if t else S
+    """,
+        (1, 2),
+    ),
+    (  # dynarray
+        """
+@external
+def foo(t: bool, x: DynArray[uint256, 3], y: DynArray[uint256, 3]) -> DynArray[uint256, 3]:
+    return x if t else y
+    """,
+        ([], [1]),
+    ),
+    (  # variable + literal dynarray
+        """
+@external
+def foo(t: bool, x: DynArray[uint256, 3], _y: DynArray[uint256, 3]) -> DynArray[uint256, 3]:
+    return x if t else {y}
+    """,
+        ([], [1]),
+    ),
+    (  # literal + variable dynarray
+        """
+@external
+def foo(t: bool, _x: DynArray[uint256, 3], y: DynArray[uint256, 3]) -> DynArray[uint256, 3]:
+    return {x} if t else y
+    """,
+        ([], [1]),
+    ),
+    (  # storage dynarray
+        """
+s: DynArray[uint256, 3]
+@external
+def foo(t: bool, x: DynArray[uint256, 3], y: DynArray[uint256, 3]) -> DynArray[uint256, 3]:
+    self.s = y
+    return x if t else self.s
+    """,
+        ([], [1]),
+    ),
+    (  # static array
+        """
+@external
+def foo(t: bool, x: uint256[1], y: uint256[1]) -> uint256[1]:
+    return x if t else y
+    """,
+        ([2], [1]),
+    ),
+    (  # static array literal
+        """
+@external
+def foo(t: bool, x: uint256[1], _y: uint256[1]) -> uint256[1]:
+    return x if t else {y}
+    """,
+        ([2], [1]),
+    ),
+    (  # strings
+        """
+@external
+def foo(t: bool, x: String[10], y: String[10]) -> String[10]:
+    return x if t else y
+    """,
+        ("hello", "world"),
+    ),
+    (  # string literal
+        """
+@external
+def foo(t: bool, x: String[10], _y: String[10]) -> String[10]:
+    return x if t else {y}
+    """,
+        ("hello", "world"),
+    ),
+    (  # bytes
+        """
+@external
+def foo(t: bool, x: Bytes[10], y: Bytes[10]) -> Bytes[10]:
+    return x if t else y
+    """,
+        (b"hello", b"world"),
+    ),
+]
+
+
+@pytest.mark.parametrize("code,inputs", simple_cases)
+@pytest.mark.parametrize("test", [True, False])
+def test_ternary_simple(get_contract, code, test, inputs):
+    x, y = inputs
+    # note: repr to escape strings
+    code = code.format(test=test, x=repr(x), y=repr(y))
+    c = get_contract(code)
+    # careful with order of precedence of `assert` and `if/else` in python!
+    assert c.foo(test, x, y) == (x if test else y)
+
+
+tuple_codes = [
+    """
+@external
+def foo(t: bool, x: uint256, y: uint256) -> (uint256, uint256):
+    return (x, y) if t else (y, x)
+    """,
+    """
+s: uint256
+@external
+def foo(t: bool, x: uint256, y: uint256) -> (uint256, uint256):
+    self.s = x
+    return (self.s, y) if t else (y, self.s)
+    """,
+]
+
+
+@pytest.mark.parametrize("code", tuple_codes)
+@pytest.mark.parametrize("test", [True, False])
+def test_ternary_tuple(get_contract, code, test):
+    c = get_contract(code)
+
+    x, y = 1, 2
+    assert c.foo(test, x, y) == ([x, y] if test else [y, x])
+
+
+@pytest.mark.parametrize("test", [True, False])
+def test_ternary_immutable(get_contract, test):
+    code = """
+IMM: public(immutable(uint256))
+@external
+def __init__(test: bool):
+    IMM = 1 if test else 2
+    """
+    c = get_contract(code, test)
+
+    assert c.IMM() == (1 if test else 2)
+
+
+@pytest.mark.parametrize("test", [True, False])
+@pytest.mark.parametrize("x", list(range(8)))
+@pytest.mark.parametrize("y", list(range(8)))
+def test_complex_ternary_expression(get_contract, test, x, y):
+    code = """
+@external
+def foo(t: bool, x: uint256, y: uint256) -> uint256:
+    return (x * y) if (t and True) else (x + y + convert(t, uint256))
+    """
+    c = get_contract(code)
+
+    assert c.foo(test, x, y) == ((x * y) if (test and True) else (x + y + int(test)))
+
+
+@pytest.mark.parametrize("test", [True, False])
+@pytest.mark.parametrize("x", list(range(8)))
+@pytest.mark.parametrize("y", list(range(8)))
+def test_ternary_precedence(get_contract, test, x, y):
+    code = """
+@external
+def foo(t: bool, x: uint256, y: uint256) -> uint256:
+    return x * y if t else x + y + convert(t, uint256)
+    """
+    c = get_contract(code)
+
+    assert c.foo(test, x, y) == (x * y if test else x + y + int(test))
+
+
+@pytest.mark.parametrize("test1", [True, False])
+@pytest.mark.parametrize("test2", [True, False])
+def test_nested_ternary(get_contract, test1, test2):
+    code = """
+@external
+def foo(t1: bool, t2: bool, x: uint256, y: uint256, z: uint256) -> uint256:
+    return x if t1 else y if t2 else z
+    """
+    c = get_contract(code)
+
+    x, y, z = 1, 2, 3
+    assert c.foo(test1, test2, x, y, z) == (x if test1 else y if test2 else z)
+
+
+@pytest.mark.parametrize("test", [True, False])
+def test_ternary_side_effects(get_contract, test):
+    code = """
+track_taint_x: public(uint256)
+track_taint_y: public(uint256)
+foo_retval: public(uint256)
+
+@internal
+def x() -> uint256:
+    self.track_taint_x += 1
+    return 5
+
+@internal
+def y() -> uint256:
+    self.track_taint_y += 1
+    return 7
+
+@external
+def foo(t: bool):
+    self.foo_retval = self.x() if t else self.y()
+    """
+    c = get_contract(code)
+
+    c.foo(test, transact={})
+    assert c.foo_retval() == (5 if test else 7)
+
+    if test:
+        assert c.track_taint_x() == 1
+        assert c.track_taint_y() == 0
+    else:
+        assert c.track_taint_x() == 0
+        assert c.track_taint_y() == 1
diff --git a/tests/parser/syntax/test_ternary.py b/tests/parser/syntax/test_ternary.py
new file mode 100644
index 0000000000..11c06051d0
--- /dev/null
+++ b/tests/parser/syntax/test_ternary.py
@@ -0,0 +1,138 @@
+import pytest
+
+from vyper.compiler import compile_code
+from vyper.exceptions import InvalidType, TypeMismatch
+
+good_list = [
+    # basic test
+    """
+@external
+def foo(a: uint256, b: uint256) -> uint256:
+    return a if a > b else b
+    """,
+    # different locations:
+    """
+b: uint256
+
+@external
+def foo(x: uint256) -> uint256:
+    return x if x > self.b else self.b
+    """,
+    # different kinds of test exprs
+    """
+@external
+def foo(x: uint256, t: bool) -> uint256:
+    return x if t else 1
+    """,
+    """
+@external
+def foo(x: uint256) -> uint256:
+    return x if True else 1
+    """,
+    """
+@external
+def foo(x: uint256) -> uint256:
+    return x if False else 1
+    """,
+    # more complex types
+    """
+@external
+def foo(t: bool) -> DynArray[uint256, 1]:
+    return [2] if t else [1]
+    """,
+    # TODO: get this working, depends #3377
+    #    """
+    # @external
+    # def foo(t: bool) -> DynArray[uint256, 1]:
+    #    return [] if t else [1]
+    #    """,
+    """
+@external
+def foo(t: bool) -> (uint256, uint256):
+    a: uint256 = 0
+    b: uint256 = 1
+    return (a, b) if t else (b, a)
+    """,
+]
+
+
+@pytest.mark.parametrize("code", good_list)
+def test_ternary_good(code):
+    assert compile_code(code) is not None
+
+
+fail_list = [
+    (  # bad test type
+        """
+@external
+def foo() -> uint256:
+    return 1 if 1 else 2
+    """,
+        InvalidType,
+    ),
+    (  # bad test type: constant
+        """
+TEST: constant(uint256) = 1
+@external
+def foo() -> uint256:
+    return 1 if TEST else 2
+    """,
+        InvalidType,
+    ),
+    (  # bad test type: variable
+        """
+TEST: constant(uint256) = 1
+@external
+def foo(t: uint256) -> uint256:
+    return 1 if t else 2
+    """,
+        TypeMismatch,
+    ),
+    (  # mismatched body and orelse: literal
+        """
+@external
+def foo() -> uint256:
+    return 1 if True else 2.0
+    """,
+        TypeMismatch,
+    ),
+    (  # mismatched body and orelse: literal and known type
+        """
+T: constant(uint256) = 1
+@external
+def foo() -> uint256:
+    return T if True else 2.0
+    """,
+        TypeMismatch,
+    ),
+    (  # mismatched body and orelse: both variable
+        """
+@external
+def foo(x: uint256, y: uint8) -> uint256:
+    return x if True else y
+    """,
+        TypeMismatch,
+    ),
+    (  # mismatched tuple types
+        """
+@external
+def foo(a: uint256, b: uint256, c: uint256) -> (uint256, uint256):
+    return (a, b) if True else (a, b, c)
+    """,
+        TypeMismatch,
+    ),
+    (  # mismatched tuple types - other direction
+        """
+@external
+def foo(a: uint256, b: uint256, c: uint256) -> (uint256, uint256):
+    return (a, b, c) if True else (a, b)
+    """,
+        TypeMismatch,
+    ),
+]
+
+
+@pytest.mark.parametrize("code,exc", fail_list)
+def test_functions_call_fail(code, exc):
+    with pytest.raises(exc):
+        compile_code(code)
diff --git a/vyper/ast/grammar.lark b/vyper/ast/grammar.lark
index cf15e13a8c..046dcc1f1a 100644
--- a/vyper/ast/grammar.lark
+++ b/vyper/ast/grammar.lark
@@ -174,10 +174,13 @@ loop_variable: NAME [":" NAME]
 loop_iterator: _expr
 for_stmt: "for" loop_variable "in" loop_iterator ":" body
 
+// ternary operator
+ternary: _expr "if" _expr "else" _expr
 
 // Expressions
 _expr: operation
      | dict
+     | ternary
 
 get_item: variable_access "[" _expr "]"
 get_attr: variable_access "." NAME
diff --git a/vyper/ast/nodes.py b/vyper/ast/nodes.py
index 5e6f8473a0..7bb0a6274d 100644
--- a/vyper/ast/nodes.py
+++ b/vyper/ast/nodes.py
@@ -1430,6 +1430,10 @@ class If(Stmt):
     __slots__ = ("test", "body", "orelse")
 
 
+class IfExp(ExprNode):
+    __slots__ = ("test", "body", "orelse")
+
+
 class For(Stmt):
     __slots__ = ("iter", "target", "body")
     _only_empty_fields = ("orelse",)
diff --git a/vyper/ast/nodes.pyi b/vyper/ast/nodes.pyi
index 93563516f3..d47e420d66 100644
--- a/vyper/ast/nodes.pyi
+++ b/vyper/ast/nodes.pyi
@@ -238,6 +238,11 @@ class If(VyperNode):
     body: list = ...
     orelse: list = ...
 
+class IfExp(ExprNode):
+    test: ExprNode = ...
+    body: ExprNode = ...
+    orelse: ExprNode = ...
+
 class For(VyperNode): ...
 class Break(VyperNode): ...
 class Continue(VyperNode): ...
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 87293a4794..506a2694fb 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -701,6 +701,29 @@ def parse_Tuple(self):
         multi_ir = IRnode.from_list(["multi"] + tuple_elements, typ=typ)
         return multi_ir
 
+    def parse_IfExp(self):
+        test = Expr.parse_value_expr(self.expr.test, self.context)
+        assert test.typ == BoolT()  # sanity check
+
+        body = Expr(self.expr.body, self.context).ir_node
+        orelse = Expr(self.expr.orelse, self.context).ir_node
+
+        # if they are in the same location, we can skip copying
+        # into memory. also for the case where either body or orelse are
+        # literal `multi` values (ex. for tuple or arrays), copy to
+        # memory (to avoid crashing in make_setter, XXX fixme).
+        if body.location != orelse.location or body.value == "multi":
+            body = ensure_in_memory(body, self.context)
+            orelse = ensure_in_memory(orelse, self.context)
+
+        assert body.location == orelse.location
+        # check this once compare_type has no side effects:
+        # assert body.typ.compare_type(orelse.typ)
+
+        typ = self.expr._metadata["type"]
+        location = body.location
+        return IRnode.from_list(["if", test, body, orelse], typ=typ, location=location)
+
     @staticmethod
     def struct_literals(expr, name, context):
         member_subs = {}
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index 3d2397f30d..a14c0b9783 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -5,7 +5,7 @@
     get_exact_type_from_node,
     get_possible_types_from_node,
 )
-from vyper.semantics.types import TYPE_T, EnumT, EventT, SArrayT, StructT, is_type_t
+from vyper.semantics.types import TYPE_T, BoolT, EnumT, EventT, SArrayT, StructT, is_type_t
 from vyper.semantics.types.function import ContractFunctionT, MemberFunctionT
 
 
@@ -258,3 +258,14 @@ def visit_UnaryOp(self, node, type_):
                 type_ = type_.pop()
         node._metadata["type"] = type_
         self.visit(node.operand, type_)
+
+    def visit_IfExp(self, node, type_):
+        if type_ is None:
+            ts = get_common_types(node.body, node.orelse)
+            if len(type_) == 1:
+                type_ = ts.pop()
+
+        node._metadata["type"] = type_
+        self.visit(node.test, BoolT())
+        self.visit(node.body, type_)
+        self.visit(node.orelse, type_)
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index 5de03d611b..23ccc216a6 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -596,3 +596,8 @@ def visit_Tuple(self, node: vy_ast.Tuple) -> None:
 
     def visit_UnaryOp(self, node: vy_ast.UnaryOp) -> None:
         self.visit(node.operand)  # type: ignore[attr-defined]
+
+    def visit_IfExp(self, node: vy_ast.IfExp) -> None:
+        self.visit(node.test)
+        self.visit(node.body)
+        self.visit(node.orelse)
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index 7aaf9647c4..f50f3243c8 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -363,6 +363,17 @@ def types_from_UnaryOp(self, node):
         types_list = self.get_possible_types_from_node(node.operand)
         return _validate_op(node, types_list, "validate_numeric_op")
 
+    def types_from_IfExp(self, node):
+        validate_expected_type(node.test, BoolT())
+        types_list = get_common_types(node.body, node.orelse)
+
+        if not types_list:
+            a = get_possible_types_from_node(node.body)[0]
+            b = get_possible_types_from_node(node.orelse)[0]
+            raise TypeMismatch(f"Dislike types: {a} and {b}", node)
+
+        return types_list
+
 
 def _is_empty_list(node):
     # Checks if a node is a `List` node with an empty list for `elements`,

From 92c32f8e61677f7bbd6fd95ada0b7a45da594513 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 13:20:05 -0700
Subject: [PATCH 010/161] docs: `unique_symbol` in IR (#3399)

---
 vyper/ir/README.md | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/vyper/ir/README.md b/vyper/ir/README.md
index 50e61ce81f..ebcc381590 100644
--- a/vyper/ir/README.md
+++ b/vyper/ir/README.md
@@ -194,6 +194,10 @@ Could compile to:
 _sym_foo JUMPDEST
 ```
 
+### UNIQUE\_SYMBOL
+
+`(unique_symbol l)` defines a "unique symbol". These are generated to help catch front-end bugs involving multiple execution of side-effects (which should be only executed once). They can be ignored, or to be strict, any backend should enforce that each `unique_symbol` only appears one time in the code.
+
 ### IF\_STMT
 
 Branching statements. There are two forms, if with a single branch, and if with two branches.

From 4f8289a81206f767df1900ac48f485d90fc87edb Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 13:30:00 -0700
Subject: [PATCH 011/161] Merge pull request from GHSA-3p37-3636-q8wv

in dynarray_make_setter, the length is copied before the data. when the
dst and src arrays do not overlap, this is not a problem. however, when
the dst and src are the same dynarray, this can lead to a
store-before-load, leading any array bounds checks on the right hand
side to function incorrectly. here is an example:

```vyper
@external
def should_revert() -> DynArray[uint256,3]:
    a: DynArray[uint256, 3] = [1, 2, 3]
    a = empty(DynArray[uint256, 3])
    a = [self.a[0], self.a[1], self.a[2]]
    return a  # if bug: returns [1,2,3]
```

this commit moves the length store to after the data copy in
dynarray_make_setter. for hygiene, it also moves the length store to
after the data copy in several other routines. I left pop_dyn_array()
unchanged, because moving the routine does not actually perform any data
copy, it just writes the new length (and optionally returns a pointer to
the popped item).
---
 tests/parser/types/test_dynamic_array.py | 92 ++++++++++++++++++++++++
 vyper/codegen/core.py                    | 46 ++++++++----
 2 files changed, 123 insertions(+), 15 deletions(-)

diff --git a/tests/parser/types/test_dynamic_array.py b/tests/parser/types/test_dynamic_array.py
index 04c0688245..cb55c42870 100644
--- a/tests/parser/types/test_dynamic_array.py
+++ b/tests/parser/types/test_dynamic_array.py
@@ -1748,3 +1748,95 @@ def foo(i: uint256) -> {return_type}:
     return MY_CONSTANT[i]
     """
     assert_compile_failed(lambda: get_contract(code), TypeMismatch)
+
+
+dynarray_length_no_clobber_cases = [
+    # GHSA-3p37-3636-q8wv cases
+    """
+a: DynArray[uint256,3]
+
+@external
+def should_revert() -> DynArray[uint256,3]:
+    self.a = [1,2,3]
+    self.a = empty(DynArray[uint256,3])
+    self.a = [self.a[0], self.a[1], self.a[2]]
+
+    return self.a  # if bug: returns [1,2,3]
+    """,
+    """
+@external
+def should_revert() -> DynArray[uint256,3]:
+    self.a()
+    return self.b() # if bug: returns [1,2,3]
+
+@internal
+def a():
+    a: uint256 = 0
+    b: uint256 = 1
+    c: uint256 = 2
+    d: uint256 = 3
+
+@internal
+def b() -> DynArray[uint256,3]:
+    a: DynArray[uint256,3] = empty(DynArray[uint256,3])
+    a = [a[0],a[1],a[2]]
+    return a
+    """,
+    """
+a: DynArray[uint256,4]
+
+@external
+def should_revert() -> DynArray[uint256,4]:
+    self.a = [1,2,3]
+    self.a = empty(DynArray[uint256,4])
+    self.a = [4, self.a[0]]
+
+    return self.a  # if bug: return [4, 4]
+    """,
+    """
+@external
+def should_revert() -> DynArray[uint256,4]:
+    a: DynArray[uint256, 4] = [1,2,3]
+    a = []
+
+    a = [a.pop()]  # if bug: return [1]
+
+    return a
+    """,
+    """
+@external
+def should_revert():
+    c: DynArray[uint256, 1] = []
+    c.append(c[0])
+    """,
+    """
+@external
+def should_revert():
+    c: DynArray[uint256, 1] = [1]
+    c[0] = c.pop()
+    """,
+    """
+@external
+def should_revert():
+    c: DynArray[DynArray[uint256, 1], 2] = [[]]
+    c[0] = c.pop()
+    """,
+    """
+a: DynArray[String[65],2]
+
+@external
+def should_revert() -> DynArray[String[65], 2]:
+    self.a = ["hello", "world"]
+    self.a = []
+    self.a = [self.a[0], self.a[1]]
+
+    return self.a  # if bug: return ["hello", "world"]
+    """,
+]
+
+
+@pytest.mark.parametrize("code", dynarray_length_no_clobber_cases)
+def test_dynarray_length_no_clobber(get_contract, assert_tx_failed, code):
+    # check that length is not clobbered before dynarray data copy happens
+    c = get_contract(code)
+    assert_tx_failed(lambda: c.should_revert())
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 86fe19818c..a9a91ec9d8 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -117,13 +117,15 @@ def make_byte_array_copier(dst, src):
             max_bytes = src.typ.maxlen
 
             ret = ["seq"]
+
+            dst_ = bytes_data_ptr(dst)
+            src_ = bytes_data_ptr(src)
+
+            ret.append(copy_bytes(dst_, src_, len_, max_bytes))
+
             # store length
             ret.append(STORE(dst, len_))
 
-            dst = bytes_data_ptr(dst)
-            src = bytes_data_ptr(src)
-
-            ret.append(copy_bytes(dst, src, len_, max_bytes))
             return b1.resolve(b2.resolve(ret))
 
 
@@ -148,25 +150,34 @@ def _dynarray_make_setter(dst, src):
     if src.value == "~empty":
         return IRnode.from_list(STORE(dst, 0))
 
+    # copy contents of src dynarray to dst.
+    # note that in case src and dst refer to the same dynarray,
+    # in order for get_element_ptr oob checks on the src dynarray
+    # to work, we need to wait until after the data is copied
+    # before we clobber the length word.
+
     if src.value == "multi":
         ret = ["seq"]
         # handle literals
 
-        # write the length word
-        store_length = STORE(dst, len(src.args))
-        ann = None
-        if src.annotation is not None:
-            ann = f"len({src.annotation})"
-        store_length = IRnode.from_list(store_length, annotation=ann)
-        ret.append(store_length)
-
+        # copy each item
         n_items = len(src.args)
+
         for i in range(n_items):
             k = IRnode.from_list(i, typ=UINT256_T)
             dst_i = get_element_ptr(dst, k, array_bounds_check=False)
             src_i = get_element_ptr(src, k, array_bounds_check=False)
             ret.append(make_setter(dst_i, src_i))
 
+        # write the length word after data is copied
+        store_length = STORE(dst, n_items)
+        ann = None
+        if src.annotation is not None:
+            ann = f"len({src.annotation})"
+        store_length = IRnode.from_list(store_length, annotation=ann)
+
+        ret.append(store_length)
+
         return ret
 
     with src.cache_when_complex("darray_src") as (b1, src):
@@ -190,8 +201,6 @@ def _dynarray_make_setter(dst, src):
         with get_dyn_array_count(src).cache_when_complex("darray_count") as (b2, count):
             ret = ["seq"]
 
-            ret.append(STORE(dst, count))
-
             if should_loop:
                 i = IRnode.from_list(_freshname("copy_darray_ix"), typ=UINT256_T)
 
@@ -213,6 +222,9 @@ def _dynarray_make_setter(dst, src):
                 dst_ = dynarray_data_ptr(dst)
                 ret.append(copy_bytes(dst_, src_, n_bytes, max_bytes))
 
+            # write the length word after data is copied
+            ret.append(STORE(dst, count))
+
             return b1.resolve(b2.resolve(ret))
 
 
@@ -336,12 +348,14 @@ def append_dyn_array(darray_node, elem_node):
         with len_.cache_when_complex("old_darray_len") as (b2, len_):
             assertion = ["assert", ["lt", len_, darray_node.typ.count]]
             ret.append(IRnode.from_list(assertion, error_msg=f"{darray_node.typ} bounds check"))
-            ret.append(STORE(darray_node, ["add", len_, 1]))
             # NOTE: typechecks elem_node
             # NOTE skip array bounds check bc we already asserted len two lines up
             ret.append(
                 make_setter(get_element_ptr(darray_node, len_, array_bounds_check=False), elem_node)
             )
+
+            # store new length
+            ret.append(STORE(darray_node, ["add", len_, 1]))
             return IRnode.from_list(b1.resolve(b2.resolve(ret)))
 
 
@@ -354,6 +368,7 @@ def pop_dyn_array(darray_node, return_popped_item):
         new_len = IRnode.from_list(["sub", old_len, 1], typ=UINT256_T)
 
         with new_len.cache_when_complex("new_len") as (b2, new_len):
+            # store new length
             ret.append(STORE(darray_node, new_len))
 
             # NOTE skip array bounds check bc we already asserted len two lines up
@@ -364,6 +379,7 @@ def pop_dyn_array(darray_node, return_popped_item):
                 location = popped_item.location
             else:
                 typ, location = None, None
+
             return IRnode.from_list(b1.resolve(b2.resolve(ret)), typ=typ, location=location)
 
 

From 3de1415ee77a9244eb04bdb695e249d3ec9ed868 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 13:35:44 -0700
Subject: [PATCH 012/161] Merge pull request from GHSA-6r8q-pfpv-7cgj

for loops of the form `for i in range(x, x+N)`, the range of the
iterator is not checked, leading to potential overflow. the following
example demonstrates the potential for overflow:

```
@external
def test() -> uint16:
    x:uint8 = 255
    a:uint8 = 0
    for i in range(x, x+2):
        a = i
    return convert(a,uint16)  # returns 256
```

this commit fixes the issue by adding a range check before entering the
loop body.
---
 .../{test_repeater.py => test_for_range.py}   | 39 +++++++++++++++++++
 vyper/codegen/stmt.py                         |  3 ++
 2 files changed, 42 insertions(+)
 rename tests/parser/features/iteration/{test_repeater.py => test_for_range.py} (86%)

diff --git a/tests/parser/features/iteration/test_repeater.py b/tests/parser/features/iteration/test_for_range.py
similarity index 86%
rename from tests/parser/features/iteration/test_repeater.py
rename to tests/parser/features/iteration/test_for_range.py
index 3c95882d2d..30f4bb87e3 100644
--- a/tests/parser/features/iteration/test_repeater.py
+++ b/tests/parser/features/iteration/test_for_range.py
@@ -128,6 +128,45 @@ def foo(a: {typ}) -> {typ}:
     assert c.foo(100) == 31337
 
 
+# test that we can get to the upper range of an integer
+@pytest.mark.parametrize("typ", ["uint8", "int128", "uint256"])
+def test_for_range_edge(get_contract, typ):
+    code = f"""
+@external
+def test():
+    found: bool = False
+    x: {typ} = max_value({typ})
+    for i in range(x, x + 1):
+        if i == max_value({typ}):
+            found = True
+
+    assert found
+
+    found = False
+    x = max_value({typ}) - 1
+    for i in range(x, x + 2):
+        if i == max_value({typ}):
+            found = True
+
+    assert found
+    """
+    c = get_contract(code)
+    c.test()
+
+
+@pytest.mark.parametrize("typ", ["uint8", "int128", "uint256"])
+def test_for_range_oob_check(get_contract, assert_tx_failed, typ):
+    code = f"""
+@external
+def test():
+    x: {typ} = max_value({typ})
+    for i in range(x, x+2):
+        pass
+    """
+    c = get_contract(code)
+    assert_tx_failed(lambda: c.test())
+
+
 @pytest.mark.parametrize("typ", ["int128", "uint256"])
 def test_return_inside_nested_repeater(get_contract, typ):
     code = f"""
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 204e861184..01c1d5f121 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -10,6 +10,7 @@
     IRnode,
     append_dyn_array,
     check_assign,
+    clamp,
     dummy_node_for_type,
     get_dyn_array_count,
     get_element_ptr,
@@ -264,6 +265,8 @@ def _parse_For_range(self):
             arg1 = self.stmt.iter.args[1]
             rounds = self._get_range_const_value(arg1.right)
             start = Expr.parse_value_expr(arg0, self.context)
+            _, hi = start.typ.int_bounds
+            start = clamp("le", start, hi + 1 - rounds)
 
         r = rounds if isinstance(rounds, int) else rounds.value
         if r < 1:

From c3e68c302aa6e1429946473769dd1232145822ac Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 13:47:41 -0700
Subject: [PATCH 013/161] Merge pull request from GHSA-ph9x-4vc9-m39g

the routine for aligning call-site posargs and kwargs in
`vyper.codegen.context.lookup_internal_function` was incorrect in cases
where the internal function had more than one default argument - it
consumed default args at the call site from the end instead of the
beginning of the defaults list. this commit fixes and adds some tests
for the alignment routine.
---
 tests/parser/features/test_internal_call.py | 62 +++++++++++++++++++++
 vyper/codegen/context.py                    |  4 +-
 2 files changed, 63 insertions(+), 3 deletions(-)

diff --git a/tests/parser/features/test_internal_call.py b/tests/parser/features/test_internal_call.py
index f576dc5ee5..d7a41acbc0 100644
--- a/tests/parser/features/test_internal_call.py
+++ b/tests/parser/features/test_internal_call.py
@@ -1,6 +1,9 @@
+import string
 from decimal import Decimal
 
+import hypothesis.strategies as st
 import pytest
+from hypothesis import given, settings
 
 from vyper.compiler import compile_code
 from vyper.exceptions import ArgumentException, CallViolation
@@ -642,3 +645,62 @@ def bar() -> String[6]:
     c = get_contract_with_gas_estimation(contract)
 
     assert c.bar() == "hello"
+
+
+# TODO probably want to refactor these into general test utils
+st_uint256 = st.integers(min_value=0, max_value=2**256 - 1)
+st_string65 = st.text(max_size=65, alphabet=string.printable)
+st_bytes65 = st.binary(max_size=65)
+st_sarray3 = st.lists(st_uint256, min_size=3, max_size=3)
+st_darray3 = st.lists(st_uint256, max_size=3)
+
+internal_call_kwargs_cases = [
+    ("uint256", st_uint256),
+    ("String[65]", st_string65),
+    ("Bytes[65]", st_bytes65),
+    ("uint256[3]", st_sarray3),
+    ("DynArray[uint256, 3]", st_darray3),
+]
+
+
+@pytest.mark.parametrize("typ1,strategy1", internal_call_kwargs_cases)
+@pytest.mark.parametrize("typ2,strategy2", internal_call_kwargs_cases)
+def test_internal_call_kwargs(get_contract, typ1, strategy1, typ2, strategy2):
+    # GHSA-ph9x-4vc9-m39g
+
+    @given(kwarg1=strategy1, default1=strategy1, kwarg2=strategy2, default2=strategy2)
+    @settings(deadline=None, max_examples=5)  # len(cases) * len(cases) * 5 * 5
+    def fuzz(kwarg1, kwarg2, default1, default2):
+        code = f"""
+@internal
+def foo(a: {typ1} = {repr(default1)}, b: {typ2} = {repr(default2)}) -> ({typ1}, {typ2}):
+    return a, b
+
+@external
+def test0() -> ({typ1}, {typ2}):
+    return self.foo()
+
+@external
+def test1() -> ({typ1}, {typ2}):
+    return self.foo({repr(kwarg1)})
+
+@external
+def test2() -> ({typ1}, {typ2}):
+    return self.foo({repr(kwarg1)}, {repr(kwarg2)})
+
+@external
+def test3(x1: {typ1}) -> ({typ1}, {typ2}):
+    return self.foo(x1)
+
+@external
+def test4(x1: {typ1}, x2: {typ2}) -> ({typ1}, {typ2}):
+    return self.foo(x1, x2)
+        """
+        c = get_contract(code)
+        assert c.test0() == [default1, default2]
+        assert c.test1() == [kwarg1, default2]
+        assert c.test2() == [kwarg1, kwarg2]
+        assert c.test3(kwarg1) == [kwarg1, default2]
+        assert c.test4(kwarg1, kwarg2) == [kwarg1, kwarg2]
+
+    fuzz()
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index cc9f9744f0..9902cd0cf7 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -267,10 +267,8 @@ def _check(cond, s="Unreachable"):
         # _check(all(l.typ == r.typ for (l, r) in zip(args_ir, sig.args))
 
         num_provided_kwargs = len(args_ir) - len(sig.base_args)
-        num_kwargs = len(sig.default_args)
-        kwargs_needed = num_kwargs - num_provided_kwargs
 
-        kw_vals = list(sig.default_values.values())[:kwargs_needed]
+        kw_vals = list(sig.default_values.values())[num_provided_kwargs:]
 
         return sig, kw_vals
 

From 1703d8fcd652534c17aecd71e1d9d149c81ecffb Mon Sep 17 00:00:00 2001
From: Mikko Ohtamaa <mikko@redinnovation.com>
Date: Thu, 11 May 2023 22:58:16 +0200
Subject: [PATCH 014/161] docs: fix broken rst links (#3401)

---
 docs/resources.rst | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/resources.rst b/docs/resources.rst
index 295a104fcf..7f0d0600a9 100644
--- a/docs/resources.rst
+++ b/docs/resources.rst
@@ -9,8 +9,8 @@ examples, courses and other learning material.
 General
 -------
 
--  `Ape Academy - Learn how to build vyper projects <https://academy.apeworx.io/> by ApeWorX`__
-- `More Vyper by Example <https://vyper-by-example.org/> by Smart Contract Engineer`__
+- `Ape Academy - Learn how to build vyper projects <https://academy.apeworx.io/>`__ by ApeWorX
+- `More Vyper by Example <https://vyper-by-example.org/>`__ by Smart Contract Engineer
 - `Vyper cheat Sheet <https://reference.auditless.com/cheatsheet>`__
 - `Vyper Hub for development <https://github.com/zcor/vyper-dev>`__
 - `Vyper greatest hits smart contract examples <https://github.com/pynchmeister/vyper-greatest-hits/tree/main/contracts>`__
@@ -44,4 +44,4 @@ Unmaintained
 These resources have not been updated for a while, but may still offer interesting content.
 
 - `Awesome Vyper curated resources <https://github.com/spadebuilders/awesome-vyper>`__
-- `Brownie - Python framework for developing smart contracts (deprecated) <https://eth-brownie.readthedocs.io/en/stable/>`__
\ No newline at end of file
+- `Brownie - Python framework for developing smart contracts (deprecated) <https://eth-brownie.readthedocs.io/en/stable/>`__

From 758d4282bb9f0c63333c7b6d07d8aada3d740b83 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 11 May 2023 16:53:10 -0700
Subject: [PATCH 015/161] chore: add `custom:` natspec tags (#3403)

per spec, `custom:my_custom_tag` is valid
---
 tests/ast/test_natspec.py | 2 ++
 vyper/ast/natspec.py      | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/tests/ast/test_natspec.py b/tests/ast/test_natspec.py
index 2e9980b8d7..c2133468aa 100644
--- a/tests/ast/test_natspec.py
+++ b/tests/ast/test_natspec.py
@@ -24,6 +24,7 @@ def doesEat(food: String[30], qty: uint256) -> bool:
     @param food The name of a food to evaluate (in English)
     @param qty The number of food items to evaluate
     @return True if Bugs will eat it, False otherwise
+    @custom:my-custom-tag hello, world!
     '''
     return True
 """
@@ -51,6 +52,7 @@ def doesEat(food: String[30], qty: uint256) -> bool:
                 "qty": "The number of food items to evaluate",
             },
             "returns": {"_0": "True if Bugs will eat it, False otherwise"},
+            "custom:my-custom-tag": "hello, world!",
         }
     },
     "title": "A simulator for Bug Bunny, the most famous Rabbit",
diff --git a/vyper/ast/natspec.py b/vyper/ast/natspec.py
index e6f0fcd00b..c25fc423f8 100644
--- a/vyper/ast/natspec.py
+++ b/vyper/ast/natspec.py
@@ -88,7 +88,7 @@ def _parse_docstring(
         tag, value = match.groups()
         err_args = (source, *line_no.offset_to_line(start + match.start(1)))
 
-        if tag not in SINGLE_FIELDS + PARAM_FIELDS:
+        if tag not in SINGLE_FIELDS + PARAM_FIELDS and not tag.startswith("custom:"):
             raise NatSpecSyntaxException(f"Unknown NatSpec field '@{tag}'", *err_args)
         if tag in invalid_fields:
             raise NatSpecSyntaxException(

From 99b65fb16f111f3044352c0a79814ea8bcd0d660 Mon Sep 17 00:00:00 2001
From: Pascal Marco Caversaccio <pcaversaccio@users.noreply.github.com>
Date: Fri, 12 May 2023 02:19:29 +0200
Subject: [PATCH 016/161] docs: add `custom` natspec tag to docs (#3404)

---
 docs/natspec.rst | 23 ++++++++++++-----------
 1 file changed, 12 insertions(+), 11 deletions(-)

diff --git a/docs/natspec.rst b/docs/natspec.rst
index b22650231a..a6c2d932e4 100644
--- a/docs/natspec.rst
+++ b/docs/natspec.rst
@@ -45,17 +45,18 @@ Tags
 
 All tags are optional. The following table explains the purpose of each NatSpec tag and where it may be used:
 
-============ ======================================== ==================
-Tag          Description                              Context
-============ ======================================== ==================
-``@title``   Title that describes the contract        contract
-``@license`` License of the contract                  contract
-``@author``  Name of the author                       contract, function
-``@notice``  Explain to an end user what this does    contract, function
-``@dev``     Explain to a developer any extra details contract, function
-``@param``   Documents a single parameter             function
-``@return``  Documents one or all return variable(s)  function
-============ ======================================== ==================
+=============== ============================================ ==================
+Tag             Description                                  Context
+=============== ============================================ ==================
+``@title``      Title that describes the contract            contract
+``@license``    License of the contract                      contract
+``@author``     Name of the author                           contract, function
+``@notice``     Explain to an end user what this does        contract, function
+``@dev``        Explain to a developer any extra details     contract, function
+``@param``      Documents a single parameter                 function
+``@return``     Documents one or all return variable(s)      function
+``@custom:...`` Custom tag, semantics is application-defined contract, function
+=============== ============================================ ==================
 
 Some rules / restrictions:
 

From c194ebf3c55b95593f9fa3ae8012495e754ae8a3 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sat, 13 May 2023 05:41:31 +0800
Subject: [PATCH 017/161] chore: add era compiler test suite to CI (#3394)

this commit adds the era compiler test suite to the CI, as they have
good test cases and coverage of our compiler through IR codegen.

this is intended as a diagnostic tool to help catch compiler regressions
and notify us when a change breaks downstream. as explained in the
comments in the workflow file, it is not intended as a CI blocker since
an update in our code could break downstream, and we do not want to wait
on downstream as a blocker.

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 .github/workflows/era-tester.yml | 97 ++++++++++++++++++++++++++++++++
 1 file changed, 97 insertions(+)
 create mode 100644 .github/workflows/era-tester.yml

diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
new file mode 100644
index 0000000000..ec0fee3bf1
--- /dev/null
+++ b/.github/workflows/era-tester.yml
@@ -0,0 +1,97 @@
+name: era compiler tester
+
+# run the matter labs compiler test to integrate their test cases
+# this is intended as a diagnostic / spot check to check that we
+# haven't seriously broken the compiler. but, it is not intended as
+# a requirement for merging since we may make changes to our IR
+# which break the downstream backend (at which point, downstream needs
+# to update, which we do not want to be blocked on).
+
+on: [push, pull_request]
+
+concurrency:
+  # cancel older, in-progress jobs from the same PR, same workflow.
+  # use run_id if the job is triggered by a push to ensure
+  # push-triggered jobs to not get canceled.
+  group: ${{ github.workflow }}-${{ github.head_ref || github.run_id }}
+  cancel-in-progress: true
+
+jobs:
+  era-compiler-tester:
+    runs-on: ubuntu-latest
+  
+    steps:
+    - name: Get latest commit hash
+      run: |
+        echo "ERA_HASH=$( curl -u "u:${{ github.token }}" https://api.github.com/repos/matter-labs/era-compiler-tester/git/ref/heads/main | jq .object.sha | tr -d '"' )" >> $GITHUB_ENV
+        echo "ERA_VYPER_HASH=$( curl -u "u:${{ github.token }}" https://api.github.com/repos/matter-labs/era-compiler-vyper/git/ref/heads/main | jq .object.sha | tr -d '"' )" >> $GITHUB_ENV
+
+    - name: Checkout
+      uses: actions/checkout@v1
+
+    - name: Rust setup
+      uses: actions-rs/toolchain@v1
+      with:
+        toolchain: nightly-2022-11-03
+
+    - name: Set up Python ${{ matrix.python-version[0] }}
+      uses: actions/setup-python@v4
+      with:
+        python-version: ${{ matrix.python-version[0] }}
+
+    - name: Get cache
+      id: cache
+      uses: actions/cache@v3
+      with:
+        path: |
+          ~/.cargo/bin/
+          ~/.cargo/registry/index/
+          ~/.cargo/registry/cache/
+          ~/.cargo/git/db/
+          **/target
+          **/target-llvm
+          **/compiler_tester
+          **/llvm
+          **/era-compiler-tester
+        key: ${{ runner.os }}-${{ env.ERA_HASH }}-${{ env.ERA_VYPER_HASH }}
+
+    - name: Initialize repository and install dependencies
+      if: steps.cache.outputs.cache-hit != 'true'
+      run: |
+        git clone --depth 1 https://github.com/matter-labs/era-compiler-tester.git
+        cd era-compiler-tester
+        sed -i 's/ssh:\/\/git@/https:\/\//g' .gitmodules
+        git submodule init
+        git submodule update
+        sudo apt install cmake ninja-build clang-13 lld-13 parallel pkg-config lld
+        cargo install compiler-llvm-builder
+        zkevm-llvm clone && zkevm-llvm build
+        cargo build --release
+
+    - name: Save cache
+      uses: actions/cache/save@v3
+      if: always()
+      with:
+        path: |
+          ~/.cargo/bin/
+          ~/.cargo/registry/index/
+          ~/.cargo/registry/cache/
+          ~/.cargo/git/db/
+          **/target
+          **/target-llvm
+          **/compiler_tester
+          **/llvm
+          **/era-compiler-tester
+        key: ${{ runner.os }}-${{ env.ERA_HASH }}-${{ env.ERA_VYPER_HASH }}
+
+    - name: Install Vyper
+      run: |
+        pip install .
+        mkdir era-compiler-tester/vyper-bin
+        echo $(which vyper)
+        cp $(which vyper) era-compiler-tester/vyper-bin/vyper-0.3.8
+
+    - name: Run tester
+      run: |
+        cd era-compiler-tester
+        cargo run --release --bin compiler-tester -- -v --path='tests/vyper/' --mode='M*B* 0.3.8'

From 89e3cdee6d2c8e646c1c506260fab6c37750faec Mon Sep 17 00:00:00 2001
From: Pascal Marco Caversaccio <pcaversaccio@users.noreply.github.com>
Date: Sat, 13 May 2023 00:24:30 +0200
Subject: [PATCH 018/161] docs: add docs for default parameters (#3405)

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 docs/control-structures.rst | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/docs/control-structures.rst b/docs/control-structures.rst
index a89f36f7cc..fc8a472ff6 100644
--- a/docs/control-structures.rst
+++ b/docs/control-structures.rst
@@ -36,8 +36,15 @@ External functions (marked with the ``@external`` decorator) are a part of the c
     def add_seven(a: int128) -> int128:
         return a + 7
 
+    @external
+    def add_seven_with_overloading(a: uint256, b: uint256 = 3):
+        return a + b
+
 A Vyper contract cannot call directly between two external functions. If you must do this, you can use an :ref:`interface <interfaces>`.
 
+.. note::
+    For external functions with default arguments like ``def my_function(x: uint256, b: uint256 = 1)`` the Vyper compiler will generate ``N+1`` overloaded function selectors based on ``N`` default arguments.
+
 .. _structure-functions-internal:
 
 Internal Functions
@@ -48,13 +55,15 @@ Internal functions (marked with the ``@internal`` decorator) are only accessible
 .. code-block:: python
 
     @internal
-    def _times_two(amount: uint256) -> uint256:
-        return amount * 2
+    def _times_two(amount: uint256, two: uint256 = 2) -> uint256:
+        return amount * two
 
     @external
     def calculate(amount: uint256) -> uint256:
         return self._times_two(amount)
 
+.. note::
+    Since calling an ``internal`` function is realized by jumping to its entry label, the internal function dispatcher ensures the correctness of the jumps. Please note that for ``internal`` functions which use more than one default parameter, Vyper versions ``>=0.3.8`` are strongly recommended due to the security advisory `GHSA-ph9x-4vc9-m39g <https://github.com/vyperlang/vyper/security/advisories/GHSA-ph9x-4vc9-m39g>`_.
 
 Mutability
 ----------

From e7ea7029f3c13f19020e7be68db21a8db24000b2 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sat, 13 May 2023 23:53:02 +0800
Subject: [PATCH 019/161] fix: relax namespace check for interface member
 arguments (#3351)

The first contract compiles but not the second. Both should compile
since interface functions are namespaced anyways.

```
a: constant(uint256)

interface A:
    def f(a: uint128): view
```
```
interface A:
    def f(a: uint256): view

a: constant(uint128) = 1
```
---
 tests/parser/syntax/test_interfaces.py | 14 ++++++++++++++
 vyper/semantics/types/function.py      |  5 -----
 2 files changed, 14 insertions(+), 5 deletions(-)

diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index c0afec5504..225c8945b2 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -248,6 +248,20 @@ def foo() -> uint256: view
 def __init__(x: uint256):
     foo = x
     """,
+    # no namespace collision of interface after storage variable
+    """
+a: constant(uint256) = 1
+
+interface A:
+    def f(a: uint128): view
+    """,
+    # no namespace collision of storage variable after interface
+    """
+interface A:
+    def f(a: uint256): view
+
+a: constant(uint128) = 1
+    """,
 ]
 
 
diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index 9ec4506632..bfcdf6349a 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -11,14 +11,12 @@
     CompilerPanic,
     FunctionDeclarationException,
     InvalidType,
-    NamespaceCollision,
     StateAccessViolation,
     StructureException,
 )
 from vyper.semantics.analysis.base import FunctionVisibility, StateMutability, StorageSlot
 from vyper.semantics.analysis.utils import check_kwargable, validate_expected_type
 from vyper.semantics.data_locations import DataLocation
-from vyper.semantics.namespace import get_namespace
 from vyper.semantics.types.base import KwargSettings, VyperType
 from vyper.semantics.types.primitives import BoolT
 from vyper.semantics.types.shortcuts import UINT256_T
@@ -279,7 +277,6 @@ def from_FunctionDef(
         min_arg_count = max_arg_count - len(node.args.defaults)
         defaults = [None] * min_arg_count + node.args.defaults
 
-        namespace = get_namespace()
         for arg, value in zip(node.args.args, defaults):
             if arg.arg in ("gas", "value", "skip_contract_check", "default_return_value"):
                 raise ArgumentException(
@@ -287,8 +284,6 @@ def from_FunctionDef(
                 )
             if arg.arg in arguments:
                 raise ArgumentException(f"Function contains multiple inputs named {arg.arg}", arg)
-            if arg.arg in namespace:
-                raise NamespaceCollision(arg.arg, arg)
 
             if arg.annotation is None:
                 raise ArgumentException(f"Function argument '{arg.arg}' is missing a type", arg)

From 5453a7fac74825d0997ab4ee15e3c53c7da213b4 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sun, 14 May 2023 00:38:59 +0800
Subject: [PATCH 020/161] fix: type inference for empty lists (#3377)

prior to this commit, this contract should compile but would throw:

```
@external
def foo():
    for i in [[], []]:
        pass
```

```
TypeError: _BytestringT.compare_type() missing 1 required positional argument: 'other'
```

the issue is that the possible types produced by `types_from_List` for
an empty list include type class objects (e.g. `BytesT`, `StringT`).
this would cause `get_common_types` to throw the above error in
downstream code when calling `compare_type()`. this commit fixes the
issue by providing the correct generic type acceptors instead of
uninstantiated class objects.

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/parser/syntax/test_list.py  |  6 ++++++
 vyper/semantics/analysis/utils.py | 16 +++++++++++++---
 2 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/tests/parser/syntax/test_list.py b/tests/parser/syntax/test_list.py
index 6d941fa2df..3f81b911c8 100644
--- a/tests/parser/syntax/test_list.py
+++ b/tests/parser/syntax/test_list.py
@@ -302,6 +302,12 @@ def foo():
 def foo():
     self.b[0] = 7.0
     """,
+    """
+@external
+def foo():
+    for i in [[], []]:
+        pass
+    """,
 ]
 
 
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index f50f3243c8..368f590fe0 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -3,6 +3,7 @@
 
 from vyper import ast as vy_ast
 from vyper.exceptions import (
+    CompilerPanic,
     InvalidLiteral,
     InvalidOperation,
     InvalidReference,
@@ -306,11 +307,20 @@ def types_from_List(self, node):
         # literal array
         if _is_empty_list(node):
             # empty list literal `[]`
+            ret = []
             # subtype can be anything
-            types_list = types.PRIMITIVE_TYPES
-            # 1 is minimum possible length for dynarray, assignable to anything
-            ret = [DArrayT(t, 1) for t in types_list.values()]
+            for t in types.PRIMITIVE_TYPES.values():
+                # 1 is minimum possible length for dynarray,
+                # can be assigned to anything
+                if isinstance(t, VyperType):
+                    ret.append(DArrayT(t, 1))
+                elif isinstance(t, type) and issubclass(t, VyperType):
+                    # for typeclasses like bytestrings, use a generic type acceptor
+                    ret.append(DArrayT(t.any(), 1))
+                else:
+                    raise CompilerPanic("busted type {t}", node)
             return ret
+
         types_list = get_common_types(*node.elements)
 
         if len(types_list) > 0:

From 8c8124b4b9a513f10df7c996159ee0ee24c7a5f9 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sat, 13 May 2023 09:46:29 -0700
Subject: [PATCH 021/161] fix: type annotation of Subscript nodes (#3406)

the index type was being incorrectly annotated in the frontend in the
case where the index type was not uint256. this would lead to a panic
during codegen. an example which would lead to this bug is:

```vyper
@external
def foo(xs: uint256[5], ix: uint8):
    return xs[ix + 1]  # <-- panics with uint8 != uint256
```

this commit also improves the `VyperInternalException` class so it can
include a node for prettier traceback
---
 tests/base_conftest.py                 |  2 +-
 tests/parser/types/test_lists.py       | 17 +++++++++++++++++
 vyper/codegen/expr.py                  |  7 ++++---
 vyper/exceptions.py                    | 11 ++++++-----
 vyper/semantics/analysis/annotation.py |  7 ++++++-
 5 files changed, 34 insertions(+), 10 deletions(-)

diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index 2b29a4a384..febe8f74d3 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -31,7 +31,7 @@ def __prepared_function(self, *args, **kwargs):
                 if x.get("name") == self._function.function_identifier
             ].pop()
             # To make tests faster just supply some high gas value.
-            modifier_dict.update({"gas": fn_abi.get("gas", 0) + 50000})
+            modifier_dict.update({"gas": fn_abi.get("gas", 0) + 500000})
         elif len(kwargs) == 1:
             modifier, modifier_dict = kwargs.popitem()
             if modifier not in self.ALLOWED_MODIFIERS:
diff --git a/tests/parser/types/test_lists.py b/tests/parser/types/test_lists.py
index 0715eb3870..6819815959 100644
--- a/tests/parser/types/test_lists.py
+++ b/tests/parser/types/test_lists.py
@@ -745,6 +745,23 @@ def ix(i: uint256) -> address:
     assert_tx_failed(lambda: c.ix(len(some_good_address) + 1))
 
 
+def test_list_index_complex_expr(get_contract, assert_tx_failed):
+    # test subscripts where the index is not a literal
+    code = """
+@external
+def foo(xs: uint256[257], i: uint8) -> uint256:
+    return xs[i + 1]
+    """
+    c = get_contract(code)
+    xs = [i + 1 for i in range(257)]
+
+    for ix in range(255):
+        assert c.foo(xs, ix) == xs[ix + 1]
+
+    # safemath should fail for uint8: 255 + 1.
+    assert_tx_failed(lambda: c.foo(xs, 255))
+
+
 @pytest.mark.parametrize(
     "type,value",
     [
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 506a2694fb..dd764fbe20 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -75,11 +75,11 @@ def __init__(self, node, context):
 
         fn = getattr(self, f"parse_{type(node).__name__}", None)
         if fn is None:
-            raise TypeCheckFailure(f"Invalid statement node: {type(node).__name__}")
+            raise TypeCheckFailure(f"Invalid statement node: {type(node).__name__}", node)
 
         self.ir_node = fn()
         if self.ir_node is None:
-            raise TypeCheckFailure(f"{type(node).__name__} node did not produce IR. {self.expr}")
+            raise TypeCheckFailure(f"{type(node).__name__} node did not produce IR.", node)
 
         self.ir_node.annotation = self.expr.get("node_source_code")
         self.ir_node.source_pos = getpos(self.expr)
@@ -365,7 +365,8 @@ def parse_BinOp(self):
         if not isinstance(self.expr.op, (vy_ast.LShift, vy_ast.RShift)):
             # Sanity check - ensure that we aren't dealing with different types
             # This should be unreachable due to the type check pass
-            assert left.typ == right.typ, f"unreachable, {left.typ} != {right.typ}"
+            if left.typ != right.typ:
+                raise TypeCheckFailure(f"unreachable, {left.typ} != {right.typ}", self.expr)
 
         assert is_numeric_type(left.typ) or is_enum_type(left.typ)
 
diff --git a/vyper/exceptions.py b/vyper/exceptions.py
index 07d972c343..aa23614e85 100644
--- a/vyper/exceptions.py
+++ b/vyper/exceptions.py
@@ -22,7 +22,7 @@ def raise_if_not_empty(self):
             raise VyperException("\n\n".join(err_msg))
 
 
-class VyperException(Exception):
+class _BaseVyperException(Exception):
     """
     Base Vyper exception class.
 
@@ -125,6 +125,10 @@ def __str__(self):
         return f"{self.message}\n{annotation_msg}"
 
 
+class VyperException(_BaseVyperException):
+    pass
+
+
 class SyntaxException(VyperException):
 
     """Invalid syntax."""
@@ -285,7 +289,7 @@ class StaticAssertionException(VyperException):
     """An assertion is proven to fail at compile-time."""
 
 
-class VyperInternalException(Exception):
+class VyperInternalException(_BaseVyperException):
     """
     Base Vyper internal exception class.
 
@@ -296,9 +300,6 @@ class VyperInternalException(Exception):
     compiler has panicked, and that filing a bug report would be appropriate.
     """
 
-    def __init__(self, message=""):
-        self.message = message
-
     def __str__(self):
         return (
             f"{self.message}\n\nThis is an unhandled internal compiler error. "
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index a14c0b9783..2563c88ab4 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -238,7 +238,12 @@ def visit_Subscript(self, node, type_):
         else:
             base_type = get_exact_type_from_node(node.value)
 
-        self.visit(node.slice, base_type.key_type)
+        # get the correct type for the index, it might
+        # not be base_type.key_type
+        index_types = get_possible_types_from_node(node.slice.value)
+        index_type = index_types.pop()
+
+        self.visit(node.slice, index_type)
         self.visit(node.value, base_type)
 
     def visit_Tuple(self, node, type_):

From 97ff017c5e8d1aa5b0bcefbc93cc5cf9c131f71c Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sun, 14 May 2023 00:58:29 +0800
Subject: [PATCH 022/161] fix: indexing into literal list (#3378)

a regression was introduced in 046ea166d whereby the following contract
used to compile but now panics:
```
@external
def foo():
    f: uint256 = 1
    a:bool = 1 == [1,2,4][f] + -1
```
```
AssertionError: unreachable, uint256 != int8
```

the issue was that, previously, different integer types in vyper were
represented by different types in python. however, now all integer types
inherit from `IntegerT`. this commit fixes the issue by using the
correct (and hygienically appropriate) `type.compare_type(other)`,
instead of checking python-level type equality.

the lark grammar also needed to be changed to enable accessing a literal
list directly.

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/parser/types/test_lists.py       | 12 ++++++++++++
 vyper/ast/grammar.lark                 |  2 +-
 vyper/semantics/analysis/annotation.py |  8 ++++++--
 3 files changed, 19 insertions(+), 3 deletions(-)

diff --git a/tests/parser/types/test_lists.py b/tests/parser/types/test_lists.py
index 6819815959..832b679e5e 100644
--- a/tests/parser/types/test_lists.py
+++ b/tests/parser/types/test_lists.py
@@ -676,6 +676,18 @@ def ix(i: uint256) -> {type}:
     assert_tx_failed(lambda: c.ix(len(value) + 1))
 
 
+def test_nested_constant_list_accessor(get_contract):
+    code = """
+@external
+def foo() -> bool:
+    f: uint256 = 1
+    a: bool = 1 == [1,2,4][f] + -1
+    return a
+    """
+    c = get_contract(code)
+    assert c.foo() is True
+
+
 # Would be nice to put this somewhere accessible, like in vyper.types or something
 integer_types = ["uint8", "int128", "int256", "uint256"]
 
diff --git a/vyper/ast/grammar.lark b/vyper/ast/grammar.lark
index 046dcc1f1a..77806d734c 100644
--- a/vyper/ast/grammar.lark
+++ b/vyper/ast/grammar.lark
@@ -182,7 +182,7 @@ _expr: operation
      | dict
      | ternary
 
-get_item: variable_access "[" _expr "]"
+get_item: (variable_access | list) "[" _expr "]"
 get_attr: variable_access "." NAME
 call: variable_access "(" [arguments] ")"
 ?variable_access: NAME -> get_var
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index 2563c88ab4..4bbd77fdd4 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -1,5 +1,5 @@
 from vyper import ast as vy_ast
-from vyper.exceptions import StructureException
+from vyper.exceptions import StructureException, TypeCheckFailure
 from vyper.semantics.analysis.utils import (
     get_common_types,
     get_exact_type_from_node,
@@ -231,9 +231,13 @@ def visit_Subscript(self, node, type_):
 
             elif type_ is not None and len(possible_base_types) > 1:
                 for possible_type in possible_base_types:
-                    if isinstance(possible_type.value_type, type(type_)):
+                    if type_.compare_type(possible_type.value_type):
                         base_type = possible_type
                         break
+                else:
+                    # this should have been caught in
+                    # `get_possible_types_from_node` but wasn't.
+                    raise TypeCheckFailure(f"Expected {type_} but it is not a possible type", node)
 
         else:
             base_type = get_exact_type_from_node(node.value)

From 061219022c4b9e2deecc66cce3a842da425585b2 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Tue, 16 May 2023 01:40:53 +0800
Subject: [PATCH 023/161] fix: enforce namespace collisions between globals
 (#3352)

collisions between constants, immutables and storage variables were
dependent on declaration order; this commit fixes that.
---
 tests/parser/syntax/test_constants.py | 40 +++++++++++++++++++++++++++
 vyper/semantics/analysis/module.py    | 27 +++++++++---------
 2 files changed, 53 insertions(+), 14 deletions(-)

diff --git a/tests/parser/syntax/test_constants.py b/tests/parser/syntax/test_constants.py
index 15546672c6..ffd2f1faa0 100644
--- a/tests/parser/syntax/test_constants.py
+++ b/tests/parser/syntax/test_constants.py
@@ -69,6 +69,46 @@
         """
 VAL: constant(Bytes[4]) = b"t"
 VAL: uint256
+    """,
+        NamespaceCollision,
+    ),
+    # global with same type and name
+    (
+        """
+VAL: constant(uint256) = 1
+VAL: uint256
+    """,
+        NamespaceCollision,
+    ),
+    # global with same type and name, different order
+    (
+        """
+VAL: uint256
+VAL: constant(uint256) = 1
+    """,
+        NamespaceCollision,
+    ),
+    # global with same type and name
+    (
+        """
+VAL: immutable(uint256)
+VAL: uint256
+
+@external
+def __init__():
+    VAL = 1
+    """,
+        NamespaceCollision,
+    ),
+    # global with same type and name, different order
+    (
+        """
+VAL: uint256
+VAL: immutable(uint256)
+
+@external
+def __init__():
+    VAL = 1
     """,
         NamespaceCollision,
     ),
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index 22ac8cecaf..3907882e7a 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -226,6 +226,17 @@ def _finalize():
             except VyperException as exc:
                 raise exc.with_annotation(node) from None
 
+        def _validate_self_namespace():
+            # block globals if storage variable already exists
+            try:
+                if name in self.namespace["self"].typ.members:
+                    raise NamespaceCollision(
+                        f"Value '{name}' has already been declared", node
+                    ) from None
+                self.namespace[name] = var_info
+            except VyperException as exc:
+                raise exc.with_annotation(node) from None
+
         if node.is_constant:
             if not node.value:
                 raise VariableDeclarationException("Constant must be declared with a value", node)
@@ -233,10 +244,7 @@ def _finalize():
                 raise StateAccessViolation("Value must be a literal", node.value)
 
             validate_expected_type(node.value, type_)
-            try:
-                self.namespace[name] = var_info
-            except VyperException as exc:
-                raise exc.with_annotation(node) from None
+            _validate_self_namespace()
 
             return _finalize()
 
@@ -247,16 +255,7 @@ def _finalize():
             )
 
         if node.is_immutable:
-            try:
-                # block immutable if storage variable already exists
-                if name in self.namespace["self"].typ.members:
-                    raise NamespaceCollision(
-                        f"Value '{name}' has already been declared", node
-                    ) from None
-                self.namespace[name] = var_info
-            except VyperException as exc:
-                raise exc.with_annotation(node) from None
-
+            _validate_self_namespace()
             return _finalize()
 
         try:

From 8310f4a252a91d7631b2bdd200b55c9cf7be2205 Mon Sep 17 00:00:00 2001
From: Benny <benoitb@tutanota.de>
Date: Tue, 16 May 2023 04:07:43 +1000
Subject: [PATCH 024/161] chore: fix error message for undeclared variables in
 type annotation (#3215)

The exception is raised when trying to check whether the variable is a
storage variable by checking if its name is in
`self.namespace["self"].typ.members`. However this check can happen
before `self` is added to the namespace. When the constant variable is
referenced in a type annotation, the check will happen during folding
and before validation, so there will be no `self` key in namespace,
leading to the previous exception being raised.

A simple check on whether the key is present suffices to prevent this
exception from being raised and to instead raise another detailed
`UndeclaredDefinition` exception containing the undeclared variable's
name and line number of the error.

After this commit, compiling the following contract:
```vyper
PRECISIONS: constant(uint256[N_COINS]) = [
    1000000000000,
    10000000000,
    1,
]
N_COINS: constant(int128) = 3
```
Now raises the following exception:
```
vyper.exceptions.UndeclaredDefinition: 'N_COINS' has not been declared.
  contract "***.vy:1", line 1:29
  ---> 1 PRECISIONS: constant(uint256[N_COINS]) = [
  ------------------------------------^
       2     1000000000000,
```
---
 vyper/semantics/analysis/utils.py | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index 368f590fe0..26f3fd1827 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -334,7 +334,11 @@ def types_from_List(self, node):
     def types_from_Name(self, node):
         # variable name, e.g. `foo`
         name = node.id
-        if name not in self.namespace and name in self.namespace["self"].typ.members:
+        if (
+            name not in self.namespace
+            and "self" in self.namespace
+            and name in self.namespace["self"].typ.members
+        ):
             raise InvalidReference(
                 f"'{name}' is a storage variable, access it as self.{name}", node
             )

From 1c8349e867b2b3186c106b275d38f30cdb0ef342 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 15 May 2023 15:04:00 -0400
Subject: [PATCH 025/161] fix: assignment when rhs is complex type and
 references lhs (#3410)

prior to this commit, the following code would produce a
load-after-store bug:

```vyper
@external
def foo(xs: uint256[2]) -> uint256[2]:
    ys: uint256[2] = xs
    ys = [ys[1], ys[0]]  # <-- ys[1] gets written to ys[0] before ys[0] is read
    return ys  # returns [xs[1], xs[1]]
```

this commit checks that rhs and lhs do not overlap in `parse_Assign`. if
they do, copy rhs to a temporary buffer, then copy to the lhs. this
might not be the most efficient approach, but it is safe (and it's
relatively rare to see this case in user code).

note that this commit doesn't touch `make_setter` directly because it
would need access to the memory allocator (to allocate the temporary
buffer). this could result in the fix not working in other cases where
the arguments to `make_setter` overlap. i don't think there are any
cases of those, but if there were, they would need to be fixed on a case
by case basis.
---
 tests/parser/features/test_assignment.py | 60 ++++++++++++++++++++++++
 vyper/codegen/context.py                 |  3 ++
 vyper/codegen/expr.py                    | 14 ++++--
 vyper/codegen/ir_node.py                 | 10 ++++
 vyper/codegen/stmt.py                    | 23 +++++++--
 vyper/semantics/analysis/base.py         |  3 ++
 6 files changed, 106 insertions(+), 7 deletions(-)

diff --git a/tests/parser/features/test_assignment.py b/tests/parser/features/test_assignment.py
index 65fb3a7a0e..0dd63a0d09 100644
--- a/tests/parser/features/test_assignment.py
+++ b/tests/parser/features/test_assignment.py
@@ -255,3 +255,63 @@ def foo():
     ret : bool = self.bar()
 """
     assert_compile_failed(lambda: get_contract_with_gas_estimation(code), InvalidType)
+
+
+def test_assign_rhs_lhs_overlap(get_contract):
+    # GH issue 2418
+    code = """
+@external
+def bug(xs: uint256[2]) -> uint256[2]:
+    # Initial value
+    ys: uint256[2] = xs
+    ys = [ys[1], ys[0]]
+    return ys
+    """
+    c = get_contract(code)
+
+    assert c.bug([1, 2]) == [2, 1]
+
+
+def test_assign_rhs_lhs_partial_overlap(get_contract):
+    # GH issue 2418, generalize when lhs is not only dependency of rhs.
+    code = """
+@external
+def bug(xs: uint256[2]) -> uint256[2]:
+    # Initial value
+    ys: uint256[2] = xs
+    ys = [xs[1], ys[0]]
+    return ys
+    """
+    c = get_contract(code)
+
+    assert c.bug([1, 2]) == [2, 1]
+
+
+def test_assign_rhs_lhs_overlap_dynarray(get_contract):
+    # GH issue 2418, generalize to dynarrays
+    code = """
+@external
+def bug(xs: DynArray[uint256, 2]) -> DynArray[uint256, 2]:
+    ys: DynArray[uint256, 2] = xs
+    ys = [ys[1], ys[0]]
+    return ys
+    """
+    c = get_contract(code)
+    assert c.bug([1, 2]) == [2, 1]
+
+
+def test_assign_rhs_lhs_overlap_struct(get_contract):
+    # GH issue 2418, generalize to structs
+    code = """
+struct Point:
+    x: uint256
+    y: uint256
+
+@external
+def bug(p: Point) -> Point:
+    t: Point = p
+    t = Point({x: t.y, y: t.x})
+    return t
+    """
+    c = get_contract(code)
+    assert c.bug((1, 2)) == (2, 1)
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index 9902cd0cf7..696b81d124 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -30,6 +30,9 @@ class VariableRecord:
     is_immutable: bool = False
     data_offset: Optional[int] = None
 
+    def __hash__(self):
+        return hash(id(self))
+
     def __post_init__(self):
         if self.blockscopes is None:
             self.blockscopes = []
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index dd764fbe20..6da3d9501b 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -166,7 +166,7 @@ def parse_Name(self):
             return IRnode.from_list(["address"], typ=AddressT())
         elif self.expr.id in self.context.vars:
             var = self.context.vars[self.expr.id]
-            return IRnode.from_list(
+            ret = IRnode.from_list(
                 var.pos,
                 typ=var.typ,
                 location=var.location,  # either 'memory' or 'calldata' storage is handled above.
@@ -174,6 +174,8 @@ def parse_Name(self):
                 annotation=self.expr.id,
                 mutable=var.mutable,
             )
+            ret._referenced_variables = {var}
+            return ret
 
         # TODO: use self.expr._expr_info
         elif self.expr.id in self.context.globals:
@@ -189,9 +191,11 @@ def parse_Name(self):
                 mutable = False
                 location = DATA
 
-            return IRnode.from_list(
+            ret = IRnode.from_list(
                 ofst, typ=varinfo.typ, location=location, annotation=self.expr.id, mutable=mutable
             )
+            ret._referenced_variables = {varinfo}
+            return ret
 
     # x.y or x[5]
     def parse_Attribute(self):
@@ -255,12 +259,16 @@ def parse_Attribute(self):
         # self.x: global attribute
         elif isinstance(self.expr.value, vy_ast.Name) and self.expr.value.id == "self":
             varinfo = self.context.globals[self.expr.attr]
-            return IRnode.from_list(
+            ret = IRnode.from_list(
                 varinfo.position.position,
                 typ=varinfo.typ,
                 location=STORAGE,
                 annotation="self." + self.expr.attr,
             )
+            ret._referenced_variables = {varinfo}
+
+            return ret
+
         # Reserved keywords
         elif (
             isinstance(self.expr.value, vy_ast.Name) and self.expr.value.id in ENVIRONMENT_VARIABLES
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index 1ba4122c66..d36a18ec66 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -397,6 +397,16 @@ def cache_when_complex(self, name):
 
         return _WithBuilder(self, name, should_inline)
 
+    @cached_property
+    def referenced_variables(self):
+        ret = set()
+        for arg in self.args:
+            ret |= arg.referenced_variables
+
+        ret |= getattr(self, "_referenced_variables", set())
+
+        return ret
+
     @cached_property
     def contains_self_call(self):
         return getattr(self, "is_self_call", False) or any(x.contains_self_call for x in self.args)
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 01c1d5f121..e24c429638 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -73,11 +73,22 @@ def parse_AnnAssign(self):
 
     def parse_Assign(self):
         # Assignment (e.g. x[4] = y)
-        sub = Expr(self.stmt.value, self.context).ir_node
-        target = self._get_target(self.stmt.target)
+        src = Expr(self.stmt.value, self.context).ir_node
+        dst = self._get_target(self.stmt.target)
 
-        ir_node = make_setter(target, sub)
-        return ir_node
+        ret = ["seq"]
+        overlap = len(dst.referenced_variables & src.referenced_variables) > 0
+        if overlap and not dst.typ._is_prim_word:
+            # there is overlap between the lhs and rhs, and the type is
+            # complex - i.e., it spans multiple words. for safety, we
+            # copy to a temporary buffer before copying to the destination.
+            tmp = self.context.new_internal_variable(src.typ)
+            tmp = IRnode.from_list(tmp, typ=src.typ, location=MEMORY)
+            ret.append(make_setter(tmp, src))
+            src = tmp
+
+        ret.append(make_setter(dst, src))
+        return IRnode.from_list(ret)
 
     def parse_If(self):
         if self.stmt.orelse:
@@ -336,8 +347,12 @@ def _parse_For_list(self):
 
     def parse_AugAssign(self):
         target = self._get_target(self.stmt.target)
+
         sub = Expr.parse_value_expr(self.stmt.value, self.context)
         if not target.typ._is_prim_word:
+            # because of this check, we do not need to check for
+            # make_setter references lhs<->rhs as in parse_Assign -
+            # single word load/stores are atomic.
             return
 
         with target.cache_when_complex("_loc") as (b, target):
diff --git a/vyper/semantics/analysis/base.py b/vyper/semantics/analysis/base.py
index 5919c96686..5065131f29 100644
--- a/vyper/semantics/analysis/base.py
+++ b/vyper/semantics/analysis/base.py
@@ -165,6 +165,9 @@ class VarInfo:
     is_local_var: bool = False
     decl_node: Optional[vy_ast.VyperNode] = None
 
+    def __hash__(self):
+        return hash(id(self))
+
     def __post_init__(self):
         self._modification_count = 0
 

From c202c4e3ec884c6ddb28f738e45e8b9aa3d209b4 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 15 May 2023 15:06:20 -0400
Subject: [PATCH 026/161] fix: constructor context for internal functions
 (#3388)

this commit fixes two related issues with initcode generation:

- nested internal functions called from the constructor would cause a
  compiler panic
- internal functions called from the constructor would not read/write
  from the correct immutables space

the relevant examples reproducing each issue are in the tests. this
commit fixes the issue by

- not trying to traverse the call graph to figure out which internal
  functions to include in the initcode. instead, all internal functions
  are included, and we rely on the dead code eliminator to remove unused
  functions
- adding a "constructor" flag to the codegen, so we can distinguish
  between internal calls which are being generated to include in
  initcode or runtime code.
---
 tests/compiler/asm/test_asm_optimizer.py      | 49 +++++++++++
 .../semantics/analysis/test_for_loop.py       |  8 +-
 tests/parser/features/test_comparison.py      |  2 +-
 tests/parser/features/test_immutable.py       | 87 +++++++++++++++++++
 tests/parser/features/test_init.py            | 26 ++++++
 vyper/codegen/context.py                      |  4 +
 vyper/codegen/expr.py                         |  2 +-
 vyper/codegen/function_definitions/common.py  | 10 ++-
 vyper/codegen/module.py                       | 34 +++++---
 9 files changed, 203 insertions(+), 19 deletions(-)
 create mode 100644 tests/compiler/asm/test_asm_optimizer.py

diff --git a/tests/compiler/asm/test_asm_optimizer.py b/tests/compiler/asm/test_asm_optimizer.py
new file mode 100644
index 0000000000..524b8df064
--- /dev/null
+++ b/tests/compiler/asm/test_asm_optimizer.py
@@ -0,0 +1,49 @@
+from vyper.compiler.phases import CompilerData
+
+
+def test_dead_code_eliminator():
+    code = """
+s: uint256
+
+@internal
+def foo():
+    self.s = 1
+
+@internal
+def qux():
+    self.s = 2
+
+@external
+def bar():
+    self.foo()
+
+@external
+def __init__():
+    self.qux()
+    """
+
+    c = CompilerData(code, no_optimize=True)
+    initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
+    runtime_asm = c.assembly_runtime
+
+    foo_label = "_sym_internal_foo___"
+    qux_label = "_sym_internal_qux___"
+
+    # all the labels should be in all the unoptimized asms
+    for s in (foo_label, qux_label):
+        assert s in initcode_asm
+        assert s in runtime_asm
+
+    c = CompilerData(code, no_optimize=False)
+    initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
+    runtime_asm = c.assembly_runtime
+
+    # qux should not be in runtime code
+    for instr in runtime_asm:
+        if isinstance(instr, str):
+            assert not instr.startswith(qux_label), instr
+
+    # foo should not be in initcode asm
+    for instr in initcode_asm:
+        if isinstance(instr, str):
+            assert not instr.startswith(foo_label), instr
diff --git a/tests/functional/semantics/analysis/test_for_loop.py b/tests/functional/semantics/analysis/test_for_loop.py
index 71e38d253c..8707b4c326 100644
--- a/tests/functional/semantics/analysis/test_for_loop.py
+++ b/tests/functional/semantics/analysis/test_for_loop.py
@@ -108,14 +108,14 @@ def main():
     for j in range(3):
         x: uint256 = j
         y: uint16 = j
-    """,  # issue 3212
+    """,  # GH issue 3212
     """
 @external
 def foo():
     for i in [1]:
         a:uint256 = i
         b:uint16 = i
-    """,  # issue 3374
+    """,  # GH issue 3374
     """
 @external
 def foo():
@@ -123,7 +123,7 @@ def foo():
         for j in [1]:
             a:uint256 = i
         b:uint16 = i
-    """,  # issue 3374
+    """,  # GH issue 3374
     """
 @external
 def foo():
@@ -131,7 +131,7 @@ def foo():
         for j in [1,2,3]:
             b:uint256 = j + i
         c:uint16 = i
-    """,  # issue 3374
+    """,  # GH issue 3374
 ]
 
 
diff --git a/tests/parser/features/test_comparison.py b/tests/parser/features/test_comparison.py
index 1c2f287c10..5a86ffb4b8 100644
--- a/tests/parser/features/test_comparison.py
+++ b/tests/parser/features/test_comparison.py
@@ -4,7 +4,7 @@
 
 
 def test_3034_verbatim(get_contract):
-    # test issue #3034 exactly
+    # test GH issue 3034 exactly
     code = """
 @view
 @external
diff --git a/tests/parser/features/test_immutable.py b/tests/parser/features/test_immutable.py
index bb01b3fc07..488943f784 100644
--- a/tests/parser/features/test_immutable.py
+++ b/tests/parser/features/test_immutable.py
@@ -239,3 +239,90 @@ def get_immutable() -> uint256:
 
     c = get_contract(code, n)
     assert c.get_immutable() == n + 2
+
+
+# GH issue 3292
+def test_internal_functions_called_by_ctor_location(get_contract):
+    code = """
+d: uint256
+x: immutable(uint256)
+
+@external
+def __init__():
+    self.d = 1
+    x = 2
+    self.a()
+
+@external
+def test() -> uint256:
+    return self.d
+
+@internal
+def a():
+    self.d = x
+    """
+    c = get_contract(code)
+    assert c.test() == 2
+
+
+# GH issue 3292, extended to nested internal functions
+def test_nested_internal_function_immutables(get_contract):
+    code = """
+d: public(uint256)
+x: public(immutable(uint256))
+
+@external
+def __init__():
+    self.d = 1
+    x = 2
+    self.a()
+
+@internal
+def a():
+    self.b()
+
+@internal
+def b():
+    self.d = x
+    """
+    c = get_contract(code)
+    assert c.x() == 2
+    assert c.d() == 2
+
+
+# GH issue 3292, test immutable read from both ctor and runtime
+def test_immutable_read_ctor_and_runtime(get_contract):
+    code = """
+d: public(uint256)
+x: public(immutable(uint256))
+
+@external
+def __init__():
+    self.d = 1
+    x = 2
+    self.a()
+
+@internal
+def a():
+    self.d = x
+
+@external
+def thrash():
+    self.d += 5
+
+@external
+def fix():
+    self.a()
+    """
+    c = get_contract(code)
+    assert c.x() == 2
+    assert c.d() == 2
+
+    c.thrash(transact={})
+
+    assert c.x() == 2
+    assert c.d() == 2 + 5
+
+    c.fix(transact={})
+    assert c.x() == 2
+    assert c.d() == 2
diff --git a/tests/parser/features/test_init.py b/tests/parser/features/test_init.py
index feeabe311a..83bcbc95ea 100644
--- a/tests/parser/features/test_init.py
+++ b/tests/parser/features/test_init.py
@@ -53,3 +53,29 @@ def baz() -> uint8:
 
     n = 256
     assert_compile_failed(lambda: get_contract(code, n))
+
+
+# GH issue 3206
+def test_nested_internal_call_from_ctor(get_contract):
+    code = """
+x: uint256
+
+@external
+def __init__():
+    self.a()
+
+@internal
+def a():
+    self.x += 1
+    self.b()
+
+@internal
+def b():
+    self.x += 2
+
+@external
+def test() -> uint256:
+    return self.x
+    """
+    c = get_contract(code)
+    assert c.test() == 3
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index 696b81d124..34c409e16c 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -54,6 +54,7 @@ def __init__(
         forvars=None,
         constancy=Constancy.Mutable,
         sig=None,
+        is_ctor_context=False,
     ):
         # In-memory variables, in the form (name, memory location, type)
         self.vars = vars_ or {}
@@ -92,6 +93,9 @@ def __init__(
         self._internal_var_iter = 0
         self._scope_id_iter = 0
 
+        # either the constructor, or called from the constructor
+        self.is_ctor_context = is_ctor_context
+
     def is_constant(self):
         return self.constancy is Constancy.Constant or self.in_assertion or self.in_range_expr
 
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 6da3d9501b..9ed80b86f9 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -184,7 +184,7 @@ def parse_Name(self):
 
             ofst = varinfo.position.offset
 
-            if self.context.sig.is_init_func:
+            if self.context.is_ctor_context:
                 mutable = True
                 location = IMMUTABLES
             else:
diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index 6dece865fa..cd467a152e 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -18,6 +18,7 @@ def generate_ir_for_function(
     sigs: Dict[str, Dict[str, FunctionSignature]],  # all signatures in all namespaces
     global_ctx: GlobalContext,
     skip_nonpayable_check: bool,
+    is_ctor_context: bool = False,
 ) -> IRnode:
     """
     Parse a function and produce IR code for the function, includes:
@@ -51,6 +52,7 @@ def generate_ir_for_function(
         memory_allocator=memory_allocator,
         constancy=Constancy.Constant if sig.mutability in ("view", "pure") else Constancy.Mutable,
         sig=sig,
+        is_ctor_context=is_ctor_context,
     )
 
     if sig.internal:
@@ -65,13 +67,19 @@ def generate_ir_for_function(
 
     frame_size = context.memory_allocator.size_of_mem - MemoryPositions.RESERVED_MEMORY
 
-    sig.set_frame_info(FrameInfo(allocate_start, frame_size, context.vars))
+    frame_info = FrameInfo(allocate_start, frame_size, context.vars)
+
+    if sig.frame_info is None:
+        sig.set_frame_info(frame_info)
+    else:
+        assert frame_info == sig.frame_info
 
     if not sig.internal:
         # adjust gas estimate to include cost of mem expansion
         # frame_size of external function includes all private functions called
         # (note: internal functions do not need to adjust gas estimate since
         # it is already accounted for by the caller.)
+        assert sig.frame_info is not None  # mypy hint
         o.add_gas_estimate += calc_mem_gas(sig.frame_info.mem_used)
 
     sig.gas_estimate = o.gas
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 71f9ed552d..bdf8c067f7 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -67,19 +67,21 @@ def _runtime_ir(runtime_functions, all_sigs, global_ctx):
 
     # create a map of the IR functions since they might live in both
     # runtime and deploy code (if init function calls them)
-    internal_functions_map: Dict[str, IRnode] = {}
+    internal_functions_ir: list[IRnode] = []
 
     for func_ast in internal_functions:
         func_ir = generate_ir_for_function(func_ast, all_sigs, global_ctx, False)
-        internal_functions_map[func_ast.name] = func_ir
+        internal_functions_ir.append(func_ir)
 
     # for some reason, somebody may want to deploy a contract with no
     # external functions, or more likely, a "pure data" contract which
     # contains immutables
     if len(external_functions) == 0:
-        # TODO: prune internal functions in this case?
-        runtime = ["seq"] + list(internal_functions_map.values())
-        return runtime, internal_functions_map
+        # TODO: prune internal functions in this case? dead code eliminator
+        # might not eliminate them, since internal function jumpdest is at the
+        # first instruction in the contract.
+        runtime = ["seq"] + internal_functions_ir
+        return runtime
 
     # note: if the user does not provide one, the default fallback function
     # reverts anyway. so it does not hurt to batch the payable check.
@@ -125,10 +127,10 @@ def _runtime_ir(runtime_functions, all_sigs, global_ctx):
         ["label", "fallback", ["var_list"], fallback_ir],
     ]
 
-    # TODO: prune unreachable functions?
-    runtime.extend(internal_functions_map.values())
+    # note: dead code eliminator will clean dead functions
+    runtime.extend(internal_functions_ir)
 
-    return runtime, internal_functions_map
+    return runtime
 
 
 # take a GlobalContext, which is basically
@@ -159,12 +161,15 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> Tuple[IRnode, IRnode, F
     runtime_functions = [f for f in function_defs if not _is_init_func(f)]
     init_function = next((f for f in function_defs if _is_init_func(f)), None)
 
-    runtime, internal_functions = _runtime_ir(runtime_functions, all_sigs, global_ctx)
+    runtime = _runtime_ir(runtime_functions, all_sigs, global_ctx)
 
     deploy_code: List[Any] = ["seq"]
     immutables_len = global_ctx.immutable_section_bytes
     if init_function:
-        init_func_ir = generate_ir_for_function(init_function, all_sigs, global_ctx, False)
+        # TODO might be cleaner to separate this into an _init_ir helper func
+        init_func_ir = generate_ir_for_function(
+            init_function, all_sigs, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
+        )
         deploy_code.append(init_func_ir)
 
         # pass the amount of memory allocated for the init function
@@ -174,8 +179,13 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> Tuple[IRnode, IRnode, F
         deploy_code.append(["deploy", init_mem_used, runtime, immutables_len])
 
         # internal functions come after everything else
-        for f in init_function._metadata["type"].called_functions:
-            deploy_code.append(internal_functions[f.name])
+        internal_functions = [f for f in runtime_functions if _is_internal(f)]
+        for f in internal_functions:
+            func_ir = generate_ir_for_function(
+                f, all_sigs, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
+            )
+            # note: we depend on dead code eliminator to clean dead function defs
+            deploy_code.append(func_ir)
 
     else:
         if immutables_len != 0:

From f450cb1a729040e136204060152a608169ac70aa Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Tue, 16 May 2023 03:59:15 +0800
Subject: [PATCH 027/161] chore: remove duplicate check for a function call
 into itself (#3357)

A function that calls itself is already caught in `_find_cyclic_call`.
This PR removes a duplicate check.
---
 .../semantics/analysis/test_cyclic_function_calls.py | 12 ++++++++++++
 vyper/semantics/analysis/module.py                   |  5 -----
 2 files changed, 12 insertions(+), 5 deletions(-)

diff --git a/tests/functional/semantics/analysis/test_cyclic_function_calls.py b/tests/functional/semantics/analysis/test_cyclic_function_calls.py
index 086f8ed08c..2a09bd5ed5 100644
--- a/tests/functional/semantics/analysis/test_cyclic_function_calls.py
+++ b/tests/functional/semantics/analysis/test_cyclic_function_calls.py
@@ -6,6 +6,18 @@
 from vyper.semantics.analysis.module import ModuleAnalyzer
 
 
+def test_self_function_call(namespace):
+    code = """
+@internal
+def foo():
+    self.foo()
+    """
+    vyper_module = parse_to_ast(code)
+    with namespace.enter_scope():
+        with pytest.raises(CallViolation):
+            ModuleAnalyzer(vyper_module, {}, namespace)
+
+
 def test_cyclic_function_call(namespace):
     code = """
 @internal
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index 3907882e7a..188005e365 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -117,11 +117,6 @@ def __init__(
             # anything that is not a function call will get semantically checked later
             calls_to_self = calls_to_self.intersection(function_names)
             self_members[node.name].internal_calls = calls_to_self
-            if node.name in self_members[node.name].internal_calls:
-                self_node = node.get_descendants(
-                    vy_ast.Attribute, {"value.id": "self", "attr": node.name}
-                )[0]
-                raise CallViolation(f"Function '{node.name}' calls into itself", self_node)
 
         for fn_name in sorted(function_names):
             if fn_name not in self_members:

From 7ac2d7c882a54add77a3684b9555fcdd610fc9f2 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 15 May 2023 23:23:42 -0400
Subject: [PATCH 028/161] chore: update test durations file (#3413)

rebalance tests
---
 .github/workflows/test.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 4a09914d59..f90ff706ec 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -138,7 +138,7 @@ jobs:
     # NOTE: if the tests get poorly distributed, run this and commit the resulting `.test_durations` file to the `vyper-test-durations` repo.
     # `TOXENV=fuzzing tox -r -- --store-durations --reruns 10 --reruns-delay 1 -r aR tests/`
     - name: Fetch test-durations
-      run: curl --location "https://raw.githubusercontent.com/vyperlang/vyper-test-durations/ac71e77863d7f4e7e7cd19a93cf50a8c39de4845/test_durations" -o .test_durations
+      run: curl --location "https://raw.githubusercontent.com/vyperlang/vyper-test-durations/5982755ee8459f771f2e8622427c36494646e1dd/test_durations" -o .test_durations
 
     - name: Run Tox
       run: TOXENV=fuzzing tox -r -- --splits 60 --group ${{ matrix.group }} --splitting-algorithm least_duration --reruns 10 --reruns-delay 1 -r aR tests/

From 796a075ff37e22286ea70c78c2b0bbbb29403d3d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 16 May 2023 14:53:52 -0400
Subject: [PATCH 029/161] chore: fix call graph stability test (#3417)

there were some spurious grammatical errors due to not filtering out
reserved keywords for function names. this adds a hypothesis filter, and
also adds missing keywords to the list of reserved keywords in
`vyper.semantics.namespace`.
---
 tests/parser/test_call_graph_stability.py    |  7 ++-
 tests/parser/types/test_identifier_naming.py |  6 +--
 vyper/semantics/namespace.py                 | 50 +++++++++++++++++---
 3 files changed, 50 insertions(+), 13 deletions(-)

diff --git a/tests/parser/test_call_graph_stability.py b/tests/parser/test_call_graph_stability.py
index 6785169ba3..206256a22a 100644
--- a/tests/parser/test_call_graph_stability.py
+++ b/tests/parser/test_call_graph_stability.py
@@ -7,6 +7,11 @@
 
 import vyper.ast as vy_ast
 from vyper.compiler.phases import CompilerData
+from vyper.semantics.namespace import RESERVED_KEYWORDS
+
+
+def _valid_identifier(attr):
+    return attr not in RESERVED_KEYWORDS
 
 
 # random names for functions
@@ -15,7 +20,7 @@
     st.lists(
         st.tuples(
             st.sampled_from(["@pure", "@view", "@nonpayable", "@payable"]),
-            st.text(alphabet=string.ascii_lowercase, min_size=1),
+            st.text(alphabet=string.ascii_lowercase, min_size=1).filter(_valid_identifier),
         ),
         unique_by=lambda x: x[1],  # unique on function name
         min_size=1,
diff --git a/tests/parser/types/test_identifier_naming.py b/tests/parser/types/test_identifier_naming.py
index d0daa6dc05..f4f602f471 100755
--- a/tests/parser/types/test_identifier_naming.py
+++ b/tests/parser/types/test_identifier_naming.py
@@ -45,12 +45,8 @@ def test({constant}: int128):
     )
 
 
-PYTHON_KEYWORDS = {"if", "for", "while", "pass", "def", "assert", "continue", "raise"}
-
 SELF_NAMESPACE_MEMBERS = set(AddressT._type_members.keys())
-DISALLOWED_FN_NAMES = (
-    SELF_NAMESPACE_MEMBERS | PYTHON_KEYWORDS | RESERVED_KEYWORDS | BUILTIN_CONSTANTS
-)
+DISALLOWED_FN_NAMES = SELF_NAMESPACE_MEMBERS | RESERVED_KEYWORDS | BUILTIN_CONSTANTS
 ALLOWED_FN_NAMES = ALL_RESERVED_KEYWORDS - DISALLOWED_FN_NAMES
 
 
diff --git a/vyper/semantics/namespace.py b/vyper/semantics/namespace.py
index bb37c06cef..d760f66972 100644
--- a/vyper/semantics/namespace.py
+++ b/vyper/semantics/namespace.py
@@ -126,8 +126,50 @@ def validate_identifier(attr):
         raise StructureException(f"'{attr}' is a reserved keyword")
 
 
+# https://docs.python.org/3/reference/lexical_analysis.html#keywords
+# note we don't technically need to block all python reserved keywords,
+# but do it for hygiene
+_PYTHON_RESERVED_KEYWORDS = {
+    "False",
+    "None",
+    "True",
+    "and",
+    "as",
+    "assert",
+    "async",
+    "await",
+    "break",
+    "class",
+    "continue",
+    "def",
+    "del",
+    "elif",
+    "else",
+    "except",
+    "finally",
+    "for",
+    "from",
+    "global",
+    "if",
+    "import",
+    "in",
+    "is",
+    "lambda",
+    "nonlocal",
+    "not",
+    "or",
+    "pass",
+    "raise",
+    "return",
+    "try",
+    "while",
+    "with",
+    "yield",
+}
+_PYTHON_RESERVED_KEYWORDS = {s.lower() for s in _PYTHON_RESERVED_KEYWORDS}
+
 # Cannot be used for variable or member naming
-RESERVED_KEYWORDS = {
+RESERVED_KEYWORDS = _PYTHON_RESERVED_KEYWORDS | {
     # decorators
     "public",
     "external",
@@ -153,14 +195,8 @@ def validate_identifier(attr):
     "_default_",
     "___default___",
     "____default____",
-    # boolean literals
-    "true",
-    "false",
     # more control flow and special operations
-    "this",
     "range",
-    # None sentinal value
-    "none",
     # more special operations
     "indexed",
     # denominations

From 3f70dd2c8412001c6fa7ab4b2b0613d1c0a13fd1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 16 May 2023 15:36:46 -0400
Subject: [PATCH 030/161] fix: typechecking for user-defined types (#3418)

non-structs were not type checked correctly. this represents a
regression presumably in 046ea166d9.

this commit fixes the issue and adds some tests.
---
 tests/parser/syntax/test_enum.py       | 14 ++++++++++++++
 tests/parser/syntax/test_interfaces.py | 13 +++++++++++++
 vyper/semantics/types/user.py          |  8 ++++----
 3 files changed, 31 insertions(+), 4 deletions(-)

diff --git a/tests/parser/syntax/test_enum.py b/tests/parser/syntax/test_enum.py
index c13f27f497..9bb74fb675 100644
--- a/tests/parser/syntax/test_enum.py
+++ b/tests/parser/syntax/test_enum.py
@@ -110,6 +110,20 @@ def foo() -> Roles:
     """,
         UnknownAttribute,
     ),
+    (
+        """
+enum A:
+    a
+enum B:
+    a
+    b
+
+@internal
+def foo():
+    a: A = B.b
+    """,
+        TypeMismatch,
+    ),
 ]
 
 
diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index 225c8945b2..d964a17571 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -106,6 +106,19 @@ def foo(): nonpayable
     """,
         StructureException,
     ),
+    (
+        """
+from vyper.interfaces import ERC20
+
+interface A:
+    def f(): view
+
+@internal
+def foo():
+    a: ERC20 = A(empty(address))
+    """,
+        TypeMismatch,
+    ),
 ]
 
 
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index 444f9256e7..ad61da54d9 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -32,6 +32,10 @@ class _UserType(VyperType):
     def __eq__(self, other):
         return self is other
 
+    # TODO: revisit this once user types can be imported via modules
+    def compare_type(self, other):
+        return super().compare_type(other) and self._id == other._id
+
     def __hash__(self):
         return hash(id(self))
 
@@ -537,10 +541,6 @@ def from_ast_def(cls, base_node: vy_ast.StructDef) -> "StructT":
     def __repr__(self):
         return f"{self._id} declaration object"
 
-    # TODO check me
-    def compare_type(self, other):
-        return super().compare_type(other) and self._id == other._id
-
     @property
     def size_in_bytes(self):
         return sum(i.size_in_bytes for i in self.member_types.values())

From dcc230c3731d1d5fc2379b82b220be4fbf7e3c15 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 16 May 2023 16:18:55 -0400
Subject: [PATCH 031/161] chore: improve optimizer rules for comparison
 operators (#3412)

after this commit, safe add between anything and 0 results in a no-op.
---
 tests/compiler/ir/test_optimize_ir.py | 15 +++++++++++++++
 vyper/ir/optimizer.py                 | 15 ++++++++++++---
 2 files changed, 27 insertions(+), 3 deletions(-)

diff --git a/tests/compiler/ir/test_optimize_ir.py b/tests/compiler/ir/test_optimize_ir.py
index bac0e18d65..b679e55453 100644
--- a/tests/compiler/ir/test_optimize_ir.py
+++ b/tests/compiler/ir/test_optimize_ir.py
@@ -57,6 +57,14 @@
     (["le", 0, "x"], [1]),
     (["le", 0, ["sload", 0]], None),  # no-op
     (["ge", "x", 0], [1]),
+    (["le", "x", "x"], [1]),
+    (["ge", "x", "x"], [1]),
+    (["sle", "x", "x"], [1]),
+    (["sge", "x", "x"], [1]),
+    (["lt", "x", "x"], [0]),
+    (["gt", "x", "x"], [0]),
+    (["slt", "x", "x"], [0]),
+    (["sgt", "x", "x"], [0]),
     # boundary conditions
     (["slt", "x", -(2**255)], [0]),
     (["sle", "x", -(2**255)], ["eq", "x", -(2**255)]),
@@ -253,3 +261,10 @@ def test_ir_optimizer(ir):
 def test_static_assertions(ir, assert_compile_failed):
     ir = IRnode.from_list(ir)
     assert_compile_failed(lambda: optimizer.optimize(ir), StaticAssertionException)
+
+
+def test_operator_set_values():
+    # some sanity checks
+    assert optimizer.COMPARISON_OPS == {"lt", "gt", "le", "ge", "slt", "sgt", "sle", "sge"}
+    assert optimizer.STRICT_COMPARISON_OPS == {"lt", "gt", "slt", "sgt"}
+    assert optimizer.UNSTRICT_COMPARISON_OPS == {"le", "ge", "sle", "sge"}
diff --git a/vyper/ir/optimizer.py b/vyper/ir/optimizer.py
index f54b0e8115..fb10b515cc 100644
--- a/vyper/ir/optimizer.py
+++ b/vyper/ir/optimizer.py
@@ -78,6 +78,11 @@ def _deep_contains(node_or_list, node):
 
 COMMUTATIVE_OPS = {"add", "mul", "eq", "ne", "and", "or", "xor"}
 COMPARISON_OPS = {"gt", "sgt", "ge", "sge", "lt", "slt", "le", "sle"}
+STRICT_COMPARISON_OPS = {t for t in COMPARISON_OPS if t.endswith("t")}
+UNSTRICT_COMPARISON_OPS = {t for t in COMPARISON_OPS if t.endswith("e")}
+
+assert not (STRICT_COMPARISON_OPS & UNSTRICT_COMPARISON_OPS)
+assert STRICT_COMPARISON_OPS | UNSTRICT_COMPARISON_OPS == COMPARISON_OPS
 
 
 def _flip_comparison_op(opname):
@@ -256,11 +261,15 @@ def _conservative_eq(x, y):
         return finalize("seq", [args[0]])
 
     if binop in {"sub", "xor", "ne"} and _conservative_eq(args[0], args[1]):
-        # x - x == x ^ x == x != x == 0
+        # (x - x) == (x ^ x) == (x != x) == 0
+        return finalize(0, [])
+
+    if binop in STRICT_COMPARISON_OPS and _conservative_eq(args[0], args[1]):
+        # (x < x) == (x > x) == 0
         return finalize(0, [])
 
-    if binop == "eq" and _conservative_eq(args[0], args[1]):
-        # (x == x) == 1
+    if binop in {"eq"} | UNSTRICT_COMPARISON_OPS and _conservative_eq(args[0], args[1]):
+        # (x == x) == (x >= x) == (x <= x) == 1
         return finalize(1, [])
 
     # TODO associativity rules

From 9ecb97b4b6fcdc566361b3c4501888e3f19d9cac Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 12:41:17 -0400
Subject: [PATCH 032/161] fix: calldatasize < 4 reverting instead of going to
 fallback (#3408)

in the case that a selector matches calldata with less than 4 bytes, it
currently will revert instead of going to the fallback. this can happen
if the selector has trailing zeroes. this commit fixes the behavior for
selectors with trailing zeroes, and improves code size and gas for those
without trailing zeroes.
---
 .../parser/functions/test_default_function.py | 116 ++++++++++++++++--
 .../function_definitions/external_function.py |  41 ++++---
 2 files changed, 130 insertions(+), 27 deletions(-)

diff --git a/tests/parser/functions/test_default_function.py b/tests/parser/functions/test_default_function.py
index cd1f9f39af..4aa0b04a77 100644
--- a/tests/parser/functions/test_default_function.py
+++ b/tests/parser/functions/test_default_function.py
@@ -100,7 +100,9 @@ def __default__():
     assert_compile_failed(lambda: get_contract_with_gas_estimation(code))
 
 
-def test_zero_method_id(w3, get_logs, get_contract_with_gas_estimation):
+def test_zero_method_id(w3, get_logs, get_contract, assert_tx_failed):
+    # test a method with 0x00000000 selector,
+    # expects at least 36 bytes of calldata.
     code = """
 event Sent:
     sig: uint256
@@ -116,18 +118,108 @@ def blockHashAskewLimitary(v: uint256) -> uint256:
 def __default__():
     log Sent(1)
     """
-
-    c = get_contract_with_gas_estimation(code)
+    c = get_contract(code)
 
     assert c.blockHashAskewLimitary(0) == 7
 
-    logs = get_logs(w3.eth.send_transaction({"to": c.address, "value": 0}), c, "Sent")
-    assert 1 == logs[0].args.sig
+    def _call_with_bytes(hexstr):
+        # call our special contract and return the logged value
+        logs = get_logs(
+            w3.eth.send_transaction({"to": c.address, "value": 0, "data": hexstr}), c, "Sent"
+        )
+        return logs[0].args.sig
 
-    logs = get_logs(
-        # call blockHashAskewLimitary
-        w3.eth.send_transaction({"to": c.address, "value": 0, "data": "0x" + "00" * 36}),
-        c,
-        "Sent",
-    )
-    assert 2 == logs[0].args.sig
+    assert 1 == _call_with_bytes("0x")
+
+    # call blockHashAskewLimitary with proper calldata
+    assert 2 == _call_with_bytes("0x" + "00" * 36)
+
+    # call blockHashAskewLimitary with extra trailing bytes in calldata
+    assert 2 == _call_with_bytes("0x" + "00" * 37)
+
+    for i in range(4):
+        # less than 4 bytes of calldata doesn't match the 0 selector and goes to default
+        assert 1 == _call_with_bytes("0x" + "00" * i)
+
+    for i in range(4, 36):
+        # match the full 4 selector bytes, but revert due to malformed (short) calldata
+        assert_tx_failed(lambda: _call_with_bytes("0x" + "00" * i))
+
+
+def test_another_zero_method_id(w3, get_logs, get_contract, assert_tx_failed):
+    # test another zero method id but which only expects 4 bytes of calldata
+    code = """
+event Sent:
+    sig: uint256
+
+@external
+@payable
+# function selector: 0x00000000
+def wycpnbqcyf() -> uint256:
+    log Sent(2)
+    return 7
+
+@external
+def __default__():
+    log Sent(1)
+    """
+    c = get_contract(code)
+
+    assert c.wycpnbqcyf() == 7
+
+    def _call_with_bytes(hexstr):
+        # call our special contract and return the logged value
+        logs = get_logs(
+            w3.eth.send_transaction({"to": c.address, "value": 0, "data": hexstr}), c, "Sent"
+        )
+        return logs[0].args.sig
+
+    assert 1 == _call_with_bytes("0x")
+
+    # call wycpnbqcyf
+    assert 2 == _call_with_bytes("0x" + "00" * 4)
+
+    # too many bytes ok
+    assert 2 == _call_with_bytes("0x" + "00" * 5)
+
+    # "right" method id but by accident - not enough bytes.
+    for i in range(4):
+        assert 1 == _call_with_bytes("0x" + "00" * i)
+
+
+def test_partial_selector_match_trailing_zeroes(w3, get_logs, get_contract):
+    code = """
+event Sent:
+    sig: uint256
+
+@external
+@payable
+# function selector: 0xd88e0b00
+def fow() -> uint256:
+    log Sent(2)
+    return 7
+
+@external
+def __default__():
+    log Sent(1)
+    """
+    c = get_contract(code)
+
+    # sanity check - we can call c.fow()
+    assert c.fow() == 7
+
+    def _call_with_bytes(hexstr):
+        # call our special contract and return the logged value
+        logs = get_logs(
+            w3.eth.send_transaction({"to": c.address, "value": 0, "data": hexstr}), c, "Sent"
+        )
+        return logs[0].args.sig
+
+    # check we can call default function
+    assert 1 == _call_with_bytes("0x")
+
+    # check fow() selector is 0xd88e0b00
+    assert 2 == _call_with_bytes("0xd88e0b00")
+
+    # check calling d88e0b with no trailing zero goes to fallback instead of reverting
+    assert 1 == _call_with_bytes("0xd88e0b")
diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 42ea11a035..1ff2b6d012 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -88,7 +88,12 @@ def handler_for(calldata_kwargs, default_kwargs):
         # ensure calldata is at least of minimum length
         args_abi_t = calldata_args_t.abi_type
         calldata_min_size = args_abi_t.min_size() + 4
-        ret.append(["assert", ["ge", "calldatasize", calldata_min_size]])
+
+        # note we don't need the check if calldata_min_size == 4,
+        # because the selector checks later in this routine ensure
+        # that calldatasize >= 4.
+        if calldata_min_size > 4:
+            ret.append(["assert", ["ge", "calldatasize", calldata_min_size]])
 
         # TODO optimize make_setter by using
         # TupleT(list(arg.typ for arg in calldata_kwargs + default_kwargs))
@@ -124,20 +129,26 @@ def handler_for(calldata_kwargs, default_kwargs):
 
         method_id_check = ["eq", "_calldata_method_id", method_id]
 
-        # if there is a function whose selector is 0, it won't be distinguished
-        # from the case where nil calldata is supplied, b/c calldataload loads
-        # 0s past the end of physical calldata (cf. yellow paper).
-        # since supplying 0 calldata is expected to trigger the fallback fn,
-        # we check that calldatasize > 0, which distinguishes the 0 selector
-        # from the fallback function "selector"
-        # (equiv. to "all selectors not in the selector table").
-
-        # note: cases where not enough calldata is supplied (besides
-        # calldatasize==0) are not addressed here b/c a calldatasize
-        # well-formedness check is already present in the function body
-        # as part of abi validation
-        if method_id.value == 0:
-            method_id_check = ["and", ["gt", "calldatasize", 0], method_id_check]
+        # if there is a function whose selector is 0 or has trailing 0s, it
+        # might not be distinguished from the case where insufficient calldata
+        # is supplied, b/c calldataload loads 0s past the end of physical
+        # calldata (cf. yellow paper).
+        # since the expected behavior of supplying insufficient calldata
+        # is to trigger the fallback fn, we add to the selector check that
+        # calldatasize >= 4, which distinguishes any selector with trailing
+        # 0 bytes from the fallback function "selector" (equiv. to "all
+        # selectors not in the selector table").
+        #
+        # note that the inclusion of this check means that, we are always
+        # guaranteed that the calldata is at least 4 bytes - either we have
+        # the explicit `calldatasize >= 4` condition in the selector check,
+        # or there are no trailing zeroes in the selector, (so the selector
+        # is impossible to match without calldatasize being at least 4).
+        method_id_bytes = util.method_id(abi_sig)
+        assert len(method_id_bytes) == 4
+        has_trailing_zeroes = method_id_bytes.endswith(b"\x00")
+        if has_trailing_zeroes:
+            method_id_check = ["and", ["ge", "calldatasize", 4], method_id_check]
 
         ret = ["if", method_id_check, ret]
         return ret

From 288ee7766ad8909087f75e28204ed0ccd1addbb1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 12:46:17 -0400
Subject: [PATCH 033/161] chore: update black target to 3.11 (#3420)

update the linter.
---
 tox.ini | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tox.ini b/tox.ini
index 7fd09ff3f8..5ddd01d7d4 100644
--- a/tox.ini
+++ b/tox.ini
@@ -46,7 +46,7 @@ whitelist_externals = make
 basepython = python3
 extras = lint
 commands =
-    black -C -t py310 {toxinidir}/vyper {toxinidir}/tests {toxinidir}/setup.py
+    black -C -t py311 {toxinidir}/vyper {toxinidir}/tests {toxinidir}/setup.py
     flake8 {toxinidir}/vyper {toxinidir}/tests
     isort {toxinidir}/vyper {toxinidir}/tests {toxinidir}/setup.py
 

From 08f0ac59a90cc1bf1005520ffbc07ab96e152136 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Thu, 18 May 2023 01:27:44 +0800
Subject: [PATCH 034/161] refactor: remove `FunctionSignature` (#3390)

This commit merges the old `FunctionSignature` with the newer
`ContractFunctionT` class. The old functionality has been subsumed under
`ContractFunctionT`. `ContractFunctionT` has additionally been
refactored for clarity; the new main fields are `positional_args` and
`keyword_args`, which improves on the old terminology of
`base_args`/`default_args` vs `min_arg_count`/`max_arg_count` and
improves the readability of downstream code.

this commit also
- removes the old codegen `parse_type()` functions
- simplifies codegen by removing the sigs dictionary from
  `vyper/codegen/context.py`
- simplifies the `lookup_internal_function` routine (now renamed to
  `_align_kwargs`)
- simplifies `vyper/codegen/module.py` by removing the sigs dictionaries
  and now instead relying on type annotations

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/base_conftest.py                        |   3 +
 tests/parser/syntax/test_public.py            |  21 ++
 tests/parser/test_call_graph_stability.py     |   2 +-
 tests/parser/types/numbers/test_sqrt.py       |   8 +-
 vyper/ast/expansion.py                        |   5 +
 vyper/ast/nodes.py                            |  14 ++
 vyper/ast/nodes.pyi                           |   1 +
 vyper/ast/signatures/__init__.py              |   1 -
 vyper/ast/signatures/function_signature.py    | 194 ----------------
 vyper/builtins/_convert.py                    |   6 +-
 vyper/builtins/_utils.py                      |   2 +-
 vyper/codegen/context.py                      |  45 +---
 vyper/codegen/expr.py                         |  10 +-
 vyper/codegen/external_call.py                |   6 +-
 .../codegen/function_definitions/__init__.py  |   2 +-
 vyper/codegen/function_definitions/common.py  |  94 ++++++--
 .../function_definitions/external_function.py |  58 +++--
 .../function_definitions/internal_function.py |  18 +-
 vyper/codegen/global_context.py               |  12 -
 vyper/codegen/module.py                       |  69 +++---
 vyper/codegen/return_.py                      |   6 +-
 vyper/codegen/self_call.py                    |  52 +++--
 vyper/codegen/stmt.py                         |   2 +-
 vyper/compiler/output.py                      |  47 ++--
 vyper/compiler/phases.py                      |  24 +-
 vyper/compiler/utils.py                       |  13 +-
 vyper/semantics/analysis/annotation.py        |   8 +-
 vyper/semantics/analysis/local.py             |   6 +-
 vyper/semantics/types/function.py             | 217 +++++++++++-------
 29 files changed, 428 insertions(+), 518 deletions(-)
 delete mode 100644 vyper/ast/signatures/__init__.py
 delete mode 100644 vyper/ast/signatures/function_signature.py

diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index febe8f74d3..29809a074d 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -1,3 +1,5 @@
+import json
+
 import pytest
 import web3.exceptions
 from eth_tester import EthereumTester, PyEVMBackend
@@ -120,6 +122,7 @@ def _get_contract(w3, source_code, no_optimize, *args, **kwargs):
         show_gas_estimates=True,  # Enable gas estimates for testing
     )
     parse_vyper_source(source_code)  # Test grammar.
+    json.dumps(out["metadata"])  # test metadata is json serializable
     abi = out["abi"]
     bytecode = out["bytecode"]
     value = kwargs.pop("value_in_eth", 0) * 10**18  # Handle deploying with an eth value.
diff --git a/tests/parser/syntax/test_public.py b/tests/parser/syntax/test_public.py
index fd0058cab8..68575ebd41 100644
--- a/tests/parser/syntax/test_public.py
+++ b/tests/parser/syntax/test_public.py
@@ -23,6 +23,27 @@ def __init__():
 def foo() -> int128:
     return self.x / self.y / self.z
     """,
+    # expansion of public user-defined struct
+    """
+struct Foo:
+    a: uint256
+
+x: public(HashMap[uint256, Foo])
+    """,
+    # expansion of public user-defined enum
+    """
+enum Foo:
+    BAR
+
+x: public(HashMap[uint256, Foo])
+    """,
+    # expansion of public user-defined interface
+    """
+interface Foo:
+    def bar(): nonpayable
+
+x: public(HashMap[uint256, Foo])
+    """,
 ]
 
 
diff --git a/tests/parser/test_call_graph_stability.py b/tests/parser/test_call_graph_stability.py
index 206256a22a..6f78b50053 100644
--- a/tests/parser/test_call_graph_stability.py
+++ b/tests/parser/test_call_graph_stability.py
@@ -70,4 +70,4 @@ def foo():
                 r = d.args[0].args[0].value
                 if isinstance(r, str) and r.startswith("internal"):
                     ir_funcs.append(r)
-        assert ir_funcs == [f.internal_function_label for f in sigs.values()]
+        assert ir_funcs == [f._ir_info.internal_function_label for f in sigs.values()]
diff --git a/tests/parser/types/numbers/test_sqrt.py b/tests/parser/types/numbers/test_sqrt.py
index 025a3868e9..df1ed0539c 100644
--- a/tests/parser/types/numbers/test_sqrt.py
+++ b/tests/parser/types/numbers/test_sqrt.py
@@ -143,8 +143,8 @@ def test_sqrt_bounds(sqrt_contract, value):
         min_value=Decimal(0), max_value=Decimal(SizeLimits.MAX_INT128), places=DECIMAL_PLACES
     )
 )
-@hypothesis.example(Decimal(SizeLimits.MAX_INT128))
-@hypothesis.example(Decimal(0))
+@hypothesis.example(value=Decimal(SizeLimits.MAX_INT128))
+@hypothesis.example(value=Decimal(0))
 @hypothesis.settings(deadline=1000)
 def test_sqrt_valid_range(sqrt_contract, value):
     vyper_sqrt = sqrt_contract.test(value)
@@ -159,8 +159,8 @@ def test_sqrt_valid_range(sqrt_contract, value):
     )
 )
 @hypothesis.settings(deadline=400)
-@hypothesis.example(Decimal(SizeLimits.MIN_INT128))
-@hypothesis.example(Decimal("-1E10"))
+@hypothesis.example(value=Decimal(SizeLimits.MIN_INT128))
+@hypothesis.example(value=Decimal("-1E10"))
 def test_sqrt_invalid_range(sqrt_contract, value):
     with pytest.raises(TransactionFailed):
         sqrt_contract.test(value)
diff --git a/vyper/ast/expansion.py b/vyper/ast/expansion.py
index c5518be405..753f2687cd 100644
--- a/vyper/ast/expansion.py
+++ b/vyper/ast/expansion.py
@@ -2,6 +2,7 @@
 
 from vyper import ast as vy_ast
 from vyper.exceptions import CompilerPanic
+from vyper.semantics.types.function import ContractFunctionT
 
 
 def expand_annotated_ast(vyper_module: vy_ast.Module) -> None:
@@ -85,6 +86,10 @@ def generate_public_variable_getters(vyper_module: vy_ast.Module) -> None:
             decorator_list=[vy_ast.Name(id="external"), vy_ast.Name(id="view")],
             returns=return_node,
         )
+
+        with vyper_module.namespace():
+            func_type = ContractFunctionT.from_FunctionDef(expanded)
+
         expanded._metadata["type"] = func_type
         return_node.set_parent(expanded)
         vyper_module.add_to_body(expanded)
diff --git a/vyper/ast/nodes.py b/vyper/ast/nodes.py
index 7bb0a6274d..03f2d713c1 100644
--- a/vyper/ast/nodes.py
+++ b/vyper/ast/nodes.py
@@ -1,4 +1,5 @@
 import ast as python_ast
+import contextlib
 import copy
 import decimal
 import operator
@@ -664,6 +665,19 @@ def remove_from_body(self, node: VyperNode) -> None:
         self.body.remove(node)
         self._children.remove(node)
 
+    @contextlib.contextmanager
+    def namespace(self):
+        from vyper.semantics.namespace import get_namespace, override_global_namespace
+
+        # kludge implementation for backwards compatibility.
+        # TODO: replace with type_from_ast
+        try:
+            ns = self._metadata["namespace"]
+        except AttributeError:
+            ns = get_namespace()
+        with override_global_namespace(ns):
+            yield
+
 
 class FunctionDef(TopLevel):
     __slots__ = ("args", "returns", "decorator_list", "pos")
diff --git a/vyper/ast/nodes.pyi b/vyper/ast/nodes.pyi
index d47e420d66..3d83ae7506 100644
--- a/vyper/ast/nodes.pyi
+++ b/vyper/ast/nodes.pyi
@@ -61,6 +61,7 @@ class Module(TopLevel):
     def replace_in_tree(self, old_node: VyperNode, new_node: VyperNode) -> None: ...
     def add_to_body(self, node: VyperNode) -> None: ...
     def remove_from_body(self, node: VyperNode) -> None: ...
+    def namespace(self) -> Any: ...  # context manager
 
 class FunctionDef(TopLevel):
     args: arguments = ...
diff --git a/vyper/ast/signatures/__init__.py b/vyper/ast/signatures/__init__.py
deleted file mode 100644
index aa9a5c66c6..0000000000
--- a/vyper/ast/signatures/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-from .function_signature import FrameInfo, FunctionSignature
diff --git a/vyper/ast/signatures/function_signature.py b/vyper/ast/signatures/function_signature.py
deleted file mode 100644
index 3f59b95f97..0000000000
--- a/vyper/ast/signatures/function_signature.py
+++ /dev/null
@@ -1,194 +0,0 @@
-from dataclasses import dataclass
-from functools import cached_property
-from typing import Dict, Optional, Tuple
-
-from vyper import ast as vy_ast
-from vyper.exceptions import CompilerPanic, StructureException
-from vyper.semantics.types import VyperType
-from vyper.utils import MemoryPositions, mkalphanum
-
-# dict from function names to signatures
-FunctionSignatures = Dict[str, "FunctionSignature"]
-
-
-@dataclass
-class FunctionArg:
-    name: str
-    typ: VyperType
-    ast_source: vy_ast.VyperNode
-
-
-@dataclass
-class FrameInfo:
-    frame_start: int
-    frame_size: int
-    frame_vars: Dict[str, Tuple[int, VyperType]]
-
-    @property
-    def mem_used(self):
-        return self.frame_size + MemoryPositions.RESERVED_MEMORY
-
-
-# Function signature object
-# TODO: merge with ContractFunction type
-class FunctionSignature:
-    def __init__(
-        self,
-        name,
-        args,
-        return_type,
-        mutability,
-        internal,
-        nonreentrant_key,
-        func_ast_code,
-        is_from_json,
-    ):
-        self.name = name
-        self.args = args
-        self.return_type = return_type
-        self.mutability = mutability
-        self.internal = internal
-        self.gas_estimate = None
-        self.nonreentrant_key = nonreentrant_key
-        self.func_ast_code = func_ast_code
-        self.is_from_json = is_from_json
-
-        self.set_default_args()
-
-        # frame info is metadata that will be generated during codegen.
-        self.frame_info: Optional[FrameInfo] = None
-
-    def __str__(self):
-        input_name = "def " + self.name + "(" + ",".join([str(arg.typ) for arg in self.args]) + ")"
-        if self.return_type:
-            return input_name + " -> " + str(self.return_type) + ":"
-        return input_name + ":"
-
-    def set_frame_info(self, frame_info):
-        if self.frame_info is not None:
-            raise CompilerPanic("sig.frame_info already set!")
-        self.frame_info = frame_info
-
-    @cached_property
-    def _ir_identifier(self) -> str:
-        # we could do a bit better than this but it just needs to be unique
-        visibility = "internal" if self.internal else "external"
-        argz = ",".join([str(arg.typ) for arg in self.args])
-        ret = f"{visibility} {self.name} ({argz})"
-        return mkalphanum(ret)
-
-    # calculate the abi signature for a given set of kwargs
-    def abi_signature_for_kwargs(self, kwargs):
-        args = self.base_args + kwargs
-        return self.name + "(" + ",".join([arg.typ.abi_type.selector_name() for arg in args]) + ")"
-
-    @cached_property
-    def base_signature(self):
-        return self.abi_signature_for_kwargs([])
-
-    @property
-    # common entry point for external function with kwargs
-    def external_function_base_entry_label(self):
-        assert not self.internal
-
-        return self._ir_identifier + "_common"
-
-    @property
-    def internal_function_label(self):
-        assert self.internal, "why are you doing this"
-
-        return self._ir_identifier
-
-    @property
-    def exit_sequence_label(self):
-        return self._ir_identifier + "_cleanup"
-
-    def set_default_args(self):
-        """Split base from kwargs and set member data structures"""
-
-        args = self.func_ast_code.args
-
-        defaults = getattr(args, "defaults", [])
-        num_base_args = len(args.args) - len(defaults)
-
-        self.base_args = self.args[:num_base_args]
-        self.default_args = self.args[num_base_args:]
-
-        # Keep all the value to assign to default parameters.
-        self.default_values = dict(zip([arg.name for arg in self.default_args], defaults))
-
-    # Get a signature from a function definition
-    @classmethod
-    def from_definition(
-        cls,
-        func_ast,  # vy_ast.FunctionDef
-        global_ctx,
-        interface_def=False,
-        constant_override=False,  # CMC 20210907 what does this do?
-        is_from_json=False,
-    ):
-        name = func_ast.name
-
-        args = []
-        for arg in func_ast.args.args:
-            argname = arg.arg
-            argtyp = global_ctx.parse_type(arg.annotation)
-
-            args.append(FunctionArg(argname, argtyp, arg))
-
-        mutability = "nonpayable"  # Assume nonpayable by default
-        nonreentrant_key = None
-        is_internal = None
-
-        # Update function properties from decorators
-        # NOTE: Can't import enums here because of circular import
-        for dec in func_ast.decorator_list:
-            if isinstance(dec, vy_ast.Name) and dec.id in ("payable", "view", "pure"):
-                mutability = dec.id
-            elif isinstance(dec, vy_ast.Name) and dec.id == "internal":
-                is_internal = True
-            elif isinstance(dec, vy_ast.Name) and dec.id == "external":
-                is_internal = False
-            elif isinstance(dec, vy_ast.Call) and dec.func.id == "nonreentrant":
-                nonreentrant_key = dec.args[0].s
-
-        if constant_override:
-            # In case this override is abused, match previous behavior
-            if mutability == "payable":
-                raise StructureException(f"Function {name} cannot be both constant and payable.")
-            mutability = "view"
-
-        # Determine the return type and whether or not it's constant. Expects something
-        # of the form:
-        # def foo(): ...
-        # def foo() -> int128: ...
-        # If there is no return type, ie. it's of the form def foo(): ...
-        # and NOT def foo() -> type: ..., then it's null
-        return_type = None
-        if func_ast.returns:
-            return_type = global_ctx.parse_type(func_ast.returns)
-            # sanity check: Output type must be canonicalizable
-            assert return_type.abi_type.selector_name()
-
-        return cls(
-            name,
-            args,
-            return_type,
-            mutability,
-            is_internal,
-            nonreentrant_key,
-            func_ast,
-            is_from_json,
-        )
-
-    @property
-    def is_default_func(self):
-        return self.name == "__default__"
-
-    @property
-    def is_init_func(self):
-        return self.name == "__init__"
-
-    @property
-    def is_regular_function(self):
-        return not self.is_default_func and not self.is_init_func
diff --git a/vyper/builtins/_convert.py b/vyper/builtins/_convert.py
index 546207072a..e09f5f3174 100644
--- a/vyper/builtins/_convert.py
+++ b/vyper/builtins/_convert.py
@@ -453,13 +453,13 @@ def to_enum(expr, arg, out_typ):
 
 
 def convert(expr, context):
-    if len(expr.args) != 2:
-        raise StructureException("The convert function expects two parameters.", expr)
+    assert len(expr.args) == 2, "bad typecheck: convert"
 
     arg_ast = expr.args[0]
     arg = Expr(arg_ast, context).ir_node
     original_arg = arg
-    out_typ = context.parse_type(expr.args[1])
+
+    out_typ = expr.args[1]._metadata["type"].typedef
 
     if arg.typ._is_prim_word:
         arg = unwrap_location(arg)
diff --git a/vyper/builtins/_utils.py b/vyper/builtins/_utils.py
index 77185f6e53..afc0987b6d 100644
--- a/vyper/builtins/_utils.py
+++ b/vyper/builtins/_utils.py
@@ -23,7 +23,7 @@ def generate_inline_function(code, variables, variables_2, memory_allocator):
         # `ContractFunctionT` type to rely on the annotation visitors in semantics
         # module.
         ast_code.body[0]._metadata["type"] = ContractFunctionT(
-            "sqrt_builtin", {}, 0, 0, None, FunctionVisibility.INTERNAL, StateMutability.NONPAYABLE
+            "sqrt_builtin", [], [], None, FunctionVisibility.INTERNAL, StateMutability.NONPAYABLE
         )
         # The FunctionNodeVisitor's constructor performs semantic checks
         # annotate the AST as side effects.
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index 34c409e16c..6e8d02c9b3 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -50,10 +50,9 @@ def __init__(
         global_ctx,
         memory_allocator,
         vars_=None,
-        sigs=None,
         forvars=None,
         constancy=Constancy.Mutable,
-        sig=None,
+        func_t=None,
         is_ctor_context=False,
     ):
         # In-memory variables, in the form (name, memory location, type)
@@ -62,9 +61,6 @@ def __init__(
         # Global variables, in the form (name, storage location, type)
         self.globals = global_ctx.variables
 
-        # ABI objects, in the form {classname: ABI JSON}
-        self.sigs = sigs or {"self": {}}
-
         # Variables defined in for loops, e.g. for i in range(6): ...
         self.forvars = forvars or {}
 
@@ -80,8 +76,8 @@ def __init__(
         # store global context
         self.global_ctx = global_ctx
 
-        # full function signature
-        self.sig = sig
+        # full function type
+        self.func_t = func_t
         # Active scopes
         self._scopes = set()
 
@@ -106,15 +102,15 @@ def check_is_not_constant(self, err, expr):
     # convenience propreties
     @property
     def is_payable(self):
-        return self.sig.mutability == "payable"
+        return self.func_t.is_payable
 
     @property
     def is_internal(self):
-        return self.sig.internal
+        return self.func_t.is_internal
 
     @property
     def return_type(self):
-        return self.sig.return_type
+        return self.func_t.return_type
 
     #
     # Context Managers
@@ -247,38 +243,9 @@ def new_internal_variable(self, typ: VyperType) -> int:
         var_size = typ.memory_bytes_required
         return self._new_variable(name, typ, var_size, True)
 
-    def parse_type(self, ast_node):
-        return self.global_ctx.parse_type(ast_node)
-
     def lookup_var(self, varname):
         return self.vars[varname]
 
-    def lookup_internal_function(self, method_name, args_ir, ast_source):
-        # TODO is this the right module for me?
-        """
-        Using a list of args, find the internal method to use, and
-        the kwargs which need to be filled in by the compiler
-        """
-
-        sig = self.sigs["self"].get(method_name, None)
-
-        def _check(cond, s="Unreachable"):
-            if not cond:
-                raise CompilerPanic(s)
-
-        # these should have been caught during type checking; sanity check
-        _check(sig is not None)
-        _check(sig.internal)
-        _check(len(sig.base_args) <= len(args_ir) <= len(sig.args))
-        # more sanity check, that the types match
-        # _check(all(l.typ == r.typ for (l, r) in zip(args_ir, sig.args))
-
-        num_provided_kwargs = len(args_ir) - len(sig.base_args)
-
-        kw_vals = list(sig.default_values.values())[num_provided_kwargs:]
-
-        return sig, kw_vals
-
     # Pretty print constancy for error messages
     def pp_constancy(self):
         if self.in_assertion:
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 9ed80b86f9..4a18a16e1b 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -665,7 +665,9 @@ def parse_Call(self):
             elif isinstance(self.expr._metadata["type"], StructT):
                 args = self.expr.args
                 if len(args) == 1 and isinstance(args[0], vy_ast.Dict):
-                    return Expr.struct_literals(args[0], function_name, self.context)
+                    return Expr.struct_literals(
+                        args[0], function_name, self.context, self.expr._metadata["type"]
+                    )
 
             # Interface assignment. Bar(<address>).
             elif isinstance(self.expr._metadata["type"], InterfaceT):
@@ -734,7 +736,7 @@ def parse_IfExp(self):
         return IRnode.from_list(["if", test, body, orelse], typ=typ, location=location)
 
     @staticmethod
-    def struct_literals(expr, name, context):
+    def struct_literals(expr, name, context, typ):
         member_subs = {}
         member_typs = {}
         for key, value in zip(expr.keys, expr.values):
@@ -745,10 +747,8 @@ def struct_literals(expr, name, context):
             member_subs[key.id] = sub
             member_typs[key.id] = sub.typ
 
-        # TODO: get struct type from context.global_ctx.parse_type(name)
         return IRnode.from_list(
-            ["multi"] + [member_subs[key] for key in member_subs.keys()],
-            typ=StructT(name, member_typs),
+            ["multi"] + [member_subs[key] for key in member_subs.keys()], typ=typ
         )
 
     # Parse an expression that results in a value
diff --git a/vyper/codegen/external_call.py b/vyper/codegen/external_call.py
index 88ea4b098e..c4eb182eb1 100644
--- a/vyper/codegen/external_call.py
+++ b/vyper/codegen/external_call.py
@@ -37,7 +37,7 @@ def _pack_arguments(fn_type, args, context):
     args_abi_t = args_tuple_t.abi_type
 
     # sanity typecheck - make sure the arguments can be assigned
-    dst_tuple_t = TupleT(list(fn_type.arguments.values())[: len(args)])
+    dst_tuple_t = TupleT(fn_type.argument_types[: len(args)])
     check_assign(dummy_node_for_type(dst_tuple_t), args_as_tuple)
 
     if fn_type.return_type is not None:
@@ -171,12 +171,10 @@ def _extcodesize_check(address):
 
 
 def _external_call_helper(contract_address, args_ir, call_kwargs, call_expr, context):
-    # expr.func._metadata["type"].return_type is more accurate
-    # than fn_sig.return_type in the case of JSON interfaces.
     fn_type = call_expr.func._metadata["type"]
 
     # sanity check
-    assert fn_type.min_arg_count <= len(args_ir) <= fn_type.max_arg_count
+    assert fn_type.n_positional_args <= len(args_ir) <= fn_type.n_total_args
 
     ret = ["seq"]
 
diff --git a/vyper/codegen/function_definitions/__init__.py b/vyper/codegen/function_definitions/__init__.py
index 08bebbb4a5..b677a14579 100644
--- a/vyper/codegen/function_definitions/__init__.py
+++ b/vyper/codegen/function_definitions/__init__.py
@@ -1 +1 @@
-from .common import generate_ir_for_function  # noqa
+from .common import FuncIRInfo, generate_ir_for_function  # noqa
diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index cd467a152e..431693caaa 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -1,8 +1,8 @@
-# can't use from [module] import [object] because it breaks mocks in testing
-from typing import Dict
+from dataclasses import dataclass
+from functools import cached_property
+from typing import Optional
 
 import vyper.ast as vy_ast
-from vyper.ast.signatures import FrameInfo, FunctionSignature
 from vyper.codegen.context import Constancy, Context
 from vyper.codegen.core import check_single_exit, getpos
 from vyper.codegen.function_definitions.external_function import generate_ir_for_external_function
@@ -10,12 +10,61 @@
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
 from vyper.codegen.memory_allocator import MemoryAllocator
-from vyper.utils import MemoryPositions, calc_mem_gas
+from vyper.exceptions import CompilerPanic
+from vyper.semantics.types import VyperType
+from vyper.semantics.types.function import ContractFunctionT
+from vyper.utils import MemoryPositions, calc_mem_gas, mkalphanum
+
+
+@dataclass
+class FrameInfo:
+    frame_start: int
+    frame_size: int
+    frame_vars: dict[str, tuple[int, VyperType]]
+
+    @property
+    def mem_used(self):
+        return self.frame_size + MemoryPositions.RESERVED_MEMORY
+
+
+@dataclass
+class FuncIRInfo:
+    func_t: ContractFunctionT
+    gas_estimate: Optional[int] = None
+    frame_info: Optional[FrameInfo] = None
+
+    @property
+    def visibility(self):
+        return "internal" if self.func_t.is_internal else "external"
+
+    @property
+    def exit_sequence_label(self) -> str:
+        return self.ir_identifier + "_cleanup"
+
+    @cached_property
+    def ir_identifier(self) -> str:
+        argz = ",".join([str(argtyp) for argtyp in self.func_t.argument_types])
+        return mkalphanum(f"{self.visibility} {self.func_t.name} ({argz})")
+
+    def set_frame_info(self, frame_info: FrameInfo) -> None:
+        if self.frame_info is not None:
+            raise CompilerPanic(f"frame_info already set for {self.func_t}!")
+        self.frame_info = frame_info
+
+    @property
+    # common entry point for external function with kwargs
+    def external_function_base_entry_label(self) -> str:
+        assert not self.func_t.is_internal, "uh oh, should be external"
+        return self.ir_identifier + "_common"
+
+    @property
+    def internal_function_label(self) -> str:
+        assert self.func_t.is_internal, "uh oh, should be internal"
+        return self.ir_identifier
 
 
 def generate_ir_for_function(
     code: vy_ast.FunctionDef,
-    sigs: Dict[str, Dict[str, FunctionSignature]],  # all signatures in all namespaces
     global_ctx: GlobalContext,
     skip_nonpayable_check: bool,
     is_ctor_context: bool = False,
@@ -27,18 +76,17 @@ def generate_ir_for_function(
         - Clamping and copying of arguments
         - Function body
     """
-    sig = code._metadata["signature"]
+    func_t = code._metadata["type"]
 
     # Validate return statements.
     check_single_exit(code)
 
-    callees = code._metadata["type"].called_functions
+    callees = func_t.called_functions
 
     # we start our function frame from the largest callee frame
     max_callee_frame_size = 0
-    for c in callees:
-        frame_info = sigs["self"][c.name].frame_info
-        assert frame_info is not None  # make mypy happy
+    for c_func_t in callees:
+        frame_info = c_func_t._ir_info.frame_info
         max_callee_frame_size = max(max_callee_frame_size, frame_info.frame_size)
 
     allocate_start = max_callee_frame_size + MemoryPositions.RESERVED_MEMORY
@@ -48,20 +96,19 @@ def generate_ir_for_function(
     context = Context(
         vars_=None,
         global_ctx=global_ctx,
-        sigs=sigs,
         memory_allocator=memory_allocator,
-        constancy=Constancy.Constant if sig.mutability in ("view", "pure") else Constancy.Mutable,
-        sig=sig,
+        constancy=Constancy.Mutable if func_t.is_mutable else Constancy.Constant,
+        func_t=func_t,
         is_ctor_context=is_ctor_context,
     )
 
-    if sig.internal:
+    if func_t.is_internal:
         assert skip_nonpayable_check is False
-        o = generate_ir_for_internal_function(code, sig, context)
+        o = generate_ir_for_internal_function(code, func_t, context)
     else:
-        if sig.mutability == "payable":
+        if func_t.is_payable:
             assert skip_nonpayable_check is False  # nonsense
-        o = generate_ir_for_external_function(code, sig, context, skip_nonpayable_check)
+        o = generate_ir_for_external_function(code, func_t, context, skip_nonpayable_check)
 
     o.source_pos = getpos(code)
 
@@ -69,19 +116,18 @@ def generate_ir_for_function(
 
     frame_info = FrameInfo(allocate_start, frame_size, context.vars)
 
-    if sig.frame_info is None:
-        sig.set_frame_info(frame_info)
+    if func_t._ir_info.frame_info is None:
+        func_t._ir_info.set_frame_info(frame_info)
     else:
-        assert frame_info == sig.frame_info
+        assert frame_info == func_t._ir_info.frame_info
 
-    if not sig.internal:
+    if not func_t.is_internal:
         # adjust gas estimate to include cost of mem expansion
         # frame_size of external function includes all private functions called
         # (note: internal functions do not need to adjust gas estimate since
         # it is already accounted for by the caller.)
-        assert sig.frame_info is not None  # mypy hint
-        o.add_gas_estimate += calc_mem_gas(sig.frame_info.mem_used)
+        o.add_gas_estimate += calc_mem_gas(func_t._ir_info.frame_info.mem_used)  # type: ignore
 
-    sig.gas_estimate = o.gas
+    func_t._ir_info.gas_estimate = o.gas
 
     return o
diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 1ff2b6d012..6104a86c16 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -1,7 +1,6 @@
 from typing import Any, List
 
 import vyper.utils as util
-from vyper.ast.signatures.function_signature import FunctionSignature
 from vyper.codegen.abi_encoder import abi_encoding_matches_vyper
 from vyper.codegen.context import Context, VariableRecord
 from vyper.codegen.core import get_element_ptr, getpos, make_setter, needs_clamp
@@ -11,23 +10,23 @@
 from vyper.codegen.stmt import parse_body
 from vyper.evm.address_space import CALLDATA, DATA, MEMORY
 from vyper.semantics.types import TupleT
+from vyper.semantics.types.function import ContractFunctionT
 
 
 # register function args with the local calling context.
 # also allocate the ones that live in memory (i.e. kwargs)
-def _register_function_args(context: Context, sig: FunctionSignature) -> List[IRnode]:
+def _register_function_args(func_t: ContractFunctionT, context: Context) -> List[IRnode]:
     ret = []
-
     # the type of the calldata
-    base_args_t = TupleT(tuple(arg.typ for arg in sig.base_args))
+    base_args_t = TupleT(tuple(arg.typ for arg in func_t.positional_args))
 
     # tuple with the abi_encoded args
-    if sig.is_init_func:
+    if func_t.is_constructor:
         base_args_ofst = IRnode(0, location=DATA, typ=base_args_t, encoding=Encoding.ABI)
     else:
         base_args_ofst = IRnode(4, location=CALLDATA, typ=base_args_t, encoding=Encoding.ABI)
 
-    for i, arg in enumerate(sig.base_args):
+    for i, arg in enumerate(func_t.positional_args):
         arg_ir = get_element_ptr(base_args_ofst, i)
 
         if needs_clamp(arg.typ, Encoding.ABI):
@@ -59,11 +58,11 @@ def _annotated_method_id(abi_sig):
     return IRnode(method_id, annotation=annotation)
 
 
-def _generate_kwarg_handlers(context: Context, sig: FunctionSignature) -> List[Any]:
+def _generate_kwarg_handlers(func_t: ContractFunctionT, context: Context) -> List[Any]:
     # generate kwarg handlers.
     # since they might come in thru calldata or be default,
     # allocate them in memory and then fill it in based on calldata or default,
-    # depending on the signature
+    # depending on the ContractFunctionT
     # a kwarg handler looks like
     # (if (eq _method_id <method_id>)
     #    copy calldata args to memory
@@ -71,11 +70,11 @@ def _generate_kwarg_handlers(context: Context, sig: FunctionSignature) -> List[A
     #    goto external_function_common_ir
 
     def handler_for(calldata_kwargs, default_kwargs):
-        calldata_args = sig.base_args + calldata_kwargs
+        calldata_args = func_t.positional_args + calldata_kwargs
         # create a fake type so that get_element_ptr works
         calldata_args_t = TupleT(list(arg.typ for arg in calldata_args))
 
-        abi_sig = sig.abi_signature_for_kwargs(calldata_kwargs)
+        abi_sig = func_t.abi_signature_for_kwargs(calldata_kwargs)
         method_id = _annotated_method_id(abi_sig)
 
         calldata_kwargs_ofst = IRnode(
@@ -99,10 +98,8 @@ def handler_for(calldata_kwargs, default_kwargs):
         # TupleT(list(arg.typ for arg in calldata_kwargs + default_kwargs))
         # (must ensure memory area is contiguous)
 
-        n_base_args = len(sig.base_args)
-
         for i, arg_meta in enumerate(calldata_kwargs):
-            k = n_base_args + i
+            k = func_t.n_positional_args + i
 
             dst = context.lookup_var(arg_meta.name).pos
 
@@ -118,14 +115,14 @@ def handler_for(calldata_kwargs, default_kwargs):
             dst = context.lookup_var(x.name).pos
             lhs = IRnode(dst, location=MEMORY, typ=x.typ)
             lhs.source_pos = getpos(x.ast_source)
-            kw_ast_val = sig.default_values[x.name]  # e.g. `3` in x: int = 3
+            kw_ast_val = func_t.default_values[x.name]  # e.g. `3` in x: int = 3
             rhs = Expr(kw_ast_val, context).ir_node
 
             copy_arg = make_setter(lhs, rhs)
             copy_arg.source_pos = getpos(x.ast_source)
             ret.append(copy_arg)
 
-        ret.append(["goto", sig.external_function_base_entry_label])
+        ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
 
         method_id_check = ["eq", "_calldata_method_id", method_id]
 
@@ -155,7 +152,7 @@ def handler_for(calldata_kwargs, default_kwargs):
 
     ret = ["seq"]
 
-    keyword_args = sig.default_args
+    keyword_args = func_t.keyword_args
 
     # allocate variable slots in memory
     for arg in keyword_args:
@@ -175,31 +172,32 @@ def handler_for(calldata_kwargs, default_kwargs):
 # TODO it would be nice if this returned a data structure which were
 # amenable to generating a jump table instead of the linear search for
 # method_id we have now.
-def generate_ir_for_external_function(code, sig, context, skip_nonpayable_check):
+def generate_ir_for_external_function(code, func_t, context, skip_nonpayable_check):
     # TODO type hints:
     # def generate_ir_for_external_function(
-    #    code: vy_ast.FunctionDef, sig: FunctionSignature, context: Context, check_nonpayable: bool,
+    #    code: vy_ast.FunctionDef,
+    #    func_t: ContractFunctionT,
+    #    context: Context,
+    #    check_nonpayable: bool,
     # ) -> IRnode:
     """Return the IR for an external function. Includes code to inspect the method_id,
     enter the function (nonpayable and reentrancy checks), handle kwargs and exit
     the function (clean up reentrancy storage variables)
     """
-    func_type = code._metadata["type"]
-
-    nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_type)
+    nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_t)
 
     # generate handlers for base args and register the variable records
-    handle_base_args = _register_function_args(context, sig)
+    handle_base_args = _register_function_args(func_t, context)
 
     # generate handlers for kwargs and register the variable records
-    kwarg_handlers = _generate_kwarg_handlers(context, sig)
+    kwarg_handlers = _generate_kwarg_handlers(func_t, context)
 
     body = ["seq"]
     # once optional args have been handled,
     # generate the main body of the function
     body += handle_base_args
 
-    if sig.mutability != "payable" and not skip_nonpayable_check:
+    if not func_t.is_payable and not skip_nonpayable_check:
         # if the contract contains payable functions, but this is not one of them
         # add an assertion that the value of the call is zero
         body += [["assert", ["iszero", "callvalue"]]]
@@ -209,10 +207,10 @@ def generate_ir_for_external_function(code, sig, context, skip_nonpayable_check)
     body += [parse_body(code.body, context, ensure_terminated=True)]
 
     # wrap the body in labeled block
-    body = ["label", sig.external_function_base_entry_label, ["var_list"], body]
+    body = ["label", func_t._ir_info.external_function_base_entry_label, ["var_list"], body]
 
     exit_sequence = ["seq"] + nonreentrant_post
-    if sig.is_init_func:
+    if func_t.is_constructor:
         pass  # init func has special exit sequence generated by module.py
     elif context.return_type is None:
         exit_sequence += [["stop"]]
@@ -223,17 +221,17 @@ def generate_ir_for_external_function(code, sig, context, skip_nonpayable_check)
     if context.return_type is not None:
         exit_sequence_args += ["ret_ofst", "ret_len"]
     # wrap the exit in a labeled block
-    exit = ["label", sig.exit_sequence_label, exit_sequence_args, exit_sequence]
+    exit = ["label", func_t._ir_info.exit_sequence_label, exit_sequence_args, exit_sequence]
 
     # the ir which comprises the main body of the function,
     # besides any kwarg handling
     func_common_ir = ["seq", body, exit]
 
-    if sig.is_default_func or sig.is_init_func:
+    if func_t.is_fallback or func_t.is_constructor:
         ret = ["seq"]
         # add a goto to make the function entry look like other functions
         # (for zksync interpreter)
-        ret.append(["goto", sig.external_function_base_entry_label])
+        ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
         ret.append(func_common_ir)
     else:
         ret = kwarg_handlers
@@ -241,4 +239,4 @@ def generate_ir_for_external_function(code, sig, context, skip_nonpayable_check)
         # TODO rethink this / make it clearer
         ret[-1][-1].append(func_common_ir)
 
-    return IRnode.from_list(ret, source_pos=getpos(sig.func_ast_code))
+    return IRnode.from_list(ret, source_pos=getpos(code))
diff --git a/vyper/codegen/function_definitions/internal_function.py b/vyper/codegen/function_definitions/internal_function.py
index b0ca117b6b..d27d8e36e3 100644
--- a/vyper/codegen/function_definitions/internal_function.py
+++ b/vyper/codegen/function_definitions/internal_function.py
@@ -1,18 +1,18 @@
 from vyper import ast as vy_ast
-from vyper.ast.signatures import FunctionSignature
 from vyper.codegen.context import Context
 from vyper.codegen.function_definitions.utils import get_nonreentrant_lock
 from vyper.codegen.ir_node import IRnode
 from vyper.codegen.stmt import parse_body
+from vyper.semantics.types.function import ContractFunctionT
 
 
 def generate_ir_for_internal_function(
-    code: vy_ast.FunctionDef, sig: FunctionSignature, context: Context
+    code: vy_ast.FunctionDef, func_t: ContractFunctionT, context: Context
 ) -> IRnode:
     """
     Parse a internal function (FuncDef), and produce full function body.
 
-    :param sig: the FuntionSignature
+    :param func_t: the ContractFunctionT
     :param code: ast of function
     :param context: current calling context
     :return: function body in IR
@@ -37,22 +37,20 @@ def generate_ir_for_internal_function(
     # situation like the following is easy to bork:
     #   x: T[2] = [self.generate_T(), self.generate_T()]
 
-    func_type = code._metadata["type"]
-
     # Get nonreentrant lock
 
-    for arg in sig.args:
+    for arg in func_t.arguments:
         # allocate a variable for every arg, setting mutability
         # to False to comply with vyper semantics, function arguments are immutable
         context.new_variable(arg.name, arg.typ, is_mutable=False)
 
-    nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_type)
+    nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_t)
 
-    function_entry_label = sig.internal_function_label
-    cleanup_label = sig.exit_sequence_label
+    function_entry_label = func_t._ir_info.internal_function_label
+    cleanup_label = func_t._ir_info.exit_sequence_label
 
     stack_args = ["var_list"]
-    if func_type.return_type:
+    if func_t.return_type:
         stack_args += ["return_buffer"]
     stack_args += ["return_pc"]
 
diff --git a/vyper/codegen/global_context.py b/vyper/codegen/global_context.py
index 5de04d5127..1f6783f6f8 100644
--- a/vyper/codegen/global_context.py
+++ b/vyper/codegen/global_context.py
@@ -2,8 +2,6 @@
 from typing import Optional
 
 from vyper import ast as vy_ast
-from vyper.semantics.namespace import get_namespace, override_global_namespace
-from vyper.semantics.types.utils import type_from_annotation
 
 
 # Datatype to store all global context information.
@@ -25,16 +23,6 @@ def variables(self):
         variable_decls = self._module.get_children(vy_ast.VariableDecl)
         return {s.target.id: s.target._metadata["varinfo"] for s in variable_decls}
 
-    def parse_type(self, ast_node):
-        # kludge implementation for backwards compatibility.
-        # TODO: replace with type_from_ast
-        try:
-            ns = self._module._metadata["namespace"]
-        except AttributeError:
-            ns = get_namespace()
-        with override_global_namespace(ns):
-            return type_from_annotation(ast_node)
-
     @property
     def immutables(self):
         return [t for t in self.variables.values() if t.is_immutable]
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index bdf8c067f7..320cf43b55 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -1,15 +1,13 @@
 # a contract.vy -- all functions and constructor
 
-from typing import Any, Dict, List, Optional, Tuple
+from typing import Any, List, Optional
 
 from vyper import ast as vy_ast
-from vyper.ast.signatures.function_signature import FunctionSignature, FunctionSignatures
 from vyper.codegen.core import shr
-from vyper.codegen.function_definitions import generate_ir_for_function
+from vyper.codegen.function_definitions import FuncIRInfo, generate_ir_for_function
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
 from vyper.exceptions import CompilerPanic
-from vyper.semantics.types.function import StateMutability
 
 
 def _topsort_helper(functions, lookup):
@@ -34,12 +32,12 @@ def _topsort(functions):
     return list(dict.fromkeys(_topsort_helper(functions, lookup)))
 
 
-def _is_init_func(func_ast):
-    return func_ast._metadata["signature"].is_init_func
+def _is_constructor(func_ast):
+    return func_ast._metadata["type"].is_constructor
 
 
-def _is_default_func(func_ast):
-    return func_ast._metadata["signature"].is_default_func
+def _is_fallback(func_ast):
+    return func_ast._metadata["type"].is_fallback
 
 
 def _is_internal(func_ast):
@@ -47,21 +45,21 @@ def _is_internal(func_ast):
 
 
 def _is_payable(func_ast):
-    return func_ast._metadata["type"].mutability == StateMutability.PAYABLE
+    return func_ast._metadata["type"].is_payable
 
 
 # codegen for all runtime functions + callvalue/calldata checks + method selector routines
-def _runtime_ir(runtime_functions, all_sigs, global_ctx):
+def _runtime_ir(runtime_functions, global_ctx):
     # categorize the runtime functions because we will organize the runtime
     # code into the following sections:
     # payable functions, nonpayable functions, fallback function, internal_functions
     internal_functions = [f for f in runtime_functions if _is_internal(f)]
 
     external_functions = [f for f in runtime_functions if not _is_internal(f)]
-    default_function = next((f for f in external_functions if _is_default_func(f)), None)
+    default_function = next((f for f in external_functions if _is_fallback(f)), None)
 
     # functions that need to go exposed in the selector section
-    regular_functions = [f for f in external_functions if not _is_default_func(f)]
+    regular_functions = [f for f in external_functions if not _is_fallback(f)]
     payables = [f for f in regular_functions if _is_payable(f)]
     nonpayables = [f for f in regular_functions if not _is_payable(f)]
 
@@ -70,7 +68,7 @@ def _runtime_ir(runtime_functions, all_sigs, global_ctx):
     internal_functions_ir: list[IRnode] = []
 
     for func_ast in internal_functions:
-        func_ir = generate_ir_for_function(func_ast, all_sigs, global_ctx, False)
+        func_ir = generate_ir_for_function(func_ast, global_ctx, False)
         internal_functions_ir.append(func_ir)
 
     # for some reason, somebody may want to deploy a contract with no
@@ -95,20 +93,18 @@ def _runtime_ir(runtime_functions, all_sigs, global_ctx):
     selector_section = ["seq"]
 
     for func_ast in payables:
-        func_ir = generate_ir_for_function(func_ast, all_sigs, global_ctx, False)
+        func_ir = generate_ir_for_function(func_ast, global_ctx, False)
         selector_section.append(func_ir)
 
     if batch_payable_check:
         selector_section.append(["assert", ["iszero", "callvalue"]])
 
     for func_ast in nonpayables:
-        func_ir = generate_ir_for_function(func_ast, all_sigs, global_ctx, skip_nonpayable_check)
+        func_ir = generate_ir_for_function(func_ast, global_ctx, skip_nonpayable_check)
         selector_section.append(func_ir)
 
     if default_function:
-        fallback_ir = generate_ir_for_function(
-            default_function, all_sigs, global_ctx, skip_nonpayable_check
-        )
+        fallback_ir = generate_ir_for_function(default_function, global_ctx, skip_nonpayable_check)
     else:
         fallback_ir = IRnode.from_list(
             ["revert", 0, 0], annotation="Default function", error_msg="fallback function"
@@ -133,56 +129,43 @@ def _runtime_ir(runtime_functions, all_sigs, global_ctx):
     return runtime
 
 
-# take a GlobalContext, which is basically
-# and generate the runtime and deploy IR, also return the dict of all signatures
-def generate_ir_for_module(global_ctx: GlobalContext) -> Tuple[IRnode, IRnode, FunctionSignatures]:
+# take a GlobalContext, and generate the runtime and deploy IR
+def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
     # order functions so that each function comes after all of its callees
     function_defs = _topsort(global_ctx.functions)
 
-    # FunctionSignatures for all interfaces defined in this module
-    all_sigs: Dict[str, FunctionSignatures] = {}
-
     init_function: Optional[vy_ast.FunctionDef] = None
-    local_sigs: FunctionSignatures = {}  # internal/local functions
 
-    # generate all signatures
-    # TODO really this should live in GlobalContext
+    # generate all FuncIRInfos
     for f in function_defs:
-        sig = FunctionSignature.from_definition(f, global_ctx)
-        # add it to the global namespace.
-        local_sigs[sig.name] = sig
-        # a little hacky, eventually FunctionSignature should be
-        # merged with ContractFunction and we can remove this.
-        f._metadata["signature"] = sig
-
-    assert "self" not in all_sigs
-    all_sigs["self"] = local_sigs
+        func_t = f._metadata["type"]
+        func_t._ir_info = FuncIRInfo(func_t)
 
-    runtime_functions = [f for f in function_defs if not _is_init_func(f)]
-    init_function = next((f for f in function_defs if _is_init_func(f)), None)
+    runtime_functions = [f for f in function_defs if not _is_constructor(f)]
+    init_function = next((f for f in function_defs if _is_constructor(f)), None)
 
-    runtime = _runtime_ir(runtime_functions, all_sigs, global_ctx)
+    runtime = _runtime_ir(runtime_functions, global_ctx)
 
     deploy_code: List[Any] = ["seq"]
     immutables_len = global_ctx.immutable_section_bytes
     if init_function:
         # TODO might be cleaner to separate this into an _init_ir helper func
         init_func_ir = generate_ir_for_function(
-            init_function, all_sigs, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
+            init_function, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
         )
         deploy_code.append(init_func_ir)
 
         # pass the amount of memory allocated for the init function
         # so that deployment does not clobber while preparing immutables
         # note: (deploy mem_ofst, code, extra_padding)
-        init_mem_used = init_function._metadata["signature"].frame_info.mem_used
+        init_mem_used = init_function._metadata["type"]._ir_info.frame_info.mem_used
         deploy_code.append(["deploy", init_mem_used, runtime, immutables_len])
 
         # internal functions come after everything else
         internal_functions = [f for f in runtime_functions if _is_internal(f)]
         for f in internal_functions:
             func_ir = generate_ir_for_function(
-                f, all_sigs, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
+                f, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
             )
             # note: we depend on dead code eliminator to clean dead function defs
             deploy_code.append(func_ir)
@@ -192,4 +175,4 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> Tuple[IRnode, IRnode, F
             raise CompilerPanic("unreachable")
         deploy_code.append(["deploy", 0, runtime, 0])
 
-    return IRnode.from_list(deploy_code), IRnode.from_list(runtime), local_sigs
+    return IRnode.from_list(deploy_code), IRnode.from_list(runtime)
diff --git a/vyper/codegen/return_.py b/vyper/codegen/return_.py
index 4a39127a14..b8468f3eb1 100644
--- a/vyper/codegen/return_.py
+++ b/vyper/codegen/return_.py
@@ -19,9 +19,9 @@
 
 # Generate code for return stmt
 def make_return_stmt(ir_val: IRnode, stmt: Any, context: Context) -> Optional[IRnode]:
-    sig = context.sig
+    func_t = context.func_t
 
-    jump_to_exit = ["exit_to", f"_sym_{sig.exit_sequence_label}"]
+    jump_to_exit = ["exit_to", f"_sym_{func_t._ir_info.exit_sequence_label}"]
 
     if context.return_type is None:
         if stmt.value is not None:
@@ -35,7 +35,7 @@ def make_return_stmt(ir_val: IRnode, stmt: Any, context: Context) -> Optional[IR
     # do NOT bypass this. jump_to_exit may do important function cleanup.
     def finalize(fill_return_buffer):
         fill_return_buffer = IRnode.from_list(
-            fill_return_buffer, annotation=f"fill return buffer {sig._ir_identifier}"
+            fill_return_buffer, annotation=f"fill return buffer {func_t._ir_info.ir_identifier}"
         )
         cleanup_loops = "cleanup_repeat" if context.forvars else "seq"
         # NOTE: because stack analysis is incomplete, cleanup_repeat must
diff --git a/vyper/codegen/self_call.py b/vyper/codegen/self_call.py
index b5429ca255..42a9bf2f11 100644
--- a/vyper/codegen/self_call.py
+++ b/vyper/codegen/self_call.py
@@ -1,7 +1,7 @@
 from vyper.codegen.core import _freshname, eval_once_check, make_setter
 from vyper.codegen.ir_node import IRnode, push_label_to_stack
 from vyper.evm.address_space import MEMORY
-from vyper.exceptions import StateAccessViolation, StructureException
+from vyper.exceptions import StateAccessViolation
 from vyper.semantics.types.subscriptable import TupleT
 
 _label_counter = 0
@@ -14,6 +14,21 @@ def _generate_label(name: str) -> str:
     return f"label{_label_counter}"
 
 
+def _align_kwargs(func_t, args_ir):
+    """
+    Using a list of args, find the kwargs which need to be filled in by
+    the compiler
+    """
+
+    # sanity check
+    assert func_t.n_positional_args <= len(args_ir) <= func_t.n_total_args
+
+    num_provided_kwargs = len(args_ir) - func_t.n_positional_args
+
+    unprovided_kwargs = func_t.keyword_args[num_provided_kwargs:]
+    return [i.default_value for i in unprovided_kwargs]
+
+
 def ir_for_self_call(stmt_expr, context):
     from vyper.codegen.expr import Expr  # TODO rethink this circular import
 
@@ -24,45 +39,44 @@ def ir_for_self_call(stmt_expr, context):
     # - push jumpdest (callback ptr) and return buffer location
     # - jump to label
     # - (private function will fill return buffer and jump back)
-
     method_name = stmt_expr.func.attr
+    func_t = stmt_expr.func._metadata["type"]
 
     pos_args_ir = [Expr(x, context).ir_node for x in stmt_expr.args]
 
-    sig, kw_vals = context.lookup_internal_function(method_name, pos_args_ir, stmt_expr)
+    default_vals = _align_kwargs(func_t, pos_args_ir)
+    default_vals_ir = [Expr(x, context).ir_node for x in default_vals]
 
-    kw_args_ir = [Expr(x, context).ir_node for x in kw_vals]
-
-    args_ir = pos_args_ir + kw_args_ir
+    args_ir = pos_args_ir + default_vals_ir
+    assert len(args_ir) == len(func_t.arguments)
 
     args_tuple_t = TupleT([x.typ for x in args_ir])
     args_as_tuple = IRnode.from_list(["multi"] + [x for x in args_ir], typ=args_tuple_t)
 
-    if context.is_constant() and sig.mutability not in ("view", "pure"):
+    # CMC 2023-05-17 this seems like it is already caught in typechecker
+    if context.is_constant() and func_t.is_mutable:
         raise StateAccessViolation(
             f"May not call state modifying function "
             f"'{method_name}' within {context.pp_constancy()}.",
             stmt_expr,
         )
 
-    # TODO move me to type checker phase
-    if not sig.internal:
-        raise StructureException("Cannot call external functions via 'self'", stmt_expr)
-
-    return_label = _generate_label(f"{sig.internal_function_label}_call")
+    # note: internal_function_label asserts `func_t.is_internal`.
+    return_label = _generate_label(f"{func_t._ir_info.internal_function_label}_call")
 
     # allocate space for the return buffer
     # TODO allocate in stmt and/or expr.py
-    if sig.return_type is not None:
+    if func_t.return_type is not None:
         return_buffer = IRnode.from_list(
-            context.new_internal_variable(sig.return_type), annotation=f"{return_label}_return_buf"
+            context.new_internal_variable(func_t.return_type),
+            annotation=f"{return_label}_return_buf",
         )
     else:
         return_buffer = None
 
     # note: dst_tuple_t != args_tuple_t
-    dst_tuple_t = TupleT([arg.typ for arg in sig.args])
-    args_dst = IRnode(sig.frame_info.frame_start, typ=dst_tuple_t, location=MEMORY)
+    dst_tuple_t = TupleT(tuple(func_t.argument_types))
+    args_dst = IRnode(func_t._ir_info.frame_info.frame_start, typ=dst_tuple_t, location=MEMORY)
 
     # if one of the arguments is a self call, the argument
     # buffer could get borked. to prevent against that,
@@ -84,7 +98,7 @@ def ir_for_self_call(stmt_expr, context):
     else:
         copy_args = make_setter(args_dst, args_as_tuple)
 
-    goto_op = ["goto", sig.internal_function_label]
+    goto_op = ["goto", func_t._ir_info.internal_function_label]
     # pass return buffer to subroutine
     if return_buffer is not None:
         goto_op += [return_buffer]
@@ -100,10 +114,10 @@ def ir_for_self_call(stmt_expr, context):
 
     o = IRnode.from_list(
         call_sequence,
-        typ=sig.return_type,
+        typ=func_t.return_type,
         location=MEMORY,
         annotation=stmt_expr.get("node_source_code"),
-        add_gas_estimate=sig.gas_estimate,
+        add_gas_estimate=func_t._ir_info.gas_estimate,
     )
     o.is_self_call = True
     return o
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index e24c429638..91d45f4916 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -60,7 +60,7 @@ def parse_Name(self):
             raise StructureException(f"Unsupported statement type: {type(self.stmt)}", self.stmt)
 
     def parse_AnnAssign(self):
-        ltyp = self.context.parse_type(self.stmt.annotation)
+        ltyp = self.stmt.target._metadata["type"]
         varname = self.stmt.target.id
         alloced = self.context.new_variable(varname, ltyp)
 
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 408cb9d239..e30f021c6b 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -44,7 +44,7 @@ def build_external_interface_output(compiler_data: CompilerData) -> str:
     for func in interface.functions.values():
         if func.visibility == FunctionVisibility.INTERNAL or func.name == "__init__":
             continue
-        args = ", ".join([f"{name}: {typ}" for name, typ in func.arguments.items()])
+        args = ", ".join([f"{arg.name}: {arg.typ}" for arg in func.arguments])
         return_value = f" -> {func.return_type}" if func.return_type is not None else ""
         mutability = func.mutability.value
         out = f"{out}    def {func.name}({args}){return_value}: {mutability}\n"
@@ -69,7 +69,7 @@ def build_interface_output(compiler_data: CompilerData) -> str:
                 continue
             if func.mutability != StateMutability.NONPAYABLE:
                 out = f"{out}@{func.mutability.value}\n"
-            args = ", ".join([f"{name}: {typ}" for name, typ in func.arguments.items()])
+            args = ", ".join([f"{arg.name}: {arg.typ}" for arg in func.arguments])
             return_value = f" -> {func.return_type}" if func.return_type is not None else ""
             out = f"{out}@external\ndef {func.name}({args}){return_value}:\n    pass\n\n"
 
@@ -117,20 +117,39 @@ def _var_rec_dict(variable_record):
         ret["location"] = ret["location"].name
         return ret
 
-    def _to_dict(sig):
-        ret = vars(sig)
+    def _to_dict(func_t):
+        ret = vars(func_t)
         ret["return_type"] = str(ret["return_type"])
-        ret["_ir_identifier"] = sig._ir_identifier
-        for attr in ("gas_estimate", "func_ast_code"):
-            del ret[attr]
-        for attr in ("args", "base_args", "default_args"):
-            if attr in ret:
-                ret[attr] = {arg.name: str(arg.typ) for arg in ret[attr]}
-        for k in ret["default_values"]:
-            # e.g. {"x": vy_ast.Int(..)} -> {"x": 1}
-            ret["default_values"][k] = ret["default_values"][k].node_source_code
-        ret["frame_info"] = vars(ret["frame_info"])
+        ret["_ir_identifier"] = func_t._ir_info.ir_identifier
+
+        for attr in ("mutability", "visibility"):
+            ret[attr] = ret[attr].name.lower()
+
+        # e.g. {"x": vy_ast.Int(..)} -> {"x": 1}
+        ret["default_values"] = {
+            k: val.node_source_code for k, val in func_t.default_values.items()
+        }
+
+        for attr in ("positional_args", "keyword_args"):
+            args = ret[attr]
+            ret[attr] = {arg.name: str(arg.typ) for arg in args}
+
+        ret["frame_info"] = vars(func_t._ir_info.frame_info)
         del ret["frame_info"]["frame_vars"]  # frame_var.pos might be IR, cannot serialize
+
+        keep_keys = {
+            "name",
+            "return_type",
+            "positional_args",
+            "keyword_args",
+            "default_values",
+            "frame_info",
+            "mutability",
+            "visibility",
+            "_ir_identifier",
+            "nonreentrant_key",
+        }
+        ret = {k: v for k, v in ret.items() if k in keep_keys}
         return ret
 
     return {"function_info": {name: _to_dict(sig) for (name, sig) in sigs.items()}}
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 5d16517bc8..5156aa1bbd 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -4,12 +4,12 @@
 from typing import Optional, Tuple
 
 from vyper import ast as vy_ast
-from vyper.ast.signatures.function_signature import FunctionSignatures
 from vyper.codegen import module
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
 from vyper.ir import compile_ir, optimizer
 from vyper.semantics import set_data_positions, validate_semantics
+from vyper.semantics.types.function import ContractFunctionT
 from vyper.typing import InterfaceImports, StorageLayout
 
 
@@ -123,18 +123,22 @@ def _ir_output(self):
 
     @property
     def ir_nodes(self) -> IRnode:
-        ir, ir_runtime, sigs = self._ir_output
+        ir, ir_runtime = self._ir_output
         return ir
 
     @property
     def ir_runtime(self) -> IRnode:
-        ir, ir_runtime, sigs = self._ir_output
+        ir, ir_runtime = self._ir_output
         return ir_runtime
 
     @property
-    def function_signatures(self) -> FunctionSignatures:
-        ir, ir_runtime, sigs = self._ir_output
-        return sigs
+    def function_signatures(self) -> dict[str, ContractFunctionT]:
+        # some metadata gets calculated during codegen, so
+        # ensure codegen is run:
+        _ = self._ir_output
+
+        fs = self.vyper_module_folded.get_children(vy_ast.FunctionDef)
+        return {f.name: f._metadata["type"] for f in fs}
 
     @cached_property
     def assembly(self) -> list:
@@ -232,9 +236,7 @@ def generate_folded_ast(
     return vyper_module_folded, symbol_tables
 
 
-def generate_ir_nodes(
-    global_ctx: GlobalContext, no_optimize: bool
-) -> Tuple[IRnode, IRnode, FunctionSignatures]:
+def generate_ir_nodes(global_ctx: GlobalContext, no_optimize: bool) -> tuple[IRnode, IRnode]:
     """
     Generate the intermediate representation (IR) from the contextualized AST.
 
@@ -254,11 +256,11 @@ def generate_ir_nodes(
         IR to generate deployment bytecode
         IR to generate runtime bytecode
     """
-    ir_nodes, ir_runtime, function_sigs = module.generate_ir_for_module(global_ctx)
+    ir_nodes, ir_runtime = module.generate_ir_for_module(global_ctx)
     if not no_optimize:
         ir_nodes = optimizer.optimize(ir_nodes)
         ir_runtime = optimizer.optimize(ir_runtime)
-    return ir_nodes, ir_runtime, function_sigs
+    return ir_nodes, ir_runtime
 
 
 def generate_assembly(ir_nodes: IRnode, no_optimize: bool = False) -> list:
diff --git a/vyper/compiler/utils.py b/vyper/compiler/utils.py
index baa35ac93d..8de2589367 100644
--- a/vyper/compiler/utils.py
+++ b/vyper/compiler/utils.py
@@ -1,12 +1,15 @@
 from typing import Dict
 
-from vyper.ast.signatures import FunctionSignature
+from vyper.semantics.types.function import ContractFunctionT
 
 
-def build_gas_estimates(function_sigs: Dict[str, FunctionSignature]) -> dict:
-    # note: `.gas_estimate` is added to FunctionSignature
-    # in vyper/codegen/function_definitions/common.py
-    return {k: v.gas_estimate for (k, v) in function_sigs.items()}
+def build_gas_estimates(func_ts: Dict[str, ContractFunctionT]) -> dict:
+    # note: `.gas_estimate` is added to ContractFunctionT._ir_info
+    # in vyper/semantics/types/function.py
+    ret = {}
+    for k, v in func_ts.items():
+        ret[k] = v._ir_info.gas_estimate
+    return ret
 
 
 def expand_source_map(compressed_map: str) -> list:
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index 4bbd77fdd4..e501be5fdb 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -43,9 +43,9 @@ def __init__(self, fn_node: vy_ast.FunctionDef, namespace: dict) -> None:
         self.namespace = namespace
         self.expr_visitor = ExpressionAnnotationVisitor(self.func)
 
-        assert len(self.func.kwarg_keys) == len(fn_node.args.defaults)
-        for kw, val in zip(self.func.kwarg_keys, fn_node.args.defaults):
-            self.expr_visitor.visit(val, self.func.arguments[kw])
+        assert self.func.n_keyword_args == len(fn_node.args.defaults)
+        for kwarg in self.func.keyword_args:
+            self.expr_visitor.visit(kwarg.default_value, kwarg.typ)
 
     def visit(self, node):
         super().visit(node)
@@ -136,7 +136,7 @@ def visit_Call(self, node, type_):
             # function calls
             if call_type.is_internal:
                 self.func.called_functions.add(call_type)
-            for arg, typ in zip(node.args, list(call_type.arguments.values())):
+            for arg, typ in zip(node.args, call_type.argument_types):
                 self.visit(arg, typ)
             for kwarg in node.keywords:
                 # We should only see special kwargs
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index 23ccc216a6..a09a8476d6 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -173,8 +173,10 @@ def __init__(
         self.func = fn_node._metadata["type"]
         self.annotation_visitor = StatementAnnotationVisitor(fn_node, namespace)
         self.expr_visitor = _LocalExpressionVisitor()
-        for argname, argtype in self.func.arguments.items():
-            namespace[argname] = VarInfo(argtype, location=DataLocation.CALLDATA, is_immutable=True)
+        for arg in self.func.arguments:
+            namespace[arg.name] = VarInfo(
+                arg.typ, location=DataLocation.CALLDATA, is_immutable=True
+            )
 
         for node in fn_node.body:
             self.visit(node)
diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index bfcdf6349a..c184c44c5b 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -1,6 +1,7 @@
 import re
 import warnings
-from collections import OrderedDict
+from dataclasses import dataclass
+from functools import cached_property
 from typing import Any, Dict, List, Optional, Tuple
 
 from vyper import ast as vy_ast
@@ -25,32 +26,46 @@
 from vyper.utils import OrderedSet, keccak256
 
 
+@dataclass
+class _FunctionArg:
+    name: str
+    typ: VyperType
+
+
+@dataclass
+class PositionalArg(_FunctionArg):
+    ast_source: Optional[vy_ast.VyperNode] = None
+
+
+@dataclass
+class KeywordArg(_FunctionArg):
+    default_value: vy_ast.VyperNode
+    ast_source: Optional[vy_ast.VyperNode] = None
+
+
 class ContractFunctionT(VyperType):
     """
     Contract function type.
 
     Functions compare false against all types and so cannot be assigned without
     being called. Calls are validated by `fetch_call_return`, check the call
-    arguments against `arguments`, and return `return_type`.
+    arguments against `positional_args` and `keyword_arg`, and return `return_type`.
 
     Attributes
     ----------
     name : str
         The name of the function.
-    arguments : OrderedDict
-        Function input arguments as {'name': VyperType}
-    min_arg_count : int
-        The minimum number of required input arguments.
-    max_arg_count : int
-        The maximum number of required input arguments. When a function has no
-        default arguments, this value is the same as `min_arg_count`.
-    kwarg_keys : List
-        List of optional input argument keys.
+    positional_args: list[PositionalArg]
+        Positional args for this function
+    keyword_args: list[KeywordArg]
+        Keyword args for this function
+    return_type: Optional[VyperType]
+        Type of return value
     function_visibility : FunctionVisibility
         enum indicating the external visibility of a function.
     state_mutability : StateMutability
         enum indicating the authority a function has to mutate it's own state.
-    nonreentrant : str
+    nonreentrant : Optional[str]
         Re-entrancy lock name.
     """
 
@@ -59,10 +74,8 @@ class ContractFunctionT(VyperType):
     def __init__(
         self,
         name: str,
-        arguments: OrderedDict,
-        # TODO rename to something like positional_args, keyword_args
-        min_arg_count: int,
-        max_arg_count: int,
+        positional_args: list[PositionalArg],
+        keyword_args: list[KeywordArg],
         return_type: Optional[VyperType],
         function_visibility: FunctionVisibility,
         state_mutability: StateMutability,
@@ -71,13 +84,9 @@ def __init__(
         super().__init__()
 
         self.name = name
-        self.arguments = arguments
-        self.min_arg_count = min_arg_count
-        self.max_arg_count = max_arg_count
+        self.positional_args = positional_args
+        self.keyword_args = keyword_args
         self.return_type = return_type
-        self.kwarg_keys = []
-        if min_arg_count < max_arg_count:
-            self.kwarg_keys = list(self.arguments)[min_arg_count:]
         self.visibility = function_visibility
         self.mutability = state_mutability
         self.nonreentrant = nonreentrant
@@ -85,18 +94,28 @@ def __init__(
         # a list of internal functions this function calls
         self.called_functions = OrderedSet()
 
+        # to be populated during codegen
+        self._ir_info: Any = None
+
+    @cached_property
+    def call_site_kwargs(self):
         # special kwargs that are allowed in call site
-        self.call_site_kwargs = {
+        return {
             "gas": KwargSettings(UINT256_T, "gas"),
             "value": KwargSettings(UINT256_T, 0),
             "skip_contract_check": KwargSettings(BoolT(), False, require_literal=True),
-            "default_return_value": KwargSettings(return_type, None),
+            "default_return_value": KwargSettings(self.return_type, None),
         }
 
     def __repr__(self):
-        arg_types = ",".join(repr(a) for a in self.arguments.values())
+        arg_types = ",".join(repr(a) for a in self.argument_types)
         return f"contract function {self.name}({arg_types})"
 
+    def __str__(self):
+        ret_sig = "" if not self.return_type else f" -> {self.return_type}"
+        args_sig = ",".join([str(t) for t in self.argument_types])
+        return f"def {self.name} {args_sig}{ret_sig}:"
+
     # override parent implementation. function type equality does not
     # make too much sense.
     def __eq__(self, other):
@@ -119,10 +138,9 @@ def from_abi(cls, abi: Dict) -> "ContractFunctionT":
         -------
         ContractFunctionT object.
         """
-
-        arguments = OrderedDict()
+        positional_args = []
         for item in abi["inputs"]:
-            arguments[item["name"]] = type_from_abi(item)
+            positional_args.append(PositionalArg(item["name"], type_from_abi(item)))
         return_type = None
         if len(abi["outputs"]) == 1:
             return_type = type_from_abi(abi["outputs"][0])
@@ -130,9 +148,8 @@ def from_abi(cls, abi: Dict) -> "ContractFunctionT":
             return_type = TupleT(tuple(type_from_abi(i) for i in abi["outputs"]))
         return cls(
             abi["name"],
-            arguments,
-            len(arguments),
-            len(arguments),
+            positional_args,
+            [],
             return_type,
             function_visibility=FunctionVisibility.EXTERNAL,
             state_mutability=StateMutability.from_abi(abi),
@@ -272,32 +289,39 @@ def from_FunctionDef(
                     "Constructor may not use default arguments", node.args.defaults[0]
                 )
 
-        arguments = OrderedDict()
-        max_arg_count = len(node.args.args)
-        min_arg_count = max_arg_count - len(node.args.defaults)
-        defaults = [None] * min_arg_count + node.args.defaults
+        argnames = set()  # for checking uniqueness
+        n_total_args = len(node.args.args)
+        n_positional_args = n_total_args - len(node.args.defaults)
 
-        for arg, value in zip(node.args.args, defaults):
-            if arg.arg in ("gas", "value", "skip_contract_check", "default_return_value"):
+        positional_args: list[PositionalArg] = []
+        keyword_args: list[KeywordArg] = []
+
+        for i, arg in enumerate(node.args.args):
+            argname = arg.arg
+            if argname in ("gas", "value", "skip_contract_check", "default_return_value"):
                 raise ArgumentException(
-                    f"Cannot use '{arg.arg}' as a variable name in a function input", arg
+                    f"Cannot use '{argname}' as a variable name in a function input", arg
                 )
-            if arg.arg in arguments:
-                raise ArgumentException(f"Function contains multiple inputs named {arg.arg}", arg)
+            if argname in argnames:
+                raise ArgumentException(f"Function contains multiple inputs named {argname}", arg)
 
             if arg.annotation is None:
-                raise ArgumentException(f"Function argument '{arg.arg}' is missing a type", arg)
+                raise ArgumentException(f"Function argument '{argname}' is missing a type", arg)
 
             type_ = type_from_annotation(arg.annotation, DataLocation.CALLDATA)
 
-            if value is not None:
+            if i < n_positional_args:
+                positional_args.append(PositionalArg(argname, type_, ast_source=arg))
+            else:
+                value = node.args.defaults[i - n_positional_args]
                 if not check_kwargable(value):
                     raise StateAccessViolation(
                         "Value must be literal or environment variable", value
                     )
                 validate_expected_type(value, type_)
+                keyword_args.append(KeywordArg(argname, type_, value, ast_source=arg))
 
-            arguments[arg.arg] = type_
+            argnames.add(argname)
 
         # return types
         if node.returns is None:
@@ -312,7 +336,7 @@ def from_FunctionDef(
         else:
             raise InvalidType("Function return value must be a type name or tuple", node.returns)
 
-        return cls(node.name, arguments, min_arg_count, max_arg_count, return_type, **kwargs)
+        return cls(node.name, positional_args, keyword_args, return_type, **kwargs)
 
     def set_reentrancy_key_position(self, position: StorageSlot) -> None:
         if hasattr(self, "reentrancy_key_position"):
@@ -344,15 +368,14 @@ def getter_from_VariableDecl(cls, node: vy_ast.VariableDecl) -> "ContractFunctio
             raise CompilerPanic("getter generated for non-public function")
         type_ = type_from_annotation(node.annotation, DataLocation.STORAGE)
         arguments, return_type = type_.getter_signature
-        args_dict: OrderedDict = OrderedDict()
-        for item in arguments:
-            args_dict[f"arg{len(args_dict)}"] = item
+        args = []
+        for i, item in enumerate(arguments):
+            args.append(PositionalArg(f"arg{i}", item))
 
         return cls(
             node.target.id,
-            args_dict,
-            len(arguments),
-            len(arguments),
+            args,
+            [],
             return_type,
             function_visibility=FunctionVisibility.EXTERNAL,
             state_mutability=StateMutability.VIEW,
@@ -362,7 +385,7 @@ def getter_from_VariableDecl(cls, node: vy_ast.VariableDecl) -> "ContractFunctio
     # convenience property for compare_signature, as it would
     # appear in a public interface
     def _iface_sig(self) -> Tuple[Tuple, Optional[VyperType]]:
-        return tuple(self.arguments.values()), self.return_type
+        return tuple(self.argument_types), self.return_type
 
     def compare_signature(self, other: "ContractFunctionT") -> bool:
         """
@@ -388,6 +411,31 @@ def compare_signature(self, other: "ContractFunctionT") -> bool:
 
         return True
 
+    @cached_property
+    def default_values(self) -> dict[str, vy_ast.VyperNode]:
+        return {arg.name: arg.default_value for arg in self.keyword_args}
+
+    # for backwards compatibility
+    @cached_property
+    def arguments(self) -> list[_FunctionArg]:
+        return self.positional_args + self.keyword_args  # type: ignore
+
+    @cached_property
+    def argument_types(self) -> list[VyperType]:
+        return [arg.typ for arg in self.arguments]
+
+    @property
+    def n_positional_args(self) -> int:
+        return len(self.positional_args)
+
+    @property
+    def n_keyword_args(self) -> int:
+        return len(self.keyword_args)
+
+    @cached_property
+    def n_total_args(self) -> int:
+        return self.n_positional_args + self.n_keyword_args
+
     @property
     def is_external(self) -> bool:
         return self.visibility == FunctionVisibility.EXTERNAL
@@ -396,6 +444,22 @@ def is_external(self) -> bool:
     def is_internal(self) -> bool:
         return self.visibility == FunctionVisibility.INTERNAL
 
+    @property
+    def is_mutable(self) -> bool:
+        return self.mutability > StateMutability.VIEW
+
+    @property
+    def is_payable(self) -> bool:
+        return self.mutability == StateMutability.PAYABLE
+
+    @property
+    def is_constructor(self) -> bool:
+        return self.name == "__init__"
+
+    @property
+    def is_fallback(self) -> bool:
+        return self.name == "__default__"
+
     @property
     def method_ids(self) -> Dict[str, int]:
         """
@@ -405,58 +469,32 @@ def method_ids(self) -> Dict[str, int]:
         * For functions with default arguments, there is one key for each
           function signature.
         """
-        arg_types = [i.canonical_abi_type for i in self.arguments.values()]
+        arg_types = [i.canonical_abi_type for i in self.argument_types]
 
-        if not self.has_default_args:
+        if self.n_keyword_args == 0:
             return _generate_method_id(self.name, arg_types)
 
         method_ids = {}
-        for i in range(self.min_arg_count, self.max_arg_count + 1):
+        for i in range(self.n_positional_args, self.n_total_args + 1):
             method_ids.update(_generate_method_id(self.name, arg_types[:i]))
         return method_ids
 
-    # for caller-fills-args calling convention
-    def get_args_buffer_offset(self) -> int:
-        """
-        Get the location of the args buffer in the function frame (caller sets)
-        """
-        return 0
-
-    # TODO is this needed?
-    def get_args_buffer_len(self) -> int:
-        """
-        Get the length of the argument buffer in the function frame
-        """
-        return sum(arg_t.size_in_bytes() for arg_t in self.arguments.values())
-
-    @property
-    def is_constructor(self) -> bool:
-        return self.name == "__init__"
-
-    @property
-    def is_fallback(self) -> bool:
-        return self.name == "__default__"
-
-    @property
-    def has_default_args(self) -> bool:
-        return self.min_arg_count < self.max_arg_count
-
     def fetch_call_return(self, node: vy_ast.Call) -> Optional[VyperType]:
         if node.get("func.value.id") == "self" and self.visibility == FunctionVisibility.EXTERNAL:
             raise CallViolation("Cannot call external functions via 'self'", node)
 
         # for external calls, include gas and value as optional kwargs
-        kwarg_keys = self.kwarg_keys.copy()
-        if node.get("func.value.id") != "self":
+        kwarg_keys = [arg.name for arg in self.keyword_args]
+        if not self.is_internal:
             kwarg_keys += list(self.call_site_kwargs.keys())
-        validate_call_args(node, (self.min_arg_count, self.max_arg_count), kwarg_keys)
+        validate_call_args(node, (self.n_positional_args, self.n_total_args), kwarg_keys)
 
         if self.mutability < StateMutability.PAYABLE:
             kwarg_node = next((k for k in node.keywords if k.arg == "value"), None)
             if kwarg_node is not None:
                 raise CallViolation("Cannot send ether to nonpayable function", kwarg_node)
 
-        for arg, expected in zip(node.args, self.arguments.values()):
+        for arg, expected in zip(node.args, self.argument_types):
             validate_expected_type(arg, expected)
 
         # TODO this should be moved to validate_call_args
@@ -511,7 +549,7 @@ def to_toplevel_abi_dict(self):
             abi_dict["type"] = "function"
             abi_dict["name"] = self.name
 
-        abi_dict["inputs"] = [v.to_abi_arg(name=k) for k, v in self.arguments.items()]
+        abi_dict["inputs"] = [arg.typ.to_abi_arg(name=arg.name) for arg in self.arguments]
 
         typ = self.return_type
         if typ is None:
@@ -521,16 +559,21 @@ def to_toplevel_abi_dict(self):
         else:
             abi_dict["outputs"] = [typ.to_abi_arg()]
 
-        if self.has_default_args:
+        if self.n_keyword_args > 0:
             # for functions with default args, return a dict for each possible arg count
             result = []
-            for i in range(self.min_arg_count, self.max_arg_count + 1):
+            for i in range(self.n_positional_args, self.n_total_args + 1):
                 result.append(abi_dict.copy())
                 result[-1]["inputs"] = result[-1]["inputs"][:i]
             return result
         else:
             return [abi_dict]
 
+    # calculate the abi signature for a given set of kwargs
+    def abi_signature_for_kwargs(self, kwargs: list[KeywordArg]) -> str:
+        args = self.positional_args + kwargs  # type: ignore
+        return self.name + "(" + ",".join([arg.typ.abi_type.selector_name() for arg in args]) + ")"
+
 
 class MemberFunctionT(VyperType):
     """

From 9c324b4839080708477e333e1e6327def1485a3d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 14:49:13 -0400
Subject: [PATCH 035/161] chore: only save cache on cache miss (#3421)

in the era compiler tester workflow, we were always saving the cache,
which can lead to a race condition if another workflow is simultaneously
pulling the same cache.
---
 .github/workflows/era-tester.yml | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index ec0fee3bf1..6c15e6af07 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -40,7 +40,7 @@ jobs:
         python-version: ${{ matrix.python-version[0] }}
 
     - name: Get cache
-      id: cache
+      id: get-cache
       uses: actions/cache@v3
       with:
         path: |
@@ -56,7 +56,7 @@ jobs:
         key: ${{ runner.os }}-${{ env.ERA_HASH }}-${{ env.ERA_VYPER_HASH }}
 
     - name: Initialize repository and install dependencies
-      if: steps.cache.outputs.cache-hit != 'true'
+      if: steps.get-cache.outputs.cache-hit != 'true'
       run: |
         git clone --depth 1 https://github.com/matter-labs/era-compiler-tester.git
         cd era-compiler-tester
@@ -70,7 +70,7 @@ jobs:
 
     - name: Save cache
       uses: actions/cache/save@v3
-      if: always()
+      if: steps.get-cache.outputs.cache-hit != 'true'
       with:
         path: |
           ~/.cargo/bin/

From 3837ad39af55a42952a6266ea7eea37d0bada8a0 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 17:16:47 -0400
Subject: [PATCH 036/161] fix: visibility checks for interface implementation
 (#3422)

this commit fixes an issue with interface- implementing checks: function
mutability was not checked. this can cause issues in how functions are
called in the ABI if the mutability is different from the interface
specification.
---
 tests/parser/syntax/test_interfaces.py | 15 +++++++++++++++
 vyper/semantics/types/function.py      |  9 +++++++--
 vyper/semantics/types/user.py          |  5 ++++-
 3 files changed, 26 insertions(+), 3 deletions(-)

diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index d964a17571..acadaff20d 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -3,6 +3,7 @@
 from vyper import compiler
 from vyper.exceptions import (
     ArgumentException,
+    InterfaceViolation,
     InvalidReference,
     InvalidType,
     StructureException,
@@ -119,6 +120,20 @@ def foo():
     """,
         TypeMismatch,
     ),
+    (
+        """
+interface A:
+    def f(a: uint256): view
+
+implements: A
+
+@external
+@nonpayable
+def f(a: uint256): # visibility is nonpayable instead of view
+    pass
+    """,
+        InterfaceViolation,
+    ),
 ]
 
 
diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index c184c44c5b..10711edc8e 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -387,9 +387,10 @@ def getter_from_VariableDecl(cls, node: vy_ast.VariableDecl) -> "ContractFunctio
     def _iface_sig(self) -> Tuple[Tuple, Optional[VyperType]]:
         return tuple(self.argument_types), self.return_type
 
-    def compare_signature(self, other: "ContractFunctionT") -> bool:
+    def implements(self, other: "ContractFunctionT") -> bool:
         """
-        Compare the signature of this function with another function.
+        Checks if this function implements the signature of another
+        function.
 
         Used when determining if an interface has been implemented. This method
         should not be directly implemented by any inherited classes.
@@ -406,9 +407,13 @@ def compare_signature(self, other: "ContractFunctionT") -> bool:
         for atyp, btyp in zip(arguments, other_arguments):
             if not atyp.compare_type(btyp):
                 return False
+
         if return_type and not return_type.compare_type(other_return_type):  # type: ignore
             return False
 
+        if self.mutability > other.mutability:
+            return False
+
         return True
 
     @cached_property
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index ad61da54d9..a603691410 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -324,7 +324,7 @@ def _is_function_implemented(fn_name, fn_type):
             else:
                 return False
 
-            return to_compare.compare_signature(fn_type)
+            return to_compare.implements(fn_type)
 
         # check for missing functions
         for name, type_ in self.members.items():
@@ -345,6 +345,9 @@ def _is_function_implemented(fn_name, fn_type):
                 unimplemented.append(name)
 
         if len(unimplemented) > 0:
+            # TODO: improve the error message for cases where the
+            # mismatch is small (like mutability, or just one argument
+            # is off, etc).
             missing_str = ", ".join(sorted(unimplemented))
             raise InterfaceViolation(
                 f"Contract does not implement all interface functions or events: {missing_str}",

From de433bad8f2501429a2923bb34b9420c628d1728 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 19:02:21 -0400
Subject: [PATCH 037/161] fix: disallow logging from pure, view functions
 (#3424)

---
 .../parser/features/decorators/test_private.py |  2 +-
 tests/parser/syntax/test_logging.py            | 18 +++++++++++++++++-
 vyper/semantics/analysis/local.py              |  4 ++++
 3 files changed, 22 insertions(+), 2 deletions(-)

diff --git a/tests/parser/features/decorators/test_private.py b/tests/parser/features/decorators/test_private.py
index b984921835..7c92f72af9 100644
--- a/tests/parser/features/decorators/test_private.py
+++ b/tests/parser/features/decorators/test_private.py
@@ -433,7 +433,7 @@ def i_am_me() -> bool:
     return msg.sender == self._whoami()
 
 @external
-@view
+@nonpayable
 def whoami() -> address:
     log Addr(self._whoami())
     return self._whoami()
diff --git a/tests/parser/syntax/test_logging.py b/tests/parser/syntax/test_logging.py
index 39573642c0..2dd21e7a92 100644
--- a/tests/parser/syntax/test_logging.py
+++ b/tests/parser/syntax/test_logging.py
@@ -1,7 +1,7 @@
 import pytest
 
 from vyper import compiler
-from vyper.exceptions import InvalidType, TypeMismatch
+from vyper.exceptions import InvalidType, StructureException, TypeMismatch
 
 fail_list = [
     """
@@ -45,3 +45,19 @@ def test_logging_fail(bad_code):
     else:
         with pytest.raises(TypeMismatch):
             compiler.compile_code(bad_code)
+
+
+@pytest.mark.parametrize("mutability", ["@pure", "@view"])
+@pytest.mark.parametrize("visibility", ["@internal", "@external"])
+def test_logging_from_non_mutable(mutability, visibility):
+    code = f"""
+event Test:
+    n: uint256
+
+{visibility}
+{mutability}
+def test():
+    log Test(1)
+    """
+    with pytest.raises(StructureException):
+        compiler.compile_code(code)
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index a09a8476d6..790cee52d6 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -543,6 +543,10 @@ def visit_Log(self, node):
         f = get_exact_type_from_node(node.value.func)
         if not is_type_t(f, EventT):
             raise StructureException("Value is not an event", node.value)
+        if self.func.mutability <= StateMutability.VIEW:
+            raise StructureException(
+                f"Cannot emit logs from {self.func.mutability.value.lower()} functions", node
+            )
         f.fetch_call_return(node.value)
         self.expr_visitor.visit(node.value)
 

From 4f9f8133191c25841e309ad26f3124dbe2a46b21 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 17 May 2023 19:18:13 -0400
Subject: [PATCH 038/161] fix: generate separate function names depending on
 context (#3423)

for backends (like zksync) which only have a single compilation context
(i.e., they do not split initcode and runtime code like EVM), they need
separate names for the two different codes generated per-function as of
c202c4e3ec8. this is also hygienic - since the two functions actually
have different codes as of c202c4e3ec8, give them different names.
---
 tests/compiler/asm/test_asm_optimizer.py                | 4 ++--
 tests/parser/test_call_graph_stability.py               | 4 +++-
 vyper/codegen/function_definitions/common.py            | 6 +++---
 vyper/codegen/function_definitions/internal_function.py | 2 +-
 vyper/codegen/self_call.py                              | 5 +++--
 5 files changed, 12 insertions(+), 9 deletions(-)

diff --git a/tests/compiler/asm/test_asm_optimizer.py b/tests/compiler/asm/test_asm_optimizer.py
index 524b8df064..b82d568ff8 100644
--- a/tests/compiler/asm/test_asm_optimizer.py
+++ b/tests/compiler/asm/test_asm_optimizer.py
@@ -31,8 +31,8 @@ def __init__():
 
     # all the labels should be in all the unoptimized asms
     for s in (foo_label, qux_label):
-        assert s in initcode_asm
-        assert s in runtime_asm
+        assert s + "_deploy" in initcode_asm
+        assert s + "_runtime" in runtime_asm
 
     c = CompilerData(code, no_optimize=False)
     initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
diff --git a/tests/parser/test_call_graph_stability.py b/tests/parser/test_call_graph_stability.py
index 6f78b50053..b651092d16 100644
--- a/tests/parser/test_call_graph_stability.py
+++ b/tests/parser/test_call_graph_stability.py
@@ -70,4 +70,6 @@ def foo():
                 r = d.args[0].args[0].value
                 if isinstance(r, str) and r.startswith("internal"):
                     ir_funcs.append(r)
-        assert ir_funcs == [f._ir_info.internal_function_label for f in sigs.values()]
+        assert ir_funcs == [
+            f._ir_info.internal_function_label(is_ctor_context=False) for f in sigs.values()
+        ]
diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index 431693caaa..45b97831aa 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -57,10 +57,10 @@ def external_function_base_entry_label(self) -> str:
         assert not self.func_t.is_internal, "uh oh, should be external"
         return self.ir_identifier + "_common"
 
-    @property
-    def internal_function_label(self) -> str:
+    def internal_function_label(self, is_ctor_context: bool = False) -> str:
         assert self.func_t.is_internal, "uh oh, should be internal"
-        return self.ir_identifier
+        suffix = "_deploy" if is_ctor_context else "_runtime"
+        return self.ir_identifier + suffix
 
 
 def generate_ir_for_function(
diff --git a/vyper/codegen/function_definitions/internal_function.py b/vyper/codegen/function_definitions/internal_function.py
index d27d8e36e3..17479c4c07 100644
--- a/vyper/codegen/function_definitions/internal_function.py
+++ b/vyper/codegen/function_definitions/internal_function.py
@@ -46,7 +46,7 @@ def generate_ir_for_internal_function(
 
     nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_t)
 
-    function_entry_label = func_t._ir_info.internal_function_label
+    function_entry_label = func_t._ir_info.internal_function_label(context.is_ctor_context)
     cleanup_label = func_t._ir_info.exit_sequence_label
 
     stack_args = ["var_list"]
diff --git a/vyper/codegen/self_call.py b/vyper/codegen/self_call.py
index 42a9bf2f11..311576194b 100644
--- a/vyper/codegen/self_call.py
+++ b/vyper/codegen/self_call.py
@@ -62,7 +62,8 @@ def ir_for_self_call(stmt_expr, context):
         )
 
     # note: internal_function_label asserts `func_t.is_internal`.
-    return_label = _generate_label(f"{func_t._ir_info.internal_function_label}_call")
+    _label = func_t._ir_info.internal_function_label(context.is_ctor_context)
+    return_label = _generate_label(f"{_label}_call")
 
     # allocate space for the return buffer
     # TODO allocate in stmt and/or expr.py
@@ -98,7 +99,7 @@ def ir_for_self_call(stmt_expr, context):
     else:
         copy_args = make_setter(args_dst, args_as_tuple)
 
-    goto_op = ["goto", func_t._ir_info.internal_function_label]
+    goto_op = ["goto", func_t._ir_info.internal_function_label(context.is_ctor_context)]
     # pass return buffer to subroutine
     if return_buffer is not None:
         goto_op += [return_buffer]

From 1ac8362df0c9d501af241df63bc3798cab7f5f9c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 18 May 2023 09:49:12 -0400
Subject: [PATCH 039/161] feat: use new push0 opcode (#3361)

per the shanghai fork - during codegen, use the new `push0` opcode
instead of the `push1 0` sequence
---
 setup.py                             |  4 ++--
 tests/compiler/ir/test_compile_ir.py |  2 +-
 tests/compiler/test_opcodes.py       | 31 ++++++++++++++++------------
 tests/compiler/test_sha3_32.py       |  3 +++
 vyper/compiler/output.py             |  4 ++--
 vyper/evm/opcodes.py                 |  4 +++-
 vyper/ir/compile_ir.py               | 28 ++++++++++---------------
 7 files changed, 40 insertions(+), 36 deletions(-)

diff --git a/setup.py b/setup.py
index 0966a8e31a..05cb52259d 100644
--- a/setup.py
+++ b/setup.py
@@ -14,8 +14,8 @@
         "pytest-xdist>=2.5,<3.0",
         "pytest-split>=0.7.0,<1.0",
         "pytest-rerunfailures>=10.2,<11",
-        "eth-tester[py-evm]>=0.8.0b3,<0.9",
-        "py-evm>=0.6.1a2,<0.7",
+        "eth-tester[py-evm]>=0.9.0b1,<0.10",
+        "py-evm>=0.7.0a1,<0.8",
         "web3==6.0.0",
         "tox>=3.15,<4.0",
         "lark==1.1.2",
diff --git a/tests/compiler/ir/test_compile_ir.py b/tests/compiler/ir/test_compile_ir.py
index 91007da33a..706c31e0f2 100644
--- a/tests/compiler/ir/test_compile_ir.py
+++ b/tests/compiler/ir/test_compile_ir.py
@@ -68,4 +68,4 @@ def test_pc_debugger():
     debugger_ir = ["seq", ["mstore", 0, 32], ["pc_debugger"]]
     ir_nodes = IRnode.from_list(debugger_ir)
     _, line_number_map = compile_ir.assembly_to_evm(compile_ir.compile_to_assembly(ir_nodes))
-    assert line_number_map["pc_breakpoints"][0] == 5
+    assert line_number_map["pc_breakpoints"][0] == 4
diff --git a/tests/compiler/test_opcodes.py b/tests/compiler/test_opcodes.py
index 67ea10c311..f36fcfac6f 100644
--- a/tests/compiler/test_opcodes.py
+++ b/tests/compiler/test_opcodes.py
@@ -8,9 +8,11 @@
 @pytest.fixture(params=list(opcodes.EVM_VERSIONS))
 def evm_version(request):
     default = opcodes.active_evm_version
-    opcodes.active_evm_version = opcodes.EVM_VERSIONS[request.param]
-    yield request.param
-    opcodes.active_evm_version = default
+    try:
+        opcodes.active_evm_version = opcodes.EVM_VERSIONS[request.param]
+        yield request.param
+    finally:
+        opcodes.active_evm_version = default
 
 
 def test_opcodes():
@@ -42,17 +44,20 @@ def test_version_check(evm_version):
 
 
 def test_get_opcodes(evm_version):
-    op = opcodes.get_opcodes()
-    if evm_version in ("paris", "berlin"):
-        assert "CHAINID" in op
-        assert op["SLOAD"][-1] == 2100
+    ops = opcodes.get_opcodes()
+    if evm_version in ("paris", "berlin", "shanghai"):
+        assert "CHAINID" in ops
+        assert ops["SLOAD"][-1] == 2100
+        if evm_version in ("shanghai",):
+            assert "PUSH0" in ops
     elif evm_version == "istanbul":
-        assert "CHAINID" in op
-        assert op["SLOAD"][-1] == 800
+        assert "CHAINID" in ops
+        assert ops["SLOAD"][-1] == 800
     else:
-        assert "CHAINID" not in op
-        assert op["SLOAD"][-1] == 200
+        assert "CHAINID" not in ops
+        assert ops["SLOAD"][-1] == 200
+
     if evm_version in ("byzantium", "atlantis"):
-        assert "CREATE2" not in op
+        assert "CREATE2" not in ops
     else:
-        assert op["CREATE2"][-1] == 32000
+        assert ops["CREATE2"][-1] == 32000
diff --git a/tests/compiler/test_sha3_32.py b/tests/compiler/test_sha3_32.py
index 9fbdf6f000..e1cbf9c843 100644
--- a/tests/compiler/test_sha3_32.py
+++ b/tests/compiler/test_sha3_32.py
@@ -1,9 +1,12 @@
 from vyper.codegen.ir_node import IRnode
+from vyper.evm.opcodes import version_check
 from vyper.ir import compile_ir, optimizer
 
 
 def test_sha3_32():
     ir = ["sha3_32", 0]
     evm = ["PUSH1", 0, "PUSH1", 0, "MSTORE", "PUSH1", 32, "PUSH1", 0, "SHA3"]
+    if version_check(begin="shanghai"):
+        evm = ["PUSH0", "PUSH0", "MSTORE", "PUSH1", 32, "PUSH0", "SHA3"]
     assert compile_ir.compile_to_assembly(IRnode.from_list(ir)) == evm
     assert compile_ir.compile_to_assembly(optimizer.optimize(IRnode.from_list(ir))) == evm
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index e30f021c6b..f061bd8e18 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -208,7 +208,7 @@ def _build_asm(asm_list):
         else:
             output_string += str(node) + " "
 
-            if isinstance(node, str) and node.startswith("PUSH"):
+            if isinstance(node, str) and node.startswith("PUSH") and node != "PUSH0":
                 assert in_push == 0
                 in_push = int(node[4:])
                 output_string += "0x"
@@ -303,7 +303,7 @@ def _build_opcodes(bytecode: bytes) -> str:
     while bytecode_sequence:
         op = bytecode_sequence.popleft()
         opcode_output.append(opcode_map[op])
-        if "PUSH" in opcode_output[-1]:
+        if "PUSH" in opcode_output[-1] and opcode_output[-1] != "PUSH0":
             push_len = int(opcode_map[op][4:])
             push_values = [hex(bytecode_sequence.popleft())[2:] for i in range(push_len)]
             opcode_output.append(f"0x{''.join(push_values).upper()}")
diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index b9f1e77ca8..76529da14e 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -25,11 +25,12 @@
     "istanbul": 2,
     "berlin": 3,
     "paris": 4,
+    "shanghai": 5,
     # ETC Forks
     "atlantis": 0,
     "agharta": 1,
 }
-DEFAULT_EVM_VERSION: str = "paris"
+DEFAULT_EVM_VERSION: str = "shanghai"
 
 
 # opcode as hex value
@@ -102,6 +103,7 @@
     "MSIZE": (0x59, 0, 1, 2),
     "GAS": (0x5A, 0, 1, 2),
     "JUMPDEST": (0x5B, 0, 0, 1),
+    "PUSH0": (0x5F, 0, 1, 2),
     "PUSH1": (0x60, 0, 1, 3),
     "PUSH2": (0x61, 0, 1, 3),
     "PUSH3": (0x62, 0, 1, 3),
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index c24b3a67a2..57ea4ca7e7 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -3,7 +3,7 @@
 import math
 
 from vyper.codegen.ir_node import IRnode
-from vyper.evm.opcodes import get_opcodes
+from vyper.evm.opcodes import get_opcodes, version_check
 from vyper.exceptions import CodegenPanic, CompilerPanic
 from vyper.utils import MemoryPositions
 from vyper.version import version_tuple
@@ -23,7 +23,8 @@ def num_to_bytearray(x):
 
 def PUSH(x):
     bs = num_to_bytearray(x)
-    if len(bs) == 0:
+    # starting in shanghai, can do push0 directly with no immediates
+    if len(bs) == 0 and not version_check(begin="shanghai"):
         bs = [0]
     return [f"PUSH{len(bs)}"] + bs
 
@@ -149,7 +150,7 @@ def _add_postambles(asm_ops):
 
     global _revert_label
 
-    _revert_string = [_revert_label, "JUMPDEST", "PUSH1", 0, "DUP1", "REVERT"]
+    _revert_string = [_revert_label, "JUMPDEST", *PUSH(0), "DUP1", "REVERT"]
 
     if _revert_label in asm_ops:
         # shared failure block
@@ -555,13 +556,10 @@ def _height_of(witharg):
         o = _compile_to_assembly(code.args[0], withargs, existing_labels, break_dest, height)
         o.extend(
             [
-                "PUSH1",
-                MemoryPositions.FREE_VAR_SPACE,
+                *PUSH(MemoryPositions.FREE_VAR_SPACE),
                 "MSTORE",
-                "PUSH1",
-                32,
-                "PUSH1",
-                MemoryPositions.FREE_VAR_SPACE,
+                *PUSH(32),
+                *PUSH(MemoryPositions.FREE_VAR_SPACE),
                 "SHA3",
             ]
         )
@@ -572,16 +570,12 @@ def _height_of(witharg):
         o.extend(_compile_to_assembly(code.args[1], withargs, existing_labels, break_dest, height))
         o.extend(
             [
-                "PUSH1",
-                MemoryPositions.FREE_VAR_SPACE2,
+                *PUSH(MemoryPositions.FREE_VAR_SPACE2),
                 "MSTORE",
-                "PUSH1",
-                MemoryPositions.FREE_VAR_SPACE,
+                *PUSH(MemoryPositions.FREE_VAR_SPACE),
                 "MSTORE",
-                "PUSH1",
-                64,
-                "PUSH1",
-                MemoryPositions.FREE_VAR_SPACE,
+                *PUSH(64),
+                *PUSH(MemoryPositions.FREE_VAR_SPACE),
                 "SHA3",
             ]
         )

From 8aaaa9dbf64d537f57ae73d0db7f48682cecc5c2 Mon Sep 17 00:00:00 2001
From: Kelvin Fan <kelvinfan001@gmail.com>
Date: Thu, 18 May 2023 07:08:00 -0700
Subject: [PATCH 040/161] feat: build for aarch64 (#2687)

Use `universal2` as target arch in pyinstaller

To also build official binary releases for aarch64 machines.

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 Makefile | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/Makefile b/Makefile
index daa1c2bfc9..645b800e79 100644
--- a/Makefile
+++ b/Makefile
@@ -43,7 +43,7 @@ freeze: clean init
 	echo Generating binary...
 	export OS="$$(uname -s | tr A-Z a-z)" && \
 	export VERSION="$$(PYTHONPATH=. python vyper/cli/vyper_compile.py --version)" && \
-	pyinstaller --clean --onefile vyper/cli/vyper_compile.py --name "vyper.$${VERSION}.$${OS}" --add-data vyper:vyper
+	pyinstaller --target-architecture=universal2 --clean --onefile vyper/cli/vyper_compile.py --name "vyper.$${VERSION}.$${OS}" --add-data vyper:vyper
 
 clean: clean-build clean-docs clean-pyc clean-test
 

From a8382f53b70f185fc3035dbfea561ed0737d0463 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 18 May 2023 10:18:33 -0400
Subject: [PATCH 041/161] fix: uninitialized immutable values (#3409)

immutable variables can be read before assignment in constructor code,
and their memory location is accessed, but that memory might not yet
be initialized. prior to this commit, its value is not necessarily
`empty(type)` since memory could have been written to ephemerally. in
particular, `create_copy_of` (and its sister, `create_from_blueprint`)
use `msize` to determine a starting location for where to copy the
target bytecode into memory, while the immutables section start is
determined using the static memory allocator. in case that `msize` is
still less than the immutables section end, `create_copy_of` can write
to the immutables section, thereby resulting in reads from the
immutables section to return garbage.

this commit fixes the issue by issuing an `iload
<immutables_section_end> - 32` before executing any initcode, which
forces `msize` to be initialized past the end of the immutables section
(and therefore, accessing an immutable before it is initialized in the
constructor will produce the "expected" `empty()` value for the
immutable).

note that a corresponding `mload` is not required for runtime code,
because vyper requires all memory variables to be instantiated at the
declaration site, so there is no way that msize can produce a pointer to
an uninitialized memory variable.
---
 tests/parser/features/test_immutable.py | 50 +++++++++++++++++++++++++
 vyper/codegen/module.py                 | 21 ++++++++++-
 2 files changed, 70 insertions(+), 1 deletion(-)

diff --git a/tests/parser/features/test_immutable.py b/tests/parser/features/test_immutable.py
index 488943f784..7300d0f2d9 100644
--- a/tests/parser/features/test_immutable.py
+++ b/tests/parser/features/test_immutable.py
@@ -241,6 +241,56 @@ def get_immutable() -> uint256:
     assert c.get_immutable() == n + 2
 
 
+# GH issue 3101
+def test_immutables_initialized(get_contract):
+    dummy_code = """
+@external
+def foo() -> uint256:
+    return 1
+    """
+    dummy_contract = get_contract(dummy_code)
+
+    code = """
+a: public(immutable(uint256))
+b: public(uint256)
+
+@payable
+@external
+def __init__(to_copy: address):
+    c: address = create_copy_of(to_copy)
+    self.b = a
+    a = 12
+    """
+    c = get_contract(code, dummy_contract.address)
+
+    assert c.b() == 0
+
+
+# GH issue 3101, take 2
+def test_immutables_initialized2(get_contract, get_contract_from_ir):
+    dummy_contract = get_contract_from_ir(
+        ["deploy", 0, ["seq"] + ["invalid"] * 600, 0], no_optimize=True
+    )
+
+    # rekt because immutables section extends past allocated memory
+    code = """
+a0: immutable(uint256[10])
+a: public(immutable(uint256))
+b: public(uint256)
+
+@payable
+@external
+def __init__(to_copy: address):
+    c: address = create_copy_of(to_copy)
+    self.b = a
+    a = 12
+    a0 = empty(uint256[10])
+    """
+    c = get_contract(code, dummy_contract.address)
+
+    assert c.b() == 0
+
+
 # GH issue 3292
 def test_internal_functions_called_by_ctor_location(get_contract):
     code = """
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 320cf43b55..5d05c27e0b 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -153,12 +153,31 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
         init_func_ir = generate_ir_for_function(
             init_function, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
         )
-        deploy_code.append(init_func_ir)
 
         # pass the amount of memory allocated for the init function
         # so that deployment does not clobber while preparing immutables
         # note: (deploy mem_ofst, code, extra_padding)
         init_mem_used = init_function._metadata["type"]._ir_info.frame_info.mem_used
+
+        # force msize to be initialized past the end of immutables section
+        # so that builtins which use `msize` for "dynamic" memory
+        # allocation do not clobber uninitialized immutables.
+        # cf. GH issue 3101.
+        # note mload/iload X touches bytes from X to X+32, and msize rounds up
+        # to the nearest 32, so `iload`ing `immutables_len - 32` guarantees
+        # that `msize` will refer to a memory location of at least
+        # `<immutables_start> + immutables_len` (where <immutables_start> ==
+        # `_mem_deploy_end` as defined in the assembler).
+        # note:
+        #   mload 32 => msize == 64
+        #   mload 33 => msize == 96
+        # assumption in general: (mload X) => msize == ceil32(X + 32)
+        # see py-evm extend_memory: after_size = ceil32(start_position + size)
+        if immutables_len > 0:
+            deploy_code.append(["iload", max(0, immutables_len - 32)])
+
+        deploy_code.append(init_func_ir)
+
         deploy_code.append(["deploy", init_mem_used, runtime, immutables_len])
 
         # internal functions come after everything else

From 6ee74f5af58507029192732f828e13c431c273a3 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Fri, 19 May 2023 01:05:49 +0800
Subject: [PATCH 042/161] fix: complex arguments to builtin functions (#3167)

prior to this commit, some builtin functions including ceil, would panic
if their arguments were function calls (or otherwise determined to be
complex expressions by `is_complex_ir`). this commit fixes the relevant
builtin functions by using `cache_when_complex` where appropriate.

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/conftest.py                             |  35 ++++
 tests/parser/functions/test_addmod.py         |  57 ++++++
 tests/parser/functions/test_as_wei_value.py   |  31 ++++
 tests/parser/functions/test_ceil.py           |  34 ++++
 tests/parser/functions/test_ec.py             |  62 +++++++
 tests/parser/functions/test_floor.py          |  34 ++++
 tests/parser/functions/test_mulmod.py         |  75 ++++++++
 .../types/numbers/test_unsigned_ints.py       |  43 -----
 vyper/builtins/functions.py                   | 167 ++++++++++--------
 9 files changed, 422 insertions(+), 116 deletions(-)
 create mode 100644 tests/parser/functions/test_addmod.py
 create mode 100644 tests/parser/functions/test_as_wei_value.py
 create mode 100644 tests/parser/functions/test_mulmod.py

diff --git a/tests/conftest.py b/tests/conftest.py
index e1d0996767..1cc9e4e72e 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -192,3 +192,38 @@ def _f(_addr, _salt, _initcode):
         return keccak(prefix + addr + salt + keccak(initcode))[12:]
 
     return _f
+
+
+@pytest.fixture
+def side_effects_contract(get_contract):
+    def generate(ret_type):
+        """
+        Generates a Vyper contract with an external `foo()` function, which
+        returns the specified return value of the specified return type, for
+        testing side effects using the `assert_side_effects_invoked` fixture.
+        """
+        code = f"""
+counter: public(uint256)
+
+@external
+def foo(s: {ret_type}) -> {ret_type}:
+    self.counter += 1
+    return s
+    """
+        contract = get_contract(code)
+        return contract
+
+    return generate
+
+
+@pytest.fixture
+def assert_side_effects_invoked():
+    def assert_side_effects_invoked(side_effects_contract, side_effects_trigger, n=1):
+        start_value = side_effects_contract.counter()
+
+        side_effects_trigger()
+
+        end_value = side_effects_contract.counter()
+        assert end_value == start_value + n
+
+    return assert_side_effects_invoked
diff --git a/tests/parser/functions/test_addmod.py b/tests/parser/functions/test_addmod.py
new file mode 100644
index 0000000000..67a7e9b101
--- /dev/null
+++ b/tests/parser/functions/test_addmod.py
@@ -0,0 +1,57 @@
+def test_uint256_addmod(assert_tx_failed, get_contract_with_gas_estimation):
+    uint256_code = """
+@external
+def _uint256_addmod(x: uint256, y: uint256, z: uint256) -> uint256:
+    return uint256_addmod(x, y, z)
+    """
+
+    c = get_contract_with_gas_estimation(uint256_code)
+
+    assert c._uint256_addmod(1, 2, 2) == 1
+    assert c._uint256_addmod(32, 2, 32) == 2
+    assert c._uint256_addmod((2**256) - 1, 0, 2) == 1
+    assert c._uint256_addmod(2**255, 2**255, 6) == 4
+    assert_tx_failed(lambda: c._uint256_addmod(1, 2, 0))
+
+
+def test_uint256_addmod_ext_call(
+    w3, side_effects_contract, assert_side_effects_invoked, get_contract
+):
+    code = """
+@external
+def foo(f: Foo) -> uint256:
+    return uint256_addmod(32, 2, f.foo(32))
+
+interface Foo:
+    def foo(x: uint256) -> uint256: payable
+    """
+
+    c1 = side_effects_contract("uint256")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == 2
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_uint256_addmod_internal_call(get_contract_with_gas_estimation):
+    code = """
+@external
+def foo() -> uint256:
+    return uint256_addmod(self.a(), self.b(), self.c())
+
+@internal
+def a() -> uint256:
+    return 32
+
+@internal
+def b() -> uint256:
+    return 2
+
+@internal
+def c() -> uint256:
+    return 32
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo() == 2
diff --git a/tests/parser/functions/test_as_wei_value.py b/tests/parser/functions/test_as_wei_value.py
new file mode 100644
index 0000000000..bab0aed616
--- /dev/null
+++ b/tests/parser/functions/test_as_wei_value.py
@@ -0,0 +1,31 @@
+def test_ext_call(w3, side_effects_contract, assert_side_effects_invoked, get_contract):
+    code = """
+@external
+def foo(a: Foo) -> uint256:
+    return as_wei_value(a.foo(7), "ether")
+
+interface Foo:
+    def foo(x: uint8) -> uint8: nonpayable
+    """
+
+    c1 = side_effects_contract("uint8")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == w3.to_wei(7, "ether")
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_internal_call(w3, get_contract_with_gas_estimation):
+    code = """
+@external
+def foo() -> uint256:
+    return as_wei_value(self.bar(), "ether")
+
+@internal
+def bar() -> uint8:
+    return 7
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo() == w3.to_wei(7, "ether")
diff --git a/tests/parser/functions/test_ceil.py b/tests/parser/functions/test_ceil.py
index a9bcf62da2..daa9cb7c1b 100644
--- a/tests/parser/functions/test_ceil.py
+++ b/tests/parser/functions/test_ceil.py
@@ -104,3 +104,37 @@ def ceil_param(p: decimal) -> int256:
     assert c.fou() == -3
     assert c.ceil_param(Decimal("-0.5")) == 0
     assert c.ceil_param(Decimal("-7777777.7777777")) == -7777777
+
+
+def test_ceil_ext_call(w3, side_effects_contract, assert_side_effects_invoked, get_contract):
+    code = """
+@external
+def foo(a: Foo) -> int256:
+    return ceil(a.foo(2.5))
+
+interface Foo:
+    def foo(x: decimal) -> decimal: payable
+    """
+
+    c1 = side_effects_contract("decimal")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == 3
+
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_ceil_internal_call(get_contract_with_gas_estimation):
+    code = """
+@external
+def foo() -> int256:
+    return ceil(self.bar())
+
+@internal
+def bar() -> decimal:
+    return 2.5
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo() == 3
diff --git a/tests/parser/functions/test_ec.py b/tests/parser/functions/test_ec.py
index be0f6f7ed2..9ce37d0721 100644
--- a/tests/parser/functions/test_ec.py
+++ b/tests/parser/functions/test_ec.py
@@ -45,6 +45,37 @@ def _ecadd3(x: uint256[2], y: uint256[2]) -> uint256[2]:
     assert c._ecadd3(G1, negative_G1) == [0, 0]
 
 
+def test_ecadd_internal_call(get_contract_with_gas_estimation):
+    code = """
+@internal
+def a() -> uint256[2]:
+    return [1, 2]
+
+@external
+def foo() -> uint256[2]:
+    return ecadd([1, 2], self.a())
+    """
+    c = get_contract_with_gas_estimation(code)
+    assert c.foo() == G1_times_two
+
+
+def test_ecadd_ext_call(w3, side_effects_contract, assert_side_effects_invoked, get_contract):
+    code = """
+interface Foo:
+    def foo(x: uint256[2]) -> uint256[2]: payable
+
+@external
+def foo(a: Foo) -> uint256[2]:
+    return ecadd([1, 2], a.foo([1, 2]))
+    """
+    c1 = side_effects_contract("uint256[2]")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == G1_times_two
+
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
 def test_ecmul(get_contract_with_gas_estimation):
     ecmuller = """
 x3: uint256[2]
@@ -74,3 +105,34 @@ def _ecmul3(x: uint256[2], y: uint256) -> uint256[2]:
     assert c._ecmul(G1, 3) == G1_times_three
     assert c._ecmul(G1, curve_order - 1) == negative_G1
     assert c._ecmul(G1, curve_order) == [0, 0]
+
+
+def test_ecmul_internal_call(get_contract_with_gas_estimation):
+    code = """
+@internal
+def a() -> uint256:
+    return 3
+
+@external
+def foo() -> uint256[2]:
+    return ecmul([1, 2], self.a())
+    """
+    c = get_contract_with_gas_estimation(code)
+    assert c.foo() == G1_times_three
+
+
+def test_ecmul_ext_call(w3, side_effects_contract, assert_side_effects_invoked, get_contract):
+    code = """
+interface Foo:
+    def foo(x: uint256) -> uint256: payable
+
+@external
+def foo(a: Foo) -> uint256[2]:
+    return ecmul([1, 2], a.foo(3))
+    """
+    c1 = side_effects_contract("uint256")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == G1_times_three
+
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
diff --git a/tests/parser/functions/test_floor.py b/tests/parser/functions/test_floor.py
index dc53545ac3..d2fd993785 100644
--- a/tests/parser/functions/test_floor.py
+++ b/tests/parser/functions/test_floor.py
@@ -108,3 +108,37 @@ def floor_param(p: decimal) -> int256:
     assert c.fou() == -4
     assert c.floor_param(Decimal("-5.6")) == -6
     assert c.floor_param(Decimal("-0.0000000001")) == -1
+
+
+def test_floor_ext_call(w3, side_effects_contract, assert_side_effects_invoked, get_contract):
+    code = """
+@external
+def foo(a: Foo) -> int256:
+    return floor(a.foo(2.5))
+
+interface Foo:
+    def foo(x: decimal) -> decimal: nonpayable
+    """
+
+    c1 = side_effects_contract("decimal")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == 2
+
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_floor_internal_call(get_contract_with_gas_estimation):
+    code = """
+@external
+def foo() -> int256:
+    return floor(self.bar())
+
+@internal
+def bar() -> decimal:
+    return 2.5
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo() == 2
diff --git a/tests/parser/functions/test_mulmod.py b/tests/parser/functions/test_mulmod.py
new file mode 100644
index 0000000000..1ea7a3f8e8
--- /dev/null
+++ b/tests/parser/functions/test_mulmod.py
@@ -0,0 +1,75 @@
+def test_uint256_mulmod(assert_tx_failed, get_contract_with_gas_estimation):
+    uint256_code = """
+@external
+def _uint256_mulmod(x: uint256, y: uint256, z: uint256) -> uint256:
+    return uint256_mulmod(x, y, z)
+    """
+
+    c = get_contract_with_gas_estimation(uint256_code)
+
+    assert c._uint256_mulmod(3, 1, 2) == 1
+    assert c._uint256_mulmod(200, 3, 601) == 600
+    assert c._uint256_mulmod(2**255, 1, 3) == 2
+    assert c._uint256_mulmod(2**255, 2, 6) == 4
+    assert_tx_failed(lambda: c._uint256_mulmod(2, 2, 0))
+
+
+def test_uint256_mulmod_complex(get_contract_with_gas_estimation):
+    modexper = """
+@external
+def exponential(base: uint256, exponent: uint256, modulus: uint256) -> uint256:
+    o: uint256 = 1
+    for i in range(256):
+        o = uint256_mulmod(o, o, modulus)
+        if exponent & shift(1, 255 - i) != 0:
+            o = uint256_mulmod(o, base, modulus)
+    return o
+    """
+
+    c = get_contract_with_gas_estimation(modexper)
+    assert c.exponential(3, 5, 100) == 43
+    assert c.exponential(2, 997, 997) == 2
+
+
+def test_uint256_mulmod_ext_call(
+    w3, side_effects_contract, assert_side_effects_invoked, get_contract
+):
+    code = """
+@external
+def foo(f: Foo) -> uint256:
+    return uint256_mulmod(200, 3, f.foo(601))
+
+interface Foo:
+    def foo(x: uint256) -> uint256: nonpayable
+    """
+
+    c1 = side_effects_contract("uint256")
+    c2 = get_contract(code)
+
+    assert c2.foo(c1.address) == 600
+
+    assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_uint256_mulmod_internal_call(get_contract_with_gas_estimation):
+    code = """
+@external
+def foo() -> uint256:
+    return uint256_mulmod(self.a(), self.b(), self.c())
+
+@internal
+def a() -> uint256:
+    return 200
+
+@internal
+def b() -> uint256:
+    return 3
+
+@internal
+def c() -> uint256:
+    return 601
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo() == 600
diff --git a/tests/parser/types/numbers/test_unsigned_ints.py b/tests/parser/types/numbers/test_unsigned_ints.py
index 82c0f8484c..683684e6be 100644
--- a/tests/parser/types/numbers/test_unsigned_ints.py
+++ b/tests/parser/types/numbers/test_unsigned_ints.py
@@ -195,49 +195,6 @@ def foo(x: {typ}, y: {typ}) -> bool:
         assert c.foo(x, y) is expected
 
 
-# TODO move to tests/parser/functions/test_mulmod.py and test_addmod.py
-def test_uint256_mod(assert_tx_failed, get_contract_with_gas_estimation):
-    uint256_code = """
-@external
-def _uint256_addmod(x: uint256, y: uint256, z: uint256) -> uint256:
-    return uint256_addmod(x, y, z)
-
-@external
-def _uint256_mulmod(x: uint256, y: uint256, z: uint256) -> uint256:
-    return uint256_mulmod(x, y, z)
-    """
-
-    c = get_contract_with_gas_estimation(uint256_code)
-
-    assert c._uint256_addmod(1, 2, 2) == 1
-    assert c._uint256_addmod(32, 2, 32) == 2
-    assert c._uint256_addmod((2**256) - 1, 0, 2) == 1
-    assert c._uint256_addmod(2**255, 2**255, 6) == 4
-    assert_tx_failed(lambda: c._uint256_addmod(1, 2, 0))
-    assert c._uint256_mulmod(3, 1, 2) == 1
-    assert c._uint256_mulmod(200, 3, 601) == 600
-    assert c._uint256_mulmod(2**255, 1, 3) == 2
-    assert c._uint256_mulmod(2**255, 2, 6) == 4
-    assert_tx_failed(lambda: c._uint256_mulmod(2, 2, 0))
-
-
-def test_uint256_modmul(get_contract_with_gas_estimation):
-    modexper = """
-@external
-def exponential(base: uint256, exponent: uint256, modulus: uint256) -> uint256:
-    o: uint256 = 1
-    for i in range(256):
-        o = uint256_mulmod(o, o, modulus)
-        if exponent & (1 << (255 - i)) != 0:
-            o = uint256_mulmod(o, base, modulus)
-    return o
-    """
-
-    c = get_contract_with_gas_estimation(modexper)
-    assert c.exponential(3, 5, 100) == 43
-    assert c.exponential(2, 997, 997) == 2
-
-
 @pytest.mark.parametrize("typ", types)
 def test_uint_literal(get_contract, assert_compile_failed, typ):
     lo, hi = typ.ast_bounds
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index bfe90bb669..915f10ede3 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -148,15 +148,18 @@ def evaluate(self, node):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        return IRnode.from_list(
-            [
-                "if",
-                ["slt", args[0], 0],
-                ["sdiv", ["sub", args[0], DECIMAL_DIVISOR - 1], DECIMAL_DIVISOR],
-                ["sdiv", args[0], DECIMAL_DIVISOR],
-            ],
-            typ=INT256_T,
-        )
+        arg = args[0]
+        with arg.cache_when_complex("arg") as (b1, arg):
+            ret = IRnode.from_list(
+                [
+                    "if",
+                    ["slt", arg, 0],
+                    ["sdiv", ["sub", arg, DECIMAL_DIVISOR - 1], DECIMAL_DIVISOR],
+                    ["sdiv", arg, DECIMAL_DIVISOR],
+                ],
+                typ=INT256_T,
+            )
+            return b1.resolve(ret)
 
 
 class Ceil(BuiltinFunction):
@@ -175,15 +178,18 @@ def evaluate(self, node):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        return IRnode.from_list(
-            [
-                "if",
-                ["slt", args[0], 0],
-                ["sdiv", args[0], DECIMAL_DIVISOR],
-                ["sdiv", ["add", args[0], DECIMAL_DIVISOR - 1], DECIMAL_DIVISOR],
-            ],
-            typ=INT256_T,
-        )
+        arg = args[0]
+        with arg.cache_when_complex("arg") as (b1, arg):
+            ret = IRnode.from_list(
+                [
+                    "if",
+                    ["slt", arg, 0],
+                    ["sdiv", arg, DECIMAL_DIVISOR],
+                    ["sdiv", ["add", arg, DECIMAL_DIVISOR - 1], DECIMAL_DIVISOR],
+                ],
+                typ=INT256_T,
+            )
+            return b1.resolve(ret)
 
 
 class Convert(BuiltinFunction):
@@ -800,20 +806,25 @@ def build_IR(self, expr, args, kwargs, context):
         placeholder_node = IRnode.from_list(
             context.new_internal_variable(BytesT(128)), typ=BytesT(128), location=MEMORY
         )
-        o = IRnode.from_list(
-            [
-                "seq",
-                ["mstore", placeholder_node, _getelem(args[0], 0)],
-                ["mstore", ["add", placeholder_node, 32], _getelem(args[0], 1)],
-                ["mstore", ["add", placeholder_node, 64], _getelem(args[1], 0)],
-                ["mstore", ["add", placeholder_node, 96], _getelem(args[1], 1)],
-                ["assert", ["staticcall", ["gas"], 6, placeholder_node, 128, placeholder_node, 64]],
-                placeholder_node,
-            ],
-            typ=SArrayT(UINT256_T, 2),
-            location=MEMORY,
-        )
-        return o
+
+        with args[0].cache_when_complex("a") as (b1, a), args[1].cache_when_complex("b") as (b2, b):
+            o = IRnode.from_list(
+                [
+                    "seq",
+                    ["mstore", placeholder_node, _getelem(a, 0)],
+                    ["mstore", ["add", placeholder_node, 32], _getelem(a, 1)],
+                    ["mstore", ["add", placeholder_node, 64], _getelem(b, 0)],
+                    ["mstore", ["add", placeholder_node, 96], _getelem(b, 1)],
+                    [
+                        "assert",
+                        ["staticcall", ["gas"], 6, placeholder_node, 128, placeholder_node, 64],
+                    ],
+                    placeholder_node,
+                ],
+                typ=SArrayT(UINT256_T, 2),
+                location=MEMORY,
+            )
+            return b2.resolve(b1.resolve(o))
 
 
 class ECMul(BuiltinFunction):
@@ -826,19 +837,24 @@ def build_IR(self, expr, args, kwargs, context):
         placeholder_node = IRnode.from_list(
             context.new_internal_variable(BytesT(128)), typ=BytesT(128), location=MEMORY
         )
-        o = IRnode.from_list(
-            [
-                "seq",
-                ["mstore", placeholder_node, _getelem(args[0], 0)],
-                ["mstore", ["add", placeholder_node, 32], _getelem(args[0], 1)],
-                ["mstore", ["add", placeholder_node, 64], args[1]],
-                ["assert", ["staticcall", ["gas"], 7, placeholder_node, 96, placeholder_node, 64]],
-                placeholder_node,
-            ],
-            typ=SArrayT(UINT256_T, 2),
-            location=MEMORY,
-        )
-        return o
+
+        with args[0].cache_when_complex("a") as (b1, a), args[1].cache_when_complex("b") as (b2, b):
+            o = IRnode.from_list(
+                [
+                    "seq",
+                    ["mstore", placeholder_node, _getelem(a, 0)],
+                    ["mstore", ["add", placeholder_node, 32], _getelem(a, 1)],
+                    ["mstore", ["add", placeholder_node, 64], b],
+                    [
+                        "assert",
+                        ["staticcall", ["gas"], 7, placeholder_node, 96, placeholder_node, 64],
+                    ],
+                    placeholder_node,
+                ],
+                typ=SArrayT(UINT256_T, 2),
+                location=MEMORY,
+            )
+            return b2.resolve(b1.resolve(o))
 
 
 def _generic_element_getter(op):
@@ -1030,34 +1046,35 @@ def build_IR(self, expr, args, kwargs, context):
         value = args[0]
 
         denom_divisor = self.get_denomination(expr)
-        if value.typ in (UINT256_T, UINT8_T):
-            sub = [
-                "with",
-                "ans",
-                ["mul", value, denom_divisor],
-                [
-                    "seq",
+        with value.cache_when_complex("value") as (b1, value):
+            if value.typ in (UINT256_T, UINT8_T):
+                sub = [
+                    "with",
+                    "ans",
+                    ["mul", value, denom_divisor],
                     [
-                        "assert",
-                        ["or", ["eq", ["div", "ans", value], denom_divisor], ["iszero", value]],
+                        "seq",
+                        [
+                            "assert",
+                            ["or", ["eq", ["div", "ans", value], denom_divisor], ["iszero", value]],
+                        ],
+                        "ans",
                     ],
-                    "ans",
-                ],
-            ]
-        elif value.typ == INT128_T:
-            # signed types do not require bounds checks because the
-            # largest possible converted value will not overflow 2**256
-            sub = ["seq", ["assert", ["sgt", value, -1]], ["mul", value, denom_divisor]]
-        elif value.typ == DecimalT():
-            sub = [
-                "seq",
-                ["assert", ["sgt", value, -1]],
-                ["div", ["mul", value, denom_divisor], DECIMAL_DIVISOR],
-            ]
-        else:
-            raise CompilerPanic(f"Unexpected type: {value.typ}")
+                ]
+            elif value.typ == INT128_T:
+                # signed types do not require bounds checks because the
+                # largest possible converted value will not overflow 2**256
+                sub = ["seq", ["assert", ["sgt", value, -1]], ["mul", value, denom_divisor]]
+            elif value.typ == DecimalT():
+                sub = [
+                    "seq",
+                    ["assert", ["sgt", value, -1]],
+                    ["div", ["mul", value, denom_divisor], DECIMAL_DIVISOR],
+                ]
+            else:
+                raise CompilerPanic(f"Unexpected type: {value.typ}")
 
-        return IRnode.from_list(sub, typ=UINT256_T)
+            return IRnode.from_list(b1.resolve(sub), typ=UINT256_T)
 
 
 zero_value = IRnode.from_list(0, typ=UINT256_T)
@@ -1516,9 +1533,13 @@ def evaluate(self, node):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        return IRnode.from_list(
-            ["seq", ["assert", args[2]], [self._opcode, args[0], args[1], args[2]]], typ=UINT256_T
-        )
+        c = args[2]
+
+        with c.cache_when_complex("c") as (b1, c):
+            ret = IRnode.from_list(
+                ["seq", ["assert", c], [self._opcode, args[0], args[1], c]], typ=UINT256_T
+            )
+            return b1.resolve(ret)
 
 
 class AddMod(_AddMulMod):

From 27b6b893caad86c461c7980dd777abe42f716e19 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 18 May 2023 14:24:28 -0400
Subject: [PATCH 043/161] fix: calculate `active_evm_version` from
 `DEFAULT_EVM_VERSION` (#3427)

per 1ac8362df0c, the `DEFAULT_EVM_VERSION` is updated to shanghai, while
`active_evm_version` still points to paris. so entry points into the
compiler which don't use the @evm_wrapper wrapper might continue using
paris. this commit fixes the issue by calculating active_evm_version
from `DEFAULT_EVM_VERSION` so that only one value needs to be updated
going forward.
---
 vyper/evm/opcodes.py | 5 ++---
 1 file changed, 2 insertions(+), 3 deletions(-)

diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index 76529da14e..7ff56df772 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -3,8 +3,6 @@
 from vyper.exceptions import CompilerPanic
 from vyper.typing import OpcodeGasCost, OpcodeMap, OpcodeRulesetMap, OpcodeRulesetValue, OpcodeValue
 
-active_evm_version: int = 4
-
 # EVM version rules work as follows:
 # 1. Fork rules go from oldest (lowest value) to newest (highest value).
 # 2. Fork versions aren't actually tied to anything. They are not a part of our
@@ -17,7 +15,7 @@
 # 6. Yes, this will probably have to be rethought if there's ever conflicting support
 #    between multiple chains for a specific feature. Let's hope not.
 # 7. We support at a maximum 3 hard forks (for any given chain).
-EVM_VERSIONS: Dict[str, int] = {
+EVM_VERSIONS: dict[str, int] = {
     # ETH Forks
     "byzantium": 0,
     "constantinople": 1,
@@ -31,6 +29,7 @@
     "agharta": 1,
 }
 DEFAULT_EVM_VERSION: str = "shanghai"
+active_evm_version: int = EVM_VERSIONS[DEFAULT_EVM_VERSION]
 
 
 # opcode as hex value

From 5b9bca24e3ac82654ce78ba66d5932ab609b28a8 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 18 May 2023 18:07:40 -0400
Subject: [PATCH 044/161] chore: fix badges in README (#3428)

microbadger appears defunct, switch to shields.io
switch lgtm to codeql
---
 README.md | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index f17e693bf5..af987ffd4f 100644
--- a/README.md
+++ b/README.md
@@ -1,15 +1,15 @@
 
 <img src="https://raw.githubusercontent.com/vyperlang/vyper/master/logo/vyper-logo-transparent.svg?sanitize=true" alt="" width="110">
 
-[![Build Status](https://github.com/vyperlang/vyper/workflows/Test/badge.svg)](https://github.com/vyperlang/vyper/actions)
+[![Build Status](https://github.com/vyperlang/vyper/workflows/Test/badge.svg)](https://github.com/vyperlang/vyper/actions/workflows/test.yml)
 [![Documentation Status](https://readthedocs.org/projects/vyper/badge/?version=latest)](http://vyper.readthedocs.io/en/latest/?badge=latest "ReadTheDocs")
 [![Discord](https://img.shields.io/discord/969926564286459934.svg?label=%23vyper)](https://discord.gg/6tw7PTM7C2)
 
 [![PyPI](https://badge.fury.io/py/vyper.svg)](https://pypi.org/project/vyper "PyPI")
-[![Docker](https://images.microbadger.com/badges/version/vyperlang/vyper.svg)](https://hub.docker.com/r/vyperlang/vyper "DockerHub")
+[![Docker](https://img.shields.io/docker/cloud/build/vyperlang/vyper)](https://hub.docker.com/r/vyperlang/vyper "DockerHub")
 
 [![Coverage Status](https://codecov.io/gh/vyperlang/vyper/branch/master/graph/badge.svg)](https://codecov.io/gh/vyperlang/vyper "Codecov")
-[![Language grade: Python](https://img.shields.io/lgtm/grade/python/g/vyperlang/vyper.svg?logo=lgtm&logoWidth=18)](https://lgtm.com/projects/g/vyperlang/vyper/context:python)
+[![Language grade: Python](https://github.com/vyperlang/vyper/workflows/CodeQL/badge.svg)](https://github.com/vyperlang/vyper/actions/workflows/codeql.yml)
 
 # Getting Started
 See [Installing Vyper](http://vyper.readthedocs.io/en/latest/installing-vyper.html) to install vyper.

From ed0a654aa2f1069874c2c6d21b8932737aee3f6f Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 18 May 2023 18:27:38 -0400
Subject: [PATCH 045/161] transient storage keyword (#3373)

experimentally add support for transient storage via a new `transient`
keyword, which works like `immutable` or `constant`, ex.:

```vyper
my_transient_variable: transient(uint256)
```

this feature is considered experimental until py-evm adds support
(giving us the ability to actually test it). so this commit leaves the
default evm version as "shanghai" for now. it blocks the feature on
pre-cancun EVM versions, so users can't use it by accident - the only
way to use it is to explicitly enable it via `--evm-version=cancun`.
---
 tests/compiler/test_opcodes.py                |  7 ++-
 tests/parser/ast_utils/test_ast_dict.py       |  1 +
 .../features/decorators/test_nonreentrant.py  |  2 +
 tests/parser/features/test_transient.py       | 61 +++++++++++++++++++
 vyper/ast/nodes.py                            | 18 ++++--
 vyper/cli/vyper_compile.py                    |  3 +-
 vyper/codegen/context.py                      |  1 +
 vyper/codegen/core.py                         |  8 +--
 vyper/codegen/expr.py                         |  6 +-
 vyper/codegen/function_definitions/utils.py   | 10 ++-
 vyper/evm/address_space.py                    |  1 +
 vyper/evm/opcodes.py                          |  3 +
 vyper/semantics/analysis/base.py              |  1 +
 vyper/semantics/analysis/module.py            |  9 +++
 vyper/semantics/data_locations.py             |  2 +
 vyper/semantics/namespace.py                  |  1 +
 16 files changed, 118 insertions(+), 16 deletions(-)
 create mode 100644 tests/parser/features/test_transient.py

diff --git a/tests/compiler/test_opcodes.py b/tests/compiler/test_opcodes.py
index f36fcfac6f..3c595dee44 100644
--- a/tests/compiler/test_opcodes.py
+++ b/tests/compiler/test_opcodes.py
@@ -45,11 +45,14 @@ def test_version_check(evm_version):
 
 def test_get_opcodes(evm_version):
     ops = opcodes.get_opcodes()
-    if evm_version in ("paris", "berlin", "shanghai"):
+    if evm_version in ("paris", "berlin", "shanghai", "cancun"):
         assert "CHAINID" in ops
         assert ops["SLOAD"][-1] == 2100
-        if evm_version in ("shanghai",):
+        if evm_version in ("shanghai", "cancun"):
             assert "PUSH0" in ops
+        if evm_version in ("cancun",):
+            assert "TLOAD" in ops
+            assert "TSTORE" in ops
     elif evm_version == "istanbul":
         assert "CHAINID" in ops
         assert ops["SLOAD"][-1] == 800
diff --git a/tests/parser/ast_utils/test_ast_dict.py b/tests/parser/ast_utils/test_ast_dict.py
index 214af50f9f..f483d0cbe8 100644
--- a/tests/parser/ast_utils/test_ast_dict.py
+++ b/tests/parser/ast_utils/test_ast_dict.py
@@ -73,6 +73,7 @@ def test_basic_ast():
         "is_constant": False,
         "is_immutable": False,
         "is_public": False,
+        "is_transient": False,
     }
 
 
diff --git a/tests/parser/features/decorators/test_nonreentrant.py b/tests/parser/features/decorators/test_nonreentrant.py
index 0577313b88..ac73b35bec 100644
--- a/tests/parser/features/decorators/test_nonreentrant.py
+++ b/tests/parser/features/decorators/test_nonreentrant.py
@@ -3,6 +3,8 @@
 from vyper.exceptions import FunctionDeclarationException
 
 
+# TODO test functions in this module across all evm versions
+# once we have cancun support.
 def test_nonreentrant_decorator(get_contract, assert_tx_failed):
     calling_contract_code = """
 interface SpecialContract:
diff --git a/tests/parser/features/test_transient.py b/tests/parser/features/test_transient.py
new file mode 100644
index 0000000000..53354beca8
--- /dev/null
+++ b/tests/parser/features/test_transient.py
@@ -0,0 +1,61 @@
+import pytest
+
+from vyper.compiler import compile_code
+from vyper.evm.opcodes import EVM_VERSIONS
+from vyper.exceptions import StructureException
+
+post_cancun = {k: v for k, v in EVM_VERSIONS.items() if v >= EVM_VERSIONS["cancun"]}
+
+
+@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS.keys()))
+def test_transient_blocked(evm_version):
+    # test transient is blocked on pre-cancun and compiles post-cancun
+    code = """
+my_map: transient(HashMap[address, uint256])
+    """
+    if EVM_VERSIONS[evm_version] >= EVM_VERSIONS["cancun"]:
+        assert compile_code(code, evm_version=evm_version) is not None
+    else:
+        with pytest.raises(StructureException):
+            compile_code(code, evm_version=evm_version)
+
+
+@pytest.mark.parametrize("evm_version", list(post_cancun.keys()))
+def test_transient_compiles(evm_version):
+    # test transient keyword at least generates TLOAD/TSTORE opcodes
+    getter_code = """
+my_map: public(transient(HashMap[address, uint256]))
+    """
+    t = compile_code(getter_code, evm_version=evm_version, output_formats=["opcodes_runtime"])
+    t = t["opcodes_runtime"].split(" ")
+
+    assert "TLOAD" in t
+    assert "TSTORE" not in t
+
+    setter_code = """
+my_map: transient(HashMap[address, uint256])
+
+@external
+def setter(k: address, v: uint256):
+    self.my_map[k] = v
+    """
+    t = compile_code(setter_code, evm_version=evm_version, output_formats=["opcodes_runtime"])
+    t = t["opcodes_runtime"].split(" ")
+
+    assert "TLOAD" not in t
+    assert "TSTORE" in t
+
+    getter_setter_code = """
+my_map: public(transient(HashMap[address, uint256]))
+
+@external
+def setter(k: address, v: uint256):
+    self.my_map[k] = v
+    """
+    t = compile_code(
+        getter_setter_code, evm_version=evm_version, output_formats=["opcodes_runtime"]
+    )
+    t = t["opcodes_runtime"].split(" ")
+
+    assert "TLOAD" in t
+    assert "TSTORE" in t
diff --git a/vyper/ast/nodes.py b/vyper/ast/nodes.py
index 03f2d713c1..7c907b4d08 100644
--- a/vyper/ast/nodes.py
+++ b/vyper/ast/nodes.py
@@ -1344,7 +1344,15 @@ class VariableDecl(VyperNode):
         If true, indicates that the variable is an immutable variable.
     """
 
-    __slots__ = ("target", "annotation", "value", "is_constant", "is_public", "is_immutable")
+    __slots__ = (
+        "target",
+        "annotation",
+        "value",
+        "is_constant",
+        "is_public",
+        "is_immutable",
+        "is_transient",
+    )
 
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
@@ -1352,6 +1360,7 @@ def __init__(self, *args, **kwargs):
         self.is_constant = False
         self.is_public = False
         self.is_immutable = False
+        self.is_transient = False
 
         def _check_args(annotation, call_name):
             # do the same thing as `validate_call_args`
@@ -1369,9 +1378,10 @@ def _check_args(annotation, call_name):
             # unwrap one layer
             self.annotation = self.annotation.args[0]
 
-        if self.annotation.get("func.id") in ("immutable", "constant"):
-            _check_args(self.annotation, self.annotation.func.id)
-            setattr(self, f"is_{self.annotation.func.id}", True)
+        func_id = self.annotation.get("func.id")
+        if func_id in ("immutable", "constant", "transient"):
+            _check_args(self.annotation, func_id)
+            setattr(self, f"is_{func_id}", True)
             # unwrap one layer
             self.annotation = self.annotation.args[0]
 
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 9ab884a6d0..4dfc87639a 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -101,7 +101,8 @@ def _parse_args(argv):
     )
     parser.add_argument(
         "--evm-version",
-        help=f"Select desired EVM version (default {DEFAULT_EVM_VERSION})",
+        help=f"Select desired EVM version (default {DEFAULT_EVM_VERSION}). "
+        " note: cancun support is EXPERIMENTAL",
         choices=list(EVM_VERSIONS),
         default=DEFAULT_EVM_VERSION,
         dest="evm_version",
diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index 6e8d02c9b3..e4b41adbc0 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -28,6 +28,7 @@ class VariableRecord:
     defined_at: Any = None
     is_internal: bool = False
     is_immutable: bool = False
+    is_transient: bool = False
     data_offset: Optional[int] = None
 
     def __hash__(self):
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index a9a91ec9d8..06140f3f52 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -1,6 +1,6 @@
 from vyper import ast as vy_ast
 from vyper.codegen.ir_node import Encoding, IRnode
-from vyper.evm.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE
+from vyper.evm.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE, TRANSIENT
 from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StructureException, TypeCheckFailure, TypeMismatch
 from vyper.semantics.types import (
@@ -562,10 +562,10 @@ def _get_element_ptr_mapping(parent, key):
     key = unwrap_location(key)
 
     # TODO when is key None?
-    if key is None or parent.location != STORAGE:
-        raise TypeCheckFailure(f"bad dereference on mapping {parent}[{key}]")
+    if key is None or parent.location not in (STORAGE, TRANSIENT):
+        raise TypeCheckFailure("bad dereference on mapping {parent}[{key}]")
 
-    return IRnode.from_list(["sha3_64", parent, key], typ=subtype, location=STORAGE)
+    return IRnode.from_list(["sha3_64", parent, key], typ=subtype, location=parent.location)
 
 
 # Take a value representing a memory or storage location, and descend down to
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index 4a18a16e1b..ac7290836b 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -23,7 +23,7 @@
 )
 from vyper.codegen.ir_node import IRnode
 from vyper.codegen.keccak256_helper import keccak256_helper
-from vyper.evm.address_space import DATA, IMMUTABLES, MEMORY, STORAGE
+from vyper.evm.address_space import DATA, IMMUTABLES, MEMORY, STORAGE, TRANSIENT
 from vyper.evm.opcodes import version_check
 from vyper.exceptions import (
     CompilerPanic,
@@ -259,10 +259,12 @@ def parse_Attribute(self):
         # self.x: global attribute
         elif isinstance(self.expr.value, vy_ast.Name) and self.expr.value.id == "self":
             varinfo = self.context.globals[self.expr.attr]
+            location = TRANSIENT if varinfo.is_transient else STORAGE
+
             ret = IRnode.from_list(
                 varinfo.position.position,
                 typ=varinfo.typ,
-                location=STORAGE,
+                location=location,
                 annotation="self." + self.expr.attr,
             )
             ret._referenced_variables = {varinfo}
diff --git a/vyper/codegen/function_definitions/utils.py b/vyper/codegen/function_definitions/utils.py
index 7129388c58..f524ec6e88 100644
--- a/vyper/codegen/function_definitions/utils.py
+++ b/vyper/codegen/function_definitions/utils.py
@@ -8,6 +8,10 @@ def get_nonreentrant_lock(func_type):
 
     nkey = func_type.reentrancy_key_position.position
 
+    LOAD, STORE = "sload", "sstore"
+    if version_check(begin="cancun"):
+        LOAD, STORE = "tload", "tstore"
+
     if version_check(begin="berlin"):
         # any nonzero values would work here (see pricing as of net gas
         # metering); these values are chosen so that downgrading to the
@@ -16,12 +20,12 @@ def get_nonreentrant_lock(func_type):
     else:
         final_value, temp_value = 0, 1
 
-    check_notset = ["assert", ["ne", temp_value, ["sload", nkey]]]
+    check_notset = ["assert", ["ne", temp_value, [LOAD, nkey]]]
 
     if func_type.mutability == StateMutability.VIEW:
         return [check_notset], [["seq"]]
 
     else:
-        pre = ["seq", check_notset, ["sstore", nkey, temp_value]]
-        post = ["sstore", nkey, final_value]
+        pre = ["seq", check_notset, [STORE, nkey, temp_value]]
+        post = [STORE, nkey, final_value]
         return [pre], [post]
diff --git a/vyper/evm/address_space.py b/vyper/evm/address_space.py
index 855e98b5c8..85a75c3c23 100644
--- a/vyper/evm/address_space.py
+++ b/vyper/evm/address_space.py
@@ -48,6 +48,7 @@ def byte_addressable(self) -> bool:
 
 MEMORY = AddrSpace("memory", 32, "mload", "mstore")
 STORAGE = AddrSpace("storage", 1, "sload", "sstore")
+TRANSIENT = AddrSpace("transient", 1, "tload", "tstore")
 CALLDATA = AddrSpace("calldata", 32, "calldataload")
 # immutables address space: "immutables" section of memory
 # which is read-write in deploy code but then gets turned into
diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index 7ff56df772..c447fd863c 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -24,6 +24,7 @@
     "berlin": 3,
     "paris": 4,
     "shanghai": 5,
+    "cancun": 6,
     # ETC Forks
     "atlantis": 0,
     "agharta": 1,
@@ -184,6 +185,8 @@
     "INVALID": (0xFE, 0, 0, 0),
     "DEBUG": (0xA5, 1, 0, 0),
     "BREAKPOINT": (0xA6, 0, 0, 0),
+    "TLOAD": (0xB3, 1, 1, 100),
+    "TSTORE": (0xB4, 2, 0, 100),
 }
 
 PSEUDO_OPCODES: OpcodeMap = {
diff --git a/vyper/semantics/analysis/base.py b/vyper/semantics/analysis/base.py
index 5065131f29..449e6ca338 100644
--- a/vyper/semantics/analysis/base.py
+++ b/vyper/semantics/analysis/base.py
@@ -162,6 +162,7 @@ class VarInfo:
     is_constant: bool = False
     is_public: bool = False
     is_immutable: bool = False
+    is_transient: bool = False
     is_local_var: bool = False
     decl_node: Optional[vy_ast.VyperNode] = None
 
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index 188005e365..cb8e93ff28 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -4,6 +4,7 @@
 
 import vyper.builtins.interfaces
 from vyper import ast as vy_ast
+from vyper.evm.opcodes import version_check
 from vyper.exceptions import (
     CallViolation,
     CompilerPanic,
@@ -189,10 +190,17 @@ def visit_VariableDecl(self, node):
             if node.is_immutable
             else DataLocation.UNSET
             if node.is_constant
+            # XXX: needed if we want separate transient allocator
+            # else DataLocation.TRANSIENT
+            # if node.is_transient
             else DataLocation.STORAGE
         )
 
         type_ = type_from_annotation(node.annotation, data_loc)
+
+        if node.is_transient and not version_check(begin="cancun"):
+            raise StructureException("`transient` is not available pre-cancun", node.annotation)
+
         var_info = VarInfo(
             type_,
             decl_node=node,
@@ -200,6 +208,7 @@ def visit_VariableDecl(self, node):
             is_constant=node.is_constant,
             is_public=node.is_public,
             is_immutable=node.is_immutable,
+            is_transient=node.is_transient,
         )
         node.target._metadata["varinfo"] = var_info  # TODO maybe put this in the global namespace
         node._metadata["type"] = type_
diff --git a/vyper/semantics/data_locations.py b/vyper/semantics/data_locations.py
index 0ec374e42f..2f259b1766 100644
--- a/vyper/semantics/data_locations.py
+++ b/vyper/semantics/data_locations.py
@@ -7,3 +7,5 @@ class DataLocation(enum.Enum):
     STORAGE = 2
     CALLDATA = 3
     CODE = 4
+    # XXX: needed for separate transient storage allocator
+    # TRANSIENT = 5
diff --git a/vyper/semantics/namespace.py b/vyper/semantics/namespace.py
index d760f66972..82a5d5cf3e 100644
--- a/vyper/semantics/namespace.py
+++ b/vyper/semantics/namespace.py
@@ -176,6 +176,7 @@ def validate_identifier(attr):
     "nonpayable",
     "constant",
     "immutable",
+    "transient",
     "internal",
     "payable",
     "nonreentrant",

From 903727006c1e5ebef99fa9fd5d51d62bd33d72a9 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 19 May 2023 10:17:11 -0400
Subject: [PATCH 046/161] Merge pull request from GHSA-vxmm-cwh2-q762

on <=0.3.7, the batch payable check was broken. this was fixed due to
the removal of the global calldatasize check in 02339dfda0. this commit
adds a test to prevent regression
---
 .../features/decorators/test_payable.py       | 21 +++++++++++++++++++
 1 file changed, 21 insertions(+)

diff --git a/tests/parser/features/decorators/test_payable.py b/tests/parser/features/decorators/test_payable.py
index 906ae330c0..55c60236f4 100644
--- a/tests/parser/features/decorators/test_payable.py
+++ b/tests/parser/features/decorators/test_payable.py
@@ -372,3 +372,24 @@ def __default__():
     assert_tx_failed(
         lambda: w3.eth.send_transaction({"to": c.address, "value": 100, "data": "0x12345678"})
     )
+
+
+def test_batch_nonpayable(get_contract, w3, assert_tx_failed):
+    code = """
+@external
+def foo() -> bool:
+    return True
+
+@external
+def __default__():
+    pass
+    """
+
+    c = get_contract(code)
+    w3.eth.send_transaction({"to": c.address, "value": 0, "data": "0x12345678"})
+    data = bytes([1, 2, 3, 4])
+    for i in range(5):
+        calldata = "0x" + data[:i].hex()
+        assert_tx_failed(
+            lambda: w3.eth.send_transaction({"to": c.address, "value": 100, "data": calldata})
+        )

From 32c9a3d70e066d9b4c31adb0a11c33ec1ee640bd Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Fri, 19 May 2023 23:04:47 +0800
Subject: [PATCH 047/161] chore: fix a comment (#3431)

fix comment on TYPE_T

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 vyper/semantics/types/base.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/vyper/semantics/types/base.py b/vyper/semantics/types/base.py
index 8a174566eb..af955f6071 100644
--- a/vyper/semantics/types/base.py
+++ b/vyper/semantics/types/base.py
@@ -314,7 +314,9 @@ def __init__(self, typ, default, require_literal=False):
         self.require_literal = require_literal
 
 
-# A type type. Only used internally for builtins
+# A type type. Used internally for types which can live in expression
+# position, ex. constructors (events, interfaces and structs), and also
+# certain builtins which take types as parameters
 class TYPE_T:
     def __init__(self, typedef):
         self.typedef = typedef

From 11e1ae9f8547632c4ecbed8565dccc082f12fd8f Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 19 May 2023 14:36:28 -0400
Subject: [PATCH 048/161] chore: cache pip in setup-python (#3436)

installing dependencies takes about 1min per job. pip caching should
speed it up. note that in theory, this caches "correctly" in that it
doesn't cache the dependency graph or install directories, just the
wheels. so if upstream packages are updated, they should get
reinstalled.
---
 .github/workflows/build.yml      | 2 ++
 .github/workflows/era-tester.yml | 1 +
 .github/workflows/publish.yml    | 2 +-
 .github/workflows/test.yml       | 6 ++++++
 4 files changed, 10 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index a3e9a195f6..43586c262a 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -34,6 +34,7 @@ jobs:
         uses: actions/setup-python@v4
         with:
           python-version: "3.11"
+          cache: "pip"
 
       - name: Generate Binary
         run: >-
@@ -61,6 +62,7 @@ jobs:
         uses: actions/setup-python@v4
         with:
           python-version: "3.11"
+          cache: "pip"
 
       - name: Generate Binary
         run: >-
diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index 6c15e6af07..8c7e355d26 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -38,6 +38,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: ${{ matrix.python-version[0] }}
+        cache: "pip"
 
     - name: Get cache
       id: get-cache
diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
index 5a8d989038..e6e5f2a6f9 100644
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -18,7 +18,7 @@ jobs:
     - name: Python
       uses: actions/setup-python@v4
       with:
-        python-version: '3.x'
+        python-version: "3.11"
 
     - name: Install dependencies
       run: |
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index f90ff706ec..94e8c7c8f6 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -21,6 +21,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: "3.11"
+        cache: "pip"
 
     - name: Install Dependencies
       run: pip install .[lint]
@@ -46,6 +47,7 @@ jobs:
         uses: actions/setup-python@v4
         with:
           python-version: "3.11"
+          cache: "pip"
 
       - name: Install Tox
         run: pip install tox
@@ -63,6 +65,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: "3.11"
+        cache: "pip"
 
     - name: Install Tox
       run: pip install tox
@@ -88,6 +91,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: ${{ matrix.python-version[0] }}
+        cache: "pip"
 
     - name: Install Tox
       run: pip install tox
@@ -130,6 +134,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: "3.11"
+        cache: "pip"
 
     - name: Install Tox
       run: pip install tox
@@ -171,6 +176,7 @@ jobs:
       uses: actions/setup-python@v4
       with:
         python-version: "3.11"
+        cache: "pip"
 
     - name: Install Tox
       run: pip install tox

From 8a28372f6d9f9e63dfa4c7ffcbf7fad4f8169117 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 19 May 2023 16:04:48 -0400
Subject: [PATCH 049/161] chore: make `FuncIRInfo` generation private (#3437)

this moves generation of `func_t._ir_info` to be closer to where it is
used (and where FuncIRInfo is defined!). since FuncIRInfo is no longer
imported anywhere, it can be changed to a private member of the
function_definitions/common.py module.
---
 vyper/codegen/function_definitions/__init__.py | 2 +-
 vyper/codegen/function_definitions/common.py   | 5 ++++-
 vyper/codegen/module.py                        | 7 +------
 3 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/vyper/codegen/function_definitions/__init__.py b/vyper/codegen/function_definitions/__init__.py
index b677a14579..08bebbb4a5 100644
--- a/vyper/codegen/function_definitions/__init__.py
+++ b/vyper/codegen/function_definitions/__init__.py
@@ -1 +1 @@
-from .common import FuncIRInfo, generate_ir_for_function  # noqa
+from .common import generate_ir_for_function  # noqa
diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index 45b97831aa..fd65b12265 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -28,7 +28,7 @@ def mem_used(self):
 
 
 @dataclass
-class FuncIRInfo:
+class _FuncIRInfo:
     func_t: ContractFunctionT
     gas_estimate: Optional[int] = None
     frame_info: Optional[FrameInfo] = None
@@ -78,6 +78,9 @@ def generate_ir_for_function(
     """
     func_t = code._metadata["type"]
 
+    # generate _FuncIRInfo
+    func_t._ir_info = _FuncIRInfo(func_t)
+
     # Validate return statements.
     check_single_exit(code)
 
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 5d05c27e0b..9bc589d82f 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -4,7 +4,7 @@
 
 from vyper import ast as vy_ast
 from vyper.codegen.core import shr
-from vyper.codegen.function_definitions import FuncIRInfo, generate_ir_for_function
+from vyper.codegen.function_definitions import generate_ir_for_function
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
 from vyper.exceptions import CompilerPanic
@@ -136,11 +136,6 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
 
     init_function: Optional[vy_ast.FunctionDef] = None
 
-    # generate all FuncIRInfos
-    for f in function_defs:
-        func_t = f._metadata["type"]
-        func_t._ir_info = FuncIRInfo(func_t)
-
     runtime_functions = [f for f in function_defs if not _is_constructor(f)]
     init_function = next((f for f in function_defs if _is_constructor(f)), None)
 

From 870ad491c86be30c00c2404d85bae8368a7cf1d1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 19 May 2023 16:33:07 -0400
Subject: [PATCH 050/161] ci: deploy to ghcr on push (#3435)

publish and tag docker images continuously to ghcr.io. adds custom
tagging so we can retain every commit. it's technically possible to do
this on docker hub, but in order to have custom tags, you need to set up
a regular user and log in/push via that user. the authentication is much
cleaner in github actions for ghcr.

(note docker hub pulls for releases are still staying the same, this is
just an alternative form of retention going forward).
---
 .github/workflows/ghcr.yml | 73 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 73 insertions(+)
 create mode 100644 .github/workflows/ghcr.yml

diff --git a/.github/workflows/ghcr.yml b/.github/workflows/ghcr.yml
new file mode 100644
index 0000000000..d227d6caf0
--- /dev/null
+++ b/.github/workflows/ghcr.yml
@@ -0,0 +1,73 @@
+name: Deploy docker image to ghcr
+
+# Deploy docker image to ghcr on pushes to master and all releases/tags.
+# Note releases to docker hub are managed separately in another process
+# (github sends webhooks to docker hub which triggers the build there).
+# This workflow is an alternative form of retention for docker images
+# which also allows us to tag and retain every single commit to master.
+
+on:
+  push:
+    tags:
+      - '*'
+    branches:
+      - master
+  release:
+    types: [released]
+
+env:
+  REGISTRY: ghcr.io
+  IMAGE_NAME: ${{ github.repository }}
+
+jobs:
+  deploy-ghcr:
+
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v3
+        with:
+            # need to fetch unshallow so that setuptools_scm can infer the version
+            fetch-depth: 0
+
+      - uses: actions/setup-python@v4
+        name: Install python
+        with:
+          python-version: "3.11"
+          cache: "pip"
+
+      - name: Generate vyper/version.py
+        run: |
+          pip install .
+          echo "VYPER_VERSION=$(PYTHONPATH=. python vyper/cli/vyper_compile.py --version)" >> "$GITHUB_ENV"
+
+      - name: Docker meta
+        id: meta
+        uses: docker/metadata-action@v4
+        with:
+          images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
+          flavor: |
+            latest=true
+          tags: |
+            type=ref,event=branch
+            type=ref,event=tag
+            type=raw,value=${{ env.VYPER_VERSION }}
+
+      - name: Login to ghcr.io
+        uses: docker/login-action@v2
+        with:
+          registry: ${{ env.REGISTRY }}
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Build and push
+        uses: docker/build-push-action@v4
+        with:
+          context: .
+          push: true
+          tags: ${{ steps.meta.outputs.tags }}
+          labels: ${{ steps.meta.outputs.labels }}

From 95bf73f493dc8458a1d6981493275379197a4bdf Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sat, 20 May 2023 13:55:48 -0400
Subject: [PATCH 051/161] chore: fix up ghcr tags (#3438)

use `latest` for latest release, `dev` for continuous, and tag dev
builds with `-dev`. also remove the 'master' tag since that's redundant
with `dev`.
---
 .github/workflows/ghcr.yml | 12 ++++++++----
 1 file changed, 8 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/ghcr.yml b/.github/workflows/ghcr.yml
index d227d6caf0..4bc2885bdb 100644
--- a/.github/workflows/ghcr.yml
+++ b/.github/workflows/ghcr.yml
@@ -45,17 +45,21 @@ jobs:
           pip install .
           echo "VYPER_VERSION=$(PYTHONPATH=. python vyper/cli/vyper_compile.py --version)" >> "$GITHUB_ENV"
 
+      - name: generate tag suffix
+        if: ${{ github.event_name != 'release' }}
+        run: echo "VERSION_SUFFIX=-dev" >> "$GITHUB_ENV"
+
       - name: Docker meta
         id: meta
         uses: docker/metadata-action@v4
         with:
           images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
-          flavor: |
-            latest=true
           tags: |
-            type=ref,event=branch
             type=ref,event=tag
-            type=raw,value=${{ env.VYPER_VERSION }}
+            type=raw,value=${{ env.VYPER_VERSION }}${{ env.VERSION_SUFFIX }}
+            type=raw,value=dev,enable=${{ github.ref == 'refs/heads/master' }}
+            type=raw,value=latest,enable=${{ github.event_name == 'release' }}
+
 
       - name: Login to ghcr.io
         uses: docker/login-action@v2

From 0ed5c23ca43cd299f4e62c262df31038806ac164 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 23 May 2023 10:26:06 -0400
Subject: [PATCH 052/161] chore: add v0.3.8 release notes (#3439)

---
 docs/release-notes.rst | 107 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 107 insertions(+)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 89a528dc49..cf4d8d42f9 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -3,6 +3,113 @@
 Release Notes
 #############
 
+..
+    vim regexes:
+    first convert all single backticks to double backticks:
+    :'<,'>s/`/``/g
+    to convert links to nice rst links:
+    :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/pull\/)(\d+)/(`#\2 <\1\2>`_)/g
+    ex. in: https://github.com/vyperlang/vyper/pull/3373
+    ex. out: (`#3373 <https://github.com/vyperlang/vyper/pull/3373>`_)
+    for advisory links:
+    :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/security\/advisories\/)([-A-Za-z0-9]+)/(`\2 <\1\2>`_)/g
+
+v0.3.8
+******
+
+Date released: 2023-05-23
+
+Non-breaking changes and improvements:
+
+- ``transient`` storage keyword (`#3373 <https://github.com/vyperlang/vyper/pull/3373>`_)
+- ternary operators (`#3398 <https://github.com/vyperlang/vyper/pull/3398>`_)
+- ``raw_revert()`` builtin (`#3136 <https://github.com/vyperlang/vyper/pull/3136>`_)
+- shift operators (`#3019 <https://github.com/vyperlang/vyper/pull/3019>`_)
+- make ``send()`` gas stipend configurable (`#3158 <https://github.com/vyperlang/vyper/pull/3158>`_)
+- use new ``push0`` opcode (`#3361 <https://github.com/vyperlang/vyper/pull/3361>`_)
+- python 3.11 support (`#3129 <https://github.com/vyperlang/vyper/pull/3129>`_)
+- drop support for python 3.8 and 3.9 (`#3325 <https://github.com/vyperlang/vyper/pull/3325>`_)
+- build for ``aarch64`` (`#2687 <https://github.com/vyperlang/vyper/pull/2687>`_)
+
+Major refactoring PRs:
+
+- refactor front-end type system (`#2974 <https://github.com/vyperlang/vyper/pull/2974>`_)
+- merge front-end and codegen type systems (`#3182 <https://github.com/vyperlang/vyper/pull/3182>`_)
+- simplify ``GlobalContext`` (`#3209 <https://github.com/vyperlang/vyper/pull/3209>`_)
+- remove ``FunctionSignature`` (`#3390 <https://github.com/vyperlang/vyper/pull/3390>`_)
+
+Notable fixes:
+
+- assignment when rhs is complex type and references lhs (`#3410 <https://github.com/vyperlang/vyper/pull/3410>`_)
+- uninitialized immutable values (`#3409 <https://github.com/vyperlang/vyper/pull/3409>`_)
+- success value when mixing ``max_outsize=0`` and ``revert_on_failure=False`` (`GHSA-w9g2-3w7p-72g9 <https://github.com/vyperlang/vyper/security/advisories/GHSA-w9g2-3w7p-72g9>`_)
+- block certain kinds of storage allocator overflows (`GHSA-mgv8-gggw-mrg6 <https://github.com/vyperlang/vyper/security/advisories/GHSA-mgv8-gggw-mrg6>`_) 
+- store-before-load when a dynarray appears on both sides of an assignment (`GHSA-3p37-3636-q8wv <https://github.com/vyperlang/vyper/security/advisories/GHSA-3p37-3636-q8wv>`_)
+- bounds check for loops of the form ``for i in range(x, x+N)`` (`GHSA-6r8q-pfpv-7cgj <https://github.com/vyperlang/vyper/security/advisories/GHSA-6r8q-pfpv-7cgj>`_)
+- alignment of call-site posargs and kwargs for internal functions (`GHSA-ph9x-4vc9-m39g <https://github.com/vyperlang/vyper/security/advisories/GHSA-ph9x-4vc9-m39g>`_)
+- batch nonpayable check for default functions calldatasize < 4 (`#3104 <https://github.com/vyperlang/vyper/pull/3104>`_, `#3408 <https://github.com/vyperlang/vyper/pull/3408>`_, cf. `GHSA-vxmm-cwh2-q762 <https://github.com/vyperlang/vyper/security/advisories/GHSA-vxmm-cwh2-q762>`_)
+
+Other docs updates, chores and fixes:
+
+- call graph stability (`#3370 <https://github.com/vyperlang/vyper/pull/3370>`_)
+- fix ``vyper-serve`` output (`#3338 <https://github.com/vyperlang/vyper/pull/3338>`_)
+- add ``custom:`` natspec tags (`#3403 <https://github.com/vyperlang/vyper/pull/3403>`_)
+- add missing pc maps to ``vyper_json`` output (`#3333 <https://github.com/vyperlang/vyper/pull/3333>`_)
+- fix constructor context for internal functions (`#3388 <https://github.com/vyperlang/vyper/pull/3388>`_)
+- add deprecation warning for ``selfdestruct`` usage (`#3372 <https://github.com/vyperlang/vyper/pull/3372>`_)
+- add bytecode metadata option to vyper-json (`#3117 <https://github.com/vyperlang/vyper/pull/3117>`_)
+- fix compiler panic when a ``break`` is outside of a loop (`#3177 <https://github.com/vyperlang/vyper/pull/3177>`_)
+- fix complex arguments to builtin functions (`#3167 <https://github.com/vyperlang/vyper/pull/3167>`_)
+- add support for all types in ABI imports (`#3154 <https://github.com/vyperlang/vyper/pull/3154>`_)
+- disable uadd operator (`#3174 <https://github.com/vyperlang/vyper/pull/3174>`_)
+- block bitwise ops on decimals (`#3219 <https://github.com/vyperlang/vyper/pull/3219>`_)
+- raise ``UNREACHABLE`` (`#3194 <https://github.com/vyperlang/vyper/pull/3194>`_)
+- allow enum as mapping key (`#3256 <https://github.com/vyperlang/vyper/pull/3256>`_)
+- block boolean ``not`` operator on numeric types (`#3231 <https://github.com/vyperlang/vyper/pull/3231>`_)
+- enforce that loop's iterators are valid names (`#3242 <https://github.com/vyperlang/vyper/pull/3242>`_)
+- fix typechecker hotspot (`#3318 <https://github.com/vyperlang/vyper/pull/3318>`_)
+- rewrite typechecker journal to handle nested commits (`#3375 <https://github.com/vyperlang/vyper/pull/3375>`_)
+- fix missing pc map for empty functions (`#3202 <https://github.com/vyperlang/vyper/pull/3202>`_)
+- guard against iterating over empty list in for loop (`#3197 <https://github.com/vyperlang/vyper/pull/3197>`_)
+- skip enum members during constant folding (`#3235 <https://github.com/vyperlang/vyper/pull/3235>`_)
+- bitwise ``not`` constant folding (`#3222 <https://github.com/vyperlang/vyper/pull/3222>`_)
+- allow accessing members of constant address (`#3261 <https://github.com/vyperlang/vyper/pull/3261>`_)
+- guard against decorators in interface (`#3266 <https://github.com/vyperlang/vyper/pull/3266>`_)
+- fix bounds for decimals in some builtins (`#3283 <https://github.com/vyperlang/vyper/pull/3283>`_)
+- length of literal empty bytestrings (`#3276 <https://github.com/vyperlang/vyper/pull/3276>`_)
+- block ``empty()`` for HashMaps (`#3303 <https://github.com/vyperlang/vyper/pull/3303>`_)
+- fix type inference for empty lists (`#3377 <https://github.com/vyperlang/vyper/pull/3377>`_)
+- disallow logging from ``pure``, ``view`` functions (`#3424 <https://github.com/vyperlang/vyper/pull/3424>`_)
+- improve optimizer rules for comparison operators (`#3412 <https://github.com/vyperlang/vyper/pull/3412>`_)
+- deploy to ghcr on push (`#3435 <https://github.com/vyperlang/vyper/pull/3435>`_)
+- add note on return value bounds in interfaces (`#3205 <https://github.com/vyperlang/vyper/pull/3205>`_)
+- index ``id`` param in ``URI`` event of ``ERC1155ownable`` (`#3203 <https://github.com/vyperlang/vyper/pull/3203>`_)
+- add missing ``asset`` function to ``ERC4626`` built-in interface (`#3295 <https://github.com/vyperlang/vyper/pull/3295>`_)
+- clarify ``skip_contract_check=True`` can result in undefined behavior (`#3386 <https://github.com/vyperlang/vyper/pull/3386>`_)
+- add ``custom`` NatSpec tag to docs (`#3404 <https://github.com/vyperlang/vyper/pull/3404>`_)
+- fix ``uint256_addmod`` doc (`#3300 <https://github.com/vyperlang/vyper/pull/3300>`_)
+- document optional kwargs for external calls (`#3122 <https://github.com/vyperlang/vyper/pull/3122>`_)
+- remove ``slice()`` length documentation caveats (`#3152 <https://github.com/vyperlang/vyper/pull/3152>`_)
+- fix docs of ``blockhash`` to reflect revert behaviour (`#3168 <https://github.com/vyperlang/vyper/pull/3168>`_)
+- improvements to compiler error messages (`#3121 <https://github.com/vyperlang/vyper/pull/3121>`_, `#3134 <https://github.com/vyperlang/vyper/pull/3134>`_, `#3312 <https://github.com/vyperlang/vyper/pull/3312>`_, `#3304 <https://github.com/vyperlang/vyper/pull/3304>`_, `#3240 <https://github.com/vyperlang/vyper/pull/3240>`_, `#3264 <https://github.com/vyperlang/vyper/pull/3264>`_, `#3343 <https://github.com/vyperlang/vyper/pull/3343>`_, `#3307 <https://github.com/vyperlang/vyper/pull/3307>`_, `#3313 <https://github.com/vyperlang/vyper/pull/3313>`_ and `#3215 <https://github.com/vyperlang/vyper/pull/3215>`_)
+
+These are really just the highlights, as many other bugfixes, docs updates and refactoring (over 150 pull requests!) made it into this release! For the full list, please see the `changelog <https://github.com/vyperlang/vyper/compare/v0.3.7...v0.3.8>`_. Special thanks to contributions from @tserg, @trocher, @z80dev, @emc415 and @benber86 in this release!
+
+New Contributors:
+
+- @omahs made their first contribution in (`#3128 <https://github.com/vyperlang/vyper/pull/3128>`_)
+- @ObiajuluM made their first contribution in (`#3124 <https://github.com/vyperlang/vyper/pull/3124>`_)
+- @trocher made their first contribution in (`#3134 <https://github.com/vyperlang/vyper/pull/3134>`_)
+- @ozmium22 made their first contribution in (`#3149 <https://github.com/vyperlang/vyper/pull/3149>`_)
+- @ToonVanHove made their first contribution in (`#3168 <https://github.com/vyperlang/vyper/pull/3168>`_)
+- @emc415 made their first contribution in (`#3158 <https://github.com/vyperlang/vyper/pull/3158>`_)
+- @lgtm-com made their first contribution in (`#3147 <https://github.com/vyperlang/vyper/pull/3147>`_)
+- @tdurieux made their first contribution in (`#3224 <https://github.com/vyperlang/vyper/pull/3224>`_)
+- @victor-ego made their first contribution in (`#3263 <https://github.com/vyperlang/vyper/pull/3263>`_)
+- @miohtama made their first contribution in (`#3257 <https://github.com/vyperlang/vyper/pull/3257>`_)
+- @kelvinfan001 made their first contribution in (`#2687 <https://github.com/vyperlang/vyper/pull/2687>`_)
+
+
 v0.3.7
 ******
 

From 036f153683e0d55b890305eb4c77680a0872fcba Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 23 May 2023 10:48:21 -0400
Subject: [PATCH 053/161] chore: clean up 0.3.7 release notes formatting
 (#3444)

---
 docs/release-notes.rst | 18 +++++++++---------
 1 file changed, 9 insertions(+), 9 deletions(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index cf4d8d42f9..3e7bc02587 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -115,29 +115,29 @@ v0.3.7
 
 Date released: 2022-09-26
 
-## Breaking changes:
+Breaking changes:
 
 - chore: drop python 3.7 support (`#3071 <https://github.com/vyperlang/vyper/pull/3071>`_)
 - fix: relax check for statically sized calldata (`#3090 <https://github.com/vyperlang/vyper/pull/3090>`_)
 
-## Non-breaking changes and improvements:
+Non-breaking changes and improvements:
 
-- fix: assert description in Crowdfund.finalize() (`#3058 <https://github.com/vyperlang/vyper/pull/3058>`_)
+- fix: assert description in ``Crowdfund.finalize()`` (`#3058 <https://github.com/vyperlang/vyper/pull/3058>`_)
 - fix: change mutability of example ERC721 interface (`#3076 <https://github.com/vyperlang/vyper/pull/3076>`_)
 - chore: improve error message for non-checksummed address literal (`#3065 <https://github.com/vyperlang/vyper/pull/3065>`_)
-- feat: isqrt built-in (`#3074 <https://github.com/vyperlang/vyper/pull/3074>`_) (`#3069 <https://github.com/vyperlang/vyper/pull/3069>`_)
-- feat: add `block.prevrandao` as alias for `block.difficulty` (`#3085 <https://github.com/vyperlang/vyper/pull/3085>`_)
-- feat: epsilon builtin (`#3057 <https://github.com/vyperlang/vyper/pull/3057>`_)
+- feat: ``isqrt()`` builtin (`#3074 <https://github.com/vyperlang/vyper/pull/3074>`_) (`#3069 <https://github.com/vyperlang/vyper/pull/3069>`_)
+- feat: add ``block.prevrandao`` as alias for ``block.difficulty`` (`#3085 <https://github.com/vyperlang/vyper/pull/3085>`_)
+- feat: ``epsilon()`` builtin (`#3057 <https://github.com/vyperlang/vyper/pull/3057>`_)
 - feat: extend ecrecover signature to accept additional parameter types (`#3084 <https://github.com/vyperlang/vyper/pull/3084>`_)
 - feat: allow constant and immutable variables to be declared public (`#3024 <https://github.com/vyperlang/vyper/pull/3024>`_)
 - feat: optionally disable metadata in bytecode (`#3107 <https://github.com/vyperlang/vyper/pull/3107>`_)
     
-## Bugfixes:
+Bugfixes:
 
 - fix: empty nested dynamic arrays (`#3061 <https://github.com/vyperlang/vyper/pull/3061>`_)
 - fix: foldable builtin default args in imports (`#3079 <https://github.com/vyperlang/vyper/pull/3079>`_) (`#3077 <https://github.com/vyperlang/vyper/pull/3077>`_)
 
-## Additional changes and improvements:
+Additional changes and improvements:
 
 - doc: update broken links in SECURITY.md (`#3095 <https://github.com/vyperlang/vyper/pull/3095>`_)
 - chore: update discord link in docs (`#3031 <https://github.com/vyperlang/vyper/pull/3031>`_)
@@ -147,7 +147,7 @@ Date released: 2022-09-26
 - chore: migrate lark grammar (`#3082 <https://github.com/vyperlang/vyper/pull/3082>`_)
 - chore: loosen and upgrade semantic version (`#3106 <https://github.com/vyperlang/vyper/pull/3106>`_)
 
-# New Contributors
+New Contributors
 
 - @emilianobonassi made their first contribution in `#3107 <https://github.com/vyperlang/vyper/pull/3107>`_
 - @unparalleled-js made their first contribution in `#3106 <https://github.com/vyperlang/vyper/pull/3106>`_

From 71c8e55b7ca6b5cef02411c006c8cdc3f0b0a8e1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 23 May 2023 17:48:25 -0400
Subject: [PATCH 054/161] chore: build for old ubuntus (#3453)

python3.11 uses a new libc which is not compatible with ubuntu 20.04.
---
 .github/workflows/build.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 43586c262a..f2b63e9967 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -20,7 +20,7 @@ jobs:
     runs-on: ${{ matrix.os }}
     strategy:
       matrix:
-        os: [ubuntu-latest, macos-latest]
+        os: [ubuntu-20.04, macos-latest]
 
     steps:
       - uses: actions/checkout@v2

From 510125e0fce389fcc2b9993691696eb0836345b6 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 23 May 2023 17:53:31 -0400
Subject: [PATCH 055/161] fix: initcode codesize regression (#3450)

this commit fixes a regression in c202c4e3ec8. the commit message states
that we rely on the dead code eliminator to prune unused internal
functions in the initcode, but the dead code eliminator does not prune
dead code in all cases, including nested internal functions and loops.
this commit reintroduces the reachability analysis in
`vyper/codegen/module.py` as a stopgap until the dead code eliminator is
more robust.
---
 tests/compiler/asm/test_asm_optimizer.py      | 83 +++++++++++++++----
 .../parser/functions/test_create_functions.py | 24 ++++--
 vyper/codegen/module.py                       |  7 +-
 vyper/ir/compile_ir.py                        | 13 ++-
 4 files changed, 100 insertions(+), 27 deletions(-)

diff --git a/tests/compiler/asm/test_asm_optimizer.py b/tests/compiler/asm/test_asm_optimizer.py
index b82d568ff8..f4a245e168 100644
--- a/tests/compiler/asm/test_asm_optimizer.py
+++ b/tests/compiler/asm/test_asm_optimizer.py
@@ -1,49 +1,102 @@
-from vyper.compiler.phases import CompilerData
+import pytest
 
+from vyper.compiler.phases import CompilerData
 
-def test_dead_code_eliminator():
-    code = """
+codes = [
+    """
 s: uint256
 
 @internal
-def foo():
+def ctor_only():
     self.s = 1
 
 @internal
-def qux():
+def runtime_only():
     self.s = 2
 
+@external
+def bar():
+    self.runtime_only()
+
+@external
+def __init__():
+    self.ctor_only()
+    """,
+    # code with nested function in it
+    """
+s: uint256
+
+@internal
+def runtime_only():
+    self.s = 1
+
+@internal
+def foo():
+    self.runtime_only()
+
+@internal
+def ctor_only():
+    self.s += 1
+
 @external
 def bar():
     self.foo()
 
 @external
 def __init__():
-    self.qux()
+    self.ctor_only()
+    """,
+    # code with loop in it, these are harder for dead code eliminator
     """
+s: uint256
+
+@internal
+def ctor_only():
+    self.s = 1
+
+@internal
+def runtime_only():
+    for i in range(10):
+        self.s += 1
 
+@external
+def bar():
+    self.runtime_only()
+
+@external
+def __init__():
+    self.ctor_only()
+    """,
+]
+
+
+@pytest.mark.parametrize("code", codes)
+def test_dead_code_eliminator(code):
     c = CompilerData(code, no_optimize=True)
     initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
     runtime_asm = c.assembly_runtime
 
-    foo_label = "_sym_internal_foo___"
-    qux_label = "_sym_internal_qux___"
+    ctor_only_label = "_sym_internal_ctor_only___"
+    runtime_only_label = "_sym_internal_runtime_only___"
+
+    # qux reachable from unoptimized initcode, foo not reachable.
+    assert ctor_only_label + "_deploy" in initcode_asm
+    assert runtime_only_label + "_deploy" not in initcode_asm
 
-    # all the labels should be in all the unoptimized asms
-    for s in (foo_label, qux_label):
-        assert s + "_deploy" in initcode_asm
+    # all labels should be in unoptimized runtime asm
+    for s in (ctor_only_label, runtime_only_label):
         assert s + "_runtime" in runtime_asm
 
     c = CompilerData(code, no_optimize=False)
     initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
     runtime_asm = c.assembly_runtime
 
-    # qux should not be in runtime code
+    # ctor only label should not be in runtime code
     for instr in runtime_asm:
         if isinstance(instr, str):
-            assert not instr.startswith(qux_label), instr
+            assert not instr.startswith(ctor_only_label), instr
 
-    # foo should not be in initcode asm
+    # runtime only label should not be in initcode asm
     for instr in initcode_asm:
         if isinstance(instr, str):
-            assert not instr.startswith(foo_label), instr
+            assert not instr.startswith(runtime_only_label), instr
diff --git a/tests/parser/functions/test_create_functions.py b/tests/parser/functions/test_create_functions.py
index 857173df7e..64e0823146 100644
--- a/tests/parser/functions/test_create_functions.py
+++ b/tests/parser/functions/test_create_functions.py
@@ -3,6 +3,8 @@
 from eth.codecs import abi
 from hexbytes import HexBytes
 
+import vyper.ir.compile_ir as compile_ir
+from vyper.codegen.ir_node import IRnode
 from vyper.utils import EIP_170_LIMIT, checksum_encode, keccak256
 
 
@@ -224,15 +226,23 @@ def test(code_ofst: uint256) -> address:
     return create_from_blueprint(BLUEPRINT, code_offset=code_ofst)
     """
 
-    # use a bunch of JUMPDEST + STOP instructions as blueprint code
-    # (as any STOP instruction returns valid code, split up with
-    # jumpdests as optimization fence)
     initcode_len = 100
-    f = get_contract_from_ir(["deploy", 0, ["seq"] + ["jumpdest", "stop"] * (initcode_len // 2), 0])
-    blueprint_code = w3.eth.get_code(f.address)
-    print(blueprint_code)
 
-    d = get_contract(deployer_code, f.address)
+    # deploy a blueprint contract whose contained initcode contains only
+    # zeroes (so no matter which offset, create_from_blueprint will
+    # return empty code)
+    ir = IRnode.from_list(["deploy", 0, ["seq"] + ["stop"] * initcode_len, 0])
+    bytecode, _ = compile_ir.assembly_to_evm(compile_ir.compile_to_assembly(ir, no_optimize=True))
+    # manually deploy the bytecode
+    c = w3.eth.contract(abi=[], bytecode=bytecode)
+    deploy_transaction = c.constructor()
+    tx_info = {"from": w3.eth.accounts[0], "value": 0, "gasPrice": 0}
+    tx_hash = deploy_transaction.transact(tx_info)
+    blueprint_address = w3.eth.get_transaction_receipt(tx_hash)["contractAddress"]
+    blueprint_code = w3.eth.get_code(blueprint_address)
+    print("BLUEPRINT CODE:", blueprint_code)
+
+    d = get_contract(deployer_code, blueprint_address)
 
     # deploy with code_ofst=0 fine
     d.test(0)
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 9bc589d82f..2fece47a9e 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -123,7 +123,6 @@ def _runtime_ir(runtime_functions, global_ctx):
         ["label", "fallback", ["var_list"], fallback_ir],
     ]
 
-    # note: dead code eliminator will clean dead functions
     runtime.extend(internal_functions_ir)
 
     return runtime
@@ -178,10 +177,14 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
         # internal functions come after everything else
         internal_functions = [f for f in runtime_functions if _is_internal(f)]
         for f in internal_functions:
+            init_func_t = init_function._metadata["type"]
+            if f.name not in init_func_t.recursive_calls:
+                # unreachable
+                continue
+
             func_ir = generate_ir_for_function(
                 f, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
             )
-            # note: we depend on dead code eliminator to clean dead function defs
             deploy_code.append(func_ir)
 
     else:
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 57ea4ca7e7..b2a58fa8c9 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -758,6 +758,9 @@ def note_breakpoint(line_number_map, item, pos):
             line_number_map["breakpoints"].add(item.lineno + 1)
 
 
+_TERMINAL_OPS = ("JUMP", "RETURN", "REVERT", "STOP", "INVALID")
+
+
 def _prune_unreachable_code(assembly):
     # In converting IR to assembly we sometimes end up with unreachable
     # instructions - POPing to clear the stack or STOPing execution at the
@@ -766,9 +769,13 @@ def _prune_unreachable_code(assembly):
     # to avoid unnecessary bytecode bloat.
     changed = False
     i = 0
-    while i < len(assembly) - 1:
-        if assembly[i] in ("JUMP", "RETURN", "REVERT", "STOP") and not (
-            is_symbol(assembly[i + 1]) or assembly[i + 1] == "JUMPDEST"
+    while i < len(assembly) - 2:
+        instr = assembly[i]
+        if isinstance(instr, list):
+            instr = assembly[i][-1]
+
+        if assembly[i] in _TERMINAL_OPS and not (
+            is_symbol(assembly[i + 1]) and assembly[i + 2] in ("JUMPDEST", "BLANK")
         ):
             changed = True
             del assembly[i + 1]

From b3c7efa38eef63d9d979ad663a9ecfd77e343987 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 23 May 2023 18:31:18 -0400
Subject: [PATCH 056/161] add v0.3.9 release notes (#3452)

---
 docs/release-notes.rst | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 3e7bc02587..06bb29d839 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -14,6 +14,18 @@ Release Notes
     for advisory links:
     :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/security\/advisories\/)([-A-Za-z0-9]+)/(`\2 <\1\2>`_)/g
 
+v0.3.9
+******
+
+Date released: 2023-05-23
+
+This is a patch release fix for v0.3.8. @bout3fiddy discovered a codesize regression for blueprint contracts in v0.3.8 which is fixed in this release.
+
+Fixes:
+
+- initcode codesize blowup (`#3450 <https://github.com/vyperlang/vyper/pull/3450>`_)
+
+
 v0.3.8
 ******
 

From 19073dadb3c0d661f4bddfa7de7852d85835484e Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 24 May 2023 10:08:08 -0400
Subject: [PATCH 057/161] chore: update v0.3.9 release date (#3455)

---
 docs/release-notes.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 06bb29d839..a8bd309bf1 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -17,7 +17,7 @@ Release Notes
 v0.3.9
 ******
 
-Date released: 2023-05-23
+Date released: 2023-05-24
 
 This is a patch release fix for v0.3.8. @bout3fiddy discovered a codesize regression for blueprint contracts in v0.3.8 which is fixed in this release.
 

From 070b0cfba0bf32da66b8640740d54d9e2a850833 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 25 May 2023 10:29:27 -0400
Subject: [PATCH 058/161] fix: add error message for send() builtin (#3459)

---
 vyper/builtins/functions.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 915f10ede3..af965afe0a 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -1247,7 +1247,9 @@ def build_IR(self, expr, args, kwargs, context):
         to, value = args
         gas = kwargs["gas"]
         context.check_is_not_constant("send ether", expr)
-        return IRnode.from_list(["assert", ["call", gas, to, value, 0, 0, 0, 0]])
+        return IRnode.from_list(
+            ["assert", ["call", gas, to, value, 0, 0, 0, 0]], error_msg="send failed"
+        )
 
 
 class SelfDestruct(BuiltinFunction):

From 056dfd84878bf3892a42eea33415d792ac0d29c1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 25 May 2023 22:37:35 -0400
Subject: [PATCH 059/161] fix: `source_map_full` output in `vyper-json` (#3464)

source_map_full output fails with a KeyError when user requests
evm.sourceMapFull but not evm.sourceMap. this commit fixes.
---
 vyper/cli/vyper_json.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/vyper/cli/vyper_json.py b/vyper/cli/vyper_json.py
index aa6cf1c2f5..2fbf58aec4 100755
--- a/vyper/cli/vyper_json.py
+++ b/vyper/cli/vyper_json.py
@@ -429,7 +429,7 @@ def format_to_output_dict(compiler_data: Dict) -> Dict:
             if "source_map" in data:
                 evm["sourceMap"] = data["source_map"]["pc_pos_map_compressed"]
             if "source_map_full" in data:
-                evm["sourceMapFull"] = data["source_map"]
+                evm["sourceMapFull"] = data["source_map_full"]
 
     return output_dict
 

From 64733b9d15935ecd2bfcfdfbb9606d5ab500d70c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 26 May 2023 11:36:30 -0400
Subject: [PATCH 060/161] fix: add error message for nonpayable check (#3466)

---
 vyper/codegen/function_definitions/external_function.py | 5 ++++-
 vyper/codegen/module.py                                 | 5 ++++-
 2 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 6104a86c16..312cb75cf8 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -200,7 +200,10 @@ def generate_ir_for_external_function(code, func_t, context, skip_nonpayable_che
     if not func_t.is_payable and not skip_nonpayable_check:
         # if the contract contains payable functions, but this is not one of them
         # add an assertion that the value of the call is zero
-        body += [["assert", ["iszero", "callvalue"]]]
+        nonpayable_check = IRnode.from_list(
+            ["assert", ["iszero", "callvalue"]], error_msg="nonpayable check"
+        )
+        body.append(nonpayable_check)
 
     body += nonreentrant_pre
 
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 2fece47a9e..2d498460be 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -97,7 +97,10 @@ def _runtime_ir(runtime_functions, global_ctx):
         selector_section.append(func_ir)
 
     if batch_payable_check:
-        selector_section.append(["assert", ["iszero", "callvalue"]])
+        nonpayable_check = IRnode.from_list(
+            ["assert", ["iszero", "callvalue"]], error_msg="nonpayable check"
+        )
+        selector_section.append(nonpayable_check)
 
     for func_ast in nonpayables:
         func_ir = generate_ir_for_function(func_ast, global_ctx, skip_nonpayable_check)

From 33c247151cfed13999289c08f3c35d70fa83394d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 28 May 2023 10:33:50 -0400
Subject: [PATCH 061/161] fix: add back global calldatasize check (#3463)

prevent a performance regression for sending eth to contracts with a
payable default function by (mostly) reverting the changes introduced in
9ecb97b4b6f and 02339dfda0. the `skip_nonpayable_check=False` for the
default function is introduced to address GHSA-vxmm-cwh2-q762 (which
02339dfda0 inadvertently fixed, and a test for which was added in
903727006c).
---
 .../function_definitions/external_function.py | 25 +------------------
 vyper/codegen/module.py                       |  7 +++++-
 2 files changed, 7 insertions(+), 25 deletions(-)

diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 312cb75cf8..207356860b 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -89,8 +89,7 @@ def handler_for(calldata_kwargs, default_kwargs):
         calldata_min_size = args_abi_t.min_size() + 4
 
         # note we don't need the check if calldata_min_size == 4,
-        # because the selector checks later in this routine ensure
-        # that calldatasize >= 4.
+        # because the global calldatasize check ensures that already.
         if calldata_min_size > 4:
             ret.append(["assert", ["ge", "calldatasize", calldata_min_size]])
 
@@ -125,28 +124,6 @@ def handler_for(calldata_kwargs, default_kwargs):
         ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
 
         method_id_check = ["eq", "_calldata_method_id", method_id]
-
-        # if there is a function whose selector is 0 or has trailing 0s, it
-        # might not be distinguished from the case where insufficient calldata
-        # is supplied, b/c calldataload loads 0s past the end of physical
-        # calldata (cf. yellow paper).
-        # since the expected behavior of supplying insufficient calldata
-        # is to trigger the fallback fn, we add to the selector check that
-        # calldatasize >= 4, which distinguishes any selector with trailing
-        # 0 bytes from the fallback function "selector" (equiv. to "all
-        # selectors not in the selector table").
-        #
-        # note that the inclusion of this check means that, we are always
-        # guaranteed that the calldata is at least 4 bytes - either we have
-        # the explicit `calldatasize >= 4` condition in the selector check,
-        # or there are no trailing zeroes in the selector, (so the selector
-        # is impossible to match without calldatasize being at least 4).
-        method_id_bytes = util.method_id(abi_sig)
-        assert len(method_id_bytes) == 4
-        has_trailing_zeroes = method_id_bytes.endswith(b"\x00")
-        if has_trailing_zeroes:
-            method_id_check = ["and", ["ge", "calldatasize", 4], method_id_check]
-
         ret = ["if", method_id_check, ret]
         return ret
 
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 2d498460be..64d5a8b70c 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -107,7 +107,9 @@ def _runtime_ir(runtime_functions, global_ctx):
         selector_section.append(func_ir)
 
     if default_function:
-        fallback_ir = generate_ir_for_function(default_function, global_ctx, skip_nonpayable_check)
+        fallback_ir = generate_ir_for_function(
+            default_function, global_ctx, skip_nonpayable_check=False
+        )
     else:
         fallback_ir = IRnode.from_list(
             ["revert", 0, 0], annotation="Default function", error_msg="fallback function"
@@ -119,8 +121,11 @@ def _runtime_ir(runtime_functions, global_ctx):
     # fallback label is the immediate next instruction,
     close_selector_section = ["goto", "fallback"]
 
+    global_calldatasize_check = ["if", ["lt", "calldatasize", 4], ["goto", "fallback"]]
+
     runtime = [
         "seq",
+        global_calldatasize_check,
         ["with", "_calldata_method_id", shr(224, ["calldataload", 0]), selector_section],
         close_selector_section,
         ["label", "fallback", ["var_list"], fallback_ir],

From 5c2892b2b4f6cdbc039b0f70ecd0e7058fed521c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 28 May 2023 10:36:16 -0400
Subject: [PATCH 062/161] chore: update v0.3.9 release notes (#3458)

---
 docs/release-notes.rst | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index a8bd309bf1..6d1d35b1e2 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -17,13 +17,14 @@ Release Notes
 v0.3.9
 ******
 
-Date released: 2023-05-24
+Date released: 2023-05-28
 
-This is a patch release fix for v0.3.8. @bout3fiddy discovered a codesize regression for blueprint contracts in v0.3.8 which is fixed in this release.
+This is a patch release fix for v0.3.8. @bout3fiddy discovered a codesize regression for blueprint contracts in v0.3.8 which is fixed in this release. @bout3fiddy also discovered a runtime performance (gas) regression for default functions in v0.3.8 which is fixed in this release.
 
 Fixes:
 
 - initcode codesize blowup (`#3450 <https://github.com/vyperlang/vyper/pull/3450>`_)
+- add back global calldatasize check for contracts with default fn (`#3463 <https://github.com/vyperlang/vyper/pull/3463>`_)
 
 
 v0.3.8

From 66b9670555cbb57a78b9113e1c2ad343111df1b3 Mon Sep 17 00:00:00 2001
From: ControlCplusControlV
 <44706811+ControlCplusControlV@users.noreply.github.com>
Date: Mon, 29 May 2023 08:50:34 -0600
Subject: [PATCH 063/161] docs: add name to 0.3.9 release (#3468)

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 docs/release-notes.rst | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 6d1d35b1e2..22d89614db 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -14,10 +14,10 @@ Release Notes
     for advisory links:
     :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/security\/advisories\/)([-A-Za-z0-9]+)/(`\2 <\1\2>`_)/g
 
-v0.3.9
+v0.3.9 ("Common Adder")
 ******
 
-Date released: 2023-05-28
+Date released: 2023-05-29
 
 This is a patch release fix for v0.3.8. @bout3fiddy discovered a codesize regression for blueprint contracts in v0.3.8 which is fixed in this release. @bout3fiddy also discovered a runtime performance (gas) regression for default functions in v0.3.8 which is fixed in this release.
 

From e97e9f2a2fd7c6c062574997b622a41539926930 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 30 May 2023 15:28:44 -0400
Subject: [PATCH 064/161] ci: auto-upload release assets on release event
 (#3469)

note: used download-artifact to upload the artifacts since we don't want
to learn how to write a windows script in the windows-build workflow

also:
* removed the ghcr build on tag events (since it's redundant with the
  release event and we end up with orphaned images, since two images get
  tagged with ex. v0.3.9)
* rename some workflows for clarity
---
 .github/workflows/build.yml      | 37 +++++++++++++++++++++++++++-----
 .github/workflows/era-tester.yml |  2 +-
 .github/workflows/ghcr.yml       |  2 --
 .github/workflows/publish.yml    |  4 ++--
 .github/workflows/test.yml       |  2 +-
 5 files changed, 36 insertions(+), 11 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index f2b63e9967..f891ff7e1d 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -1,4 +1,4 @@
-name: Artifacts
+name: Build and release artifacts
 
 on:
   workflow_dispatch:
@@ -6,10 +6,10 @@ on:
       tag:
         default: ''
   push:
-    tags:
-      - '*'
     branches:
       - master
+  release:
+    types: [released]
 
 defaults:
   run:
@@ -23,7 +23,7 @@ jobs:
         os: [ubuntu-20.04, macos-latest]
 
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v3
         with:
             # grab the commit passed in via `tag`, if any
             ref: ${{ github.event.inputs.tag }}
@@ -51,7 +51,7 @@ jobs:
     runs-on: windows-latest
 
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v3
         with:
             # grab the commit passed in via `tag`, if any
             ref: ${{ github.event.inputs.tag }}
@@ -74,3 +74,30 @@ jobs:
         uses: actions/upload-artifact@v3
         with:
           path: dist/vyper.*
+
+  publish-release-assets:
+    needs: [windows-build, unix-build]
+    if: ${{ github.event_name == 'release' }}
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v3
+      - uses: actions/download-artifact@v3
+        with:
+          path: artifacts/
+
+      - name: Upload assets
+        # fun - artifacts are downloaded into "artifact/".
+        working-directory: artifacts/artifact
+        run: |
+          set -Eeuxo pipefail
+          for BIN_NAME in $(ls)
+          do
+            curl -L \
+              --no-progress-meter \
+              -X POST \
+              -H "Authorization: Bearer ${{ secrets.GITHUB_TOKEN }}"\
+              -H "Content-Type: application/octet-stream" \
+              "https://uploads.github.com/repos/${{ github.repository }}/releases/${{ github.event.release.id }}/assets?name=${BIN_NAME}" \
+              --data-binary "@${BIN_NAME}"
+          done
diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index 8c7e355d26..a693d2c97d 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -1,4 +1,4 @@
-name: era compiler tester
+name: Era compiler tester
 
 # run the matter labs compiler test to integrate their test cases
 # this is intended as a diagnostic / spot check to check that we
diff --git a/.github/workflows/ghcr.yml b/.github/workflows/ghcr.yml
index 4bc2885bdb..a35a22e278 100644
--- a/.github/workflows/ghcr.yml
+++ b/.github/workflows/ghcr.yml
@@ -8,8 +8,6 @@ name: Deploy docker image to ghcr
 
 on:
   push:
-    tags:
-      - '*'
     branches:
       - master
   release:
diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
index e6e5f2a6f9..44c6978295 100644
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -1,7 +1,7 @@
-# This workflows will upload a Python Package using Twine when a release is created
+# This workflow will upload a Python Package using Twine when a release is created
 # For more information see: https://help.github.com/en/actions/language-and-framework-guides/using-python-with-github-actions#publishing-to-package-registries
 
-name: Publish
+name: Publish to PyPI
 
 on:
   release:
diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 94e8c7c8f6..42e0524b13 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -1,4 +1,4 @@
-name: Test
+name: Run test suite
 
 on: [push, pull_request]
 

From 981fcdabd66c5823c5a2f00e02b57413a7dd4ad3 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Thu, 1 Jun 2023 00:09:33 +0800
Subject: [PATCH 065/161] fix: type inference for ternary operator literals
 (#3460)

---
 tests/parser/syntax/test_ternary.py    | 5 +++++
 vyper/semantics/analysis/annotation.py | 2 +-
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/tests/parser/syntax/test_ternary.py b/tests/parser/syntax/test_ternary.py
index 11c06051d0..325be3e43b 100644
--- a/tests/parser/syntax/test_ternary.py
+++ b/tests/parser/syntax/test_ternary.py
@@ -10,6 +10,11 @@
 def foo(a: uint256, b: uint256) -> uint256:
     return a if a > b else b
     """,
+    """
+@external
+def foo():
+    a: bool = (True if True else True) or True
+    """,
     # different locations:
     """
 b: uint256
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index e501be5fdb..3ea0319b54 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -271,7 +271,7 @@ def visit_UnaryOp(self, node, type_):
     def visit_IfExp(self, node, type_):
         if type_ is None:
             ts = get_common_types(node.body, node.orelse)
-            if len(type_) == 1:
+            if len(ts) == 1:
                 type_ = ts.pop()
 
         node._metadata["type"] = type_

From 7f18aeee59abbf3f4657edc94a8b354731cce19b Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 31 May 2023 13:00:13 -0400
Subject: [PATCH 066/161] docs: shanghai is default compilation target (#3474)

in v0.3.9 release notes
---
 docs/release-notes.rst | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 22d89614db..dcdbcda74a 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -44,6 +44,8 @@ Non-breaking changes and improvements:
 - drop support for python 3.8 and 3.9 (`#3325 <https://github.com/vyperlang/vyper/pull/3325>`_)
 - build for ``aarch64`` (`#2687 <https://github.com/vyperlang/vyper/pull/2687>`_)
 
+Note that with the addition of ``push0`` opcode, ``shanghai`` is now the default compilation target for vyper. When deploying to a chain which does not support ``shanghai``, it is recommended to set ``--evm-version`` to ``paris``, otherwise it could result in hard-to-debug errors.
+
 Major refactoring PRs:
 
 - refactor front-end type system (`#2974 <https://github.com/vyperlang/vyper/pull/2974>`_)

From 07f3cb091a30d06d45e626f49e8189260153aaa6 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 1 Jun 2023 15:46:37 -0400
Subject: [PATCH 067/161] chore: drop evm versions through istanbul (#3470)

drop pre-istanbul versions. per VIP-3365, we could drop through paris,
but since this is the first time starting to enforce this policy, we
don't want to drop too many versions at once.
---
 docs/compiling-a-contract.rst                 | 29 +++++----
 tests/cli/vyper_compile/test_compile_files.py | 26 --------
 .../test_compile_from_input_dict.py           |  9 ---
 tests/cli/vyper_json/test_get_settings.py     | 14 ++++-
 tests/compiler/test_opcodes.py                | 33 +++++-----
 tests/parser/functions/test_bitwise.py        | 13 +---
 tests/parser/syntax/test_chainid.py           | 16 ++---
 tests/parser/syntax/test_codehash.py          |  7 ---
 vyper/cli/vyper_compile.py                    |  2 +-
 vyper/cli/vyper_json.py                       | 10 ++-
 vyper/codegen/arithmetic.py                   | 11 +---
 vyper/codegen/core.py                         | 14 +----
 vyper/codegen/expr.py                         |  5 --
 vyper/codegen/external_call.py                |  3 +-
 vyper/evm/opcodes.py                          | 63 +++++++------------
 vyper/ir/optimizer.py                         |  9 +--
 16 files changed, 95 insertions(+), 169 deletions(-)

diff --git a/docs/compiling-a-contract.rst b/docs/compiling-a-contract.rst
index 4a03347536..36d0c8cb74 100644
--- a/docs/compiling-a-contract.rst
+++ b/docs/compiling-a-contract.rst
@@ -140,24 +140,29 @@ Target Options
 The following is a list of supported EVM versions, and changes in the compiler introduced with each version. Backward compatibility is not guaranteed between each version.
 
 
-.. py:attribute:: byzantium
+.. py:attribute:: istanbul
 
-   - The oldest EVM version supported by Vyper.
+   - The ``CHAINID`` opcode is accessible via ``chain.id``
+   - The ``SELFBALANCE`` opcode is used for calls to ``self.balance``
+   - Gas estimates changed for ``SLOAD`` and ``BALANCE``
 
-.. py:attribute:: constantinople
+.. py:attribute:: berlin
+   - Gas estimates changed for ``EXTCODESIZE``, ``EXTCODECOPY``, ``EXTCODEHASH``, ``SLOAD``, ``SSTORE``, ``CALL``, ``CALLCODE``, ``DELEGATECALL`` and ``STATICCALL``
+   - Functions marked with ``@nonreentrant`` are protected with different values (3 and 2) than contracts targeting pre-berlin.
+   - ``BASEFEE`` is accessible via ``block.basefee``
 
-   - The ``EXTCODEHASH`` opcode is accessible via ``address.codehash``
-   - ``shift`` makes use of ``SHL``/``SHR`` opcodes.
+.. py:attribute:: paris
+   - ``block.difficulty`` is deprecated in favor of its new alias, ``block.prevrandao``.
 
-.. py:attribute:: petersburg
+.. py:attribute:: shanghai
+   - The ``PUSH0`` opcode is automatically generated by the compiler instead of ``PUSH1 0``
 
-   - The compiler behaves the same way as with constantinople.
+.. py:attribute:: cancun (experimental)
+
+   - The ``transient`` keyword allows declaration of variables which live in transient storage
+   - Functions marked with ``@nonreentrant`` are protected with TLOAD/TSTORE instead of SLOAD/SSTORE
 
-.. py:attribute:: istanbul (default)
 
-   - The ``CHAINID`` opcode is accessible via ``chain.id``
-   - The ``SELFBALANCE`` opcode is used for calls to ``self.balance``
-   - Gas estimates changed for ``SLOAD`` and ``BALANCE``
 
 
 Compiler Input and Output JSON Description
@@ -204,7 +209,7 @@ The following example describes the expected input format of ``vyper-json``. Com
         },
         // Optional
         "settings": {
-            "evmVersion": "istanbul",  // EVM version to compile for. Can be byzantium, constantinople, petersburg or istanbul.
+            "evmVersion": "shanghai",  // EVM version to compile for. Can be istanbul, berlin, paris, shanghai (default) or cancun (experimental!).
             // optional, whether or not optimizations are turned on
             // defaults to true
             "optimize": true,
diff --git a/tests/cli/vyper_compile/test_compile_files.py b/tests/cli/vyper_compile/test_compile_files.py
index 796976ae0e..31cf622658 100644
--- a/tests/cli/vyper_compile/test_compile_files.py
+++ b/tests/cli/vyper_compile/test_compile_files.py
@@ -28,29 +28,3 @@ def test_combined_json_keys(tmp_path):
 def test_invalid_root_path():
     with pytest.raises(FileNotFoundError):
         compile_files([], [], root_folder="path/that/does/not/exist")
-
-
-def test_evm_versions(tmp_path):
-    # should compile differently because of SELFBALANCE
-    code = """
-@external
-def foo() -> uint256:
-    return self.balance
-"""
-
-    bar_path = tmp_path.joinpath("bar.vy")
-    with bar_path.open("w") as fp:
-        fp.write(code)
-
-    byzantium_bytecode = compile_files(
-        [bar_path], output_formats=["bytecode"], evm_version="byzantium"
-    )[str(bar_path)]["bytecode"]
-    istanbul_bytecode = compile_files(
-        [bar_path], output_formats=["bytecode"], evm_version="istanbul"
-    )[str(bar_path)]["bytecode"]
-
-    assert byzantium_bytecode != istanbul_bytecode
-
-    # SELFBALANCE opcode is 0x47
-    assert "47" not in byzantium_bytecode
-    assert "47" in istanbul_bytecode
diff --git a/tests/cli/vyper_json/test_compile_from_input_dict.py b/tests/cli/vyper_json/test_compile_from_input_dict.py
index a5a31a522b..a6d0a23100 100644
--- a/tests/cli/vyper_json/test_compile_from_input_dict.py
+++ b/tests/cli/vyper_json/test_compile_from_input_dict.py
@@ -130,12 +130,3 @@ def test_relative_import_paths():
     input_json["sources"]["contracts/potato/baz/potato.vy"] = {"content": """from . import baz"""}
     input_json["sources"]["contracts/potato/footato.vy"] = {"content": """from baz import baz"""}
     compile_from_input_dict(input_json)
-
-
-def test_evm_version():
-    # should compile differently because of SELFBALANCE
-    input_json = deepcopy(INPUT_JSON)
-    input_json["settings"]["evmVersion"] = "byzantium"
-    compiled = compile_from_input_dict(input_json)
-    input_json["settings"]["evmVersion"] = "istanbul"
-    assert compiled != compile_from_input_dict(input_json)
diff --git a/tests/cli/vyper_json/test_get_settings.py b/tests/cli/vyper_json/test_get_settings.py
index ca60d2cf5a..7530e85ef8 100644
--- a/tests/cli/vyper_json/test_get_settings.py
+++ b/tests/cli/vyper_json/test_get_settings.py
@@ -12,13 +12,23 @@ def test_unknown_evm():
         get_evm_version({"settings": {"evmVersion": "foo"}})
 
 
-@pytest.mark.parametrize("evm_version", ["homestead", "tangerineWhistle", "spuriousDragon"])
+@pytest.mark.parametrize(
+    "evm_version",
+    [
+        "homestead",
+        "tangerineWhistle",
+        "spuriousDragon",
+        "byzantium",
+        "constantinople",
+        "petersburg",
+    ],
+)
 def test_early_evm(evm_version):
     with pytest.raises(JSONError):
         get_evm_version({"settings": {"evmVersion": evm_version}})
 
 
-@pytest.mark.parametrize("evm_version", ["byzantium", "constantinople", "petersburg"])
+@pytest.mark.parametrize("evm_version", ["istanbul", "berlin", "paris", "shanghai", "cancun"])
 def test_valid_evm(evm_version):
     assert evm_version == get_evm_version({"settings": {"evmVersion": evm_version}})
 
diff --git a/tests/compiler/test_opcodes.py b/tests/compiler/test_opcodes.py
index 3c595dee44..b9841b92f0 100644
--- a/tests/compiler/test_opcodes.py
+++ b/tests/compiler/test_opcodes.py
@@ -37,30 +37,27 @@ def test_version_check(evm_version):
     assert opcodes.version_check(begin=evm_version)
     assert opcodes.version_check(end=evm_version)
     assert opcodes.version_check(begin=evm_version, end=evm_version)
-    if evm_version not in ("byzantium", "atlantis"):
-        assert not opcodes.version_check(end="byzantium")
+    if evm_version not in ("istanbul"):
+        assert not opcodes.version_check(end="istanbul")
     istanbul_check = opcodes.version_check(begin="istanbul")
     assert istanbul_check == (opcodes.EVM_VERSIONS[evm_version] >= opcodes.EVM_VERSIONS["istanbul"])
 
 
 def test_get_opcodes(evm_version):
     ops = opcodes.get_opcodes()
-    if evm_version in ("paris", "berlin", "shanghai", "cancun"):
-        assert "CHAINID" in ops
+
+    assert "CHAINID" in ops
+    assert ops["CREATE2"][-1] == 32000
+
+    if evm_version in ("london", "berlin", "paris", "shanghai", "cancun"):
         assert ops["SLOAD"][-1] == 2100
-        if evm_version in ("shanghai", "cancun"):
-            assert "PUSH0" in ops
-        if evm_version in ("cancun",):
-            assert "TLOAD" in ops
-            assert "TSTORE" in ops
-    elif evm_version == "istanbul":
-        assert "CHAINID" in ops
-        assert ops["SLOAD"][-1] == 800
     else:
-        assert "CHAINID" not in ops
-        assert ops["SLOAD"][-1] == 200
+        assert evm_version == "istanbul"
+        assert ops["SLOAD"][-1] == 800
 
-    if evm_version in ("byzantium", "atlantis"):
-        assert "CREATE2" not in ops
-    else:
-        assert ops["CREATE2"][-1] == 32000
+    if evm_version in ("shanghai", "cancun"):
+        assert "PUSH0" in ops
+
+    if evm_version in ("cancun",):
+        assert "TLOAD" in ops
+        assert "TSTORE" in ops
diff --git a/tests/parser/functions/test_bitwise.py b/tests/parser/functions/test_bitwise.py
index 800803907a..3e18bd292c 100644
--- a/tests/parser/functions/test_bitwise.py
+++ b/tests/parser/functions/test_bitwise.py
@@ -35,12 +35,8 @@ def _shr(x: uint256, y: uint256) -> uint256:
 @pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
 def test_bitwise_opcodes(evm_version):
     opcodes = compile_code(code, ["opcodes"], evm_version=evm_version)["opcodes"]
-    if evm_version in ("byzantium", "atlantis"):
-        assert "SHL" not in opcodes
-        assert "SHR" not in opcodes
-    else:
-        assert "SHL" in opcodes
-        assert "SHR" in opcodes
+    assert "SHL" in opcodes
+    assert "SHR" in opcodes
 
 
 @pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
@@ -59,10 +55,7 @@ def test_test_bitwise(get_contract_with_gas_estimation, evm_version):
             assert c._shl(t, s) == (t << s) % (2**256)
 
 
-POST_BYZANTIUM = [k for (k, v) in EVM_VERSIONS.items() if v > 0]
-
-
-@pytest.mark.parametrize("evm_version", POST_BYZANTIUM)
+@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS.keys()))
 def test_signed_shift(get_contract_with_gas_estimation, evm_version):
     code = """
 @external
diff --git a/tests/parser/syntax/test_chainid.py b/tests/parser/syntax/test_chainid.py
index eb2ed36325..be960f2fc5 100644
--- a/tests/parser/syntax/test_chainid.py
+++ b/tests/parser/syntax/test_chainid.py
@@ -2,7 +2,7 @@
 
 from vyper import compiler
 from vyper.evm.opcodes import EVM_VERSIONS
-from vyper.exceptions import EvmVersionException, InvalidType, TypeMismatch
+from vyper.exceptions import InvalidType, TypeMismatch
 
 
 @pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
@@ -13,11 +13,7 @@ def foo():
     a: uint256 = chain.id
     """
 
-    if EVM_VERSIONS[evm_version] < 2:
-        with pytest.raises(EvmVersionException):
-            compiler.compile_code(code, evm_version=evm_version)
-    else:
-        compiler.compile_code(code, evm_version=evm_version)
+    assert compiler.compile_code(code, evm_version=evm_version) is not None
 
 
 fail_list = [
@@ -71,10 +67,10 @@ def foo(inp: Bytes[10]) -> Bytes[3]:
 def test_chain_fail(bad_code):
     if isinstance(bad_code, tuple):
         with pytest.raises(bad_code[1]):
-            compiler.compile_code(bad_code[0], evm_version="istanbul")
+            compiler.compile_code(bad_code[0])
     else:
         with pytest.raises(TypeMismatch):
-            compiler.compile_code(bad_code, evm_version="istanbul")
+            compiler.compile_code(bad_code)
 
 
 valid_list = [
@@ -95,7 +91,7 @@ def check_chain_id(c: uint256) -> bool:
 
 @pytest.mark.parametrize("good_code", valid_list)
 def test_chain_success(good_code):
-    assert compiler.compile_code(good_code, evm_version="istanbul") is not None
+    assert compiler.compile_code(good_code) is not None
 
 
 def test_chainid_operation(get_contract_with_gas_estimation):
@@ -105,5 +101,5 @@ def test_chainid_operation(get_contract_with_gas_estimation):
 def get_chain_id() -> uint256:
     return chain.id
     """
-    c = get_contract_with_gas_estimation(code, evm_version="istanbul")
+    c = get_contract_with_gas_estimation(code)
     assert c.get_chain_id() == 131277322940537  # Default value of py-evm
diff --git a/tests/parser/syntax/test_codehash.py b/tests/parser/syntax/test_codehash.py
index 8c1e430d32..e4b6d90d8d 100644
--- a/tests/parser/syntax/test_codehash.py
+++ b/tests/parser/syntax/test_codehash.py
@@ -2,7 +2,6 @@
 
 from vyper.compiler import compile_code
 from vyper.evm.opcodes import EVM_VERSIONS
-from vyper.exceptions import EvmVersionException
 from vyper.utils import keccak256
 
 
@@ -32,12 +31,6 @@ def foo3() -> bytes32:
 def foo4() -> bytes32:
     return self.a.codehash
     """
-
-    if evm_version in ("byzantium", "atlantis"):
-        with pytest.raises(EvmVersionException):
-            compile_code(code, evm_version=evm_version)
-        return
-
     compiled = compile_code(
         code, ["bytecode_runtime"], evm_version=evm_version, no_optimize=no_optimize
     )
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 4dfc87639a..f5e113116d 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -102,7 +102,7 @@ def _parse_args(argv):
     parser.add_argument(
         "--evm-version",
         help=f"Select desired EVM version (default {DEFAULT_EVM_VERSION}). "
-        " note: cancun support is EXPERIMENTAL",
+        "note: cancun support is EXPERIMENTAL",
         choices=list(EVM_VERSIONS),
         default=DEFAULT_EVM_VERSION,
         dest="evm_version",
diff --git a/vyper/cli/vyper_json.py b/vyper/cli/vyper_json.py
index 2fbf58aec4..9778848aa2 100755
--- a/vyper/cli/vyper_json.py
+++ b/vyper/cli/vyper_json.py
@@ -149,8 +149,14 @@ def get_evm_version(input_dict: Dict) -> str:
         return DEFAULT_EVM_VERSION
 
     evm_version = input_dict["settings"].get("evmVersion", DEFAULT_EVM_VERSION)
-    if evm_version in ("homestead", "tangerineWhistle", "spuriousDragon"):
-        raise JSONError("Vyper does not support pre-byzantium EVM versions")
+    if evm_version in (
+        "homestead",
+        "tangerineWhistle",
+        "spuriousDragon",
+        "byzantium",
+        "constantinople",
+    ):
+        raise JSONError("Vyper does not support pre-istanbul EVM versions")
     if evm_version not in EVM_VERSIONS:
         raise JSONError(f"Unknown EVM version - '{evm_version}'")
 
diff --git a/vyper/codegen/arithmetic.py b/vyper/codegen/arithmetic.py
index eb2df20922..f14069384a 100644
--- a/vyper/codegen/arithmetic.py
+++ b/vyper/codegen/arithmetic.py
@@ -10,7 +10,6 @@
     is_numeric_type,
 )
 from vyper.codegen.ir_node import IRnode
-from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, TypeCheckFailure, UnimplementedException
 
 
@@ -243,10 +242,7 @@ def safe_mul(x, y):
             # in the above sdiv check, if (r==-1 and l==-2**255),
             # -2**255<res> / -1<r> will return -2**255<l>.
             # need to check: not (r == -1 and l == -2**255)
-            if version_check(begin="constantinople"):
-                upper_bound = ["shl", 255, 1]
-            else:
-                upper_bound = -(2**255)
+            upper_bound = ["shl", 255, 1]
 
             check_x = ["ne", x, upper_bound]
             check_y = ["ne", ["not", y], 0]
@@ -301,10 +297,7 @@ def safe_div(x, y):
     with res.cache_when_complex("res") as (b1, res):
         # TODO: refactor this condition / push some things into the optimizer
         if typ.is_signed and typ.bits == 256:
-            if version_check(begin="constantinople"):
-                upper_bound = ["shl", 255, 1]
-            else:
-                upper_bound = -(2**255)
+            upper_bound = ["shl", 255, 1]
 
             if not x.is_literal and not y.is_literal:
                 ok = ["or", ["ne", y, ["not", 0]], ["ne", x, upper_bound]]
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 06140f3f52..58d9db9889 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -1,7 +1,6 @@
 from vyper import ast as vy_ast
 from vyper.codegen.ir_node import Encoding, IRnode
 from vyper.evm.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE, TRANSIENT
-from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StructureException, TypeCheckFailure, TypeMismatch
 from vyper.semantics.types import (
     AddressT,
@@ -997,23 +996,16 @@ def zero_pad(bytez_placeholder):
 
 # convenience rewrites for shr/sar/shl
 def shr(bits, x):
-    if version_check(begin="constantinople"):
-        return ["shr", bits, x]
-    return ["div", x, ["exp", 2, bits]]
+    return ["shr", bits, x]
 
 
 # convenience rewrites for shr/sar/shl
 def shl(bits, x):
-    if version_check(begin="constantinople"):
-        return ["shl", bits, x]
-    return ["mul", x, ["exp", 2, bits]]
+    return ["shl", bits, x]
 
 
 def sar(bits, x):
-    if version_check(begin="constantinople"):
-        return ["sar", bits, x]
-
-    raise NotImplementedError("no SAR emulation for pre-constantinople EVM")
+    return ["sar", bits, x]
 
 
 def clamp_bytestring(ir_node):
diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index ac7290836b..d637a454bc 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -242,10 +242,6 @@ def parse_Attribute(self):
         # x.codehash: keccak of address x
         elif self.expr.attr == "codehash":
             addr = Expr.parse_value_expr(self.expr.value, self.context)
-            if not version_check(begin="constantinople"):
-                raise EvmVersionException(
-                    "address.codehash is unavailable prior to constantinople ruleset", self.expr
-                )
             if addr.typ == AddressT():
                 return IRnode.from_list(["extcodehash", addr], typ=BYTES32_T)
         # x.code: codecopy/extcodecopy of address x
@@ -401,7 +397,6 @@ def parse_BinOp(self):
                 # TODO implement me. promote_signed_int(op(right, left), bits)
                 return
             op = shr if not left.typ.is_signed else sar
-            # note: sar NotImplementedError for pre-constantinople
             return IRnode.from_list(op(right, left), typ=new_typ)
 
         # enums can only do bit ops, not arithmetic.
diff --git a/vyper/codegen/external_call.py b/vyper/codegen/external_call.py
index c4eb182eb1..ba89f3cace 100644
--- a/vyper/codegen/external_call.py
+++ b/vyper/codegen/external_call.py
@@ -63,8 +63,7 @@ def _pack_arguments(fn_type, args, context):
     # 32 bytes                 | args
     # 0x..00<method_id_4bytes> | args
     # the reason for the left padding is just so the alignment is easier.
-    # if we were only targeting constantinople, we could align
-    # to buf (and also keep code size small) by using
+    # XXX: we could align to buf (and also keep code size small) by using
     # (mstore buf (shl signature.method_id 224))
     pack_args = ["seq"]
     pack_args.append(["mstore", buf, util.method_id_int(abi_signature)])
diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index c447fd863c..00e0986939 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -7,28 +7,13 @@
 # 1. Fork rules go from oldest (lowest value) to newest (highest value).
 # 2. Fork versions aren't actually tied to anything. They are not a part of our
 #    official API. *DO NOT USE THE VALUES FOR ANYTHING IMPORTANT* besides versioning.
-# 3. When support for an older version is dropped, the numbers should *not* change to
-#    reflect it (i.e. dropping support for version 0 removes version 0 entirely).
-# 4. There can be multiple aliases to the same version number (but not the reverse).
-# 5. When supporting multiple chains, if a chain gets a fix first, it increments the
-#    number first.
-# 6. Yes, this will probably have to be rethought if there's ever conflicting support
-#    between multiple chains for a specific feature. Let's hope not.
-# 7. We support at a maximum 3 hard forks (for any given chain).
-EVM_VERSIONS: dict[str, int] = {
-    # ETH Forks
-    "byzantium": 0,
-    "constantinople": 1,
-    "petersburg": 1,
-    "istanbul": 2,
-    "berlin": 3,
-    "paris": 4,
-    "shanghai": 5,
-    "cancun": 6,
-    # ETC Forks
-    "atlantis": 0,
-    "agharta": 1,
-}
+# 3. Per VIP-3365, we support mainnet fork choice rules up to 1 year old
+#    (and may optionally have forward support for experimental/unreleased
+#    fork choice rules)
+_evm_versions = ("istanbul", "berlin", "london", "paris", "shanghai", "cancun")
+EVM_VERSIONS: dict[str, int] = dict((v, i) for i, v in enumerate(_evm_versions))
+
+
 DEFAULT_EVM_VERSION: str = "shanghai"
 active_evm_version: int = EVM_VERSIONS[DEFAULT_EVM_VERSION]
 
@@ -36,7 +21,7 @@
 # opcode as hex value
 # number of values removed from stack
 # number of values added to stack
-# gas cost (byzantium, constantinople, istanbul, berlin)
+# gas cost (istanbul, berlin, paris, shanghai, cancun)
 OPCODES: OpcodeMap = {
     "STOP": (0x00, 0, 0, 0),
     "ADD": (0x01, 2, 1, 3),
@@ -61,12 +46,12 @@
     "XOR": (0x18, 2, 1, 3),
     "NOT": (0x19, 1, 1, 3),
     "BYTE": (0x1A, 2, 1, 3),
-    "SHL": (0x1B, 2, 1, (None, 3)),
-    "SHR": (0x1C, 2, 1, (None, 3)),
-    "SAR": (0x1D, 2, 1, (None, 3)),
+    "SHL": (0x1B, 2, 1, 3),
+    "SHR": (0x1C, 2, 1, 3),
+    "SAR": (0x1D, 2, 1, 3),
     "SHA3": (0x20, 2, 1, 30),
     "ADDRESS": (0x30, 0, 1, 2),
-    "BALANCE": (0x31, 1, 1, (400, 400, 700)),
+    "BALANCE": (0x31, 1, 1, 700),
     "ORIGIN": (0x32, 0, 1, 2),
     "CALLER": (0x33, 0, 1, 2),
     "CALLVALUE": (0x34, 0, 1, 2),
@@ -76,11 +61,11 @@
     "CODESIZE": (0x38, 0, 1, 2),
     "CODECOPY": (0x39, 3, 0, 3),
     "GASPRICE": (0x3A, 0, 1, 2),
-    "EXTCODESIZE": (0x3B, 1, 1, (700, 700, 700, 2600)),
-    "EXTCODECOPY": (0x3C, 4, 0, (700, 700, 700, 2600)),
+    "EXTCODESIZE": (0x3B, 1, 1, (700, 2600)),
+    "EXTCODECOPY": (0x3C, 4, 0, (700, 2600)),
     "RETURNDATASIZE": (0x3D, 0, 1, 2),
     "RETURNDATACOPY": (0x3E, 3, 0, 3),
-    "EXTCODEHASH": (0x3F, 1, 1, (None, 400, 700, 2600)),
+    "EXTCODEHASH": (0x3F, 1, 1, (700, 2600)),
     "BLOCKHASH": (0x40, 1, 1, 20),
     "COINBASE": (0x41, 0, 1, 2),
     "TIMESTAMP": (0x42, 0, 1, 2),
@@ -88,14 +73,14 @@
     "DIFFICULTY": (0x44, 0, 1, 2),
     "PREVRANDAO": (0x44, 0, 1, 2),
     "GASLIMIT": (0x45, 0, 1, 2),
-    "CHAINID": (0x46, 0, 1, (None, None, 2)),
-    "SELFBALANCE": (0x47, 0, 1, (None, None, 5)),
-    "BASEFEE": (0x48, 0, 1, (None, None, None, 2)),
+    "CHAINID": (0x46, 0, 1, 2),
+    "SELFBALANCE": (0x47, 0, 1, 5),
+    "BASEFEE": (0x48, 0, 1, (None, 2)),
     "POP": (0x50, 1, 0, 2),
     "MLOAD": (0x51, 1, 1, 3),
     "MSTORE": (0x52, 2, 0, 3),
     "MSTORE8": (0x53, 2, 0, 3),
-    "SLOAD": (0x54, 1, 1, (200, 200, 800, 2100)),
+    "SLOAD": (0x54, 1, 1, (800, 2100)),
     "SSTORE": (0x55, 2, 0, 20000),
     "JUMP": (0x56, 1, 0, 8),
     "JUMPI": (0x57, 2, 0, 10),
@@ -174,13 +159,13 @@
     "LOG3": (0xA3, 5, 0, 1500),
     "LOG4": (0xA4, 6, 0, 1875),
     "CREATE": (0xF0, 3, 1, 32000),
-    "CALL": (0xF1, 7, 1, (700, 700, 700, 2100)),
-    "CALLCODE": (0xF2, 7, 1, (700, 700, 700, 2100)),
+    "CALL": (0xF1, 7, 1, (700, 2100)),
+    "CALLCODE": (0xF2, 7, 1, (700, 2100)),
     "RETURN": (0xF3, 2, 0, 0),
-    "DELEGATECALL": (0xF4, 6, 1, (700, 700, 700, 2100)),
-    "CREATE2": (0xF5, 4, 1, (None, 32000)),
+    "DELEGATECALL": (0xF4, 6, 1, (700, 2100)),
+    "CREATE2": (0xF5, 4, 1, 32000),
     "SELFDESTRUCT": (0xFF, 1, 0, 25000),
-    "STATICCALL": (0xFA, 6, 1, (700, 700, 700, 2100)),
+    "STATICCALL": (0xFA, 6, 1, (700, 2100)),
     "REVERT": (0xFD, 2, 0, 0),
     "INVALID": (0xFE, 0, 0, 0),
     "DEBUG": (0xA5, 1, 0, 0),
diff --git a/vyper/ir/optimizer.py b/vyper/ir/optimizer.py
index fb10b515cc..b13c6f79f8 100644
--- a/vyper/ir/optimizer.py
+++ b/vyper/ir/optimizer.py
@@ -2,7 +2,6 @@
 from typing import List, Optional, Tuple, Union
 
 from vyper.codegen.ir_node import IRnode
-from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StaticAssertionException
 from vyper.utils import (
     ceil32,
@@ -340,19 +339,17 @@ def _conservative_eq(x, y):
         if binop == "mod":
             return finalize("and", [args[0], _int(args[1]) - 1])
 
-        if binop == "div" and version_check(begin="constantinople"):
+        if binop == "div":
             # x / 2**n == x >> n
             # recall shr/shl have unintuitive arg order
             return finalize("shr", [int_log2(_int(args[1])), args[0]])
 
         # note: no rule for sdiv since it rounds differently from sar
-        if binop == "mul" and version_check(begin="constantinople"):
+        if binop == "mul":
             # x * 2**n == x << n
             return finalize("shl", [int_log2(_int(args[1])), args[0]])
 
-        # reachable but only before constantinople
-        if version_check(begin="constantinople"):  # pragma: no cover
-            raise CompilerPanic("unreachable")
+        raise CompilerPanic("unreachable")  # pragma: no cover
 
     ##
     # COMPARISONS

From 795d9f5a389b4c4e05869be06ae016e47a2f0173 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 1 Jun 2023 17:26:15 -0400
Subject: [PATCH 068/161] docs: fix borked formatting for rulesets (#3476)

---
 docs/compiling-a-contract.rst | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/docs/compiling-a-contract.rst b/docs/compiling-a-contract.rst
index 36d0c8cb74..6295226bca 100644
--- a/docs/compiling-a-contract.rst
+++ b/docs/compiling-a-contract.rst
@@ -147,14 +147,17 @@ The following is a list of supported EVM versions, and changes in the compiler i
    - Gas estimates changed for ``SLOAD`` and ``BALANCE``
 
 .. py:attribute:: berlin
+
    - Gas estimates changed for ``EXTCODESIZE``, ``EXTCODECOPY``, ``EXTCODEHASH``, ``SLOAD``, ``SSTORE``, ``CALL``, ``CALLCODE``, ``DELEGATECALL`` and ``STATICCALL``
    - Functions marked with ``@nonreentrant`` are protected with different values (3 and 2) than contracts targeting pre-berlin.
    - ``BASEFEE`` is accessible via ``block.basefee``
 
 .. py:attribute:: paris
+
    - ``block.difficulty`` is deprecated in favor of its new alias, ``block.prevrandao``.
 
-.. py:attribute:: shanghai
+.. py:attribute:: shanghai (default)
+
    - The ``PUSH0`` opcode is automatically generated by the compiler instead of ``PUSH1 0``
 
 .. py:attribute:: cancun (experimental)

From 0e201316e63284d52bbe1410fdfaafe2a378616a Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 1 Jun 2023 23:55:42 -0400
Subject: [PATCH 069/161] chore: fix era compiler tester workflow (#3477)

auto-detect vyper version
only run full llvm matrix on push to master
---
 .github/workflows/era-tester.yml | 23 ++++++++++++++++++-----
 1 file changed, 18 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index a693d2c97d..8a2a3e50ce 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -85,14 +85,27 @@ jobs:
           **/era-compiler-tester
         key: ${{ runner.os }}-${{ env.ERA_HASH }}-${{ env.ERA_VYPER_HASH }}
 
-    - name: Install Vyper
+    - name: Build Vyper
       run: |
+        set -Eeuxo pipefail
         pip install .
+        echo "VYPER_VERSION=$(vyper --version | cut -f1 -d'+')" >> $GITHUB_ENV
+
+    - name: Install Vyper
+      run: |
         mkdir era-compiler-tester/vyper-bin
-        echo $(which vyper)
-        cp $(which vyper) era-compiler-tester/vyper-bin/vyper-0.3.8
+        cp $(which vyper) era-compiler-tester/vyper-bin/vyper-${{ env.VYPER_VERSION }}
+
+    - name: Run tester (fast)
+      # Run era tester with no LLVM optimizations
+      if: ${{ github.ref != 'refs/heads/master' }}
+      run: |
+        cd era-compiler-tester
+        cargo run --release --bin compiler-tester -- -v --path=tests/vyper/ --mode="M0B0 ${{ env.VYPER_VERSION }}"
 
-    - name: Run tester
+    - name: Run tester (slow)
+      # Run era tester across the LLVM optimization matrix
+      if: ${{ github.ref == 'refs/heads/master' }}
       run: |
         cd era-compiler-tester
-        cargo run --release --bin compiler-tester -- -v --path='tests/vyper/' --mode='M*B* 0.3.8'
+        cargo run --release --bin compiler-tester -- -v --path=tests/vyper/ --mode="M*B* ${{ env.VYPER_VERSION }}"

From a71d604513c1cf711b188ca3826325ffb58e35a0 Mon Sep 17 00:00:00 2001
From: antazoey <jules@apeworx.io>
Date: Fri, 2 Jun 2023 09:27:23 -0600
Subject: [PATCH 070/161] chore: rm redundant var declaration (#3478)

it was apparently there as a type hint but it is no longer needed
---
 vyper/codegen/module.py | 5 +----
 1 file changed, 1 insertion(+), 4 deletions(-)

diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 64d5a8b70c..b98e4d0f86 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -1,8 +1,7 @@
 # a contract.vy -- all functions and constructor
 
-from typing import Any, List, Optional
+from typing import Any, List
 
-from vyper import ast as vy_ast
 from vyper.codegen.core import shr
 from vyper.codegen.function_definitions import generate_ir_for_function
 from vyper.codegen.global_context import GlobalContext
@@ -141,8 +140,6 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
     # order functions so that each function comes after all of its callees
     function_defs = _topsort(global_ctx.functions)
 
-    init_function: Optional[vy_ast.FunctionDef] = None
-
     runtime_functions = [f for f in function_defs if not _is_constructor(f)]
     init_function = next((f for f in function_defs if _is_constructor(f)), None)
 

From f0f9377748a6089dc8a39db692c8ad4c51a11f40 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 8 Jun 2023 13:30:14 -0700
Subject: [PATCH 071/161] chore: update tload/tstore opcodes per latest 1153
 (#3484)

---
 vyper/evm/opcodes.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index 00e0986939..7550d047b5 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -170,8 +170,8 @@
     "INVALID": (0xFE, 0, 0, 0),
     "DEBUG": (0xA5, 1, 0, 0),
     "BREAKPOINT": (0xA6, 0, 0, 0),
-    "TLOAD": (0xB3, 1, 1, 100),
-    "TSTORE": (0xB4, 2, 0, 100),
+    "TLOAD": (0x5C, 1, 1, 100),
+    "TSTORE": (0x5D, 2, 0, 100),
 }
 
 PSEUDO_OPCODES: OpcodeMap = {

From c90ab2fb26d66ad2121bf967dabe738ee8eaf21e Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Thu, 15 Jun 2023 00:57:27 +0800
Subject: [PATCH 072/161] feat: let params of internal functions be mutable
 (#3473)

params to internal functions are never in calldata, so we don't need to
have any write restrictions.
---
 tests/parser/features/test_assignment.py      | 115 +++++++++++++++++-
 .../function_definitions/internal_function.py |   4 +-
 vyper/semantics/analysis/local.py             |   9 +-
 3 files changed, 121 insertions(+), 7 deletions(-)

diff --git a/tests/parser/features/test_assignment.py b/tests/parser/features/test_assignment.py
index 0dd63a0d09..29ec820484 100644
--- a/tests/parser/features/test_assignment.py
+++ b/tests/parser/features/test_assignment.py
@@ -39,7 +39,118 @@ def augmod(x: int128, y: int128) -> int128:
     print("Passed aug-assignment test")
 
 
-def test_invalid_assign(assert_compile_failed, get_contract_with_gas_estimation):
+@pytest.mark.parametrize(
+    "typ,in_val,out_val",
+    [
+        ("uint256", 77, 123),
+        ("uint256[3]", [1, 2, 3], [4, 5, 6]),
+        ("DynArray[uint256, 3]", [1, 2, 3], [4, 5, 6]),
+        ("Bytes[5]", b"vyper", b"conda"),
+    ],
+)
+def test_internal_assign(get_contract_with_gas_estimation, typ, in_val, out_val):
+    code = f"""
+@internal
+def foo(x: {typ}) -> {typ}:
+    x = {out_val}
+    return x
+
+@external
+def bar(x: {typ}) -> {typ}:
+    return self.foo(x)
+    """
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.bar(in_val) == out_val
+
+
+def test_internal_assign_struct(get_contract_with_gas_estimation):
+    code = """
+enum Bar:
+    BAD
+    BAK
+    BAZ
+
+struct Foo:
+    a: uint256
+    b: DynArray[Bar, 3]
+    c: String[5]
+
+@internal
+def foo(x: Foo) -> Foo:
+    x = Foo({a: 789, b: [Bar.BAZ, Bar.BAK, Bar.BAD], c: \"conda\"})
+    return x
+
+@external
+def bar(x: Foo) -> Foo:
+    return self.foo(x)
+    """
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.bar((123, [1, 2, 4], "vyper")) == (789, [4, 2, 1], "conda")
+
+
+def test_internal_assign_struct_member(get_contract_with_gas_estimation):
+    code = """
+enum Bar:
+    BAD
+    BAK
+    BAZ
+
+struct Foo:
+    a: uint256
+    b: DynArray[Bar, 3]
+    c: String[5]
+
+@internal
+def foo(x: Foo) -> Foo:
+    x.a = 789
+    x.b.pop()
+    return x
+
+@external
+def bar(x: Foo) -> Foo:
+    return self.foo(x)
+    """
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.bar((123, [1, 2, 4], "vyper")) == (789, [1, 2], "vyper")
+
+
+def test_internal_augassign(get_contract_with_gas_estimation):
+    code = """
+@internal
+def foo(x: int128) -> int128:
+    x += 77
+    return x
+
+@external
+def bar(x: int128) -> int128:
+    return self.foo(x)
+    """
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.bar(123) == 200
+
+
+@pytest.mark.parametrize("typ", ["DynArray[uint256, 3]", "uint256[3]"])
+def test_internal_augassign_arrays(get_contract_with_gas_estimation, typ):
+    code = f"""
+@internal
+def foo(x: {typ}) -> {typ}:
+    x[1] += 77
+    return x
+
+@external
+def bar(x: {typ}) -> {typ}:
+    return self.foo(x)
+    """
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.bar([1, 2, 3]) == [1, 79, 3]
+
+
+def test_invalid_external_assign(assert_compile_failed, get_contract_with_gas_estimation):
     code = """
 @external
 def foo(x: int128):
@@ -48,7 +159,7 @@ def foo(x: int128):
     assert_compile_failed(lambda: get_contract_with_gas_estimation(code), ImmutableViolation)
 
 
-def test_invalid_augassign(assert_compile_failed, get_contract_with_gas_estimation):
+def test_invalid_external_augassign(assert_compile_failed, get_contract_with_gas_estimation):
     code = """
 @external
 def foo(x: int128):
diff --git a/vyper/codegen/function_definitions/internal_function.py b/vyper/codegen/function_definitions/internal_function.py
index 17479c4c07..228191e3ca 100644
--- a/vyper/codegen/function_definitions/internal_function.py
+++ b/vyper/codegen/function_definitions/internal_function.py
@@ -41,8 +41,8 @@ def generate_ir_for_internal_function(
 
     for arg in func_t.arguments:
         # allocate a variable for every arg, setting mutability
-        # to False to comply with vyper semantics, function arguments are immutable
-        context.new_variable(arg.name, arg.typ, is_mutable=False)
+        # to True to allow internal function arguments to be mutable
+        context.new_variable(arg.name, arg.typ, is_mutable=True)
 
     nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_t)
 
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index 790cee52d6..c99b582ad3 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -173,10 +173,13 @@ def __init__(
         self.func = fn_node._metadata["type"]
         self.annotation_visitor = StatementAnnotationVisitor(fn_node, namespace)
         self.expr_visitor = _LocalExpressionVisitor()
+
+        # allow internal function params to be mutable
+        location, is_immutable = (
+            (DataLocation.MEMORY, False) if self.func.is_internal else (DataLocation.CALLDATA, True)
+        )
         for arg in self.func.arguments:
-            namespace[arg.name] = VarInfo(
-                arg.typ, location=DataLocation.CALLDATA, is_immutable=True
-            )
+            namespace[arg.name] = VarInfo(arg.typ, location=location, is_immutable=is_immutable)
 
         for node in fn_node.body:
             self.visit(node)

From 2704ff0140c3f08372720c95c92e0b0071211726 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 29 Jun 2023 17:02:45 -0700
Subject: [PATCH 073/161] fix: pycryptodome on arm (#3485)

---
 .github/workflows/build.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index f891ff7e1d..b4be1043c1 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -38,7 +38,7 @@ jobs:
 
       - name: Generate Binary
         run: >-
-          pip install . &&
+          pip install --no-binary pycryptodome . &&
           pip install pyinstaller &&
           make freeze
 

From c1f0bd5a87e2f7fa10dec41639e8e37f9692e62c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 29 Jun 2023 17:51:37 -0700
Subject: [PATCH 074/161] chore: polish some codegen issues (#3488)

fix some issues with well-formedness of generated IR (which were getting
hidden by the `rewrite_return_sequences` routine). this shouldn't affect
correctness of current vyper programs, but may help programs which
consume vyper IR directly.

* fix push_label_to_stack - use dedicated symbol instruction
* remove busted return_pc forwarding in external functions
* remove weird `_sym_` prefix in `exit_to`
---
 vyper/codegen/ir_node.py   | 5 -----
 vyper/codegen/return_.py   | 5 +++--
 vyper/codegen/self_call.py | 4 ++--
 vyper/ir/compile_ir.py     | 8 ++++----
 4 files changed, 9 insertions(+), 13 deletions(-)

diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index d36a18ec66..f7698fbabb 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -38,11 +38,6 @@ def __repr__(self) -> str:
     __mul__ = __add__
 
 
-def push_label_to_stack(labelname: str) -> str:
-    #  items prefixed with `_sym_` are ignored until asm phase
-    return "_sym_" + labelname
-
-
 class Encoding(Enum):
     # vyper encoding, default for memory variables
     VYPER = auto()
diff --git a/vyper/codegen/return_.py b/vyper/codegen/return_.py
index b8468f3eb1..56bea2b8da 100644
--- a/vyper/codegen/return_.py
+++ b/vyper/codegen/return_.py
@@ -21,7 +21,7 @@
 def make_return_stmt(ir_val: IRnode, stmt: Any, context: Context) -> Optional[IRnode]:
     func_t = context.func_t
 
-    jump_to_exit = ["exit_to", f"_sym_{func_t._ir_info.exit_sequence_label}"]
+    jump_to_exit = ["exit_to", func_t._ir_info.exit_sequence_label]
 
     if context.return_type is None:
         if stmt.value is not None:
@@ -43,7 +43,8 @@ def finalize(fill_return_buffer):
         return IRnode.from_list(["seq", fill_return_buffer, cleanup_loops, jump_to_exit])
 
     if context.return_type is None:
-        jump_to_exit += ["return_pc"]
+        if context.is_internal:
+            jump_to_exit += ["return_pc"]
         return finalize(["seq"])
 
     if context.is_internal:
diff --git a/vyper/codegen/self_call.py b/vyper/codegen/self_call.py
index 311576194b..c320e6889c 100644
--- a/vyper/codegen/self_call.py
+++ b/vyper/codegen/self_call.py
@@ -1,5 +1,5 @@
 from vyper.codegen.core import _freshname, eval_once_check, make_setter
-from vyper.codegen.ir_node import IRnode, push_label_to_stack
+from vyper.codegen.ir_node import IRnode
 from vyper.evm.address_space import MEMORY
 from vyper.exceptions import StateAccessViolation
 from vyper.semantics.types.subscriptable import TupleT
@@ -104,7 +104,7 @@ def ir_for_self_call(stmt_expr, context):
     if return_buffer is not None:
         goto_op += [return_buffer]
     # pass return label to subroutine
-    goto_op += [push_label_to_stack(return_label)]
+    goto_op.append(["symbol", return_label])
 
     call_sequence = ["seq"]
     call_sequence.append(eval_once_check(_freshname(stmt_expr.node_source_code)))
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index b2a58fa8c9..9d7ef4691f 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -118,14 +118,14 @@ def _rewrite_return_sequences(ir_node, label_params=None):
             args[0].value = "pass"
         else:
             # handle jump to cleanup
-            assert is_symbol(args[0].value)
             ir_node.value = "seq"
 
             _t = ["seq"]
             if "return_buffer" in label_params:
                 _t.append(["pop", "pass"])
 
-            dest = args[0].value[5:]  # `_sym_foo` -> `foo`
+            dest = args[0].value
+            # works for both internal and external exit_to
             more_args = ["pass" if t.value == "return_pc" else t for t in args[1:]]
             _t.append(["goto", dest] + more_args)
             ir_node.args = IRnode.from_list(_t, source_pos=ir_node.source_pos).args
@@ -667,8 +667,8 @@ def _height_of(witharg):
         o.extend(["_sym_" + str(code.args[0]), "JUMP"])
         return o
     # push a literal symbol
-    elif isinstance(code.value, str) and is_symbol(code.value):
-        return [code.value]
+    elif code.value == "symbol":
+        return ["_sym_" + str(code.args[0])]
     # set a symbol as a location.
     elif code.value == "label":
         label_name = code.args[0].value

From ae608368f6a3ea6fd7cb16e685d95018ad0efcd0 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 29 Jun 2023 22:58:40 -0700
Subject: [PATCH 075/161] chore: add __new__ to Namespace (#3489)

this makes it picklable, otherwise it fails with `_scope` not being
available during `__setitem__`
---
 vyper/semantics/analysis/module.py | 2 +-
 vyper/semantics/namespace.py       | 6 +++++-
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index cb8e93ff28..d916dcf119 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -98,7 +98,7 @@ def __init__(
         _ns = Namespace()
         # note that we don't just copy the namespace because
         # there are constructor issues.
-        _ns.update({k: namespace[k] for k in namespace._scopes[-1]})
+        _ns.update({k: namespace[k] for k in namespace._scopes[-1]})  # type: ignore
         module_node._metadata["namespace"] = _ns
 
         # check for collisions between 4byte function selectors
diff --git a/vyper/semantics/namespace.py b/vyper/semantics/namespace.py
index 82a5d5cf3e..b88bc3d817 100644
--- a/vyper/semantics/namespace.py
+++ b/vyper/semantics/namespace.py
@@ -20,9 +20,13 @@ class Namespace(dict):
         List of sets containing the key names for each scope
     """
 
+    def __new__(cls, *args, **kwargs):
+        self = super().__new__(cls, *args, **kwargs)
+        self._scopes = []
+        return self
+
     def __init__(self):
         super().__init__()
-        self._scopes = []
         # NOTE cyclic imports!
         # TODO: break this cycle by providing an `init_vyper_namespace` in 3rd module
         from vyper.builtins.functions import get_builtin_functions

From bc723d2645aeec94bec1d83cdcbb8b41f7f807d3 Mon Sep 17 00:00:00 2001
From: trocher <rocher14@live.fr>
Date: Fri, 30 Jun 2023 08:01:14 +0200
Subject: [PATCH 076/161] fix: improve error message for conflicting methods
 IDs (#3491)

Before this commit: `Methods have conflicting IDs: `
Now: `Methods produce colliding method ID '0x2e1a7d4d': OwnerTransferV7b711143(uint256), withdraw(uint256)`

for the following contract:
```
@external
def OwnerTransferV7b711143(a : uint256) :
    pass
@external
def withdraw(a : uint256):
    pass
```

Co-authored-by: Tanguy Rocher <tanguy.rocher@protonmail.com>
---
 tests/signatures/test_method_id_conflicts.py |  7 +++++++
 vyper/semantics/analysis/utils.py            | 11 ++++++++---
 2 files changed, 15 insertions(+), 3 deletions(-)

diff --git a/tests/signatures/test_method_id_conflicts.py b/tests/signatures/test_method_id_conflicts.py
index 262348c12a..35c10300b4 100644
--- a/tests/signatures/test_method_id_conflicts.py
+++ b/tests/signatures/test_method_id_conflicts.py
@@ -67,6 +67,13 @@ def gfah(): pass
 @view
 def eexo(): pass
     """,
+    """
+# check collision with ID = 0x00000000
+wycpnbqcyf:public(uint256)
+
+@external
+def randallsRevenge_ilxaotc(): pass
+    """,
 ]
 
 
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index 26f3fd1827..f16b0c8c33 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -24,7 +24,7 @@
 from vyper.semantics.types.bytestrings import BytesT, StringT
 from vyper.semantics.types.primitives import AddressT, BoolT, BytesM_T, IntegerT
 from vyper.semantics.types.subscriptable import DArrayT, SArrayT, TupleT
-from vyper.utils import checksum_encode
+from vyper.utils import checksum_encode, int_to_fourbytes
 
 
 def _validate_op(node, types_list, validation_fn_name):
@@ -593,8 +593,13 @@ def validate_unique_method_ids(functions: List) -> None:
     seen = set()
     for method_id in method_ids:
         if method_id in seen:
-            collision_str = ", ".join(i.name for i in functions if method_id in i.method_ids)
-            raise StructureException(f"Methods have conflicting IDs: {collision_str}")
+            collision_str = ", ".join(
+                x for i in functions for x in i.method_ids.keys() if i.method_ids[x] == method_id
+            )
+            collision_hex = int_to_fourbytes(method_id).hex()
+            raise StructureException(
+                f"Methods produce colliding method ID `0x{collision_hex}`: {collision_str}"
+            )
         seen.add(method_id)
 
 

From 9e363e89fb9a67984b29590da3f821c767622c8c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 30 Jun 2023 15:31:40 -0700
Subject: [PATCH 077/161] chore: remove vyper signature from runtime (#3471)

it's going at the end of initcode instead, which is cheaper but still
possible to pick up the vyper version by looking at the create tx.
---
 vyper/compiler/output.py |  4 +---
 vyper/compiler/phases.py | 17 +++++------------
 vyper/ir/compile_ir.py   | 12 +++---------
 3 files changed, 9 insertions(+), 24 deletions(-)

diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index f061bd8e18..63d92d9a47 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -218,9 +218,7 @@ def _build_asm(asm_list):
 
 def build_source_map_output(compiler_data: CompilerData) -> OrderedDict:
     _, line_number_map = compile_ir.assembly_to_evm(
-        compiler_data.assembly_runtime,
-        insert_vyper_signature=True,
-        disable_bytecode_metadata=compiler_data.no_bytecode_metadata,
+        compiler_data.assembly_runtime, insert_vyper_signature=False
     )
     # Sort line_number_map
     out = OrderedDict()
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 5156aa1bbd..c759f6e272 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -150,15 +150,12 @@ def assembly_runtime(self) -> list:
 
     @cached_property
     def bytecode(self) -> bytes:
-        return generate_bytecode(
-            self.assembly, is_runtime=False, no_bytecode_metadata=self.no_bytecode_metadata
-        )
+        insert_vyper_signature = not self.no_bytecode_metadata
+        return generate_bytecode(self.assembly, insert_vyper_signature=insert_vyper_signature)
 
     @cached_property
     def bytecode_runtime(self) -> bytes:
-        return generate_bytecode(
-            self.assembly_runtime, is_runtime=True, no_bytecode_metadata=self.no_bytecode_metadata
-        )
+        return generate_bytecode(self.assembly_runtime, insert_vyper_signature=False)
 
     @cached_property
     def blueprint_bytecode(self) -> bytes:
@@ -295,9 +292,7 @@ def _find_nested_opcode(assembly, key):
         return any(_find_nested_opcode(x, key) for x in sublists)
 
 
-def generate_bytecode(
-    assembly: list, is_runtime: bool = False, no_bytecode_metadata: bool = False
-) -> bytes:
+def generate_bytecode(assembly: list, insert_vyper_signature: bool) -> bytes:
     """
     Generate bytecode from assembly instructions.
 
@@ -311,6 +306,4 @@ def generate_bytecode(
     bytes
         Final compiled bytecode.
     """
-    return compile_ir.assembly_to_evm(
-        assembly, insert_vyper_signature=is_runtime, disable_bytecode_metadata=no_bytecode_metadata
-    )[0]
+    return compile_ir.assembly_to_evm(assembly, insert_vyper_signature=insert_vyper_signature)[0]
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 9d7ef4691f..5a35b8f932 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -968,9 +968,7 @@ def adjust_pc_maps(pc_maps, ofst):
     return ret
 
 
-def assembly_to_evm(
-    assembly, pc_ofst=0, insert_vyper_signature=False, disable_bytecode_metadata=False
-):
+def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
     """
     Assembles assembly into EVM
 
@@ -994,7 +992,7 @@ def assembly_to_evm(
     runtime_code, runtime_code_start, runtime_code_end = None, None, None
 
     bytecode_suffix = b""
-    if (not disable_bytecode_metadata) and insert_vyper_signature:
+    if insert_vyper_signature:
         # CBOR encoded: {"vyper": [major,minor,patch]}
         bytecode_suffix += b"\xa1\x65vyper\x83" + bytes(list(version_tuple))
         bytecode_suffix += len(bytecode_suffix).to_bytes(2, "big")
@@ -1011,11 +1009,7 @@ def assembly_to_evm(
     for i, item in enumerate(assembly):
         if isinstance(item, list):
             assert runtime_code is None, "Multiple subcodes"
-            runtime_code, runtime_map = assembly_to_evm(
-                item,
-                insert_vyper_signature=True,
-                disable_bytecode_metadata=disable_bytecode_metadata,
-            )
+            runtime_code, runtime_map = assembly_to_evm(item)
 
             assert item[0].startswith("_DEPLOY_MEM_OFST_")
             assert ctor_mem_size is None

From 3d01e947276481d49390aaf3dce6d09a216ea004 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 30 Jun 2023 15:32:41 -0700
Subject: [PATCH 078/161] chore: add test for complex storage assignment
 (#3472)

add a test for complex make_setter when location is storage to prevent
future regressions
---
 tests/parser/features/test_assignment.py | 22 +++++++++++++++++++---
 1 file changed, 19 insertions(+), 3 deletions(-)

diff --git a/tests/parser/features/test_assignment.py b/tests/parser/features/test_assignment.py
index 29ec820484..e550f60541 100644
--- a/tests/parser/features/test_assignment.py
+++ b/tests/parser/features/test_assignment.py
@@ -367,17 +367,33 @@ def foo():
 """
     assert_compile_failed(lambda: get_contract_with_gas_estimation(code), InvalidType)
 
-
-def test_assign_rhs_lhs_overlap(get_contract):
     # GH issue 2418
-    code = """
+
+
+overlap_codes = [
+    """
 @external
 def bug(xs: uint256[2]) -> uint256[2]:
     # Initial value
     ys: uint256[2] = xs
     ys = [ys[1], ys[0]]
     return ys
+    """,
     """
+foo: uint256[2]
+@external
+def bug(xs: uint256[2]) -> uint256[2]:
+    # Initial value
+    self.foo = xs
+    self.foo = [self.foo[1], self.foo[0]]
+    return self.foo
+    """,
+    # TODO add transient tests when it's available
+]
+
+
+@pytest.mark.parametrize("code", overlap_codes)
+def test_assign_rhs_lhs_overlap(get_contract, code):
     c = get_contract(code)
 
     assert c.bug([1, 2]) == [2, 1]

From 29b02dd5b88a951c3791affc2062cca81701745d Mon Sep 17 00:00:00 2001
From: trocher <rocher14@live.fr>
Date: Sat, 1 Jul 2023 22:53:00 +0200
Subject: [PATCH 079/161] fix: typechecking of folded builtins (#3490)

some builtins would allow decimals during typechecking and then panic
during codegen

---------

Co-authored-by: Tanguy Rocher <tanguy.rocher@protonmail.com>
---
 tests/parser/syntax/test_addmulmod.py | 27 +++++++++++++++++++++++++++
 vyper/builtins/functions.py           | 14 +++++++-------
 2 files changed, 34 insertions(+), 7 deletions(-)
 create mode 100644 tests/parser/syntax/test_addmulmod.py

diff --git a/tests/parser/syntax/test_addmulmod.py b/tests/parser/syntax/test_addmulmod.py
new file mode 100644
index 0000000000..ddff4d3e01
--- /dev/null
+++ b/tests/parser/syntax/test_addmulmod.py
@@ -0,0 +1,27 @@
+import pytest
+
+from vyper.exceptions import InvalidType
+
+fail_list = [
+    (  # bad AST nodes given as arguments
+        """
+@external
+def foo() -> uint256:
+    return uint256_addmod(1.1, 1.2, 3.0)
+    """,
+        InvalidType,
+    ),
+    (  # bad AST nodes given as arguments
+        """
+@external
+def foo() -> uint256:
+    return uint256_mulmod(1.1, 1.2, 3.0)
+    """,
+        InvalidType,
+    ),
+]
+
+
+@pytest.mark.parametrize("code,exc", fail_list)
+def test_add_mod_fail(assert_compile_failed, get_contract, code, exc):
+    assert_compile_failed(lambda: get_contract(code), exc)
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index af965afe0a..90214554b0 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -1370,7 +1370,7 @@ def evaluate(self, node):
 
         validate_call_args(node, 2)
         for arg in node.args:
-            if not isinstance(arg, vy_ast.Num):
+            if not isinstance(arg, vy_ast.Int):
                 raise UnfoldableNode
             if arg.value < 0 or arg.value >= 2**256:
                 raise InvalidLiteral("Value out of range for uint256", arg)
@@ -1396,7 +1396,7 @@ def evaluate(self, node):
 
         validate_call_args(node, 2)
         for arg in node.args:
-            if not isinstance(arg, vy_ast.Num):
+            if not isinstance(arg, vy_ast.Int):
                 raise UnfoldableNode
             if arg.value < 0 or arg.value >= 2**256:
                 raise InvalidLiteral("Value out of range for uint256", arg)
@@ -1422,7 +1422,7 @@ def evaluate(self, node):
 
         validate_call_args(node, 2)
         for arg in node.args:
-            if not isinstance(arg, vy_ast.Num):
+            if not isinstance(arg, vy_ast.Int):
                 raise UnfoldableNode
             if arg.value < 0 or arg.value >= 2**256:
                 raise InvalidLiteral("Value out of range for uint256", arg)
@@ -1447,7 +1447,7 @@ def evaluate(self, node):
             self.__class__._warned = True
 
         validate_call_args(node, 1)
-        if not isinstance(node.args[0], vy_ast.Num):
+        if not isinstance(node.args[0], vy_ast.Int):
             raise UnfoldableNode
 
         value = node.args[0].value
@@ -1474,7 +1474,7 @@ def evaluate(self, node):
             self.__class__._warned = True
 
         validate_call_args(node, 2)
-        if [i for i in node.args if not isinstance(i, vy_ast.Num)]:
+        if [i for i in node.args if not isinstance(i, vy_ast.Int)]:
             raise UnfoldableNode
         value, shift = [i.value for i in node.args]
         if value < 0 or value >= 2**256:
@@ -1522,10 +1522,10 @@ class _AddMulMod(BuiltinFunction):
 
     def evaluate(self, node):
         validate_call_args(node, 3)
-        if isinstance(node.args[2], vy_ast.Num) and node.args[2].value == 0:
+        if isinstance(node.args[2], vy_ast.Int) and node.args[2].value == 0:
             raise ZeroDivisionException("Modulo by 0", node.args[2])
         for arg in node.args:
-            if not isinstance(arg, vy_ast.Num):
+            if not isinstance(arg, vy_ast.Int):
                 raise UnfoldableNode
             if arg.value < 0 or arg.value >= 2**256:
                 raise InvalidLiteral("Value out of range for uint256", arg)

From 593c9b86cfea23f624655d5847ef36ae00d7ccdc Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 11 Jul 2023 08:35:39 -0400
Subject: [PATCH 080/161] feat: add optimization mode to vyper compiler (#3493)

this commit adds the `--optimize` flag to the vyper cli, and as an
option in vyper json. it is to be used separately from the
`--no-optimize` flag. this commit does not actually change codegen,
just adds the flag and threads it through the codebase so it is
available once we want to start differentiating between the two modes,
and sets up the test harness to test both modes.

it also makes the `optimize` and `evm-version` available as source code
pragmas, and adds an additional syntax for specifying the compiler
version (`#pragma version X.Y.Z`). if the CLI / JSON options conflict
with the source code pragmas, an exception is raised.

this commit also:
* bumps mypy - it was needed to bump to 0.940 to handle match/case, and
  discovered we could bump all the way to 0.98* without breaking
  anything
* removes evm_version from bitwise op tests - it was probably important
  when we supported pre-constantinople targets, which we don't anymore
---
 .github/workflows/test.yml                    |  4 +-
 docs/compiling-a-contract.rst                 | 31 +++++--
 docs/structure-of-a-contract.rst              | 39 ++++++++-
 setup.py                                      |  2 +-
 tests/ast/test_pre_parser.py                  | 85 +++++++++++++++++--
 tests/base_conftest.py                        | 25 +++---
 tests/cli/vyper_json/test_get_settings.py     |  5 --
 tests/compiler/asm/test_asm_optimizer.py      |  5 +-
 tests/compiler/test_pre_parser.py             | 61 ++++++++++++-
 tests/conftest.py                             | 31 ++++---
 tests/examples/factory/test_factory.py        |  5 +-
 tests/grammar/test_grammar.py                 |  3 +-
 tests/parser/features/test_immutable.py       |  4 +-
 tests/parser/features/test_transient.py       | 15 ++--
 tests/parser/functions/test_bitwise.py        | 21 ++---
 .../parser/functions/test_create_functions.py |  5 +-
 .../test_annotate_and_optimize_ast.py         |  2 +-
 tests/parser/syntax/test_address_code.py      |  6 +-
 tests/parser/syntax/test_chainid.py           |  4 +-
 tests/parser/syntax/test_codehash.py          |  8 +-
 tests/parser/syntax/test_self_balance.py      |  4 +-
 tests/parser/types/test_dynamic_array.py      |  5 +-
 tox.ini                                       |  3 +-
 vyper/ast/__init__.py                         |  2 +-
 vyper/ast/nodes.pyi                           |  1 +
 vyper/ast/pre_parser.py                       | 57 ++++++++++---
 vyper/ast/utils.py                            | 17 ++--
 vyper/cli/vyper_compile.py                    | 35 +++++---
 vyper/cli/vyper_json.py                       | 34 ++++++--
 vyper/compiler/__init__.py                    | 73 ++++++++--------
 vyper/compiler/phases.py                      | 66 ++++++++++----
 vyper/compiler/settings.py                    | 30 +++++++
 vyper/evm/opcodes.py                          | 24 +++---
 vyper/ir/compile_ir.py                        |  5 +-
 34 files changed, 524 insertions(+), 193 deletions(-)

diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index 42e0524b13..b6399b3ae9 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -79,8 +79,8 @@ jobs:
     strategy:
       matrix:
         python-version: [["3.10", "310"], ["3.11", "311"]]
-        # run in default (optimized) and --no-optimize mode
-        flag: ["core", "no-opt"]
+        # run in modes: --optimize [gas, none, codesize]
+        flag: ["core", "no-opt", "codesize"]
 
     name: py${{ matrix.python-version[1] }}-${{ matrix.flag }}
 
diff --git a/docs/compiling-a-contract.rst b/docs/compiling-a-contract.rst
index 6295226bca..208771a5a9 100644
--- a/docs/compiling-a-contract.rst
+++ b/docs/compiling-a-contract.rst
@@ -99,6 +99,11 @@ See :ref:`searching_for_imports` for more information on Vyper's import system.
 Online Compilers
 ================
 
+Try VyperLang!
+-----------------
+
+`Try VyperLang! <https://try.vyperlang.org>`_ is a JupterHub instance hosted by the Vyper team as a sandbox for developing and testing contracts in Vyper. It requires github for login, and supports deployment via the browser.
+
 Remix IDE
 ---------
 
@@ -109,22 +114,33 @@ Remix IDE
    While the Vyper version of the Remix IDE compiler is updated on a regular basis, it might be a bit behind the latest version found in the master branch of the repository. Make sure the byte code matches the output from your local compiler.
 
 
+.. _evm-version:
+
 Setting the Target EVM Version
 ==============================
 
-When you compile your contract code, you can specify the Ethereum Virtual Machine version to compile for, to avoid particular features or behaviours.
+When you compile your contract code, you can specify the target Ethereum Virtual Machine version to compile for, to access or avoid particular features. You can specify the version either with a source code pragma or as a compiler option. It is recommended to use the compiler option when you want flexibility (for instance, ease of deploying across different chains), and the source code pragma when you want bytecode reproducibility (for instance, when verifying code on a block explorer).
+
+.. note::
+   If the evm version specified by the compiler options conflicts with the source code pragma, an exception will be raised and compilation will not continue.
+
+For instance, the adding the following pragma to a contract indicates that it should be compiled for the "shanghai" fork of the EVM.
+
+.. code-block:: python
+
+   #pragma evm-version shanghai
 
 .. warning::
 
-    Compiling for the wrong EVM version can result in wrong, strange and failing behaviour. Please ensure, especially if running a private chain, that you use matching EVM versions.
+    Compiling for the wrong EVM version can result in wrong, strange, or failing behavior. Please ensure, especially if running a private chain, that you use matching EVM versions.
 
-When compiling via ``vyper``, include the ``--evm-version`` flag:
+When compiling via the ``vyper`` CLI, you can specify the EVM version option using the ``--evm-version`` flag:
 
 ::
 
     $ vyper --evm-version [VERSION]
 
-When using the JSON interface, include the ``"evmVersion"`` key within the ``"settings"`` field:
+When using the JSON interface, you can include the ``"evmVersion"`` key within the ``"settings"`` field:
 
 .. code-block:: javascript
 
@@ -213,9 +229,10 @@ The following example describes the expected input format of ``vyper-json``. Com
         // Optional
         "settings": {
             "evmVersion": "shanghai",  // EVM version to compile for. Can be istanbul, berlin, paris, shanghai (default) or cancun (experimental!).
-            // optional, whether or not optimizations are turned on
-            // defaults to true
-            "optimize": true,
+            // optional, optimization mode
+            // defaults to "gas". can be one of "gas", "codesize", "none",
+            // false  and true (the last two are for backwards compatibility).
+            "optimize": "gas",
             // optional, whether or not the bytecode should include Vyper's signature
             // defaults to true
             "bytecodeMetadata": true,
diff --git a/docs/structure-of-a-contract.rst b/docs/structure-of-a-contract.rst
index 8eb2c1da78..c7abb3e645 100644
--- a/docs/structure-of-a-contract.rst
+++ b/docs/structure-of-a-contract.rst
@@ -9,16 +9,47 @@ This section provides a quick overview of the types of data present within a con
 
 .. _structure-versions:
 
-Version Pragma
+Pragmas
 ==============
 
-Vyper supports a version pragma to ensure that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax.
+Vyper supports several source code directives to control compiler modes and help with build reproducibility.
+
+Version Pragma
+--------------
+
+The version pragma ensures that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax.
+
+As of 0.3.10, the recommended way to specify the version pragma is as follows:
 
 .. code-block:: python
 
-    # @version ^0.2.0
+    #pragma version ^0.3.0
+
+The following declaration is equivalent, and, prior to 0.3.10, was the only supported method to specify the compiler version:
+
+.. code-block:: python
+
+    # @version ^0.3.0
+
+
+In the above examples, the contract will only compile with Vyper versions ``0.3.x``.
+
+Optimization Mode
+-----------------
+
+The optimization mode can be one of ``"none"``, ``"codesize"``, or ``"gas"`` (default). For instance, the following contract will be compiled in a way which tries to minimize codesize:
+
+.. code-block:: python
+
+   #pragma optimize codesize
+
+The optimization mode can also be set as a compiler option. If the compiler option conflicts with the source code pragma, an exception will be raised and compilation will not continue.
+
+EVM Version
+-----------------
+
+The EVM version can be set with the ``evm-version`` pragma, which is documented in :ref:`evm-version`.
 
-In the above example, the contract only compiles with Vyper versions ``0.2.x``.
 
 .. _structure-state-variables:
 
diff --git a/setup.py b/setup.py
index 05cb52259d..36a138aacd 100644
--- a/setup.py
+++ b/setup.py
@@ -28,7 +28,7 @@
         "flake8-bugbear==20.1.4",
         "flake8-use-fstring==1.1",
         "isort==5.9.3",
-        "mypy==0.910",
+        "mypy==0.982",
     ],
     "docs": ["recommonmark", "sphinx>=6.0,<7.0", "sphinx_rtd_theme>=1.2,<1.3"],
     "dev": ["ipython", "pre-commit", "pyinstaller", "twine"],
diff --git a/tests/ast/test_pre_parser.py b/tests/ast/test_pre_parser.py
index 8501bb8749..150ee55edf 100644
--- a/tests/ast/test_pre_parser.py
+++ b/tests/ast/test_pre_parser.py
@@ -1,6 +1,7 @@
 import pytest
 
-from vyper.ast.pre_parser import validate_version_pragma
+from vyper.ast.pre_parser import pre_parse, validate_version_pragma
+from vyper.compiler.settings import OptimizationLevel, Settings
 from vyper.exceptions import VersionException
 
 SRC_LINE = (1, 0)  # Dummy source line
@@ -51,14 +52,14 @@ def set_version(version):
 @pytest.mark.parametrize("file_version", valid_versions)
 def test_valid_version_pragma(file_version, mock_version):
     mock_version(COMPILER_VERSION)
-    validate_version_pragma(f" @version {file_version}", (SRC_LINE))
+    validate_version_pragma(f"{file_version}", (SRC_LINE))
 
 
 @pytest.mark.parametrize("file_version", invalid_versions)
 def test_invalid_version_pragma(file_version, mock_version):
     mock_version(COMPILER_VERSION)
     with pytest.raises(VersionException):
-        validate_version_pragma(f" @version {file_version}", (SRC_LINE))
+        validate_version_pragma(f"{file_version}", (SRC_LINE))
 
 
 prerelease_valid_versions = [
@@ -98,11 +99,85 @@ def test_invalid_version_pragma(file_version, mock_version):
 @pytest.mark.parametrize("file_version", prerelease_valid_versions)
 def test_prerelease_valid_version_pragma(file_version, mock_version):
     mock_version(PRERELEASE_COMPILER_VERSION)
-    validate_version_pragma(f" @version {file_version}", (SRC_LINE))
+    validate_version_pragma(file_version, (SRC_LINE))
 
 
 @pytest.mark.parametrize("file_version", prerelease_invalid_versions)
 def test_prerelease_invalid_version_pragma(file_version, mock_version):
     mock_version(PRERELEASE_COMPILER_VERSION)
     with pytest.raises(VersionException):
-        validate_version_pragma(f" @version {file_version}", (SRC_LINE))
+        validate_version_pragma(file_version, (SRC_LINE))
+
+
+pragma_examples = [
+    (
+        """
+    """,
+        Settings(),
+    ),
+    (
+        """
+    #pragma optimize codesize
+    """,
+        Settings(optimize=OptimizationLevel.CODESIZE),
+    ),
+    (
+        """
+    #pragma optimize none
+    """,
+        Settings(optimize=OptimizationLevel.NONE),
+    ),
+    (
+        """
+    #pragma optimize gas
+    """,
+        Settings(optimize=OptimizationLevel.GAS),
+    ),
+    (
+        """
+    #pragma version 0.3.10
+    """,
+        Settings(compiler_version="0.3.10"),
+    ),
+    (
+        """
+    #pragma evm-version shanghai
+    """,
+        Settings(evm_version="shanghai"),
+    ),
+    (
+        """
+    #pragma optimize codesize
+    #pragma evm-version shanghai
+    """,
+        Settings(evm_version="shanghai", optimize=OptimizationLevel.GAS),
+    ),
+    (
+        """
+    #pragma version 0.3.10
+    #pragma evm-version shanghai
+    """,
+        Settings(evm_version="shanghai", compiler_version="0.3.10"),
+    ),
+    (
+        """
+    #pragma version 0.3.10
+    #pragma optimize gas
+    """,
+        Settings(compiler_version="0.3.10", optimize=OptimizationLevel.GAS),
+    ),
+    (
+        """
+    #pragma version 0.3.10
+    #pragma evm-version shanghai
+    #pragma optimize gas
+    """,
+        Settings(compiler_version="0.3.10", optimize=OptimizationLevel.GAS, evm_version="shanghai"),
+    ),
+]
+
+
+@pytest.mark.parametrize("code, expected_pragmas", pragma_examples)
+def parse_pragmas(code, expected_pragmas):
+    pragmas, _, _ = pre_parse(code)
+    assert pragmas == expected_pragmas
diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index 29809a074d..a78562e982 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -12,6 +12,7 @@
 
 from vyper import compiler
 from vyper.ast.grammar import parse_vyper_source
+from vyper.compiler.settings import Settings
 
 
 class VyperMethod:
@@ -111,14 +112,16 @@ def w3(tester):
     return w3
 
 
-def _get_contract(w3, source_code, no_optimize, *args, **kwargs):
+def _get_contract(w3, source_code, optimize, *args, **kwargs):
+    settings = Settings()
+    settings.evm_version = kwargs.pop("evm_version", None)
+    settings.optimize = optimize
     out = compiler.compile_code(
         source_code,
         # test that metadata gets generated
         ["abi", "bytecode", "metadata"],
+        settings=settings,
         interface_codes=kwargs.pop("interface_codes", None),
-        no_optimize=no_optimize,
-        evm_version=kwargs.pop("evm_version", None),
         show_gas_estimates=True,  # Enable gas estimates for testing
     )
     parse_vyper_source(source_code)  # Test grammar.
@@ -135,13 +138,15 @@ def _get_contract(w3, source_code, no_optimize, *args, **kwargs):
     return w3.eth.contract(address, abi=abi, bytecode=bytecode, ContractFactoryClass=VyperContract)
 
 
-def _deploy_blueprint_for(w3, source_code, no_optimize, initcode_prefix=b"", **kwargs):
+def _deploy_blueprint_for(w3, source_code, optimize, initcode_prefix=b"", **kwargs):
+    settings = Settings()
+    settings.evm_version = kwargs.pop("evm_version", None)
+    settings.optimize = optimize
     out = compiler.compile_code(
         source_code,
         ["abi", "bytecode"],
         interface_codes=kwargs.pop("interface_codes", None),
-        no_optimize=no_optimize,
-        evm_version=kwargs.pop("evm_version", None),
+        settings=settings,
         show_gas_estimates=True,  # Enable gas estimates for testing
     )
     parse_vyper_source(source_code)  # Test grammar.
@@ -173,17 +178,17 @@ def factory(address):
 
 
 @pytest.fixture(scope="module")
-def deploy_blueprint_for(w3, no_optimize):
+def deploy_blueprint_for(w3, optimize):
     def deploy_blueprint_for(source_code, *args, **kwargs):
-        return _deploy_blueprint_for(w3, source_code, no_optimize, *args, **kwargs)
+        return _deploy_blueprint_for(w3, source_code, optimize, *args, **kwargs)
 
     return deploy_blueprint_for
 
 
 @pytest.fixture(scope="module")
-def get_contract(w3, no_optimize):
+def get_contract(w3, optimize):
     def get_contract(source_code, *args, **kwargs):
-        return _get_contract(w3, source_code, no_optimize, *args, **kwargs)
+        return _get_contract(w3, source_code, optimize, *args, **kwargs)
 
     return get_contract
 
diff --git a/tests/cli/vyper_json/test_get_settings.py b/tests/cli/vyper_json/test_get_settings.py
index 7530e85ef8..bbe5dab113 100644
--- a/tests/cli/vyper_json/test_get_settings.py
+++ b/tests/cli/vyper_json/test_get_settings.py
@@ -3,7 +3,6 @@
 import pytest
 
 from vyper.cli.vyper_json import get_evm_version
-from vyper.evm.opcodes import DEFAULT_EVM_VERSION
 from vyper.exceptions import JSONError
 
 
@@ -31,7 +30,3 @@ def test_early_evm(evm_version):
 @pytest.mark.parametrize("evm_version", ["istanbul", "berlin", "paris", "shanghai", "cancun"])
 def test_valid_evm(evm_version):
     assert evm_version == get_evm_version({"settings": {"evmVersion": evm_version}})
-
-
-def test_default_evm():
-    assert get_evm_version({}) == DEFAULT_EVM_VERSION
diff --git a/tests/compiler/asm/test_asm_optimizer.py b/tests/compiler/asm/test_asm_optimizer.py
index f4a245e168..47b70a8c70 100644
--- a/tests/compiler/asm/test_asm_optimizer.py
+++ b/tests/compiler/asm/test_asm_optimizer.py
@@ -1,6 +1,7 @@
 import pytest
 
 from vyper.compiler.phases import CompilerData
+from vyper.compiler.settings import OptimizationLevel, Settings
 
 codes = [
     """
@@ -72,7 +73,7 @@ def __init__():
 
 @pytest.mark.parametrize("code", codes)
 def test_dead_code_eliminator(code):
-    c = CompilerData(code, no_optimize=True)
+    c = CompilerData(code, settings=Settings(optimize=OptimizationLevel.NONE))
     initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
     runtime_asm = c.assembly_runtime
 
@@ -87,7 +88,7 @@ def test_dead_code_eliminator(code):
     for s in (ctor_only_label, runtime_only_label):
         assert s + "_runtime" in runtime_asm
 
-    c = CompilerData(code, no_optimize=False)
+    c = CompilerData(code, settings=Settings(optimize=OptimizationLevel.GAS))
     initcode_asm = [i for i in c.assembly if not isinstance(i, list)]
     runtime_asm = c.assembly_runtime
 
diff --git a/tests/compiler/test_pre_parser.py b/tests/compiler/test_pre_parser.py
index 4b747bb7d1..1761e74bad 100644
--- a/tests/compiler/test_pre_parser.py
+++ b/tests/compiler/test_pre_parser.py
@@ -1,6 +1,8 @@
-from pytest import raises
+import pytest
 
-from vyper.exceptions import SyntaxException
+from vyper.compiler import compile_code
+from vyper.compiler.settings import OptimizationLevel, Settings
+from vyper.exceptions import StructureException, SyntaxException
 
 
 def test_semicolon_prohibited(get_contract):
@@ -10,7 +12,7 @@ def test() -> int128:
     return a + b
     """
 
-    with raises(SyntaxException):
+    with pytest.raises(SyntaxException):
         get_contract(code)
 
 
@@ -70,6 +72,57 @@ def test():
     assert get_contract(code)
 
 
+def test_version_pragma2(get_contract):
+    # new, `#pragma` way of doing things
+    from vyper import __version__
+
+    installed_version = ".".join(__version__.split(".")[:3])
+
+    code = f"""
+#pragma version {installed_version}
+
+@external
+def test():
+    pass
+    """
+    assert get_contract(code)
+
+
+def test_evm_version_check(assert_compile_failed):
+    code = """
+#pragma evm-version berlin
+    """
+    assert compile_code(code, settings=Settings(evm_version=None)) is not None
+    assert compile_code(code, settings=Settings(evm_version="berlin")) is not None
+    # should fail if compile options indicate different evm version
+    # from source pragma
+    with pytest.raises(StructureException):
+        compile_code(code, settings=Settings(evm_version="shanghai"))
+
+
+def test_optimization_mode_check():
+    code = """
+#pragma optimize codesize
+    """
+    assert compile_code(code, settings=Settings(optimize=None))
+    # should fail if compile options indicate different optimization mode
+    # from source pragma
+    with pytest.raises(StructureException):
+        compile_code(code, settings=Settings(optimize=OptimizationLevel.GAS))
+    with pytest.raises(StructureException):
+        compile_code(code, settings=Settings(optimize=OptimizationLevel.NONE))
+
+
+def test_optimization_mode_check_none():
+    code = """
+#pragma optimize none
+    """
+    assert compile_code(code, settings=Settings(optimize=None))
+    # "none" conflicts with "gas"
+    with pytest.raises(StructureException):
+        compile_code(code, settings=Settings(optimize=OptimizationLevel.GAS))
+
+
 def test_version_empty_version(assert_compile_failed, get_contract):
     code = """
 #@version
@@ -110,5 +163,5 @@ def foo():
     convert(
     """
 
-    with raises(SyntaxException):
+    with pytest.raises(SyntaxException):
         get_contract(code)
diff --git a/tests/conftest.py b/tests/conftest.py
index 1cc9e4e72e..9c9c4191b9 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -10,6 +10,7 @@
 
 from vyper import compiler
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.settings import OptimizationLevel
 from vyper.ir import compile_ir, optimizer
 
 from .base_conftest import VyperContract, _get_contract, zero_gas_price_strategy
@@ -36,12 +37,18 @@ def set_evm_verbose_logging():
 
 
 def pytest_addoption(parser):
-    parser.addoption("--no-optimize", action="store_true", help="disable asm and IR optimizations")
+    parser.addoption(
+        "--optimize",
+        choices=["codesize", "gas", "none"],
+        default="gas",
+        help="change optimization mode",
+    )
 
 
 @pytest.fixture(scope="module")
-def no_optimize(pytestconfig):
-    return pytestconfig.getoption("no_optimize")
+def optimize(pytestconfig):
+    flag = pytestconfig.getoption("optimize")
+    return OptimizationLevel.from_string(flag)
 
 
 @pytest.fixture
@@ -58,13 +65,13 @@ def bytes_helper(str, length):
 
 
 @pytest.fixture
-def get_contract_from_ir(w3, no_optimize):
+def get_contract_from_ir(w3, optimize):
     def ir_compiler(ir, *args, **kwargs):
         ir = IRnode.from_list(ir)
-        if not no_optimize:
+        if optimize != OptimizationLevel.NONE:
             ir = optimizer.optimize(ir)
         bytecode, _ = compile_ir.assembly_to_evm(
-            compile_ir.compile_to_assembly(ir, no_optimize=no_optimize)
+            compile_ir.compile_to_assembly(ir, optimize=optimize)
         )
         abi = kwargs.get("abi") or []
         c = w3.eth.contract(abi=abi, bytecode=bytecode)
@@ -80,7 +87,7 @@ def ir_compiler(ir, *args, **kwargs):
 
 
 @pytest.fixture(scope="module")
-def get_contract_module(no_optimize):
+def get_contract_module(optimize):
     """
     This fixture is used for Hypothesis tests to ensure that
     the same contract is called over multiple runs of the test.
@@ -93,7 +100,7 @@ def get_contract_module(no_optimize):
     w3.eth.set_gas_price_strategy(zero_gas_price_strategy)
 
     def get_contract_module(source_code, *args, **kwargs):
-        return _get_contract(w3, source_code, no_optimize, *args, **kwargs)
+        return _get_contract(w3, source_code, optimize, *args, **kwargs)
 
     return get_contract_module
 
@@ -138,9 +145,9 @@ def set_decorator_to_contract_function(w3, tester, contract, source_code, func):
 
 
 @pytest.fixture
-def get_contract_with_gas_estimation(tester, w3, no_optimize):
+def get_contract_with_gas_estimation(tester, w3, optimize):
     def get_contract_with_gas_estimation(source_code, *args, **kwargs):
-        contract = _get_contract(w3, source_code, no_optimize, *args, **kwargs)
+        contract = _get_contract(w3, source_code, optimize, *args, **kwargs)
         for abi_ in contract._classic_contract.functions.abi:
             if abi_["type"] == "function":
                 set_decorator_to_contract_function(w3, tester, contract, source_code, abi_["name"])
@@ -150,9 +157,9 @@ def get_contract_with_gas_estimation(source_code, *args, **kwargs):
 
 
 @pytest.fixture
-def get_contract_with_gas_estimation_for_constants(w3, no_optimize):
+def get_contract_with_gas_estimation_for_constants(w3, optimize):
     def get_contract_with_gas_estimation_for_constants(source_code, *args, **kwargs):
-        return _get_contract(w3, source_code, no_optimize, *args, **kwargs)
+        return _get_contract(w3, source_code, optimize, *args, **kwargs)
 
     return get_contract_with_gas_estimation_for_constants
 
diff --git a/tests/examples/factory/test_factory.py b/tests/examples/factory/test_factory.py
index 15becc05f1..0c5cf61b04 100644
--- a/tests/examples/factory/test_factory.py
+++ b/tests/examples/factory/test_factory.py
@@ -2,6 +2,7 @@
 from eth_utils import keccak
 
 import vyper
+from vyper.compiler.settings import Settings
 
 
 @pytest.fixture
@@ -30,12 +31,12 @@ def create_exchange(token, factory):
 
 
 @pytest.fixture
-def factory(get_contract, no_optimize):
+def factory(get_contract, optimize):
     with open("examples/factory/Exchange.vy") as f:
         code = f.read()
 
     exchange_interface = vyper.compile_code(
-        code, output_formats=["bytecode_runtime"], no_optimize=no_optimize
+        code, output_formats=["bytecode_runtime"], settings=Settings(optimize=optimize)
     )
     exchange_deployed_bytecode = exchange_interface["bytecode_runtime"]
 
diff --git a/tests/grammar/test_grammar.py b/tests/grammar/test_grammar.py
index 7e220b58ae..d665ca2544 100644
--- a/tests/grammar/test_grammar.py
+++ b/tests/grammar/test_grammar.py
@@ -106,5 +106,6 @@ def has_no_docstrings(c):
 @hypothesis.settings(deadline=400, max_examples=500, suppress_health_check=(HealthCheck.too_slow,))
 def test_grammar_bruteforce(code):
     if utf8_encodable(code):
-        tree = parse_to_ast(pre_parse(code + "\n")[1])
+        _, _, reformatted_code = pre_parse(code + "\n")
+        tree = parse_to_ast(reformatted_code)
         assert isinstance(tree, Module)
diff --git a/tests/parser/features/test_immutable.py b/tests/parser/features/test_immutable.py
index 7300d0f2d9..47f7fc748e 100644
--- a/tests/parser/features/test_immutable.py
+++ b/tests/parser/features/test_immutable.py
@@ -1,5 +1,7 @@
 import pytest
 
+from vyper.compiler.settings import OptimizationLevel
+
 
 @pytest.mark.parametrize(
     "typ,value",
@@ -269,7 +271,7 @@ def __init__(to_copy: address):
 # GH issue 3101, take 2
 def test_immutables_initialized2(get_contract, get_contract_from_ir):
     dummy_contract = get_contract_from_ir(
-        ["deploy", 0, ["seq"] + ["invalid"] * 600, 0], no_optimize=True
+        ["deploy", 0, ["seq"] + ["invalid"] * 600, 0], optimize=OptimizationLevel.NONE
     )
 
     # rekt because immutables section extends past allocated memory
diff --git a/tests/parser/features/test_transient.py b/tests/parser/features/test_transient.py
index 53354beca8..718f5ae314 100644
--- a/tests/parser/features/test_transient.py
+++ b/tests/parser/features/test_transient.py
@@ -1,6 +1,7 @@
 import pytest
 
 from vyper.compiler import compile_code
+from vyper.compiler.settings import Settings
 from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.exceptions import StructureException
 
@@ -13,20 +14,22 @@ def test_transient_blocked(evm_version):
     code = """
 my_map: transient(HashMap[address, uint256])
     """
+    settings = Settings(evm_version=evm_version)
     if EVM_VERSIONS[evm_version] >= EVM_VERSIONS["cancun"]:
-        assert compile_code(code, evm_version=evm_version) is not None
+        assert compile_code(code, settings=settings) is not None
     else:
         with pytest.raises(StructureException):
-            compile_code(code, evm_version=evm_version)
+            compile_code(code, settings=settings)
 
 
 @pytest.mark.parametrize("evm_version", list(post_cancun.keys()))
 def test_transient_compiles(evm_version):
     # test transient keyword at least generates TLOAD/TSTORE opcodes
+    settings = Settings(evm_version=evm_version)
     getter_code = """
 my_map: public(transient(HashMap[address, uint256]))
     """
-    t = compile_code(getter_code, evm_version=evm_version, output_formats=["opcodes_runtime"])
+    t = compile_code(getter_code, settings=settings, output_formats=["opcodes_runtime"])
     t = t["opcodes_runtime"].split(" ")
 
     assert "TLOAD" in t
@@ -39,7 +42,7 @@ def test_transient_compiles(evm_version):
 def setter(k: address, v: uint256):
     self.my_map[k] = v
     """
-    t = compile_code(setter_code, evm_version=evm_version, output_formats=["opcodes_runtime"])
+    t = compile_code(setter_code, settings=settings, output_formats=["opcodes_runtime"])
     t = t["opcodes_runtime"].split(" ")
 
     assert "TLOAD" not in t
@@ -52,9 +55,7 @@ def setter(k: address, v: uint256):
 def setter(k: address, v: uint256):
     self.my_map[k] = v
     """
-    t = compile_code(
-        getter_setter_code, evm_version=evm_version, output_formats=["opcodes_runtime"]
-    )
+    t = compile_code(getter_setter_code, settings=settings, output_formats=["opcodes_runtime"])
     t = t["opcodes_runtime"].split(" ")
 
     assert "TLOAD" in t
diff --git a/tests/parser/functions/test_bitwise.py b/tests/parser/functions/test_bitwise.py
index 3e18bd292c..3ba74034ac 100644
--- a/tests/parser/functions/test_bitwise.py
+++ b/tests/parser/functions/test_bitwise.py
@@ -1,7 +1,6 @@
 import pytest
 
 from vyper.compiler import compile_code
-from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.exceptions import InvalidLiteral, InvalidOperation, TypeMismatch
 from vyper.utils import unsigned_to_signed
 
@@ -32,16 +31,14 @@ def _shr(x: uint256, y: uint256) -> uint256:
     """
 
 
-@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
-def test_bitwise_opcodes(evm_version):
-    opcodes = compile_code(code, ["opcodes"], evm_version=evm_version)["opcodes"]
+def test_bitwise_opcodes():
+    opcodes = compile_code(code, ["opcodes"])["opcodes"]
     assert "SHL" in opcodes
     assert "SHR" in opcodes
 
 
-@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
-def test_test_bitwise(get_contract_with_gas_estimation, evm_version):
-    c = get_contract_with_gas_estimation(code, evm_version=evm_version)
+def test_test_bitwise(get_contract_with_gas_estimation):
+    c = get_contract_with_gas_estimation(code)
     x = 126416208461208640982146408124
     y = 7128468721412412459
     assert c._bitwise_and(x, y) == (x & y)
@@ -55,8 +52,7 @@ def test_test_bitwise(get_contract_with_gas_estimation, evm_version):
             assert c._shl(t, s) == (t << s) % (2**256)
 
 
-@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS.keys()))
-def test_signed_shift(get_contract_with_gas_estimation, evm_version):
+def test_signed_shift(get_contract_with_gas_estimation):
     code = """
 @external
 def _sar(x: int256, y: uint256) -> int256:
@@ -66,7 +62,7 @@ def _sar(x: int256, y: uint256) -> int256:
 def _shl(x: int256, y: uint256) -> int256:
     return x << y
     """
-    c = get_contract_with_gas_estimation(code, evm_version=evm_version)
+    c = get_contract_with_gas_estimation(code)
     x = 126416208461208640982146408124
     y = 7128468721412412459
     cases = [x, y, -x, -y]
@@ -97,8 +93,7 @@ def baz(a: uint256, b: uint256, c: uint256) -> (uint256, uint256):
     assert tuple(c.baz(1, 6, 14)) == (1 + 8 | ~6 & 14 * 2, (1 + 8 | ~6) & 14 * 2) == (25, 24)
 
 
-@pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
-def test_literals(get_contract, evm_version):
+def test_literals(get_contract):
     code = """
 @external
 def _shr(x: uint256) -> uint256:
@@ -109,7 +104,7 @@ def _shl(x: uint256) -> uint256:
     return x << 3
     """
 
-    c = get_contract(code, evm_version=evm_version)
+    c = get_contract(code)
     assert c._shr(80) == 10
     assert c._shl(80) == 640
 
diff --git a/tests/parser/functions/test_create_functions.py b/tests/parser/functions/test_create_functions.py
index 64e0823146..876d50b27d 100644
--- a/tests/parser/functions/test_create_functions.py
+++ b/tests/parser/functions/test_create_functions.py
@@ -5,6 +5,7 @@
 
 import vyper.ir.compile_ir as compile_ir
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.settings import OptimizationLevel
 from vyper.utils import EIP_170_LIMIT, checksum_encode, keccak256
 
 
@@ -232,7 +233,9 @@ def test(code_ofst: uint256) -> address:
     # zeroes (so no matter which offset, create_from_blueprint will
     # return empty code)
     ir = IRnode.from_list(["deploy", 0, ["seq"] + ["stop"] * initcode_len, 0])
-    bytecode, _ = compile_ir.assembly_to_evm(compile_ir.compile_to_assembly(ir, no_optimize=True))
+    bytecode, _ = compile_ir.assembly_to_evm(
+        compile_ir.compile_to_assembly(ir, optimize=OptimizationLevel.NONE)
+    )
     # manually deploy the bytecode
     c = w3.eth.contract(abi=[], bytecode=bytecode)
     deploy_transaction = c.constructor()
diff --git a/tests/parser/parser_utils/test_annotate_and_optimize_ast.py b/tests/parser/parser_utils/test_annotate_and_optimize_ast.py
index 6f2246c6c0..68a07178bb 100644
--- a/tests/parser/parser_utils/test_annotate_and_optimize_ast.py
+++ b/tests/parser/parser_utils/test_annotate_and_optimize_ast.py
@@ -29,7 +29,7 @@ def foo() -> int128:
 
 
 def get_contract_info(source_code):
-    class_types, reformatted_code = pre_parse(source_code)
+    _, class_types, reformatted_code = pre_parse(source_code)
     py_ast = python_ast.parse(reformatted_code)
 
     annotate_python_ast(py_ast, reformatted_code, class_types)
diff --git a/tests/parser/syntax/test_address_code.py b/tests/parser/syntax/test_address_code.py
index 25fe1be0b4..70ba5cbbf7 100644
--- a/tests/parser/syntax/test_address_code.py
+++ b/tests/parser/syntax/test_address_code.py
@@ -5,6 +5,7 @@
 from web3 import Web3
 
 from vyper import compiler
+from vyper.compiler.settings import Settings
 from vyper.exceptions import NamespaceCollision, StructureException, VyperException
 
 # For reproducibility, use precompiled data of `hello: public(uint256)` using vyper 0.3.1
@@ -161,7 +162,7 @@ def test_address_code_compile_success(code: str):
     compiler.compile_code(code)
 
 
-def test_address_code_self_success(get_contract, no_optimize: bool):
+def test_address_code_self_success(get_contract, optimize):
     code = """
 code_deployment: public(Bytes[32])
 
@@ -174,8 +175,9 @@ def code_runtime() -> Bytes[32]:
     return slice(self.code, 0, 32)
 """
     contract = get_contract(code)
+    settings = Settings(optimize=optimize)
     code_compiled = compiler.compile_code(
-        code, output_formats=["bytecode", "bytecode_runtime"], no_optimize=no_optimize
+        code, output_formats=["bytecode", "bytecode_runtime"], settings=settings
     )
     assert contract.code_deployment() == bytes.fromhex(code_compiled["bytecode"][2:])[:32]
     assert contract.code_runtime() == bytes.fromhex(code_compiled["bytecode_runtime"][2:])[:32]
diff --git a/tests/parser/syntax/test_chainid.py b/tests/parser/syntax/test_chainid.py
index be960f2fc5..2b6e08cbc4 100644
--- a/tests/parser/syntax/test_chainid.py
+++ b/tests/parser/syntax/test_chainid.py
@@ -1,6 +1,7 @@
 import pytest
 
 from vyper import compiler
+from vyper.compiler.settings import Settings
 from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.exceptions import InvalidType, TypeMismatch
 
@@ -12,8 +13,9 @@ def test_evm_version(evm_version):
 def foo():
     a: uint256 = chain.id
     """
+    settings = Settings(evm_version=evm_version)
 
-    assert compiler.compile_code(code, evm_version=evm_version) is not None
+    assert compiler.compile_code(code, settings=settings) is not None
 
 
 fail_list = [
diff --git a/tests/parser/syntax/test_codehash.py b/tests/parser/syntax/test_codehash.py
index e4b6d90d8d..5074d14636 100644
--- a/tests/parser/syntax/test_codehash.py
+++ b/tests/parser/syntax/test_codehash.py
@@ -1,12 +1,13 @@
 import pytest
 
 from vyper.compiler import compile_code
+from vyper.compiler.settings import Settings
 from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.utils import keccak256
 
 
 @pytest.mark.parametrize("evm_version", list(EVM_VERSIONS))
-def test_get_extcodehash(get_contract, evm_version, no_optimize):
+def test_get_extcodehash(get_contract, evm_version, optimize):
     code = """
 a: address
 
@@ -31,9 +32,8 @@ def foo3() -> bytes32:
 def foo4() -> bytes32:
     return self.a.codehash
     """
-    compiled = compile_code(
-        code, ["bytecode_runtime"], evm_version=evm_version, no_optimize=no_optimize
-    )
+    settings = Settings(evm_version=evm_version, optimize=optimize)
+    compiled = compile_code(code, ["bytecode_runtime"], settings=settings)
     bytecode = bytes.fromhex(compiled["bytecode_runtime"][2:])
     hash_ = keccak256(bytecode)
 
diff --git a/tests/parser/syntax/test_self_balance.py b/tests/parser/syntax/test_self_balance.py
index 949cdde324..63db58e347 100644
--- a/tests/parser/syntax/test_self_balance.py
+++ b/tests/parser/syntax/test_self_balance.py
@@ -1,6 +1,7 @@
 import pytest
 
 from vyper import compiler
+from vyper.compiler.settings import Settings
 from vyper.evm.opcodes import EVM_VERSIONS
 
 
@@ -18,7 +19,8 @@ def get_balance() -> uint256:
 def __default__():
     pass
     """
-    opcodes = compiler.compile_code(code, ["opcodes"], evm_version=evm_version)["opcodes"]
+    settings = Settings(evm_version=evm_version)
+    opcodes = compiler.compile_code(code, ["opcodes"], settings=settings)["opcodes"]
     if EVM_VERSIONS[evm_version] >= EVM_VERSIONS["istanbul"]:
         assert "SELFBALANCE" in opcodes
     else:
diff --git a/tests/parser/types/test_dynamic_array.py b/tests/parser/types/test_dynamic_array.py
index cb55c42870..cbae183fe4 100644
--- a/tests/parser/types/test_dynamic_array.py
+++ b/tests/parser/types/test_dynamic_array.py
@@ -2,6 +2,7 @@
 
 import pytest
 
+from vyper.compiler.settings import OptimizationLevel
 from vyper.exceptions import (
     ArgumentException,
     ArrayIndexException,
@@ -1543,7 +1544,7 @@ def bar(x: int128) -> DynArray[int128, 3]:
     assert c.bar(7) == [7, 14]
 
 
-def test_nested_struct_of_lists(get_contract, assert_compile_failed, no_optimize):
+def test_nested_struct_of_lists(get_contract, assert_compile_failed, optimize):
     code = """
 struct nestedFoo:
     a1: DynArray[DynArray[DynArray[uint256, 2], 2], 2]
@@ -1585,7 +1586,7 @@ def bar2() -> uint256:
         newFoo.b1[0][1][0].a1[0][0][0]
     """
 
-    if no_optimize:
+    if optimize == OptimizationLevel.NONE:
         # fails at assembly stage with too many stack variables
         assert_compile_failed(lambda: get_contract(code), Exception)
     else:
diff --git a/tox.ini b/tox.ini
index 5ddd01d7d4..9b63630f58 100644
--- a/tox.ini
+++ b/tox.ini
@@ -9,7 +9,8 @@ envlist =
 usedevelop = True
 commands =
     core: pytest -m "not fuzzing" --showlocals {posargs:tests/}
-    no-opt: pytest -m "not fuzzing" --showlocals --no-optimize {posargs:tests/}
+    no-opt: pytest -m "not fuzzing" --showlocals --optimize none {posargs:tests/}
+    codesize: pytest -m "not fuzzing" --showlocals --optimize codesize {posargs:tests/}
 basepython =
     py310: python3.10
     py311: python3.11
diff --git a/vyper/ast/__init__.py b/vyper/ast/__init__.py
index 5695ceab7c..e5b81f1e7f 100644
--- a/vyper/ast/__init__.py
+++ b/vyper/ast/__init__.py
@@ -6,7 +6,7 @@
 from . import nodes, validation
 from .natspec import parse_natspec
 from .nodes import compare_nodes
-from .utils import ast_to_dict, parse_to_ast
+from .utils import ast_to_dict, parse_to_ast, parse_to_ast_with_settings
 
 # adds vyper.ast.nodes classes into the local namespace
 for name, obj in (
diff --git a/vyper/ast/nodes.pyi b/vyper/ast/nodes.pyi
index 3d83ae7506..0d59a2fa63 100644
--- a/vyper/ast/nodes.pyi
+++ b/vyper/ast/nodes.pyi
@@ -4,6 +4,7 @@ from typing import Any, Optional, Sequence, Type, Union
 from .natspec import parse_natspec as parse_natspec
 from .utils import ast_to_dict as ast_to_dict
 from .utils import parse_to_ast as parse_to_ast
+from .utils import parse_to_ast_with_settings as parse_to_ast_with_settings
 
 NODE_BASE_ATTRIBUTES: Any
 NODE_SRC_ATTRIBUTES: Any
diff --git a/vyper/ast/pre_parser.py b/vyper/ast/pre_parser.py
index f29150a5d3..35153af9d5 100644
--- a/vyper/ast/pre_parser.py
+++ b/vyper/ast/pre_parser.py
@@ -1,11 +1,15 @@
 import io
 import re
 from tokenize import COMMENT, NAME, OP, TokenError, TokenInfo, tokenize, untokenize
-from typing import Tuple
 
 from semantic_version import NpmSpec, Version
 
-from vyper.exceptions import SyntaxException, VersionException
+from vyper.compiler.settings import OptimizationLevel, Settings
+
+# seems a bit early to be importing this but we want it to validate the
+# evm-version pragma
+from vyper.evm.opcodes import EVM_VERSIONS
+from vyper.exceptions import StructureException, SyntaxException, VersionException
 from vyper.typing import ModificationOffsets, ParserPosition
 
 VERSION_ALPHA_RE = re.compile(r"(?<=\d)a(?=\d)")  # 0.1.0a17
@@ -33,10 +37,7 @@ def validate_version_pragma(version_str: str, start: ParserPosition) -> None:
     # NOTE: should be `x.y.z.*`
     installed_version = ".".join(__version__.split(".")[:3])
 
-    version_arr = version_str.split("@version")
-
-    raw_file_version = version_arr[1].strip()
-    strict_file_version = _convert_version_str(raw_file_version)
+    strict_file_version = _convert_version_str(version_str)
     strict_compiler_version = Version(_convert_version_str(installed_version))
 
     if len(strict_file_version) == 0:
@@ -46,14 +47,14 @@ def validate_version_pragma(version_str: str, start: ParserPosition) -> None:
         npm_spec = NpmSpec(strict_file_version)
     except ValueError:
         raise VersionException(
-            f'Version specification "{raw_file_version}" is not a valid NPM semantic '
+            f'Version specification "{version_str}" is not a valid NPM semantic '
             f"version specification",
             start,
         )
 
     if not npm_spec.match(strict_compiler_version):
         raise VersionException(
-            f'Version specification "{raw_file_version}" is not compatible '
+            f'Version specification "{version_str}" is not compatible '
             f'with compiler version "{installed_version}"',
             start,
         )
@@ -66,7 +67,7 @@ def validate_version_pragma(version_str: str, start: ParserPosition) -> None:
 VYPER_EXPRESSION_TYPES = {"log"}
 
 
-def pre_parse(code: str) -> Tuple[ModificationOffsets, str]:
+def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
     """
     Re-formats a vyper source string into a python source string and performs
     some validation.  More specifically,
@@ -93,6 +94,7 @@ def pre_parse(code: str) -> Tuple[ModificationOffsets, str]:
     """
     result = []
     modification_offsets: ModificationOffsets = {}
+    settings = Settings()
 
     try:
         code_bytes = code.encode("utf-8")
@@ -108,8 +110,39 @@ def pre_parse(code: str) -> Tuple[ModificationOffsets, str]:
             end = token.end
             line = token.line
 
-            if typ == COMMENT and "@version" in string:
-                validate_version_pragma(string[1:], start)
+            if typ == COMMENT:
+                contents = string[1:].strip()
+                if contents.startswith("@version"):
+                    if settings.compiler_version is not None:
+                        raise StructureException("compiler version specified twice!", start)
+                    compiler_version = contents.removeprefix("@version ").strip()
+                    validate_version_pragma(compiler_version, start)
+                    settings.compiler_version = compiler_version
+
+                if string.startswith("#pragma "):
+                    pragma = string.removeprefix("#pragma").strip()
+                    if pragma.startswith("version "):
+                        if settings.compiler_version is not None:
+                            raise StructureException("pragma version specified twice!", start)
+                        compiler_version = pragma.removeprefix("version ".strip())
+                        validate_version_pragma(compiler_version, start)
+                        settings.compiler_version = compiler_version
+
+                    if pragma.startswith("optimize "):
+                        if settings.optimize is not None:
+                            raise StructureException("pragma optimize specified twice!", start)
+                        try:
+                            mode = pragma.removeprefix("optimize").strip()
+                            settings.optimize = OptimizationLevel.from_string(mode)
+                        except ValueError:
+                            raise StructureException(f"Invalid optimization mode `{mode}`", start)
+                    if pragma.startswith("evm-version "):
+                        if settings.evm_version is not None:
+                            raise StructureException("pragma evm-version specified twice!", start)
+                        evm_version = pragma.removeprefix("evm-version").strip()
+                        if evm_version not in EVM_VERSIONS:
+                            raise StructureException("Invalid evm version: `{evm_version}`", start)
+                        settings.evm_version = evm_version
 
             if typ == NAME and string in ("class", "yield"):
                 raise SyntaxException(
@@ -130,4 +163,4 @@ def pre_parse(code: str) -> Tuple[ModificationOffsets, str]:
     except TokenError as e:
         raise SyntaxException(e.args[0], code, e.args[1][0], e.args[1][1]) from e
 
-    return modification_offsets, untokenize(result).decode("utf-8")
+    return settings, modification_offsets, untokenize(result).decode("utf-8")
diff --git a/vyper/ast/utils.py b/vyper/ast/utils.py
index fc8aad227c..4e669385ab 100644
--- a/vyper/ast/utils.py
+++ b/vyper/ast/utils.py
@@ -1,18 +1,23 @@
 import ast as python_ast
-from typing import Dict, List, Optional, Union
+from typing import Any, Dict, List, Optional, Union
 
 from vyper.ast import nodes as vy_ast
 from vyper.ast.annotation import annotate_python_ast
 from vyper.ast.pre_parser import pre_parse
+from vyper.compiler.settings import Settings
 from vyper.exceptions import CompilerPanic, ParserException, SyntaxException
 
 
-def parse_to_ast(
+def parse_to_ast(*args: Any, **kwargs: Any) -> vy_ast.Module:
+    return parse_to_ast_with_settings(*args, **kwargs)[1]
+
+
+def parse_to_ast_with_settings(
     source_code: str,
     source_id: int = 0,
     contract_name: Optional[str] = None,
     add_fn_node: Optional[str] = None,
-) -> vy_ast.Module:
+) -> tuple[Settings, vy_ast.Module]:
     """
     Parses a Vyper source string and generates basic Vyper AST nodes.
 
@@ -34,7 +39,7 @@ def parse_to_ast(
     """
     if "\x00" in source_code:
         raise ParserException("No null bytes (\\x00) allowed in the source code.")
-    class_types, reformatted_code = pre_parse(source_code)
+    settings, class_types, reformatted_code = pre_parse(source_code)
     try:
         py_ast = python_ast.parse(reformatted_code)
     except SyntaxError as e:
@@ -51,7 +56,9 @@ def parse_to_ast(
     annotate_python_ast(py_ast, source_code, class_types, source_id, contract_name)
 
     # Convert to Vyper AST.
-    return vy_ast.get_node(py_ast)  # type: ignore
+    module = vy_ast.get_node(py_ast)
+    assert isinstance(module, vy_ast.Module)  # mypy hint
+    return settings, module
 
 
 def ast_to_dict(ast_struct: Union[vy_ast.VyperNode, List]) -> Union[Dict, List]:
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index f5e113116d..71e78dd666 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -5,13 +5,13 @@
 import warnings
 from collections import OrderedDict
 from pathlib import Path
-from typing import Dict, Iterable, Iterator, Set, TypeVar
+from typing import Dict, Iterable, Iterator, Optional, Set, TypeVar
 
 import vyper
 import vyper.codegen.ir_node as ir_node
 from vyper.cli import vyper_json
 from vyper.cli.utils import extract_file_interface_imports, get_interface_file_path
-from vyper.compiler.settings import VYPER_TRACEBACK_LIMIT
+from vyper.compiler.settings import VYPER_TRACEBACK_LIMIT, OptimizationLevel, Settings
 from vyper.evm.opcodes import DEFAULT_EVM_VERSION, EVM_VERSIONS
 from vyper.typing import ContractCodes, ContractPath, OutputFormats
 
@@ -37,8 +37,6 @@
 ir                 - Intermediate representation in list format
 ir_json            - Intermediate representation in JSON format
 hex-ir             - Output IR and assembly constants in hex instead of decimal
-no-optimize        - Do not optimize (don't use this for production code)
-no-bytecode-metadata - Do not add metadata to bytecode
 """
 
 combined_json_outputs = [
@@ -104,10 +102,10 @@ def _parse_args(argv):
         help=f"Select desired EVM version (default {DEFAULT_EVM_VERSION}). "
         "note: cancun support is EXPERIMENTAL",
         choices=list(EVM_VERSIONS),
-        default=DEFAULT_EVM_VERSION,
         dest="evm_version",
     )
     parser.add_argument("--no-optimize", help="Do not optimize", action="store_true")
+    parser.add_argument("--optimize", help="Optimization flag", choices=["gas", "codesize"])
     parser.add_argument(
         "--no-bytecode-metadata", help="Do not add metadata to bytecode", action="store_true"
     )
@@ -153,13 +151,28 @@ def _parse_args(argv):
 
     output_formats = tuple(uniq(args.format.split(",")))
 
+    if args.no_optimize and args.optimize:
+        raise ValueError("Cannot use `--no-optimize` and `--optimize` at the same time!")
+
+    settings = Settings()
+
+    if args.no_optimize:
+        settings.optimize = OptimizationLevel.NONE
+    elif args.optimize is not None:
+        settings.optimize = OptimizationLevel.from_string(args.optimize)
+
+    if args.evm_version:
+        settings.evm_version = args.evm_version
+
+    if args.verbose:
+        print(f"using `{settings}`", file=sys.stderr)
+
     compiled = compile_files(
         args.input_files,
         output_formats,
         args.root_folder,
         args.show_gas_estimates,
-        args.evm_version,
-        args.no_optimize,
+        settings,
         args.storage_layout,
         args.no_bytecode_metadata,
     )
@@ -253,9 +266,8 @@ def compile_files(
     output_formats: OutputFormats,
     root_folder: str = ".",
     show_gas_estimates: bool = False,
-    evm_version: str = DEFAULT_EVM_VERSION,
-    no_optimize: bool = False,
-    storage_layout: Iterable[str] = None,
+    settings: Optional[Settings] = None,
+    storage_layout: Optional[Iterable[str]] = None,
     no_bytecode_metadata: bool = False,
 ) -> OrderedDict:
     root_path = Path(root_folder).resolve()
@@ -296,8 +308,7 @@ def compile_files(
         final_formats,
         exc_handler=exc_handler,
         interface_codes=get_interface_codes(root_path, contract_sources),
-        evm_version=evm_version,
-        no_optimize=no_optimize,
+        settings=settings,
         storage_layouts=storage_layouts,
         show_gas_estimates=show_gas_estimates,
         no_bytecode_metadata=no_bytecode_metadata,
diff --git a/vyper/cli/vyper_json.py b/vyper/cli/vyper_json.py
index 9778848aa2..4a1c91550e 100755
--- a/vyper/cli/vyper_json.py
+++ b/vyper/cli/vyper_json.py
@@ -5,11 +5,12 @@
 import sys
 import warnings
 from pathlib import Path
-from typing import Any, Callable, Dict, Hashable, List, Tuple, Union
+from typing import Any, Callable, Dict, Hashable, List, Optional, Tuple, Union
 
 import vyper
 from vyper.cli.utils import extract_file_interface_imports, get_interface_file_path
-from vyper.evm.opcodes import DEFAULT_EVM_VERSION, EVM_VERSIONS
+from vyper.compiler.settings import OptimizationLevel, Settings
+from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.exceptions import JSONError
 from vyper.typing import ContractCodes, ContractPath
 from vyper.utils import keccak256
@@ -144,11 +145,15 @@ def _standardize_path(path_str: str) -> str:
     return path.as_posix()
 
 
-def get_evm_version(input_dict: Dict) -> str:
+def get_evm_version(input_dict: Dict) -> Optional[str]:
     if "settings" not in input_dict:
-        return DEFAULT_EVM_VERSION
+        return None
+
+    # TODO: move this validation somewhere it can be reused more easily
+    evm_version = input_dict["settings"].get("evmVersion")
+    if evm_version is None:
+        return None
 
-    evm_version = input_dict["settings"].get("evmVersion", DEFAULT_EVM_VERSION)
     if evm_version in (
         "homestead",
         "tangerineWhistle",
@@ -360,7 +365,21 @@ def compile_from_input_dict(
         raise JSONError(f"Invalid language '{input_dict['language']}' - Only Vyper is supported.")
 
     evm_version = get_evm_version(input_dict)
-    no_optimize = not input_dict["settings"].get("optimize", True)
+
+    optimize = input_dict["settings"].get("optimize")
+    if isinstance(optimize, bool):
+        # bool optimization level for backwards compatibility
+        warnings.warn(
+            "optimize: <bool> is deprecated! please use one of 'gas', 'codesize', 'none'."
+        )
+        optimize = OptimizationLevel.default() if optimize else OptimizationLevel.NONE
+    elif isinstance(optimize, str):
+        optimize = OptimizationLevel.from_string(optimize)
+    else:
+        assert optimize is None
+
+    settings = Settings(evm_version=evm_version, optimize=optimize)
+
     no_bytecode_metadata = not input_dict["settings"].get("bytecodeMetadata", True)
 
     contract_sources: ContractCodes = get_input_dict_contracts(input_dict)
@@ -383,8 +402,7 @@ def compile_from_input_dict(
                     output_formats[contract_path],
                     interface_codes=interface_codes,
                     initial_id=id_,
-                    no_optimize=no_optimize,
-                    evm_version=evm_version,
+                    settings=settings,
                     no_bytecode_metadata=no_bytecode_metadata,
                 )
             except Exception as exc:
diff --git a/vyper/compiler/__init__.py b/vyper/compiler/__init__.py
index 7be45ce832..0b3c0d8191 100644
--- a/vyper/compiler/__init__.py
+++ b/vyper/compiler/__init__.py
@@ -5,7 +5,8 @@
 import vyper.codegen.core as codegen
 import vyper.compiler.output as output
 from vyper.compiler.phases import CompilerData
-from vyper.evm.opcodes import DEFAULT_EVM_VERSION, evm_wrapper
+from vyper.compiler.settings import Settings
+from vyper.evm.opcodes import DEFAULT_EVM_VERSION, anchor_evm_version
 from vyper.typing import (
     ContractCodes,
     ContractPath,
@@ -46,15 +47,14 @@
 }
 
 
-@evm_wrapper
 def compile_codes(
     contract_sources: ContractCodes,
     output_formats: Union[OutputDict, OutputFormats, None] = None,
     exc_handler: Union[Callable, None] = None,
     interface_codes: Union[InterfaceDict, InterfaceImports, None] = None,
     initial_id: int = 0,
-    no_optimize: bool = False,
-    storage_layouts: Dict[ContractPath, StorageLayout] = None,
+    settings: Settings = None,
+    storage_layouts: Optional[dict[ContractPath, Optional[StorageLayout]]] = None,
     show_gas_estimates: bool = False,
     no_bytecode_metadata: bool = False,
 ) -> OrderedDict:
@@ -73,11 +73,8 @@ def compile_codes(
         two arguments - the name of the contract, and the exception that was raised
     initial_id: int, optional
         The lowest source ID value to be used when generating the source map.
-    evm_version: str, optional
-        The target EVM ruleset to compile for. If not given, defaults to the latest
-        implemented ruleset.
-    no_optimize: bool, optional
-        Turn off optimizations. Defaults to False
+    settings: Settings, optional
+        Compiler settings
     show_gas_estimates: bool, optional
         Show gas estimates for abi and ir output modes
     interface_codes: Dict, optional
@@ -98,6 +95,7 @@ def compile_codes(
     Dict
         Compiler output as `{'contract name': {'output key': "output data"}}`
     """
+    settings = settings or Settings()
 
     if output_formats is None:
         output_formats = ("bytecode",)
@@ -121,27 +119,30 @@ def compile_codes(
 
         # make IR output the same between runs
         codegen.reset_names()
-        compiler_data = CompilerData(
-            source_code,
-            contract_name,
-            interfaces,
-            source_id,
-            no_optimize,
-            storage_layout_override,
-            show_gas_estimates,
-            no_bytecode_metadata,
-        )
-        for output_format in output_formats[contract_name]:
-            if output_format not in OUTPUT_FORMATS:
-                raise ValueError(f"Unsupported format type {repr(output_format)}")
-            try:
-                out.setdefault(contract_name, {})
-                out[contract_name][output_format] = OUTPUT_FORMATS[output_format](compiler_data)
-            except Exception as exc:
-                if exc_handler is not None:
-                    exc_handler(contract_name, exc)
-                else:
-                    raise exc
+
+        with anchor_evm_version(settings.evm_version):
+            compiler_data = CompilerData(
+                source_code,
+                contract_name,
+                interfaces,
+                source_id,
+                settings,
+                storage_layout_override,
+                show_gas_estimates,
+                no_bytecode_metadata,
+            )
+            for output_format in output_formats[contract_name]:
+                if output_format not in OUTPUT_FORMATS:
+                    raise ValueError(f"Unsupported format type {repr(output_format)}")
+                try:
+                    out.setdefault(contract_name, {})
+                    formatter = OUTPUT_FORMATS[output_format]
+                    out[contract_name][output_format] = formatter(compiler_data)
+                except Exception as exc:
+                    if exc_handler is not None:
+                        exc_handler(contract_name, exc)
+                    else:
+                        raise exc
 
     return out
 
@@ -153,9 +154,8 @@ def compile_code(
     contract_source: str,
     output_formats: Optional[OutputFormats] = None,
     interface_codes: Optional[InterfaceImports] = None,
-    evm_version: str = DEFAULT_EVM_VERSION,
-    no_optimize: bool = False,
-    storage_layout_override: StorageLayout = None,
+    settings: Settings = None,
+    storage_layout_override: Optional[StorageLayout] = None,
     show_gas_estimates: bool = False,
 ) -> dict:
     """
@@ -171,8 +171,8 @@ def compile_code(
     evm_version: str, optional
         The target EVM ruleset to compile for. If not given, defaults to the latest
         implemented ruleset.
-    no_optimize: bool, optional
-        Turn off optimizations. Defaults to False
+    settings: Settings, optional
+        Compiler settings.
     show_gas_estimates: bool, optional
         Show gas estimates for abi and ir output modes
     interface_codes: Dict, optional
@@ -194,8 +194,7 @@ def compile_code(
         contract_sources,
         output_formats,
         interface_codes=interface_codes,
-        evm_version=evm_version,
-        no_optimize=no_optimize,
+        settings=settings,
         storage_layouts=storage_layouts,
         show_gas_estimates=show_gas_estimates,
     )[UNKNOWN_CONTRACT_NAME]
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index c759f6e272..99465809bd 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -7,6 +7,8 @@
 from vyper.codegen import module
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.settings import OptimizationLevel, Settings
+from vyper.exceptions import StructureException
 from vyper.ir import compile_ir, optimizer
 from vyper.semantics import set_data_positions, validate_semantics
 from vyper.semantics.types.function import ContractFunctionT
@@ -49,7 +51,7 @@ def __init__(
         contract_name: str = "VyperContract",
         interface_codes: Optional[InterfaceImports] = None,
         source_id: int = 0,
-        no_optimize: bool = False,
+        settings: Settings = None,
         storage_layout: StorageLayout = None,
         show_gas_estimates: bool = False,
         no_bytecode_metadata: bool = False,
@@ -69,8 +71,8 @@ def __init__(
             * JSON interfaces are given as lists, vyper interfaces as strings
         source_id : int, optional
             ID number used to identify this contract in the source map.
-        no_optimize: bool, optional
-            Turn off optimizations. Defaults to False
+        settings: Settings
+            Set optimization mode.
         show_gas_estimates: bool, optional
             Show gas estimates for abi and ir output modes
         no_bytecode_metadata: bool, optional
@@ -80,14 +82,45 @@ def __init__(
         self.source_code = source_code
         self.interface_codes = interface_codes
         self.source_id = source_id
-        self.no_optimize = no_optimize
         self.storage_layout_override = storage_layout
         self.show_gas_estimates = show_gas_estimates
         self.no_bytecode_metadata = no_bytecode_metadata
+        self.settings = settings or Settings()
 
     @cached_property
-    def vyper_module(self) -> vy_ast.Module:
-        return generate_ast(self.source_code, self.source_id, self.contract_name)
+    def _generate_ast(self):
+        settings, ast = generate_ast(self.source_code, self.source_id, self.contract_name)
+        # validate the compiler settings
+        # XXX: this is a bit ugly, clean up later
+        if settings.evm_version is not None:
+            if (
+                self.settings.evm_version is not None
+                and self.settings.evm_version != settings.evm_version
+            ):
+                raise StructureException(
+                    f"compiler settings indicate evm version {self.settings.evm_version}, "
+                    f"but source pragma indicates {settings.evm_version}."
+                )
+
+            self.settings.evm_version = settings.evm_version
+
+        if settings.optimize is not None:
+            if self.settings.optimize is not None and self.settings.optimize != settings.optimize:
+                raise StructureException(
+                    f"compiler options indicate optimization mode {self.settings.optimize}, "
+                    f"but source pragma indicates {settings.optimize}."
+                )
+            self.settings.optimize = settings.optimize
+
+        # ensure defaults
+        if self.settings.optimize is None:
+            self.settings.optimize = OptimizationLevel.default()
+
+        return ast
+
+    @cached_property
+    def vyper_module(self):
+        return self._generate_ast
 
     @cached_property
     def vyper_module_unfolded(self) -> vy_ast.Module:
@@ -119,7 +152,7 @@ def global_ctx(self) -> GlobalContext:
     @cached_property
     def _ir_output(self):
         # fetch both deployment and runtime IR
-        return generate_ir_nodes(self.global_ctx, self.no_optimize)
+        return generate_ir_nodes(self.global_ctx, self.settings.optimize)
 
     @property
     def ir_nodes(self) -> IRnode:
@@ -142,11 +175,11 @@ def function_signatures(self) -> dict[str, ContractFunctionT]:
 
     @cached_property
     def assembly(self) -> list:
-        return generate_assembly(self.ir_nodes, self.no_optimize)
+        return generate_assembly(self.ir_nodes, self.settings.optimize)
 
     @cached_property
     def assembly_runtime(self) -> list:
-        return generate_assembly(self.ir_runtime, self.no_optimize)
+        return generate_assembly(self.ir_runtime, self.settings.optimize)
 
     @cached_property
     def bytecode(self) -> bytes:
@@ -169,7 +202,9 @@ def blueprint_bytecode(self) -> bytes:
         return deploy_bytecode + blueprint_bytecode
 
 
-def generate_ast(source_code: str, source_id: int, contract_name: str) -> vy_ast.Module:
+def generate_ast(
+    source_code: str, source_id: int, contract_name: str
+) -> tuple[Settings, vy_ast.Module]:
     """
     Generate a Vyper AST from source code.
 
@@ -187,7 +222,7 @@ def generate_ast(source_code: str, source_id: int, contract_name: str) -> vy_ast
     vy_ast.Module
         Top-level Vyper AST node
     """
-    return vy_ast.parse_to_ast(source_code, source_id, contract_name)
+    return vy_ast.parse_to_ast_with_settings(source_code, source_id, contract_name)
 
 
 def generate_unfolded_ast(
@@ -233,7 +268,7 @@ def generate_folded_ast(
     return vyper_module_folded, symbol_tables
 
 
-def generate_ir_nodes(global_ctx: GlobalContext, no_optimize: bool) -> tuple[IRnode, IRnode]:
+def generate_ir_nodes(global_ctx: GlobalContext, optimize: bool) -> tuple[IRnode, IRnode]:
     """
     Generate the intermediate representation (IR) from the contextualized AST.
 
@@ -254,13 +289,13 @@ def generate_ir_nodes(global_ctx: GlobalContext, no_optimize: bool) -> tuple[IRn
         IR to generate runtime bytecode
     """
     ir_nodes, ir_runtime = module.generate_ir_for_module(global_ctx)
-    if not no_optimize:
+    if optimize != OptimizationLevel.NONE:
         ir_nodes = optimizer.optimize(ir_nodes)
         ir_runtime = optimizer.optimize(ir_runtime)
     return ir_nodes, ir_runtime
 
 
-def generate_assembly(ir_nodes: IRnode, no_optimize: bool = False) -> list:
+def generate_assembly(ir_nodes: IRnode, optimize: Optional[OptimizationLevel] = None) -> list:
     """
     Generate assembly instructions from IR.
 
@@ -274,7 +309,8 @@ def generate_assembly(ir_nodes: IRnode, no_optimize: bool = False) -> list:
     list
         List of assembly instructions.
     """
-    assembly = compile_ir.compile_to_assembly(ir_nodes, no_optimize=no_optimize)
+    optimize = optimize or OptimizationLevel.default()
+    assembly = compile_ir.compile_to_assembly(ir_nodes, optimize=optimize)
 
     if _find_nested_opcode(assembly, "DEBUG"):
         warnings.warn(
diff --git a/vyper/compiler/settings.py b/vyper/compiler/settings.py
index 09ced0dcb8..bb5e9cdc25 100644
--- a/vyper/compiler/settings.py
+++ b/vyper/compiler/settings.py
@@ -1,4 +1,6 @@
 import os
+from dataclasses import dataclass
+from enum import Enum
 from typing import Optional
 
 VYPER_COLOR_OUTPUT = os.environ.get("VYPER_COLOR_OUTPUT", "0") == "1"
@@ -12,3 +14,31 @@
     VYPER_TRACEBACK_LIMIT = int(_tb_limit_str)
 else:
     VYPER_TRACEBACK_LIMIT = None
+
+
+class OptimizationLevel(Enum):
+    NONE = 1
+    GAS = 2
+    CODESIZE = 3
+
+    @classmethod
+    def from_string(cls, val):
+        match val:
+            case "none":
+                return cls.NONE
+            case "gas":
+                return cls.GAS
+            case "codesize":
+                return cls.CODESIZE
+        raise ValueError(f"unrecognized optimization level: {val}")
+
+    @classmethod
+    def default(cls):
+        return cls.GAS
+
+
+@dataclass
+class Settings:
+    compiler_version: Optional[str] = None
+    optimize: Optional[OptimizationLevel] = None
+    evm_version: Optional[str] = None
diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index 7550d047b5..4fec13e897 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -1,4 +1,5 @@
-from typing import Dict, Optional
+import contextlib
+from typing import Dict, Generator, Optional
 
 from vyper.exceptions import CompilerPanic
 from vyper.typing import OpcodeGasCost, OpcodeMap, OpcodeRulesetMap, OpcodeRulesetValue, OpcodeValue
@@ -206,17 +207,16 @@
 IR_OPCODES: OpcodeMap = {**OPCODES, **PSEUDO_OPCODES}
 
 
-def evm_wrapper(fn, *args, **kwargs):
-    def _wrapper(*args, **kwargs):
-        global active_evm_version
-        evm_version = kwargs.pop("evm_version", None) or DEFAULT_EVM_VERSION
-        active_evm_version = EVM_VERSIONS[evm_version]
-        try:
-            return fn(*args, **kwargs)
-        finally:
-            active_evm_version = EVM_VERSIONS[DEFAULT_EVM_VERSION]
-
-    return _wrapper
+@contextlib.contextmanager
+def anchor_evm_version(evm_version: Optional[str] = None) -> Generator:
+    global active_evm_version
+    anchor = active_evm_version
+    evm_version = evm_version or DEFAULT_EVM_VERSION
+    active_evm_version = EVM_VERSIONS[evm_version]
+    try:
+        yield
+    finally:
+        active_evm_version = anchor
 
 
 def _gas(value: OpcodeValue, idx: int) -> Optional[OpcodeRulesetValue]:
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 5a35b8f932..15a68a5079 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -3,6 +3,7 @@
 import math
 
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.settings import OptimizationLevel
 from vyper.evm.opcodes import get_opcodes, version_check
 from vyper.exceptions import CodegenPanic, CompilerPanic
 from vyper.utils import MemoryPositions
@@ -201,7 +202,7 @@ def apply_line_no_wrapper(*args, **kwargs):
 
 
 @apply_line_numbers
-def compile_to_assembly(code, no_optimize=False):
+def compile_to_assembly(code, optimize=OptimizationLevel.GAS):
     global _revert_label
     _revert_label = mksymbol("revert")
 
@@ -212,7 +213,7 @@ def compile_to_assembly(code, no_optimize=False):
     res = _compile_to_assembly(code)
 
     _add_postambles(res)
-    if not no_optimize:
+    if optimize != OptimizationLevel.NONE:
         _optimize_assembly(res)
     return res
 

From 5dc3ac7ec700d85886eda3d53a03abcf5c7efc9c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sat, 15 Jul 2023 11:20:53 -0400
Subject: [PATCH 081/161] feat: improve batch copy performance (#3483)

per cancun, eip-5656, this commit adds the use of mcopy for memory
copies. it also
- adds heuristics to use loops vs unrolled loops for batch copies.
- adds helper functions `vyper.codegen.core._opt_[gas,codesize,none]()`
  to detect optimization mode during codegen
- adds `--optimize none` to CLI options, with the intent of phasing out
  `--no-optimize` if the ergonomics are better.
---
 .github/workflows/era-tester.yml         |   4 +-
 setup.cfg                                |   1 -
 tests/compiler/test_opcodes.py           |   7 +-
 tests/parser/functions/test_slice.py     |  89 ++++++++--------
 tests/parser/types/test_dynamic_array.py |  12 +--
 vyper/cli/vyper_compile.py               |   2 +-
 vyper/codegen/core.py                    | 128 ++++++++++++++++++++---
 vyper/codegen/ir_node.py                 |  16 +--
 vyper/compiler/phases.py                 |   8 +-
 vyper/evm/opcodes.py                     |   5 +-
 vyper/ir/compile_ir.py                   |   1 +
 vyper/ir/optimizer.py                    |  44 +++++---
 vyper/utils.py                           |   3 +-
 13 files changed, 221 insertions(+), 99 deletions(-)

diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index 8a2a3e50ce..187b5c03a2 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -101,11 +101,11 @@ jobs:
       if: ${{ github.ref != 'refs/heads/master' }}
       run: |
         cd era-compiler-tester
-        cargo run --release --bin compiler-tester -- -v --path=tests/vyper/ --mode="M0B0 ${{ env.VYPER_VERSION }}"
+        cargo run --release --bin compiler-tester -- --path=tests/vyper/ --mode="M0B0 ${{ env.VYPER_VERSION }}"
 
     - name: Run tester (slow)
       # Run era tester across the LLVM optimization matrix
       if: ${{ github.ref == 'refs/heads/master' }}
       run: |
         cd era-compiler-tester
-        cargo run --release --bin compiler-tester -- -v --path=tests/vyper/ --mode="M*B* ${{ env.VYPER_VERSION }}"
+        cargo run --release --bin compiler-tester -- --path=tests/vyper/ --mode="M*B* ${{ env.VYPER_VERSION }}"
diff --git a/setup.cfg b/setup.cfg
index d18ffe2ac7..dd4a32a3ac 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -31,7 +31,6 @@ addopts = -n auto
 	--cov-report html
 	--cov-report xml
 	--cov=vyper
-	--hypothesis-show-statistics
 python_files = test_*.py
 testpaths = tests
 markers =
diff --git a/tests/compiler/test_opcodes.py b/tests/compiler/test_opcodes.py
index b9841b92f0..20f45ced6b 100644
--- a/tests/compiler/test_opcodes.py
+++ b/tests/compiler/test_opcodes.py
@@ -59,5 +59,8 @@ def test_get_opcodes(evm_version):
         assert "PUSH0" in ops
 
     if evm_version in ("cancun",):
-        assert "TLOAD" in ops
-        assert "TSTORE" in ops
+        for op in ("TLOAD", "TSTORE", "MCOPY"):
+            assert op in ops
+    else:
+        for op in ("TLOAD", "TSTORE", "MCOPY"):
+            assert op not in ops
diff --git a/tests/parser/functions/test_slice.py b/tests/parser/functions/test_slice.py
index 11d834bf42..f1b642b28d 100644
--- a/tests/parser/functions/test_slice.py
+++ b/tests/parser/functions/test_slice.py
@@ -1,4 +1,6 @@
+import hypothesis.strategies as st
 import pytest
+from hypothesis import given, settings
 
 from vyper.exceptions import ArgumentException
 
@@ -9,14 +11,6 @@ def _generate_bytes(length):
     return bytes(list(range(length)))
 
 
-# good numbers to try
-_fun_numbers = [0, 1, 5, 31, 32, 33, 64, 99, 100, 101]
-
-
-# [b"", b"\x01", b"\x02"...]
-_bytes_examples = [_generate_bytes(i) for i in _fun_numbers if i <= 100]
-
-
 def test_basic_slice(get_contract_with_gas_estimation):
     code = """
 @external
@@ -31,12 +25,16 @@ def slice_tower_test(inp1: Bytes[50]) -> Bytes[50]:
     assert x == b"klmnopqrst", x
 
 
-@pytest.mark.parametrize("bytesdata", _bytes_examples)
-@pytest.mark.parametrize("start", _fun_numbers)
+# note: optimization boundaries at 32, 64 and 320 depending on mode
+_draw_1024 = st.integers(min_value=0, max_value=1024)
+_draw_1024_1 = st.integers(min_value=1, max_value=1024)
+_bytes_1024 = st.binary(min_size=0, max_size=1024)
+
+
 @pytest.mark.parametrize("literal_start", (True, False))
-@pytest.mark.parametrize("length", _fun_numbers)
 @pytest.mark.parametrize("literal_length", (True, False))
-@pytest.mark.fuzzing
+@given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
+@settings(max_examples=25, deadline=None)
 def test_slice_immutable(
     get_contract,
     assert_compile_failed,
@@ -46,47 +44,48 @@ def test_slice_immutable(
     literal_start,
     length,
     literal_length,
+    length_bound,
 ):
     _start = start if literal_start else "start"
     _length = length if literal_length else "length"
 
     code = f"""
-IMMUTABLE_BYTES: immutable(Bytes[100])
-IMMUTABLE_SLICE: immutable(Bytes[100])
+IMMUTABLE_BYTES: immutable(Bytes[{length_bound}])
+IMMUTABLE_SLICE: immutable(Bytes[{length_bound}])
 
 @external
-def __init__(inp: Bytes[100], start: uint256, length: uint256):
+def __init__(inp: Bytes[{length_bound}], start: uint256, length: uint256):
     IMMUTABLE_BYTES = inp
     IMMUTABLE_SLICE = slice(IMMUTABLE_BYTES, {_start}, {_length})
 
 @external
-def do_splice() -> Bytes[100]:
+def do_splice() -> Bytes[{length_bound}]:
     return IMMUTABLE_SLICE
     """
 
+    def _get_contract():
+        return get_contract(code, bytesdata, start, length)
+
     if (
-        (start + length > 100 and literal_start and literal_length)
-        or (literal_length and length > 100)
-        or (literal_start and start > 100)
+        (start + length > length_bound and literal_start and literal_length)
+        or (literal_length and length > length_bound)
+        or (literal_start and start > length_bound)
         or (literal_length and length < 1)
     ):
-        assert_compile_failed(
-            lambda: get_contract(code, bytesdata, start, length), ArgumentException
-        )
-    elif start + length > len(bytesdata):
-        assert_tx_failed(lambda: get_contract(code, bytesdata, start, length))
+        assert_compile_failed(lambda: _get_contract(), ArgumentException)
+    elif start + length > len(bytesdata) or (len(bytesdata) > length_bound):
+        # deploy fail
+        assert_tx_failed(lambda: _get_contract())
     else:
-        c = get_contract(code, bytesdata, start, length)
+        c = _get_contract()
         assert c.do_splice() == bytesdata[start : start + length]
 
 
 @pytest.mark.parametrize("location", ("storage", "calldata", "memory", "literal", "code"))
-@pytest.mark.parametrize("bytesdata", _bytes_examples)
-@pytest.mark.parametrize("start", _fun_numbers)
 @pytest.mark.parametrize("literal_start", (True, False))
-@pytest.mark.parametrize("length", _fun_numbers)
 @pytest.mark.parametrize("literal_length", (True, False))
-@pytest.mark.fuzzing
+@given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
+@settings(max_examples=25, deadline=None)
 def test_slice_bytes(
     get_contract,
     assert_compile_failed,
@@ -97,9 +96,10 @@ def test_slice_bytes(
     literal_start,
     length,
     literal_length,
+    length_bound,
 ):
     if location == "memory":
-        spliced_code = "foo: Bytes[100] = inp"
+        spliced_code = f"foo: Bytes[{length_bound}] = inp"
         foo = "foo"
     elif location == "storage":
         spliced_code = "self.foo = inp"
@@ -120,31 +120,38 @@ def test_slice_bytes(
     _length = length if literal_length else "length"
 
     code = f"""
-foo: Bytes[100]
-IMMUTABLE_BYTES: immutable(Bytes[100])
+foo: Bytes[{length_bound}]
+IMMUTABLE_BYTES: immutable(Bytes[{length_bound}])
 @external
-def __init__(foo: Bytes[100]):
+def __init__(foo: Bytes[{length_bound}]):
     IMMUTABLE_BYTES = foo
 
 @external
-def do_slice(inp: Bytes[100], start: uint256, length: uint256) -> Bytes[100]:
+def do_slice(inp: Bytes[{length_bound}], start: uint256, length: uint256) -> Bytes[{length_bound}]:
     {spliced_code}
     return slice({foo}, {_start}, {_length})
     """
 
-    length_bound = len(bytesdata) if location == "literal" else 100
+    def _get_contract():
+        return get_contract(code, bytesdata)
+
+    data_length = len(bytesdata) if location == "literal" else length_bound
     if (
-        (start + length > length_bound and literal_start and literal_length)
-        or (literal_length and length > length_bound)
-        or (literal_start and start > length_bound)
+        (start + length > data_length and literal_start and literal_length)
+        or (literal_length and length > data_length)
+        or (location == "literal" and len(bytesdata) > length_bound)
+        or (literal_start and start > data_length)
         or (literal_length and length < 1)
     ):
-        assert_compile_failed(lambda: get_contract(code, bytesdata), ArgumentException)
+        assert_compile_failed(lambda: _get_contract(), ArgumentException)
+    elif len(bytesdata) > data_length:
+        # deploy fail
+        assert_tx_failed(lambda: _get_contract())
     elif start + length > len(bytesdata):
-        c = get_contract(code, bytesdata)
+        c = _get_contract()
         assert_tx_failed(lambda: c.do_slice(bytesdata, start, length))
     else:
-        c = get_contract(code, bytesdata)
+        c = _get_contract()
         assert c.do_slice(bytesdata, start, length) == bytesdata[start : start + length], code
 
 
diff --git a/tests/parser/types/test_dynamic_array.py b/tests/parser/types/test_dynamic_array.py
index cbae183fe4..9231d1979f 100644
--- a/tests/parser/types/test_dynamic_array.py
+++ b/tests/parser/types/test_dynamic_array.py
@@ -2,7 +2,6 @@
 
 import pytest
 
-from vyper.compiler.settings import OptimizationLevel
 from vyper.exceptions import (
     ArgumentException,
     ArrayIndexException,
@@ -1585,14 +1584,9 @@ def bar2() -> uint256:
         newFoo.b1[1][0][0].a1[0][1][1] + \\
         newFoo.b1[0][1][0].a1[0][0][0]
     """
-
-    if optimize == OptimizationLevel.NONE:
-        # fails at assembly stage with too many stack variables
-        assert_compile_failed(lambda: get_contract(code), Exception)
-    else:
-        c = get_contract(code)
-        assert c.bar() == [[[3, 7], [7, 3]], [[7, 3], [0, 0]]]
-        assert c.bar2() == 0
+    c = get_contract(code)
+    assert c.bar() == [[[3, 7], [7, 3]], [[7, 3], [0, 0]]]
+    assert c.bar2() == 0
 
 
 def test_tuple_of_lists(get_contract):
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 71e78dd666..55e0fc82b2 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -105,7 +105,7 @@ def _parse_args(argv):
         dest="evm_version",
     )
     parser.add_argument("--no-optimize", help="Do not optimize", action="store_true")
-    parser.add_argument("--optimize", help="Optimization flag", choices=["gas", "codesize"])
+    parser.add_argument("--optimize", help="Optimization flag", choices=["gas", "codesize", "none"])
     parser.add_argument(
         "--no-bytecode-metadata", help="Do not add metadata to bytecode", action="store_true"
     )
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 58d9db9889..5b16938e99 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -1,6 +1,11 @@
+import contextlib
+from typing import Generator
+
 from vyper import ast as vy_ast
 from vyper.codegen.ir_node import Encoding, IRnode
+from vyper.compiler.settings import OptimizationLevel
 from vyper.evm.address_space import CALLDATA, DATA, IMMUTABLES, MEMORY, STORAGE, TRANSIENT
+from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StructureException, TypeCheckFailure, TypeMismatch
 from vyper.semantics.types import (
     AddressT,
@@ -19,13 +24,7 @@
 from vyper.semantics.types.shortcuts import BYTES32_T, INT256_T, UINT256_T
 from vyper.semantics.types.subscriptable import SArrayT
 from vyper.semantics.types.user import EnumT
-from vyper.utils import (
-    GAS_CALLDATACOPY_WORD,
-    GAS_CODECOPY_WORD,
-    GAS_IDENTITY,
-    GAS_IDENTITYWORD,
-    ceil32,
-)
+from vyper.utils import GAS_COPY_WORD, GAS_IDENTITY, GAS_IDENTITYWORD, ceil32
 
 DYNAMIC_ARRAY_OVERHEAD = 1
 
@@ -90,12 +89,16 @@ def _identity_gas_bound(num_bytes):
     return GAS_IDENTITY + GAS_IDENTITYWORD * (ceil32(num_bytes) // 32)
 
 
+def _mcopy_gas_bound(num_bytes):
+    return GAS_COPY_WORD * ceil32(num_bytes) // 32
+
+
 def _calldatacopy_gas_bound(num_bytes):
-    return GAS_CALLDATACOPY_WORD * ceil32(num_bytes) // 32
+    return GAS_COPY_WORD * ceil32(num_bytes) // 32
 
 
 def _codecopy_gas_bound(num_bytes):
-    return GAS_CODECOPY_WORD * ceil32(num_bytes) // 32
+    return GAS_COPY_WORD * ceil32(num_bytes) // 32
 
 
 # Copy byte array word-for-word (including layout)
@@ -258,7 +261,6 @@ def copy_bytes(dst, src, length, length_bound):
         assert src.is_pointer and dst.is_pointer
 
         # fast code for common case where num bytes is small
-        # TODO expand this for more cases where num words is less than ~8
         if length_bound <= 32:
             copy_op = STORE(dst, LOAD(src))
             ret = IRnode.from_list(copy_op, annotation=annotation)
@@ -268,8 +270,12 @@ def copy_bytes(dst, src, length, length_bound):
             # special cases: batch copy to memory
             # TODO: iloadbytes
             if src.location == MEMORY:
-                copy_op = ["staticcall", "gas", 4, src, length, dst, length]
-                gas_bound = _identity_gas_bound(length_bound)
+                if version_check(begin="cancun"):
+                    copy_op = ["mcopy", dst, src, length]
+                    gas_bound = _mcopy_gas_bound(length_bound)
+                else:
+                    copy_op = ["staticcall", "gas", 4, src, length, dst, length]
+                    gas_bound = _identity_gas_bound(length_bound)
             elif src.location == CALLDATA:
                 copy_op = ["calldatacopy", dst, src, length]
                 gas_bound = _calldatacopy_gas_bound(length_bound)
@@ -876,6 +882,38 @@ def make_setter(left, right):
     return _complex_make_setter(left, right)
 
 
+_opt_level = OptimizationLevel.GAS
+
+
+@contextlib.contextmanager
+def anchor_opt_level(new_level: OptimizationLevel) -> Generator:
+    """
+    Set the global optimization level variable for the duration of this
+    context manager.
+    """
+    assert isinstance(new_level, OptimizationLevel)
+
+    global _opt_level
+    try:
+        tmp = _opt_level
+        _opt_level = new_level
+        yield
+    finally:
+        _opt_level = tmp
+
+
+def _opt_codesize():
+    return _opt_level == OptimizationLevel.CODESIZE
+
+
+def _opt_gas():
+    return _opt_level == OptimizationLevel.GAS
+
+
+def _opt_none():
+    return _opt_level == OptimizationLevel.NONE
+
+
 def _complex_make_setter(left, right):
     if right.value == "~empty" and left.location == MEMORY:
         # optimized memzero
@@ -891,11 +929,69 @@ def _complex_make_setter(left, right):
         assert is_tuple_like(left.typ)
         keys = left.typ.tuple_keys()
 
-    # if len(keyz) == 0:
-    #    return IRnode.from_list(["pass"])
+    if left.is_pointer and right.is_pointer and right.encoding == Encoding.VYPER:
+        # both left and right are pointers, see if we want to batch copy
+        # instead of unrolling the loop.
+        assert left.encoding == Encoding.VYPER
+        len_ = left.typ.memory_bytes_required
+
+        has_storage = STORAGE in (left.location, right.location)
+        if has_storage:
+            if _opt_codesize():
+                # assuming PUSH2, a single sstore(dst (sload src)) is 8 bytes,
+                # sstore(add (dst ofst), (sload (add (src ofst)))) is 16 bytes,
+                # whereas loop overhead is 16-17 bytes.
+                base_cost = 3
+                if left._optimized.is_literal:
+                    # code size is smaller since add is performed at compile-time
+                    base_cost += 1
+                if right._optimized.is_literal:
+                    base_cost += 1
+                # the formula is a heuristic, but it works.
+                # (CMC 2023-07-14 could get more detailed for PUSH1 vs
+                # PUSH2 etc but not worried about that too much now,
+                # it's probably better to add a proper unroll rule in the
+                # optimizer.)
+                should_batch_copy = len_ >= 32 * base_cost
+            elif _opt_gas():
+                # kind of arbitrary, but cut off when code used > ~160 bytes
+                should_batch_copy = len_ >= 32 * 10
+            else:
+                assert _opt_none()
+                # don't care, just generate the most readable version
+                should_batch_copy = True
+        else:
+            # find a cutoff for memory copy where identity is cheaper
+            # than unrolled mloads/mstores
+            # if MCOPY is available, mcopy is *always* better (except in
+            # the 1 word case, but that is already handled by copy_bytes).
+            if right.location == MEMORY and _opt_gas() and not version_check(begin="cancun"):
+                # cost for 0th word - (mstore dst (mload src))
+                base_unroll_cost = 12
+                nth_word_cost = base_unroll_cost
+                if not left._optimized.is_literal:
+                    # (mstore (add N dst) (mload src))
+                    nth_word_cost += 6
+                if not right._optimized.is_literal:
+                    # (mstore dst (mload (add N src)))
+                    nth_word_cost += 6
+
+                identity_base_cost = 115  # staticcall 4 gas dst len src len
+
+                n_words = ceil32(len_) // 32
+                should_batch_copy = (
+                    base_unroll_cost + (nth_word_cost * (n_words - 1)) >= identity_base_cost
+                )
+
+            # calldata to memory, code to memory, cancun, or codesize -
+            # batch copy is always better.
+            else:
+                should_batch_copy = True
+
+        if should_batch_copy:
+            return copy_bytes(left, right, len_, len_)
 
-    # general case
-    # TODO use copy_bytes when the generated code is above a certain size
+    # general case, unroll
     with left.cache_when_complex("_L") as (b1, left), right.cache_when_complex("_R") as (b2, right):
         for k in keys:
             l_i = get_element_ptr(left, k, array_bounds_check=False)
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index f7698fbabb..0895e5f02d 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -49,10 +49,7 @@ class Encoding(Enum):
 # this creates a magical block which maps to IR `with`
 class _WithBuilder:
     def __init__(self, ir_node, name, should_inline=False):
-        # TODO figure out how to fix this circular import
-        from vyper.ir.optimizer import optimize
-
-        if should_inline and optimize(ir_node).is_complex_ir:
+        if should_inline and ir_node._optimized.is_complex_ir:
             # this can only mean trouble
             raise CompilerPanic("trying to inline a complex IR node")
 
@@ -366,6 +363,13 @@ def is_pointer(self):
         # eventually
         return self.location is not None
 
+    @property  # probably could be cached_property but be paranoid
+    def _optimized(self):
+        # TODO figure out how to fix this circular import
+        from vyper.ir.optimizer import optimize
+
+        return optimize(self)
+
     # This function is slightly confusing but abstracts a common pattern:
     # when an IR value needs to be computed once and then cached as an
     # IR value (if it is expensive, or more importantly if its computation
@@ -382,13 +386,11 @@ def is_pointer(self):
     #   return builder.resolve(ret)
     # ```
     def cache_when_complex(self, name):
-        from vyper.ir.optimizer import optimize
-
         # for caching purposes, see if the ir_node will be optimized
         # because a non-literal expr could turn into a literal,
         # (e.g. `(add 1 2)`)
         # TODO this could really be moved into optimizer.py
-        should_inline = not optimize(self).is_complex_ir
+        should_inline = not self._optimized.is_complex_ir
 
         return _WithBuilder(self, name, should_inline)
 
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 99465809bd..4e1bd9e6c3 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -5,6 +5,7 @@
 
 from vyper import ast as vy_ast
 from vyper.codegen import module
+from vyper.codegen.core import anchor_opt_level
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
 from vyper.compiler.settings import OptimizationLevel, Settings
@@ -268,7 +269,9 @@ def generate_folded_ast(
     return vyper_module_folded, symbol_tables
 
 
-def generate_ir_nodes(global_ctx: GlobalContext, optimize: bool) -> tuple[IRnode, IRnode]:
+def generate_ir_nodes(
+    global_ctx: GlobalContext, optimize: OptimizationLevel
+) -> tuple[IRnode, IRnode]:
     """
     Generate the intermediate representation (IR) from the contextualized AST.
 
@@ -288,7 +291,8 @@ def generate_ir_nodes(global_ctx: GlobalContext, optimize: bool) -> tuple[IRnode
         IR to generate deployment bytecode
         IR to generate runtime bytecode
     """
-    ir_nodes, ir_runtime = module.generate_ir_for_module(global_ctx)
+    with anchor_opt_level(optimize):
+        ir_nodes, ir_runtime = module.generate_ir_for_module(global_ctx)
     if optimize != OptimizationLevel.NONE:
         ir_nodes = optimizer.optimize(ir_nodes)
         ir_runtime = optimizer.optimize(ir_runtime)
diff --git a/vyper/evm/opcodes.py b/vyper/evm/opcodes.py
index 4fec13e897..767d634c89 100644
--- a/vyper/evm/opcodes.py
+++ b/vyper/evm/opcodes.py
@@ -89,6 +89,7 @@
     "MSIZE": (0x59, 0, 1, 2),
     "GAS": (0x5A, 0, 1, 2),
     "JUMPDEST": (0x5B, 0, 0, 1),
+    "MCOPY": (0x5E, 3, 0, (None, None, None, None, None, 3)),
     "PUSH0": (0x5F, 0, 1, 2),
     "PUSH1": (0x60, 0, 1, 3),
     "PUSH2": (0x61, 0, 1, 3),
@@ -171,8 +172,8 @@
     "INVALID": (0xFE, 0, 0, 0),
     "DEBUG": (0xA5, 1, 0, 0),
     "BREAKPOINT": (0xA6, 0, 0, 0),
-    "TLOAD": (0x5C, 1, 1, 100),
-    "TSTORE": (0x5D, 2, 0, 100),
+    "TLOAD": (0x5C, 1, 1, (None, None, None, None, None, 100)),
+    "TSTORE": (0x5D, 2, 0, (None, None, None, None, None, 100)),
 }
 
 PSEUDO_OPCODES: OpcodeMap = {
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 15a68a5079..a9064a44fa 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -297,6 +297,7 @@ def _height_of(witharg):
         return o
 
     # batch copy from data section of the currently executing code to memory
+    # (probably should have named this dcopy but oh well)
     elif code.value == "dloadbytes":
         dst = code.args[0]
         src = code.args[1]
diff --git a/vyper/ir/optimizer.py b/vyper/ir/optimizer.py
index b13c6f79f8..40e02e79c7 100644
--- a/vyper/ir/optimizer.py
+++ b/vyper/ir/optimizer.py
@@ -2,6 +2,7 @@
 from typing import List, Optional, Tuple, Union
 
 from vyper.codegen.ir_node import IRnode
+from vyper.evm.opcodes import version_check
 from vyper.exceptions import CompilerPanic, StaticAssertionException
 from vyper.utils import (
     ceil32,
@@ -472,6 +473,7 @@ def finalize(val, args):
     if value == "seq":
         changed |= _merge_memzero(argz)
         changed |= _merge_calldataload(argz)
+        changed |= _merge_mload(argz)
         changed |= _remove_empty_seqs(argz)
 
         # (seq x) => (x) for cleanliness and
@@ -636,12 +638,26 @@ def _remove_empty_seqs(argz):
 
 
 def _merge_calldataload(argz):
-    # look for sequential operations copying from calldata to memory
-    # and merge them into a single calldatacopy operation
+    return _merge_load(argz, "calldataload", "calldatacopy")
+
+
+def _merge_dload(argz):
+    return _merge_load(argz, "dload", "dloadbytes")
+
+
+def _merge_mload(argz):
+    if not version_check(begin="cancun"):
+        return False
+    return _merge_load(argz, "mload", "mcopy")
+
+
+def _merge_load(argz, _LOAD, _COPY):
+    # look for sequential operations copying from X to Y
+    # and merge them into a single copy operation
     changed = False
     mstore_nodes: List = []
-    initial_mem_offset = 0
-    initial_calldata_offset = 0
+    initial_dst_offset = 0
+    initial_src_offset = 0
     total_length = 0
     idx = None
     for i, ir_node in enumerate(argz):
@@ -649,19 +665,19 @@ def _merge_calldataload(argz):
         if (
             ir_node.value == "mstore"
             and isinstance(ir_node.args[0].value, int)
-            and ir_node.args[1].value == "calldataload"
+            and ir_node.args[1].value == _LOAD
             and isinstance(ir_node.args[1].args[0].value, int)
         ):
             # mstore of a zero value
-            mem_offset = ir_node.args[0].value
-            calldata_offset = ir_node.args[1].args[0].value
+            dst_offset = ir_node.args[0].value
+            src_offset = ir_node.args[1].args[0].value
             if not mstore_nodes:
-                initial_mem_offset = mem_offset
-                initial_calldata_offset = calldata_offset
+                initial_dst_offset = dst_offset
+                initial_src_offset = src_offset
                 idx = i
             if (
-                initial_mem_offset + total_length == mem_offset
-                and initial_calldata_offset + total_length == calldata_offset
+                initial_dst_offset + total_length == dst_offset
+                and initial_src_offset + total_length == src_offset
             ):
                 mstore_nodes.append(ir_node)
                 total_length += 32
@@ -676,7 +692,7 @@ def _merge_calldataload(argz):
         if len(mstore_nodes) > 1:
             changed = True
             new_ir = IRnode.from_list(
-                ["calldatacopy", initial_mem_offset, initial_calldata_offset, total_length],
+                [_COPY, initial_dst_offset, initial_src_offset, total_length],
                 source_pos=mstore_nodes[0].source_pos,
             )
             # replace first copy operation with optimized node and remove the rest
@@ -684,8 +700,8 @@ def _merge_calldataload(argz):
             # note: del xs[k:l] deletes l - k items
             del argz[idx + 1 : idx + len(mstore_nodes)]
 
-        initial_mem_offset = 0
-        initial_calldata_offset = 0
+        initial_dst_offset = 0
+        initial_src_offset = 0
         total_length = 0
         mstore_nodes.clear()
 
diff --git a/vyper/utils.py b/vyper/utils.py
index 2440117d0c..3d9d9cb416 100644
--- a/vyper/utils.py
+++ b/vyper/utils.py
@@ -196,8 +196,7 @@ def calc_mem_gas(memsize):
 # Specific gas usage
 GAS_IDENTITY = 15
 GAS_IDENTITYWORD = 3
-GAS_CODECOPY_WORD = 3
-GAS_CALLDATACOPY_WORD = 3
+GAS_COPY_WORD = 3  # i.e., W_copy from YP
 
 # A decimal value can store multiples of 1/DECIMAL_DIVISOR
 MAX_DECIMAL_PLACES = 10

From 91d6e240f770414e1fbfd8648a166e9d2dba1698 Mon Sep 17 00:00:00 2001
From: trocher <rocher14@live.fr>
Date: Sun, 16 Jul 2023 18:24:44 +0200
Subject: [PATCH 082/161] fix displaying of ArgumentException (#3500)

The change is pretty self-explanatory.
```vyper
@internal
@view
def bar():
    pass

@external
def foo():
    self.bar(12)
```
Was failing to compile with:
`vyper.exceptions.ArgumentException: Invalid argument count for call to 'bar': expected 0 to 0, got 1`

And now fail to compile with:

`vyper.exceptions.ArgumentException: Invalid argument count for call to 'bar': expected 0, got 1`

Co-authored-by: Tanguy Rocher <tanguy.rocher@protonmail.com>
---
 vyper/ast/validation.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/vyper/ast/validation.py b/vyper/ast/validation.py
index 7742d60c01..36a6a0484c 100644
--- a/vyper/ast/validation.py
+++ b/vyper/ast/validation.py
@@ -48,7 +48,7 @@ def validate_call_args(
             arg_count = (arg_count[0], 2**64)
 
         if arg_count[0] == arg_count[1]:
-            arg_count == arg_count[0]
+            arg_count = arg_count[0]
 
     if isinstance(node.func, vy_ast.Attribute):
         msg = f" for call to '{node.func.attr}'"

From 9e3b9a2b8ae55aa83b5450080f750be15f819de7 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 16 Jul 2023 20:14:35 -0400
Subject: [PATCH 083/161] feat: optimize dynarray and bytearray copies (#3499)

include the length word in the batch copy instead of issuing a separate
store instruction.

brings CurveStableSwapMetaNG.vy down by 315 bytes (~1.5%) and VaultV3.vy
by 45 bytes (0.25%) in both `--optimize codesize` and `--optimize gas`
modes.
---
 tests/parser/functions/test_slice.py |  4 +--
 vyper/codegen/core.py                | 46 ++++++++++++++++------------
 2 files changed, 28 insertions(+), 22 deletions(-)

diff --git a/tests/parser/functions/test_slice.py b/tests/parser/functions/test_slice.py
index f1b642b28d..3064ee308e 100644
--- a/tests/parser/functions/test_slice.py
+++ b/tests/parser/functions/test_slice.py
@@ -2,7 +2,7 @@
 import pytest
 from hypothesis import given, settings
 
-from vyper.exceptions import ArgumentException
+from vyper.exceptions import ArgumentException, TypeMismatch
 
 _fun_bytes32_bounds = [(0, 32), (3, 29), (27, 5), (0, 5), (5, 3), (30, 2)]
 
@@ -143,7 +143,7 @@ def _get_contract():
         or (literal_start and start > data_length)
         or (literal_length and length < 1)
     ):
-        assert_compile_failed(lambda: _get_contract(), ArgumentException)
+        assert_compile_failed(lambda: _get_contract(), (ArgumentException, TypeMismatch))
     elif len(bytesdata) > data_length:
         # deploy fail
         assert_tx_failed(lambda: _get_contract())
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 5b16938e99..f47f88ac85 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -110,25 +110,33 @@ def make_byte_array_copier(dst, src):
     _check_assign_bytes(dst, src)
 
     # TODO: remove this branch, copy_bytes and get_bytearray_length should handle
-    if src.value == "~empty":
+    if src.value == "~empty" or src.typ.maxlen == 0:
         # set length word to 0.
         return STORE(dst, 0)
 
     with src.cache_when_complex("src") as (b1, src):
-        with get_bytearray_length(src).cache_when_complex("len") as (b2, len_):
-            max_bytes = src.typ.maxlen
+        has_storage = STORAGE in (src.location, dst.location)
+        is_memory_copy = dst.location == src.location == MEMORY
+        batch_uses_identity = is_memory_copy and not version_check(begin="cancun")
+        if src.typ.maxlen <= 32 and (has_storage or batch_uses_identity):
+            # it's cheaper to run two load/stores instead of copy_bytes
 
             ret = ["seq"]
-
-            dst_ = bytes_data_ptr(dst)
-            src_ = bytes_data_ptr(src)
-
-            ret.append(copy_bytes(dst_, src_, len_, max_bytes))
-
-            # store length
+            # store length word
+            len_ = get_bytearray_length(src)
             ret.append(STORE(dst, len_))
 
-            return b1.resolve(b2.resolve(ret))
+            # store the single data word.
+            dst_data_ptr = bytes_data_ptr(dst)
+            src_data_ptr = bytes_data_ptr(src)
+            ret.append(STORE(dst_data_ptr, LOAD(src_data_ptr)))
+            return b1.resolve(ret)
+
+        # batch copy the bytearray (including length word) using copy_bytes
+        len_ = add_ofst(get_bytearray_length(src), 32)
+        max_bytes = src.typ.maxlen + 32
+        ret = copy_bytes(dst, src, len_, max_bytes)
+        return b1.resolve(ret)
 
 
 def bytes_data_ptr(ptr):
@@ -213,19 +221,17 @@ def _dynarray_make_setter(dst, src):
                 loop_body.annotation = f"{dst}[i] = {src}[i]"
 
                 ret.append(["repeat", i, 0, count, src.typ.count, loop_body])
+                # write the length word after data is copied
+                ret.append(STORE(dst, count))
 
             else:
                 element_size = src.typ.value_type.memory_bytes_required
-                # number of elements * size of element in bytes
-                n_bytes = _mul(count, element_size)
-                max_bytes = src.typ.count * element_size
-
-                src_ = dynarray_data_ptr(src)
-                dst_ = dynarray_data_ptr(dst)
-                ret.append(copy_bytes(dst_, src_, n_bytes, max_bytes))
+                # number of elements * size of element in bytes + length word
+                n_bytes = add_ofst(_mul(count, element_size), 32)
+                max_bytes = 32 + src.typ.count * element_size
 
-            # write the length word after data is copied
-            ret.append(STORE(dst, count))
+                # batch copy the entire dynarray, including length word
+                ret.append(copy_bytes(dst, src, n_bytes, max_bytes))
 
             return b1.resolve(b2.resolve(ret))
 

From cfba51719e10923cc93e40f6bca9a9d1d0d4a328 Mon Sep 17 00:00:00 2001
From: antazoey <jules@apeworx.io>
Date: Wed, 19 Jul 2023 11:27:10 -0500
Subject: [PATCH 084/161] fix: `tests` being imported in editable mode (#3510)

the `tests` package was being imported when vyper installed in editable
mode. this commit fixes by restricting the packages being exported in
`setup.py`.
---
 setup.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/setup.py b/setup.py
index 36a138aacd..bbf6e60f55 100644
--- a/setup.py
+++ b/setup.py
@@ -4,7 +4,7 @@
 import re
 import subprocess
 
-from setuptools import find_packages, setup
+from setuptools import setup
 
 extras_require = {
     "test": [
@@ -88,7 +88,7 @@ def _global_version(version):
     license="Apache License 2.0",
     keywords="ethereum evm smart contract language",
     include_package_data=True,
-    packages=find_packages(exclude=("tests", "docs")),
+    packages=["vyper"],
     python_requires=">=3.10,<4",
     py_modules=["vyper"],
     install_requires=[

From 6bd81dea55d0d0ef71b192bf30331a48a409f1d4 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 19 Jul 2023 10:15:57 -0700
Subject: [PATCH 085/161] chore: relax pragma parsing (#3511)

allow `# pragma ...` in addition to `#pragma ...`

also fix a small bug in version parsing (it only affected the error
message formatting, not the parsed version)
---
 vyper/ast/pre_parser.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/vyper/ast/pre_parser.py b/vyper/ast/pre_parser.py
index 35153af9d5..7e677b3b92 100644
--- a/vyper/ast/pre_parser.py
+++ b/vyper/ast/pre_parser.py
@@ -119,12 +119,12 @@ def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
                     validate_version_pragma(compiler_version, start)
                     settings.compiler_version = compiler_version
 
-                if string.startswith("#pragma "):
-                    pragma = string.removeprefix("#pragma").strip()
+                if contents.startswith("pragma "):
+                    pragma = contents.removeprefix("pragma ").strip()
                     if pragma.startswith("version "):
                         if settings.compiler_version is not None:
                             raise StructureException("pragma version specified twice!", start)
-                        compiler_version = pragma.removeprefix("version ".strip())
+                        compiler_version = pragma.removeprefix("version ").strip()
                         validate_version_pragma(compiler_version, start)
                         settings.compiler_version = compiler_version
 

From f928a0ff64bd3355f6410e460f6a710000e5f9d7 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Fri, 21 Jul 2023 23:32:06 +0800
Subject: [PATCH 086/161] chore: improve error message for invalid references
 to constants and immutables (#3529)

---
 .../exceptions/test_invalid_reference.py       | 18 ++++++++++++++++++
 vyper/semantics/analysis/utils.py              | 16 +++++++++++-----
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/tests/parser/exceptions/test_invalid_reference.py b/tests/parser/exceptions/test_invalid_reference.py
index 3aec6028e4..fe315e5cbf 100644
--- a/tests/parser/exceptions/test_invalid_reference.py
+++ b/tests/parser/exceptions/test_invalid_reference.py
@@ -37,6 +37,24 @@ def foo():
 def foo():
     int128 = 5
     """,
+    """
+a: public(constant(uint256)) = 1
+
+@external
+def foo():
+    b: uint256 = self.a
+    """,
+    """
+a: public(immutable(uint256))
+
+@external
+def __init__():
+    a = 123
+
+@external
+def foo():
+    b: uint256 = self.a
+    """,
 ]
 
 
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index f16b0c8c33..4f911764e0 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -180,24 +180,30 @@ def _find_fn(self, node):
         raise StructureException("Cannot determine type of this object", node)
 
     def types_from_Attribute(self, node):
+        is_self_reference = node.get("value.id") == "self"
         # variable attribute, e.g. `foo.bar`
         t = self.get_exact_type_from_node(node.value, include_type_exprs=True)
         name = node.attr
+
+        def _raise_invalid_reference(name, node):
+            raise InvalidReference(
+                f"'{name}' is not a storage variable, it should not be prepended with self", node
+            )
+
         try:
             s = t.get_member(name, node)
             if isinstance(s, VyperType):
                 # ex. foo.bar(). bar() is a ContractFunctionT
                 return [s]
+            if is_self_reference and (s.is_constant or s.is_immutable):
+                _raise_invalid_reference(name, node)
             # general case. s is a VarInfo, e.g. self.foo
             return [s.typ]
         except UnknownAttribute:
-            if node.get("value.id") != "self":
+            if not is_self_reference:
                 raise
             if name in self.namespace:
-                raise InvalidReference(
-                    f"'{name}' is not a storage variable, it should not be prepended with self",
-                    node,
-                ) from None
+                _raise_invalid_reference(name, node)
 
             suggestions_str = get_levenshtein_error_suggestions(name, t.members, 0.4)
             raise UndeclaredDefinition(

From 299352ef5ee3b9be2b334120091a7e80e10d2022 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Sun, 23 Jul 2023 15:11:29 -0700
Subject: [PATCH 087/161] feat: optimize dload/mstore sequences (#3525)

merge_dload was defined in 5dc3ac7, but was not applied.

this commit also adds a rewrite rule for single dload/mstore patterns,
any `(mstore dst (dload src))` (which compiles to a `codecopy` followed
by an `mload` and `mstore`) is rewritten to a `dloadbytes` (which
compiles directly to a `codecopy`).

this rule saves 4 bytes / ~10 gas per rewrite. for instance, it shaves
25 bytes off `VaultV3.vy`, 50 bytes off `CurveTricryptoOptimizedWETH.vy`
and 75 bytes off `CurveStableSwapMetaNG.vy` (basically 0.1%-0.3%).
---
 vyper/ir/optimizer.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/vyper/ir/optimizer.py b/vyper/ir/optimizer.py
index 40e02e79c7..08c2168381 100644
--- a/vyper/ir/optimizer.py
+++ b/vyper/ir/optimizer.py
@@ -473,6 +473,8 @@ def finalize(val, args):
     if value == "seq":
         changed |= _merge_memzero(argz)
         changed |= _merge_calldataload(argz)
+        changed |= _merge_dload(argz)
+        changed |= _rewrite_mstore_dload(argz)
         changed |= _merge_mload(argz)
         changed |= _remove_empty_seqs(argz)
 
@@ -645,6 +647,18 @@ def _merge_dload(argz):
     return _merge_load(argz, "dload", "dloadbytes")
 
 
+def _rewrite_mstore_dload(argz):
+    changed = False
+    for i, arg in enumerate(argz):
+        if arg.value == "mstore" and arg.args[1].value == "dload":
+            dst = arg.args[0]
+            src = arg.args[1].args[0]
+            len_ = 32
+            argz[i] = IRnode.from_list(["dloadbytes", dst, src, len_], source_pos=arg.source_pos)
+            changed = True
+    return changed
+
+
 def _merge_mload(argz):
     if not version_check(begin="cancun"):
         return False

From 4ca1c81aaa4f3e950522a2115aa5fcd7d80c1b27 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 24 Jul 2023 09:23:04 -0700
Subject: [PATCH 088/161] chore: improve some error messages (#3524)

fix array bounds check and `create_*` builtin error messages

- array bounds checks, previously were something like

`clamp lt [mload, 640 <result>]`

- codesize check error message was missing for create builtins
- create failure error message was also missing
---
 vyper/builtins/functions.py | 16 +++++++++++++---
 vyper/codegen/core.py       |  1 +
 vyper/codegen/ir_node.py    |  8 ++++++++
 3 files changed, 22 insertions(+), 3 deletions(-)

diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 90214554b0..e1dcee6b8d 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -1634,7 +1634,9 @@ def _create_ir(value, buf, length, salt=None, checked=True):
     if not checked:
         return ret
 
-    return clamp_nonzero(ret)
+    ret = clamp_nonzero(ret)
+    ret.set_error_msg(f"{create_op} failed")
+    return ret
 
 
 # calculate the gas used by create for a given number of bytes
@@ -1830,7 +1832,10 @@ def _build_create_IR(self, expr, args, context, value, salt):
                 ir = ["seq"]
 
                 # make sure there is actually code at the target
-                ir.append(["assert", codesize])
+                check_codesize = ["assert", codesize]
+                ir.append(
+                    IRnode.from_list(check_codesize, error_msg="empty target (create_copy_of)")
+                )
 
                 # store the preamble at msize + 22 (zero padding)
                 preamble, preamble_len = _create_preamble(codesize)
@@ -1920,7 +1925,12 @@ def _build_create_IR(self, expr, args, context, value, salt, code_offset, raw_ar
                 # (code_ofst == (extcodesize target) would be empty
                 # initcode, which we disallow for hygiene reasons -
                 # same as `create_copy_of` on an empty target).
-                ir.append(["assert", ["sgt", codesize, 0]])
+                check_codesize = ["assert", ["sgt", codesize, 0]]
+                ir.append(
+                    IRnode.from_list(
+                        check_codesize, error_msg="empty target (create_from_blueprint)"
+                    )
+                )
 
                 # copy the target code into memory.
                 # layout starting from mem_ofst:
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index f47f88ac85..47a2c8c8d0 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -539,6 +539,7 @@ def _get_element_ptr_array(parent, key, array_bounds_check):
         # an array index, and the clamp will throw an error.
         # NOTE: there are optimization rules for this when ix or bound is literal
         ix = clamp("lt", ix, bound)
+        ix.set_error_msg(f"{parent.typ} bounds check")
 
     if parent.encoding == Encoding.ABI:
         if parent.location == STORAGE:
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index 0895e5f02d..fa015b293e 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -330,6 +330,14 @@ def is_complex_ir(self):
             and self.value.lower() not in do_not_cache
         )
 
+    # set an error message and push down into all children.
+    # useful for overriding an error message generated by a helper
+    # function with a more specific error message.
+    def set_error_msg(self, error_msg: str) -> None:
+        self.error_msg = error_msg
+        for arg in self.args:
+            arg.set_error_msg(error_msg)
+
     # get the unique symbols contained in this node, which provides
     # sanity check invariants for the optimizer.
     # cache because it's a perf hotspot. note that this (and other cached

From 408929fa31ae01dde4f7566bb7babbc7da5b6620 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 24 Jul 2023 18:55:13 -0700
Subject: [PATCH 089/161] feat: O(1) selector tables (#3496)

this commit replaces the existing linear entry point search with an O(1)
implementation. there are two methods depending on whether optimizing
for code size or gas, hash table with probing and perfect hashing using
a two-level technique.

the first method divides the selectors into buckets, uses
`method_id % n_buckets` as a "guess" to where to enter the selector
table and then jumps there and performs the familiar linear search for
the selector ("probing"). to avoid too large buckets, the jumptable
generator searches a range from ~`n_buckets * 0.85` to
`n_buckets * 1.15` to minimize worst-case probe depth; the average worst
case for 80-100 methods is 3 items per bucket and the worst worst case
is 4 items per bucket (presumably if you get really unlucky), see
`_bench_sparse()` in `vyper/codegen/jumptable_utils.py`. the average
bucket size is 1.6 methods.

the second method uses a perfect hashing technique. finding a single
magic which produces a perfect hash is infeasible for large `N`
(exponential, and in practice seems to run off a cliff around 10
 methods). to "get around" this, the methods are divided into buckets of
roughly size 10, and a magic is computed per bucket. several `n_buckets`
are tried, trying to minimize `n_buckets`. the code size overhead of
each bucket is roughly 5 bytes per bucket, which works out to ~20% per
method, see `_bench_dense()` in `vyper/codegen/jumptable_utils.py`.
then, the function selector is looked up in two steps - it loads the
magic for the bucket given by `method_id % n_buckets`, and then uses the
magic to compute the location of the function selector (and associated
metadata) in the data section. from there it loads the function
metadata, performs the calldatasize, callvalue and method id checks and
jumps into the function.

there is a gas vs code size tradeoff between the two methods - roughly
speaking, the sparse method requires ~69 gas in the best case (~109 gas
in the "average" case) and 12-22 bytes of code per method, while the
dense method requires ~212 gas across the board, and ~8 bytes of code
per method.

to accomplish this implementation-wise, the jumptable info is generated
in a new helper module, `vyper/codegen/jumptable_utils.py`. some
refactoring had to be additionally done to pull the calldatasize,
callvalue and method id checks from external function generation out
into a new selector section construction step in
`vyper/codegen/module.py`.

additionally, a new IR "data" directive was added, and an associated
assembly directive. the data segments in assembly are moved to the end
of the bytecode to ensure that data bytes which happen to look like
`PUSH` instructions do not mangle valid bytecode which comes after the
data section.
---
 .github/workflows/test.yml                    |  15 +-
 docs/compiling-a-contract.rst                 |  17 +
 docs/structure-of-a-contract.rst              |   4 +-
 tests/base_conftest.py                        |   4 +-
 .../vyper_json/test_parse_args_vyperjson.py   |   4 +-
 tests/compiler/__init__.py                    |   2 +
 tests/compiler/test_default_settings.py       |  27 ++
 tests/conftest.py                             |  10 +-
 tests/parser/functions/test_slice.py          |  15 +-
 tests/parser/test_selector_table.py           | 198 ++++++++
 tox.ini                                       |   6 +-
 vyper/ast/grammar.lark                        |   2 +-
 vyper/cli/vyper_compile.py                    |  19 +-
 vyper/cli/vyper_ir.py                         |   2 +-
 vyper/codegen/core.py                         |   3 +-
 .../codegen/function_definitions/__init__.py  |   2 +-
 vyper/codegen/function_definitions/common.py  |  59 ++-
 .../function_definitions/external_function.py |  63 +--
 vyper/codegen/ir_node.py                      |  14 +-
 vyper/codegen/jumptable_utils.py              | 195 ++++++++
 vyper/codegen/module.py                       | 442 +++++++++++++++---
 vyper/compiler/output.py                      |   6 +-
 vyper/compiler/settings.py                    |  13 +
 vyper/ir/compile_ir.py                        | 241 +++++++---
 24 files changed, 1133 insertions(+), 230 deletions(-)
 create mode 100644 tests/compiler/test_default_settings.py
 create mode 100644 tests/parser/test_selector_table.py
 create mode 100644 vyper/codegen/jumptable_utils.py

diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index b6399b3ae9..fd78e2fff8 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -78,11 +78,18 @@ jobs:
     runs-on: ubuntu-latest
     strategy:
       matrix:
-        python-version: [["3.10", "310"], ["3.11", "311"]]
+        python-version: [["3.11", "311"]]
         # run in modes: --optimize [gas, none, codesize]
-        flag: ["core", "no-opt", "codesize"]
+        opt-mode: ["gas", "none", "codesize"]
+        debug: [true, false]
+        # run across other python versions.# we don't really need to run all
+        # modes across all python versions - one is enough
+        include:
+          - python-version: ["3.10", "310"]
+            opt-mode: gas
+            debug: false
 
-    name: py${{ matrix.python-version[1] }}-${{ matrix.flag }}
+    name: py${{ matrix.python-version[1] }}-opt-${{ matrix.opt-mode }}${{ matrix.debug && '-debug' || '' }}
 
     steps:
     - uses: actions/checkout@v1
@@ -97,7 +104,7 @@ jobs:
       run: pip install tox
 
     - name: Run Tox
-      run: TOXENV=py${{ matrix.python-version[1] }}-${{ matrix.flag }} tox -r -- --reruns 10 --reruns-delay 1 -r aR tests/
+      run: TOXENV=py${{ matrix.python-version[1] }} tox -r -- --optimize ${{ matrix.opt-mode }} ${{ matrix.debug && '--enable-compiler-debug-mode' || '' }} --reruns 10 --reruns-delay 1 -r aR tests/
 
     - name: Upload Coverage
       uses: codecov/codecov-action@v1
diff --git a/docs/compiling-a-contract.rst b/docs/compiling-a-contract.rst
index 208771a5a9..6d1cdf98d7 100644
--- a/docs/compiling-a-contract.rst
+++ b/docs/compiling-a-contract.rst
@@ -113,6 +113,23 @@ Remix IDE
 
    While the Vyper version of the Remix IDE compiler is updated on a regular basis, it might be a bit behind the latest version found in the master branch of the repository. Make sure the byte code matches the output from your local compiler.
 
+.. _optimization-mode:
+
+Compiler Optimization Modes
+===========================
+
+The vyper CLI tool accepts an optimization mode ``"none"``, ``"codesize"``, or ``"gas"`` (default). It can be set using the ``--optimize`` flag. For example, invoking ``vyper --optimize codesize MyContract.vy`` will compile the contract, optimizing for code size. As a rough summary of the differences between gas and codesize mode, in gas optimized mode, the compiler will try to generate bytecode which minimizes gas (up to a point), including:
+
+* using a sparse selector table which optimizes for gas over codesize
+* inlining some constants, and
+* trying to unroll some loops, especially for data copies.
+
+In codesize optimized mode, the compiler will try hard to minimize codesize by
+
+* using a dense selector table
+* out-lining code, and
+* using more loops for data copies.
+
 
 .. _evm-version:
 
diff --git a/docs/structure-of-a-contract.rst b/docs/structure-of-a-contract.rst
index c7abb3e645..f58ab3b067 100644
--- a/docs/structure-of-a-contract.rst
+++ b/docs/structure-of-a-contract.rst
@@ -37,13 +37,13 @@ In the above examples, the contract will only compile with Vyper versions ``0.3.
 Optimization Mode
 -----------------
 
-The optimization mode can be one of ``"none"``, ``"codesize"``, or ``"gas"`` (default). For instance, the following contract will be compiled in a way which tries to minimize codesize:
+The optimization mode can be one of ``"none"``, ``"codesize"``, or ``"gas"`` (default). For example, adding the following line to a contract will cause it to try to optimize for codesize:
 
 .. code-block:: python
 
    #pragma optimize codesize
 
-The optimization mode can also be set as a compiler option. If the compiler option conflicts with the source code pragma, an exception will be raised and compilation will not continue.
+The optimization mode can also be set as a compiler option, which is documented in :ref:`optimization-mode`. If the compiler option conflicts with the source code pragma, an exception will be raised and compilation will not continue.
 
 EVM Version
 -----------------
diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index a78562e982..81e8dedc36 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -112,10 +112,10 @@ def w3(tester):
     return w3
 
 
-def _get_contract(w3, source_code, optimize, *args, **kwargs):
+def _get_contract(w3, source_code, optimize, *args, override_opt_level=None, **kwargs):
     settings = Settings()
     settings.evm_version = kwargs.pop("evm_version", None)
-    settings.optimize = optimize
+    settings.optimize = override_opt_level or optimize
     out = compiler.compile_code(
         source_code,
         # test that metadata gets generated
diff --git a/tests/cli/vyper_json/test_parse_args_vyperjson.py b/tests/cli/vyper_json/test_parse_args_vyperjson.py
index 08da5f1888..11e527843a 100644
--- a/tests/cli/vyper_json/test_parse_args_vyperjson.py
+++ b/tests/cli/vyper_json/test_parse_args_vyperjson.py
@@ -57,7 +57,7 @@ def test_to_stdout(tmp_path, capfd):
     _parse_args([path.absolute().as_posix()])
     out, _ = capfd.readouterr()
     output_json = json.loads(out)
-    assert _no_errors(output_json)
+    assert _no_errors(output_json), (INPUT_JSON, output_json)
     assert "contracts/foo.vy" in output_json["sources"]
     assert "contracts/bar.vy" in output_json["sources"]
 
@@ -71,7 +71,7 @@ def test_to_file(tmp_path):
     assert output_path.exists()
     with output_path.open() as fp:
         output_json = json.load(fp)
-    assert _no_errors(output_json)
+    assert _no_errors(output_json), (INPUT_JSON, output_json)
     assert "contracts/foo.vy" in output_json["sources"]
     assert "contracts/bar.vy" in output_json["sources"]
 
diff --git a/tests/compiler/__init__.py b/tests/compiler/__init__.py
index e69de29bb2..35a11f851b 100644
--- a/tests/compiler/__init__.py
+++ b/tests/compiler/__init__.py
@@ -0,0 +1,2 @@
+# prevent module name collision between tests/compiler/test_pre_parser.py
+# and tests/ast/test_pre_parser.py
diff --git a/tests/compiler/test_default_settings.py b/tests/compiler/test_default_settings.py
new file mode 100644
index 0000000000..ca05170b61
--- /dev/null
+++ b/tests/compiler/test_default_settings.py
@@ -0,0 +1,27 @@
+from vyper.codegen import core
+from vyper.compiler.phases import CompilerData
+from vyper.compiler.settings import OptimizationLevel, _is_debug_mode
+
+
+def test_default_settings():
+    source_code = ""
+    compiler_data = CompilerData(source_code)
+    _ = compiler_data.vyper_module  # force settings to be computed
+
+    assert compiler_data.settings.optimize == OptimizationLevel.GAS
+
+
+def test_default_opt_level():
+    assert OptimizationLevel.default() == OptimizationLevel.GAS
+
+
+def test_codegen_opt_level():
+    assert core._opt_level == OptimizationLevel.GAS
+    assert core._opt_gas() is True
+    assert core._opt_none() is False
+    assert core._opt_codesize() is False
+
+
+def test_debug_mode(pytestconfig):
+    debug_mode = pytestconfig.getoption("enable_compiler_debug_mode")
+    assert _is_debug_mode() == debug_mode
diff --git a/tests/conftest.py b/tests/conftest.py
index 9c9c4191b9..d519ca3100 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -10,7 +10,7 @@
 
 from vyper import compiler
 from vyper.codegen.ir_node import IRnode
-from vyper.compiler.settings import OptimizationLevel
+from vyper.compiler.settings import OptimizationLevel, _set_debug_mode
 from vyper.ir import compile_ir, optimizer
 
 from .base_conftest import VyperContract, _get_contract, zero_gas_price_strategy
@@ -43,6 +43,7 @@ def pytest_addoption(parser):
         default="gas",
         help="change optimization mode",
     )
+    parser.addoption("--enable-compiler-debug-mode", action="store_true")
 
 
 @pytest.fixture(scope="module")
@@ -51,6 +52,13 @@ def optimize(pytestconfig):
     return OptimizationLevel.from_string(flag)
 
 
+@pytest.fixture(scope="session", autouse=True)
+def debug(pytestconfig):
+    debug = pytestconfig.getoption("enable_compiler_debug_mode")
+    assert isinstance(debug, bool)
+    _set_debug_mode(debug)
+
+
 @pytest.fixture
 def keccak():
     return Web3.keccak
diff --git a/tests/parser/functions/test_slice.py b/tests/parser/functions/test_slice.py
index 3064ee308e..6229b47921 100644
--- a/tests/parser/functions/test_slice.py
+++ b/tests/parser/functions/test_slice.py
@@ -2,6 +2,7 @@
 import pytest
 from hypothesis import given, settings
 
+from vyper.compiler.settings import OptimizationLevel
 from vyper.exceptions import ArgumentException, TypeMismatch
 
 _fun_bytes32_bounds = [(0, 32), (3, 29), (27, 5), (0, 5), (5, 3), (30, 2)]
@@ -33,12 +34,15 @@ def slice_tower_test(inp1: Bytes[50]) -> Bytes[50]:
 
 @pytest.mark.parametrize("literal_start", (True, False))
 @pytest.mark.parametrize("literal_length", (True, False))
+@pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
-@settings(max_examples=25, deadline=None)
+@settings(max_examples=100, deadline=None)
+@pytest.mark.fuzzing
 def test_slice_immutable(
     get_contract,
     assert_compile_failed,
     assert_tx_failed,
+    opt_level,
     bytesdata,
     start,
     literal_start,
@@ -64,7 +68,7 @@ def do_splice() -> Bytes[{length_bound}]:
     """
 
     def _get_contract():
-        return get_contract(code, bytesdata, start, length)
+        return get_contract(code, bytesdata, start, length, override_opt_level=opt_level)
 
     if (
         (start + length > length_bound and literal_start and literal_length)
@@ -84,12 +88,15 @@ def _get_contract():
 @pytest.mark.parametrize("location", ("storage", "calldata", "memory", "literal", "code"))
 @pytest.mark.parametrize("literal_start", (True, False))
 @pytest.mark.parametrize("literal_length", (True, False))
+@pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
-@settings(max_examples=25, deadline=None)
+@settings(max_examples=100, deadline=None)
+@pytest.mark.fuzzing
 def test_slice_bytes(
     get_contract,
     assert_compile_failed,
     assert_tx_failed,
+    opt_level,
     location,
     bytesdata,
     start,
@@ -133,7 +140,7 @@ def do_slice(inp: Bytes[{length_bound}], start: uint256, length: uint256) -> Byt
     """
 
     def _get_contract():
-        return get_contract(code, bytesdata)
+        return get_contract(code, bytesdata, override_opt_level=opt_level)
 
     data_length = len(bytesdata) if location == "literal" else length_bound
     if (
diff --git a/tests/parser/test_selector_table.py b/tests/parser/test_selector_table.py
new file mode 100644
index 0000000000..01a83698b7
--- /dev/null
+++ b/tests/parser/test_selector_table.py
@@ -0,0 +1,198 @@
+import hypothesis.strategies as st
+import pytest
+from hypothesis import given, settings
+
+import vyper.utils as utils
+from vyper.codegen.jumptable_utils import (
+    generate_dense_jumptable_info,
+    generate_sparse_jumptable_buckets,
+)
+from vyper.compiler.settings import OptimizationLevel
+
+
+@given(
+    n_methods=st.integers(min_value=1, max_value=100),
+    seed=st.integers(min_value=0, max_value=2**64 - 1),
+)
+@pytest.mark.fuzzing
+@settings(max_examples=10, deadline=None)
+def test_sparse_jumptable_probe_depth(n_methods, seed):
+    sigs = [f"foo{i + seed}()" for i in range(n_methods)]
+    _, buckets = generate_sparse_jumptable_buckets(sigs)
+    bucket_sizes = [len(bucket) for bucket in buckets.values()]
+
+    # generally bucket sizes should be bounded at around 4, but
+    # just test that they don't get really out of hand
+    assert max(bucket_sizes) <= 8
+
+    # generally mean bucket size should be around 1.6, here just
+    # test they don't get really out of hand
+    assert sum(bucket_sizes) / len(bucket_sizes) <= 4
+
+
+@given(
+    n_methods=st.integers(min_value=4, max_value=100),
+    seed=st.integers(min_value=0, max_value=2**64 - 1),
+)
+@pytest.mark.fuzzing
+@settings(max_examples=10, deadline=None)
+def test_dense_jumptable_bucket_size(n_methods, seed):
+    sigs = [f"foo{i + seed}()" for i in range(n_methods)]
+    n = len(sigs)
+    buckets = generate_dense_jumptable_info(sigs)
+    n_buckets = len(buckets)
+
+    # generally should be around 14 buckets per 100 methods, here
+    # we test they don't get really out of hand
+    assert n_buckets / n < 0.4 or n < 10
+
+
+@pytest.mark.parametrize("opt_level", list(OptimizationLevel))
+# dense selector table packing boundaries at 256 and 65336
+@pytest.mark.parametrize("max_calldata_bytes", [255, 256, 65336])
+@settings(max_examples=5, deadline=None)
+@given(
+    seed=st.integers(min_value=0, max_value=2**64 - 1),
+    max_default_args=st.integers(min_value=0, max_value=4),
+    default_fn_mutability=st.sampled_from(["", "@pure", "@view", "@nonpayable", "@payable"]),
+)
+@pytest.mark.fuzzing
+def test_selector_table_fuzz(
+    max_calldata_bytes,
+    seed,
+    max_default_args,
+    opt_level,
+    default_fn_mutability,
+    w3,
+    get_contract,
+    assert_tx_failed,
+    get_logs,
+):
+    def abi_sig(calldata_words, i, n_default_args):
+        args = [] if not calldata_words else [f"uint256[{calldata_words}]"]
+        args.extend(["uint256"] * n_default_args)
+        argstr = ",".join(args)
+        return f"foo{seed + i}({argstr})"
+
+    def generate_func_def(mutability, calldata_words, i, n_default_args):
+        arglist = [] if not calldata_words else [f"x: uint256[{calldata_words}]"]
+        for j in range(n_default_args):
+            arglist.append(f"x{j}: uint256 = 0")
+        args = ", ".join(arglist)
+        _log_return = f"log _Return({i})" if mutability == "@payable" else ""
+
+        return f"""
+@external
+{mutability}
+def foo{seed + i}({args}) -> uint256:
+    {_log_return}
+    return {i}
+    """
+
+    @given(
+        methods=st.lists(
+            st.tuples(
+                st.sampled_from(["@pure", "@view", "@nonpayable", "@payable"]),
+                st.integers(min_value=0, max_value=max_calldata_bytes // 32),
+                # n bytes to strip from calldata
+                st.integers(min_value=1, max_value=4),
+                # n default args
+                st.integers(min_value=0, max_value=max_default_args),
+            ),
+            min_size=1,
+            max_size=100,
+        )
+    )
+    @settings(max_examples=25)
+    def _test(methods):
+        func_defs = "\n".join(
+            generate_func_def(m, s, i, d) for i, (m, s, _, d) in enumerate(methods)
+        )
+
+        if default_fn_mutability == "":
+            default_fn_code = ""
+        elif default_fn_mutability in ("@nonpayable", "@payable"):
+            default_fn_code = f"""
+@external
+{default_fn_mutability}
+def __default__():
+    log CalledDefault()
+            """
+        else:
+            # can't log from pure/view functions, just test that it returns
+            default_fn_code = """
+@external
+def __default__():
+    pass
+            """
+
+        code = f"""
+event CalledDefault:
+    pass
+
+event _Return:
+    val: uint256
+
+{func_defs}
+
+{default_fn_code}
+        """
+
+        c = get_contract(code, override_opt_level=opt_level)
+
+        for i, (mutability, n_calldata_words, n_strip_bytes, n_default_args) in enumerate(methods):
+            funcname = f"foo{seed + i}"
+            func = getattr(c, funcname)
+
+            for j in range(n_default_args + 1):
+                args = [[1] * n_calldata_words] if n_calldata_words else []
+                args.extend([1] * j)
+
+                # check the function returns as expected
+                assert func(*args) == i
+
+                method_id = utils.method_id(abi_sig(n_calldata_words, i, j))
+
+                argsdata = b"\x00" * (n_calldata_words * 32 + j * 32)
+
+                # do payable check
+                if mutability == "@payable":
+                    tx = func(*args, transact={"value": 1})
+                    (event,) = get_logs(tx, c, "_Return")
+                    assert event.args.val == i
+                else:
+                    hexstr = (method_id + argsdata).hex()
+                    txdata = {"to": c.address, "data": hexstr, "value": 1}
+                    assert_tx_failed(lambda: w3.eth.send_transaction(txdata))
+
+                # now do calldatasize check
+                # strip some bytes
+                calldata = (method_id + argsdata)[:-n_strip_bytes]
+                hexstr = calldata.hex()
+                tx_params = {"to": c.address, "data": hexstr}
+                if n_calldata_words == 0 and j == 0:
+                    # no args, hit default function
+                    if default_fn_mutability == "":
+                        assert_tx_failed(lambda: w3.eth.send_transaction(tx_params))
+                    elif default_fn_mutability == "@payable":
+                        # we should be able to send eth to it
+                        tx_params["value"] = 1
+                        tx = w3.eth.send_transaction(tx_params)
+                        logs = get_logs(tx, c, "CalledDefault")
+                        assert len(logs) == 1
+                    else:
+                        tx = w3.eth.send_transaction(tx_params)
+
+                        # note: can't emit logs from view/pure functions,
+                        # so the logging is not tested.
+                        if default_fn_mutability == "@nonpayable":
+                            logs = get_logs(tx, c, "CalledDefault")
+                            assert len(logs) == 1
+
+                        # check default function reverts
+                        tx_params["value"] = 1
+                        assert_tx_failed(lambda: w3.eth.send_transaction(tx_params))
+                else:
+                    assert_tx_failed(lambda: w3.eth.send_transaction(tx_params))
+
+    _test()
diff --git a/tox.ini b/tox.ini
index 9b63630f58..c949354dfe 100644
--- a/tox.ini
+++ b/tox.ini
@@ -1,6 +1,6 @@
 [tox]
 envlist =
-    py{310,311}-{core,no-opt}
+    py{310,311}
     lint
     mypy
     docs
@@ -8,9 +8,7 @@ envlist =
 [testenv]
 usedevelop = True
 commands =
-    core: pytest -m "not fuzzing" --showlocals {posargs:tests/}
-    no-opt: pytest -m "not fuzzing" --showlocals --optimize none {posargs:tests/}
-    codesize: pytest -m "not fuzzing" --showlocals --optimize codesize {posargs:tests/}
+    pytest -m "not fuzzing" --showlocals {posargs:tests/}
 basepython =
     py310: python3.10
     py311: python3.11
diff --git a/vyper/ast/grammar.lark b/vyper/ast/grammar.lark
index 77806d734c..ca9979b2a3 100644
--- a/vyper/ast/grammar.lark
+++ b/vyper/ast/grammar.lark
@@ -72,8 +72,8 @@ function_def: [decorators] function_sig ":" body
 _EVENT_DECL: "event"
 event_member: NAME ":" type
 indexed_event_arg: NAME ":" "indexed" "(" type ")"
-event_body: _NEWLINE _INDENT ((event_member | indexed_event_arg) _NEWLINE)+ _DEDENT
 // Events which use no args use a pass statement instead
+event_body: _NEWLINE _INDENT (((event_member | indexed_event_arg ) _NEWLINE)+ | _PASS _NEWLINE) _DEDENT
 event_def: _EVENT_DECL NAME ":" ( event_body | _PASS )
 
 // Enums
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 55e0fc82b2..9c96d55040 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -11,7 +11,12 @@
 import vyper.codegen.ir_node as ir_node
 from vyper.cli import vyper_json
 from vyper.cli.utils import extract_file_interface_imports, get_interface_file_path
-from vyper.compiler.settings import VYPER_TRACEBACK_LIMIT, OptimizationLevel, Settings
+from vyper.compiler.settings import (
+    VYPER_TRACEBACK_LIMIT,
+    OptimizationLevel,
+    Settings,
+    _set_debug_mode,
+)
 from vyper.evm.opcodes import DEFAULT_EVM_VERSION, EVM_VERSIONS
 from vyper.typing import ContractCodes, ContractPath, OutputFormats
 
@@ -105,7 +110,12 @@ def _parse_args(argv):
         dest="evm_version",
     )
     parser.add_argument("--no-optimize", help="Do not optimize", action="store_true")
-    parser.add_argument("--optimize", help="Optimization flag", choices=["gas", "codesize", "none"])
+    parser.add_argument(
+        "--optimize",
+        help="Optimization flag (defaults to 'gas')",
+        choices=["gas", "codesize", "none"],
+    )
+    parser.add_argument("--debug", help="Compile in debug mode", action="store_true")
     parser.add_argument(
         "--no-bytecode-metadata", help="Do not add metadata to bytecode", action="store_true"
     )
@@ -151,6 +161,9 @@ def _parse_args(argv):
 
     output_formats = tuple(uniq(args.format.split(",")))
 
+    if args.debug:
+        _set_debug_mode(True)
+
     if args.no_optimize and args.optimize:
         raise ValueError("Cannot use `--no-optimize` and `--optimize` at the same time!")
 
@@ -165,7 +178,7 @@ def _parse_args(argv):
         settings.evm_version = args.evm_version
 
     if args.verbose:
-        print(f"using `{settings}`", file=sys.stderr)
+        print(f"cli specified: `{settings}`", file=sys.stderr)
 
     compiled = compile_files(
         args.input_files,
diff --git a/vyper/cli/vyper_ir.py b/vyper/cli/vyper_ir.py
index 6831f39473..1f90badcaa 100755
--- a/vyper/cli/vyper_ir.py
+++ b/vyper/cli/vyper_ir.py
@@ -55,7 +55,7 @@ def compile_to_ir(input_file, output_formats, show_gas_estimates=False):
         compiler_data["asm"] = asm
 
     if "bytecode" in output_formats:
-        (bytecode, _srcmap) = compile_ir.assembly_to_evm(asm)
+        bytecode, _ = compile_ir.assembly_to_evm(asm)
         compiler_data["bytecode"] = "0x" + bytecode.hex()
 
     return compiler_data
diff --git a/vyper/codegen/core.py b/vyper/codegen/core.py
index 47a2c8c8d0..e1d3ea12b4 100644
--- a/vyper/codegen/core.py
+++ b/vyper/codegen/core.py
@@ -1033,7 +1033,6 @@ def eval_seq(ir_node):
     return None
 
 
-# TODO move return checks to vyper/semantics/validation
 def is_return_from_function(node):
     if isinstance(node, vy_ast.Expr) and node.get("value.func.id") in (
         "raw_revert",
@@ -1045,6 +1044,8 @@ def is_return_from_function(node):
     return False
 
 
+# TODO this is almost certainly duplicated with check_terminus_node
+# in vyper/semantics/analysis/local.py
 def check_single_exit(fn_node):
     _check_return_body(fn_node, fn_node.body)
     for node in fn_node.get_descendants(vy_ast.If):
diff --git a/vyper/codegen/function_definitions/__init__.py b/vyper/codegen/function_definitions/__init__.py
index 08bebbb4a5..94617bef35 100644
--- a/vyper/codegen/function_definitions/__init__.py
+++ b/vyper/codegen/function_definitions/__init__.py
@@ -1 +1 @@
-from .common import generate_ir_for_function  # noqa
+from .common import FuncIR, generate_ir_for_function  # noqa
diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index fd65b12265..3fd5ce0b29 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -4,7 +4,7 @@
 
 import vyper.ast as vy_ast
 from vyper.codegen.context import Constancy, Context
-from vyper.codegen.core import check_single_exit, getpos
+from vyper.codegen.core import check_single_exit
 from vyper.codegen.function_definitions.external_function import generate_ir_for_external_function
 from vyper.codegen.function_definitions.internal_function import generate_ir_for_internal_function
 from vyper.codegen.global_context import GlobalContext
@@ -63,12 +63,32 @@ def internal_function_label(self, is_ctor_context: bool = False) -> str:
         return self.ir_identifier + suffix
 
 
+class FuncIR:
+    pass
+
+
+@dataclass
+class EntryPointInfo:
+    func_t: ContractFunctionT
+    min_calldatasize: int  # the min calldata required for this entry point
+    ir_node: IRnode  # the ir for this entry point
+
+
+@dataclass
+class ExternalFuncIR(FuncIR):
+    entry_points: dict[str, EntryPointInfo]  # map from abi sigs to entry points
+    common_ir: IRnode  # the "common" code for the function
+
+
+@dataclass
+class InternalFuncIR(FuncIR):
+    func_ir: IRnode  # the code for the function
+
+
+# TODO: should split this into external and internal ir generation?
 def generate_ir_for_function(
-    code: vy_ast.FunctionDef,
-    global_ctx: GlobalContext,
-    skip_nonpayable_check: bool,
-    is_ctor_context: bool = False,
-) -> IRnode:
+    code: vy_ast.FunctionDef, global_ctx: GlobalContext, is_ctor_context: bool = False
+) -> FuncIR:
     """
     Parse a function and produce IR code for the function, includes:
         - Signature method if statement
@@ -82,6 +102,7 @@ def generate_ir_for_function(
     func_t._ir_info = _FuncIRInfo(func_t)
 
     # Validate return statements.
+    # XXX: This should really be in semantics pass.
     check_single_exit(code)
 
     callees = func_t.called_functions
@@ -106,19 +127,23 @@ def generate_ir_for_function(
     )
 
     if func_t.is_internal:
-        assert skip_nonpayable_check is False
-        o = generate_ir_for_internal_function(code, func_t, context)
+        ret: FuncIR = InternalFuncIR(generate_ir_for_internal_function(code, func_t, context))
+        func_t._ir_info.gas_estimate = ret.func_ir.gas  # type: ignore
     else:
-        if func_t.is_payable:
-            assert skip_nonpayable_check is False  # nonsense
-        o = generate_ir_for_external_function(code, func_t, context, skip_nonpayable_check)
-
-    o.source_pos = getpos(code)
+        kwarg_handlers, common = generate_ir_for_external_function(code, func_t, context)
+        entry_points = {
+            k: EntryPointInfo(func_t, mincalldatasize, ir_node)
+            for k, (mincalldatasize, ir_node) in kwarg_handlers.items()
+        }
+        ret = ExternalFuncIR(entry_points, common)
+        # note: this ignores the cost of traversing selector table
+        func_t._ir_info.gas_estimate = ret.common_ir.gas
 
     frame_size = context.memory_allocator.size_of_mem - MemoryPositions.RESERVED_MEMORY
 
     frame_info = FrameInfo(allocate_start, frame_size, context.vars)
 
+    # XXX: when can this happen?
     if func_t._ir_info.frame_info is None:
         func_t._ir_info.set_frame_info(frame_info)
     else:
@@ -128,9 +153,7 @@ def generate_ir_for_function(
         # adjust gas estimate to include cost of mem expansion
         # frame_size of external function includes all private functions called
         # (note: internal functions do not need to adjust gas estimate since
-        # it is already accounted for by the caller.)
-        o.add_gas_estimate += calc_mem_gas(func_t._ir_info.frame_info.mem_used)  # type: ignore
-
-    func_t._ir_info.gas_estimate = o.gas
+        mem_expansion_cost = calc_mem_gas(func_t._ir_info.frame_info.mem_used)  # type: ignore
+        ret.common_ir.add_gas_estimate += mem_expansion_cost  # type: ignore
 
-    return o
+    return ret
diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 207356860b..32236e9aad 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -1,6 +1,3 @@
-from typing import Any, List
-
-import vyper.utils as util
 from vyper.codegen.abi_encoder import abi_encoding_matches_vyper
 from vyper.codegen.context import Context, VariableRecord
 from vyper.codegen.core import get_element_ptr, getpos, make_setter, needs_clamp
@@ -15,7 +12,7 @@
 
 # register function args with the local calling context.
 # also allocate the ones that live in memory (i.e. kwargs)
-def _register_function_args(func_t: ContractFunctionT, context: Context) -> List[IRnode]:
+def _register_function_args(func_t: ContractFunctionT, context: Context) -> list[IRnode]:
     ret = []
     # the type of the calldata
     base_args_t = TupleT(tuple(arg.typ for arg in func_t.positional_args))
@@ -52,13 +49,9 @@ def _register_function_args(func_t: ContractFunctionT, context: Context) -> List
     return ret
 
 
-def _annotated_method_id(abi_sig):
-    method_id = util.method_id_int(abi_sig)
-    annotation = f"{hex(method_id)}: {abi_sig}"
-    return IRnode(method_id, annotation=annotation)
-
-
-def _generate_kwarg_handlers(func_t: ContractFunctionT, context: Context) -> List[Any]:
+def _generate_kwarg_handlers(
+    func_t: ContractFunctionT, context: Context
+) -> dict[str, tuple[int, IRnode]]:
     # generate kwarg handlers.
     # since they might come in thru calldata or be default,
     # allocate them in memory and then fill it in based on calldata or default,
@@ -75,7 +68,6 @@ def handler_for(calldata_kwargs, default_kwargs):
         calldata_args_t = TupleT(list(arg.typ for arg in calldata_args))
 
         abi_sig = func_t.abi_signature_for_kwargs(calldata_kwargs)
-        method_id = _annotated_method_id(abi_sig)
 
         calldata_kwargs_ofst = IRnode(
             4, location=CALLDATA, typ=calldata_args_t, encoding=Encoding.ABI
@@ -88,11 +80,6 @@ def handler_for(calldata_kwargs, default_kwargs):
         args_abi_t = calldata_args_t.abi_type
         calldata_min_size = args_abi_t.min_size() + 4
 
-        # note we don't need the check if calldata_min_size == 4,
-        # because the global calldatasize check ensures that already.
-        if calldata_min_size > 4:
-            ret.append(["assert", ["ge", "calldatasize", calldata_min_size]])
-
         # TODO optimize make_setter by using
         # TupleT(list(arg.typ for arg in calldata_kwargs + default_kwargs))
         # (must ensure memory area is contiguous)
@@ -123,11 +110,10 @@ def handler_for(calldata_kwargs, default_kwargs):
 
         ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
 
-        method_id_check = ["eq", "_calldata_method_id", method_id]
-        ret = ["if", method_id_check, ret]
-        return ret
+        # return something we can turn into ExternalFuncIR
+        return abi_sig, calldata_min_size, ret
 
-    ret = ["seq"]
+    ret = {}
 
     keyword_args = func_t.keyword_args
 
@@ -139,9 +125,12 @@ def handler_for(calldata_kwargs, default_kwargs):
         calldata_kwargs = keyword_args[:i]
         default_kwargs = keyword_args[i:]
 
-        ret.append(handler_for(calldata_kwargs, default_kwargs))
+        sig, calldata_min_size, ir_node = handler_for(calldata_kwargs, default_kwargs)
+        ret[sig] = calldata_min_size, ir_node
+
+    sig, calldata_min_size, ir_node = handler_for(keyword_args, [])
 
-    ret.append(handler_for(keyword_args, []))
+    ret[sig] = calldata_min_size, ir_node
 
     return ret
 
@@ -149,7 +138,7 @@ def handler_for(calldata_kwargs, default_kwargs):
 # TODO it would be nice if this returned a data structure which were
 # amenable to generating a jump table instead of the linear search for
 # method_id we have now.
-def generate_ir_for_external_function(code, func_t, context, skip_nonpayable_check):
+def generate_ir_for_external_function(code, func_t, context):
     # TODO type hints:
     # def generate_ir_for_external_function(
     #    code: vy_ast.FunctionDef,
@@ -174,14 +163,6 @@ def generate_ir_for_external_function(code, func_t, context, skip_nonpayable_che
     # generate the main body of the function
     body += handle_base_args
 
-    if not func_t.is_payable and not skip_nonpayable_check:
-        # if the contract contains payable functions, but this is not one of them
-        # add an assertion that the value of the call is zero
-        nonpayable_check = IRnode.from_list(
-            ["assert", ["iszero", "callvalue"]], error_msg="nonpayable check"
-        )
-        body.append(nonpayable_check)
-
     body += nonreentrant_pre
 
     body += [parse_body(code.body, context, ensure_terminated=True)]
@@ -201,22 +182,10 @@ def generate_ir_for_external_function(code, func_t, context, skip_nonpayable_che
     if context.return_type is not None:
         exit_sequence_args += ["ret_ofst", "ret_len"]
     # wrap the exit in a labeled block
-    exit = ["label", func_t._ir_info.exit_sequence_label, exit_sequence_args, exit_sequence]
+    exit_ = ["label", func_t._ir_info.exit_sequence_label, exit_sequence_args, exit_sequence]
 
     # the ir which comprises the main body of the function,
     # besides any kwarg handling
-    func_common_ir = ["seq", body, exit]
-
-    if func_t.is_fallback or func_t.is_constructor:
-        ret = ["seq"]
-        # add a goto to make the function entry look like other functions
-        # (for zksync interpreter)
-        ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
-        ret.append(func_common_ir)
-    else:
-        ret = kwarg_handlers
-        # sneak the base code into the kwarg handler
-        # TODO rethink this / make it clearer
-        ret[-1][-1].append(func_common_ir)
+    func_common_ir = IRnode.from_list(["seq", body, exit_], source_pos=getpos(code))
 
-    return IRnode.from_list(ret, source_pos=getpos(code))
+    return kwarg_handlers, func_common_ir
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index fa015b293e..6cb0a07281 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -148,6 +148,13 @@ def _check(condition, err):
 
             self.valency = 1
             self._gas = 5
+        elif isinstance(self.value, bytes):
+            # a literal bytes value, probably inside a "data" node.
+            _check(len(self.args) == 0, "bytes can't have arguments")
+
+            self.valency = 0
+            self._gas = 0
+
         elif isinstance(self.value, str):
             # Opcodes and pseudo-opcodes (e.g. clamp)
             if self.value.upper() in get_ir_opcodes():
@@ -264,8 +271,11 @@ def _check(condition, err):
                 self.valency = 0
                 self._gas = sum([arg.gas for arg in self.args])
             elif self.value == "label":
-                if not self.args[1].value == "var_list":
-                    raise CodegenPanic(f"2nd argument to label must be var_list, {self}")
+                _check(
+                    self.args[1].value == "var_list",
+                    f"2nd argument to label must be var_list, {self}",
+                )
+                _check(len(args) == 3, f"label should have 3 args but has {len(args)}, {self}")
                 self.valency = 0
                 self._gas = 1 + sum(t.gas for t in self.args)
             elif self.value == "unique_symbol":
diff --git a/vyper/codegen/jumptable_utils.py b/vyper/codegen/jumptable_utils.py
new file mode 100644
index 0000000000..6987ce90bd
--- /dev/null
+++ b/vyper/codegen/jumptable_utils.py
@@ -0,0 +1,195 @@
+# helper module which implements jumptable for function selection
+import math
+from dataclasses import dataclass
+
+from vyper.utils import method_id_int
+
+
+@dataclass
+class Signature:
+    method_id: int
+    payable: bool
+
+
+# bucket for dense function
+@dataclass
+class Bucket:
+    bucket_id: int
+    magic: int
+    method_ids: list[int]
+
+    @property
+    def image(self):
+        return _image_of([s for s in self.method_ids], self.magic)
+
+    @property
+    # return method ids, sorted by by their image
+    def method_ids_image_order(self):
+        return [x[1] for x in sorted(zip(self.image, self.method_ids))]
+
+    @property
+    def bucket_size(self):
+        return len(self.method_ids)
+
+
+BITS_MAGIC = 24  # a constant which produced good results, see _bench_dense()
+
+
+def _image_of(xs, magic):
+    bits_shift = BITS_MAGIC
+
+    # take the upper bits from the multiplication for more entropy
+    # can we do better using primes of some sort?
+    return [((x * magic) >> bits_shift) % len(xs) for x in xs]
+
+
+class _Failure(Exception):
+    pass
+
+
+def find_magic_for(xs):
+    for m in range(2**16):
+        test = _image_of(xs, m)
+        if len(test) == len(set(test)):
+            return m
+
+    raise _Failure(f"Could not find hash for {xs}")
+
+
+def _mk_buckets(method_ids, n_buckets):
+    buckets = {}
+    for x in method_ids:
+        t = x % n_buckets
+        buckets.setdefault(t, [])
+        buckets[t].append(x)
+    return buckets
+
+
+# two layer method for generating perfect hash
+# first get "reasonably good" distribution by using
+# method_id % len(method_ids)
+# second, get the magic for the bucket.
+def _dense_jumptable_info(method_ids, n_buckets):
+    buckets = _mk_buckets(method_ids, n_buckets)
+
+    ret = {}
+    for bucket_id, method_ids in buckets.items():
+        magic = find_magic_for(method_ids)
+        ret[bucket_id] = Bucket(bucket_id, magic, method_ids)
+
+    return ret
+
+
+START_BUCKET_SIZE = 5
+
+
+# this is expensive! for 80 methods, costs about 350ms and probably
+# linear in # of methods.
+# see _bench_perfect()
+# note the buckets are NOT in order!
+def generate_dense_jumptable_info(signatures):
+    method_ids = [method_id_int(sig) for sig in signatures]
+    n = len(signatures)
+    # start at bucket size of 5 and try to improve (generally
+    # speaking we want as few buckets as possible)
+    n_buckets = (n // START_BUCKET_SIZE) + 1
+    ret = None
+    tried_exhaustive = False
+    while n_buckets > 0:
+        try:
+            # print(f"trying {n_buckets} (bucket size {n // n_buckets})")
+            ret = _dense_jumptable_info(method_ids, n_buckets)
+        except _Failure:
+            if ret is not None:
+                break
+
+            # we have not tried exhaustive search. try really hard
+            # to find a valid jumptable at the cost of performance
+            if not tried_exhaustive:
+                # print("failed with guess! trying exhaustive search.")
+                n_buckets = n
+                tried_exhaustive = True
+                continue
+            else:
+                raise RuntimeError(f"Could not generate jumptable! {signatures}")
+        n_buckets -= 1
+
+    return ret
+
+
+# note the buckets are NOT in order!
+def generate_sparse_jumptable_buckets(signatures):
+    method_ids = [method_id_int(sig) for sig in signatures]
+    n = len(signatures)
+
+    # search a range of buckets to try to minimize bucket size
+    # (doing the range search improves worst worst bucket size from 9 to 4,
+    # see _bench_sparse)
+    lo = max(1, math.floor(n * 0.85))
+    hi = max(1, math.ceil(n * 1.15))
+    stats = {}
+    for i in range(lo, hi + 1):
+        buckets = _mk_buckets(method_ids, i)
+
+        stats[i] = buckets
+
+    min_max_bucket_size = hi + 1  # smallest max_bucket_size
+    # find the smallest i which gives us the smallest max_bucket_size
+    for i, buckets in stats.items():
+        max_bucket_size = max(len(bucket) for bucket in buckets.values())
+        if max_bucket_size < min_max_bucket_size:
+            min_max_bucket_size = max_bucket_size
+            ret = i, buckets
+
+    assert ret is not None
+    return ret
+
+
+# benchmark for quality of buckets
+def _bench_dense(N=1_000, n_methods=100):
+    import random
+
+    stats = []
+    for i in range(N):
+        seed = random.randint(0, 2**64 - 1)
+        # "large" contracts in prod hit about ~50 methods, test with
+        # double the limit
+        sigs = [f"foo{i + seed}()" for i in range(n_methods)]
+
+        xs = generate_dense_jumptable_info(sigs)
+        print(f"found. n buckets {len(xs)}")
+        stats.append(xs)
+
+    def mean(xs):
+        return sum(xs) / len(xs)
+
+    avg_n_buckets = mean([len(jt) for jt in stats])
+    # usually around ~14 buckets per 100 sigs
+    # N=10, time=3.6s
+    print(f"average N buckets: {avg_n_buckets}")
+
+
+def _bench_sparse(N=10_000, n_methods=80):
+    import random
+
+    stats = []
+    for _ in range(N):
+        seed = random.randint(0, 2**64 - 1)
+        sigs = [f"foo{i + seed}()" for i in range(n_methods)]
+        _, buckets = generate_sparse_jumptable_buckets(sigs)
+
+        bucket_sizes = [len(bucket) for bucket in buckets.values()]
+        worst_bucket_size = max(bucket_sizes)
+        mean_bucket_size = sum(bucket_sizes) / len(bucket_sizes)
+        stats.append((worst_bucket_size, mean_bucket_size))
+
+    # N=10_000, time=9s
+    # range 0.85*n - 1.15*n
+    # worst worst bucket size: 4
+    # avg worst bucket size: 3.0018
+    # worst mean bucket size: 2.0
+    # avg mean bucket size: 1.579112583664968
+    print("worst worst bucket size:", max(x[0] for x in stats))
+    print("avg worst bucket size:", sum(x[0] for x in stats) / len(stats))
+    print("worst mean bucket size:", max(x[1] for x in stats))
+    print("avg mean bucket size:", sum(x[1] for x in stats) / len(stats))
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index b98e4d0f86..ebe7f92cf2 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -1,12 +1,15 @@
-# a contract.vy -- all functions and constructor
+# a compilation unit -- all functions and constructor
 
 from typing import Any, List
 
+from vyper.codegen import core, jumptable_utils
 from vyper.codegen.core import shr
 from vyper.codegen.function_definitions import generate_ir_for_function
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.settings import _is_debug_mode
 from vyper.exceptions import CompilerPanic
+from vyper.utils import method_id_int
 
 
 def _topsort_helper(functions, lookup):
@@ -47,92 +50,349 @@ def _is_payable(func_ast):
     return func_ast._metadata["type"].is_payable
 
 
-# codegen for all runtime functions + callvalue/calldata checks + method selector routines
-def _runtime_ir(runtime_functions, global_ctx):
-    # categorize the runtime functions because we will organize the runtime
-    # code into the following sections:
-    # payable functions, nonpayable functions, fallback function, internal_functions
-    internal_functions = [f for f in runtime_functions if _is_internal(f)]
+def _annotated_method_id(abi_sig):
+    method_id = method_id_int(abi_sig)
+    annotation = f"{hex(method_id)}: {abi_sig}"
+    return IRnode(method_id, annotation=annotation)
 
-    external_functions = [f for f in runtime_functions if not _is_internal(f)]
-    default_function = next((f for f in external_functions if _is_fallback(f)), None)
 
-    # functions that need to go exposed in the selector section
-    regular_functions = [f for f in external_functions if not _is_fallback(f)]
-    payables = [f for f in regular_functions if _is_payable(f)]
-    nonpayables = [f for f in regular_functions if not _is_payable(f)]
+def label_for_entry_point(abi_sig, entry_point):
+    method_id = method_id_int(abi_sig)
+    return f"{entry_point.func_t._ir_info.ir_identifier}{method_id}"
 
-    # create a map of the IR functions since they might live in both
-    # runtime and deploy code (if init function calls them)
-    internal_functions_ir: list[IRnode] = []
 
-    for func_ast in internal_functions:
-        func_ir = generate_ir_for_function(func_ast, global_ctx, False)
-        internal_functions_ir.append(func_ir)
+# adapt whatever generate_ir_for_function gives us into an IR node
+def _ir_for_fallback_or_ctor(func_ast, *args, **kwargs):
+    func_t = func_ast._metadata["type"]
+    assert func_t.is_fallback or func_t.is_constructor
+
+    ret = ["seq"]
+    if not func_t.is_payable:
+        callvalue_check = ["assert", ["iszero", "callvalue"]]
+        ret.append(IRnode.from_list(callvalue_check, error_msg="nonpayable check"))
+
+    func_ir = generate_ir_for_function(func_ast, *args, **kwargs)
+    assert len(func_ir.entry_points) == 1
+
+    # add a goto to make the function entry look like other functions
+    # (for zksync interpreter)
+    ret.append(["goto", func_t._ir_info.external_function_base_entry_label])
+    ret.append(func_ir.common_ir)
+
+    return IRnode.from_list(ret)
+
+
+def _ir_for_internal_function(func_ast, *args, **kwargs):
+    return generate_ir_for_function(func_ast, *args, **kwargs).func_ir
+
+
+def _generate_external_entry_points(external_functions, global_ctx):
+    entry_points = {}  # map from ABI sigs to ir code
+    sig_of = {}  # reverse map from method ids to abi sig
+
+    for code in external_functions:
+        func_ir = generate_ir_for_function(code, global_ctx)
+        for abi_sig, entry_point in func_ir.entry_points.items():
+            assert abi_sig not in entry_points
+            entry_points[abi_sig] = entry_point
+            sig_of[method_id_int(abi_sig)] = abi_sig
+
+        # stick function common body into final entry point to save a jump
+        ir_node = IRnode.from_list(["seq", entry_point.ir_node, func_ir.common_ir])
+        entry_point.ir_node = ir_node
+
+    return entry_points, sig_of
+
+
+# codegen for all runtime functions + callvalue/calldata checks,
+# with O(1) jumptable for selector table.
+# uses two level strategy: uses `method_id % n_buckets` to descend
+# into a bucket (of about 8-10 items), and then uses perfect hash
+# to select the final function.
+# costs about 212 gas for typical function and 8 bytes of code (+ ~87 bytes of global overhead)
+def _selector_section_dense(external_functions, global_ctx):
+    function_irs = []
 
-    # for some reason, somebody may want to deploy a contract with no
-    # external functions, or more likely, a "pure data" contract which
-    # contains immutables
     if len(external_functions) == 0:
-        # TODO: prune internal functions in this case? dead code eliminator
-        # might not eliminate them, since internal function jumpdest is at the
-        # first instruction in the contract.
-        runtime = ["seq"] + internal_functions_ir
-        return runtime
+        return IRnode.from_list(["seq"])
 
-    # note: if the user does not provide one, the default fallback function
-    # reverts anyway. so it does not hurt to batch the payable check.
-    default_is_nonpayable = default_function is None or not _is_payable(default_function)
+    entry_points, sig_of = _generate_external_entry_points(external_functions, global_ctx)
 
-    # when a contract has a nonpayable default function,
-    # we can do a single check for all nonpayable functions
-    batch_payable_check = len(nonpayables) > 0 and default_is_nonpayable
-    skip_nonpayable_check = batch_payable_check
+    # generate the label so the jumptable works
+    for abi_sig, entry_point in entry_points.items():
+        label = label_for_entry_point(abi_sig, entry_point)
+        ir_node = ["label", label, ["var_list"], entry_point.ir_node]
+        function_irs.append(IRnode.from_list(ir_node))
 
-    selector_section = ["seq"]
+    jumptable_info = jumptable_utils.generate_dense_jumptable_info(entry_points.keys())
+    n_buckets = len(jumptable_info)
+
+    #  bucket magic <2 bytes> | bucket location <2 bytes> | bucket size <1 byte>
+    # TODO: can make it smaller if the largest bucket magic <= 255
+    SZ_BUCKET_HEADER = 5
 
-    for func_ast in payables:
-        func_ir = generate_ir_for_function(func_ast, global_ctx, False)
-        selector_section.append(func_ir)
+    selector_section = ["seq"]
 
-    if batch_payable_check:
-        nonpayable_check = IRnode.from_list(
-            ["assert", ["iszero", "callvalue"]], error_msg="nonpayable check"
+    bucket_id = ["mod", "_calldata_method_id", n_buckets]
+    bucket_hdr_location = [
+        "add",
+        ["symbol", "BUCKET_HEADERS"],
+        ["mul", bucket_id, SZ_BUCKET_HEADER],
+    ]
+    # get bucket header
+    dst = 32 - SZ_BUCKET_HEADER
+    assert dst >= 0
+
+    if _is_debug_mode():
+        selector_section.append(["assert", ["eq", "msize", 0]])
+
+    selector_section.append(["codecopy", dst, bucket_hdr_location, SZ_BUCKET_HEADER])
+
+    # figure out the minimum number of bytes we can use to encode
+    # min_calldatasize in function info
+    largest_mincalldatasize = max(f.min_calldatasize for f in entry_points.values())
+    FN_METADATA_BYTES = (largest_mincalldatasize.bit_length() + 7) // 8
+
+    func_info_size = 4 + 2 + FN_METADATA_BYTES
+    # grab function info.
+    # method id <4 bytes> | label <2 bytes> | func info <1-3 bytes>
+    # func info (1-3 bytes, packed) for: expected calldatasize, is_nonpayable bit
+    # NOTE: might be able to improve codesize if we use variable # of bytes
+    # per bucket
+
+    hdr_info = IRnode.from_list(["mload", 0])
+    with hdr_info.cache_when_complex("hdr_info") as (b1, hdr_info):
+        bucket_location = ["and", 0xFFFF, shr(8, hdr_info)]
+        bucket_magic = shr(24, hdr_info)
+        bucket_size = ["and", 0xFF, hdr_info]
+        # ((method_id * bucket_magic) >> BITS_MAGIC) % bucket_size
+        func_id = [
+            "mod",
+            shr(jumptable_utils.BITS_MAGIC, ["mul", bucket_magic, "_calldata_method_id"]),
+            bucket_size,
+        ]
+        func_info_location = ["add", bucket_location, ["mul", func_id, func_info_size]]
+        dst = 32 - func_info_size
+        assert func_info_size >= SZ_BUCKET_HEADER  # otherwise mload will have dirty bytes
+        assert dst >= 0
+        selector_section.append(b1.resolve(["codecopy", dst, func_info_location, func_info_size]))
+
+    func_info = IRnode.from_list(["mload", 0])
+    fn_metadata_mask = 2 ** (FN_METADATA_BYTES * 8) - 1
+    calldatasize_mask = fn_metadata_mask - 1  # ex. 0xFFFE
+    with func_info.cache_when_complex("func_info") as (b1, func_info):
+        x = ["seq"]
+
+        # expected calldatasize always satisfies (x - 4) % 32 == 0
+        # the lower 5 bits are always 0b00100, so we can use those
+        # bits for other purposes.
+        is_nonpayable = ["and", 1, func_info]
+        expected_calldatasize = ["and", calldatasize_mask, func_info]
+
+        label_bits_ofst = FN_METADATA_BYTES * 8
+        function_label = ["and", 0xFFFF, shr(label_bits_ofst, func_info)]
+        method_id_bits_ofst = (FN_METADATA_BYTES + 2) * 8
+        function_method_id = shr(method_id_bits_ofst, func_info)
+
+        # check method id is right, if not then fallback.
+        # need to check calldatasize >= 4 in case there are
+        # trailing 0s in the method id.
+        calldatasize_valid = ["gt", "calldatasize", 3]
+        method_id_correct = ["eq", function_method_id, "_calldata_method_id"]
+        should_fallback = ["iszero", ["and", calldatasize_valid, method_id_correct]]
+        x.append(["if", should_fallback, ["goto", "fallback"]])
+
+        # assert callvalue == 0 if nonpayable
+        bad_callvalue = ["mul", is_nonpayable, "callvalue"]
+        # assert calldatasize at least minimum for the abi type
+        bad_calldatasize = ["lt", "calldatasize", expected_calldatasize]
+        failed_entry_conditions = ["or", bad_callvalue, bad_calldatasize]
+        check_entry_conditions = IRnode.from_list(
+            ["assert", ["iszero", failed_entry_conditions]],
+            error_msg="bad calldatasize or callvalue",
         )
-        selector_section.append(nonpayable_check)
+        x.append(check_entry_conditions)
+        x.append(["jump", function_label])
+        selector_section.append(b1.resolve(x))
+
+    bucket_headers = ["data", "BUCKET_HEADERS"]
+
+    for bucket_id, bucket in sorted(jumptable_info.items()):
+        bucket_headers.append(bucket.magic.to_bytes(2, "big"))
+        bucket_headers.append(["symbol", f"bucket_{bucket_id}"])
+        # note: buckets are usually ~10 items. to_bytes would
+        # fail if the int is too big.
+        bucket_headers.append(bucket.bucket_size.to_bytes(1, "big"))
+
+    selector_section.append(bucket_headers)
+
+    for bucket_id, bucket in jumptable_info.items():
+        function_infos = ["data", f"bucket_{bucket_id}"]
+        # sort function infos by their image.
+        for method_id in bucket.method_ids_image_order:
+            abi_sig = sig_of[method_id]
+            entry_point = entry_points[abi_sig]
+
+            method_id_bytes = method_id.to_bytes(4, "big")
+            symbol = ["symbol", label_for_entry_point(abi_sig, entry_point)]
+            func_metadata_int = entry_point.min_calldatasize | int(
+                not entry_point.func_t.is_payable
+            )
+            func_metadata = func_metadata_int.to_bytes(FN_METADATA_BYTES, "big")
 
-    for func_ast in nonpayables:
-        func_ir = generate_ir_for_function(func_ast, global_ctx, skip_nonpayable_check)
-        selector_section.append(func_ir)
+            function_infos.extend([method_id_bytes, symbol, func_metadata])
 
-    if default_function:
-        fallback_ir = generate_ir_for_function(
-            default_function, global_ctx, skip_nonpayable_check=False
-        )
-    else:
-        fallback_ir = IRnode.from_list(
-            ["revert", 0, 0], annotation="Default function", error_msg="fallback function"
-        )
+        selector_section.append(function_infos)
 
-    # ensure the external jumptable section gets closed out
-    # (for basic block hygiene and also for zksync interpreter)
-    # NOTE: this jump gets optimized out in assembly since the
-    # fallback label is the immediate next instruction,
-    close_selector_section = ["goto", "fallback"]
+    ret = ["seq", ["with", "_calldata_method_id", shr(224, ["calldataload", 0]), selector_section]]
 
-    global_calldatasize_check = ["if", ["lt", "calldatasize", 4], ["goto", "fallback"]]
+    ret.extend(function_irs)
 
-    runtime = [
-        "seq",
-        global_calldatasize_check,
-        ["with", "_calldata_method_id", shr(224, ["calldataload", 0]), selector_section],
-        close_selector_section,
-        ["label", "fallback", ["var_list"], fallback_ir],
-    ]
+    return ret
 
-    runtime.extend(internal_functions_ir)
 
-    return runtime
+# codegen for all runtime functions + callvalue/calldata checks,
+# with O(1) jumptable for selector table.
+# uses two level strategy: uses `method_id % n_methods` to calculate
+# a bucket, and then descends into linear search from there.
+# costs about 126 gas for typical (nonpayable, >0 args, avg bucket size 1.5)
+# function and 24 bytes of code (+ ~23 bytes of global overhead)
+def _selector_section_sparse(external_functions, global_ctx):
+    ret = ["seq"]
+
+    if len(external_functions) == 0:
+        return ret
+
+    entry_points, sig_of = _generate_external_entry_points(external_functions, global_ctx)
+
+    n_buckets, buckets = jumptable_utils.generate_sparse_jumptable_buckets(entry_points.keys())
+
+    # 2 bytes for bucket location
+    SZ_BUCKET_HEADER = 2
+
+    if n_buckets > 1:
+        bucket_id = ["mod", "_calldata_method_id", n_buckets]
+        bucket_hdr_location = [
+            "add",
+            ["symbol", "selector_buckets"],
+            ["mul", bucket_id, SZ_BUCKET_HEADER],
+        ]
+        # get bucket header
+        dst = 32 - SZ_BUCKET_HEADER
+        assert dst >= 0
+
+        if _is_debug_mode():
+            ret.append(["assert", ["eq", "msize", 0]])
+
+        ret.append(["codecopy", dst, bucket_hdr_location, SZ_BUCKET_HEADER])
+
+        jumpdest = IRnode.from_list(["mload", 0])
+        # don't particularly like using `jump` here since it can cause
+        # issues for other backends, consider changing `goto` to allow
+        # dynamic jumps, or adding some kind of jumptable instruction
+        ret.append(["jump", jumpdest])
+
+        jumptable_data = ["data", "selector_buckets"]
+        for i in range(n_buckets):
+            if i in buckets:
+                bucket_label = f"selector_bucket_{i}"
+                jumptable_data.append(["symbol", bucket_label])
+            else:
+                # empty bucket
+                jumptable_data.append(["symbol", "fallback"])
+
+        ret.append(jumptable_data)
+
+    for bucket_id, bucket in buckets.items():
+        bucket_label = f"selector_bucket_{bucket_id}"
+        ret.append(["label", bucket_label, ["var_list"], ["seq"]])
+
+        handle_bucket = ["seq"]
+
+        for method_id in bucket:
+            sig = sig_of[method_id]
+            entry_point = entry_points[sig]
+            func_t = entry_point.func_t
+            expected_calldatasize = entry_point.min_calldatasize
+
+            dispatch = ["seq"]  # code to dispatch into the function
+            skip_callvalue_check = func_t.is_payable
+            skip_calldatasize_check = expected_calldatasize == 4
+            bad_callvalue = [0] if skip_callvalue_check else ["callvalue"]
+            bad_calldatasize = (
+                [0] if skip_calldatasize_check else ["lt", "calldatasize", expected_calldatasize]
+            )
+
+            dispatch.append(
+                IRnode.from_list(
+                    ["assert", ["iszero", ["or", bad_callvalue, bad_calldatasize]]],
+                    error_msg="bad calldatasize or callvalue",
+                )
+            )
+            # we could skip a jumpdest per method if we out-lined the entry point
+            # so the dispatcher looks just like -
+            # ```(if (eq <calldata_method_id> method_id)
+            #   (goto entry_point_label))```
+            # it would another optimization for patterns like
+            # `if ... (goto)` though.
+            dispatch.append(entry_point.ir_node)
+
+            method_id_check = ["eq", "_calldata_method_id", _annotated_method_id(sig)]
+            has_trailing_zeroes = method_id.to_bytes(4, "big").endswith(b"\x00")
+            if has_trailing_zeroes:
+                # if the method id check has trailing 0s, we need to include
+                # a calldatasize check to distinguish from when not enough
+                # bytes are provided for the method id in calldata.
+                method_id_check = ["and", ["ge", "calldatasize", 4], method_id_check]
+            handle_bucket.append(["if", method_id_check, dispatch])
+
+        # close out the bucket with a goto fallback so we don't keep searching
+        handle_bucket.append(["goto", "fallback"])
+
+        ret.append(handle_bucket)
+
+    ret = ["seq", ["with", "_calldata_method_id", shr(224, ["calldataload", 0]), ret]]
+
+    return ret
+
+
+# codegen for all runtime functions + callvalue/calldata checks,
+# O(n) linear search for the method id
+# mainly keep this in for backends which cannot handle the indirect jump
+# in selector_section_dense and selector_section_sparse
+def _selector_section_linear(external_functions, global_ctx):
+    ret = ["seq"]
+    if len(external_functions) == 0:
+        return ret
+
+    ret.append(["if", ["lt", "calldatasize", 4], ["goto", "fallback"]])
+
+    entry_points, sig_of = _generate_external_entry_points(external_functions, global_ctx)
+
+    dispatcher = ["seq"]
+
+    for sig, entry_point in entry_points.items():
+        func_t = entry_point.func_t
+        expected_calldatasize = entry_point.min_calldatasize
+
+        dispatch = ["seq"]  # code to dispatch into the function
+
+        if not func_t.is_payable:
+            callvalue_check = ["assert", ["iszero", "callvalue"]]
+            dispatch.append(IRnode.from_list(callvalue_check, error_msg="nonpayable check"))
+
+        good_calldatasize = ["ge", "calldatasize", expected_calldatasize]
+        calldatasize_check = ["assert", good_calldatasize]
+        dispatch.append(IRnode.from_list(calldatasize_check, error_msg="calldatasize check"))
+
+        dispatch.append(entry_point.ir_node)
+
+        method_id_check = ["eq", "_calldata_method_id", _annotated_method_id(sig)]
+        dispatcher.append(["if", method_id_check, dispatch])
+
+    ret.append(["with", "_calldata_method_id", shr(224, ["calldataload", 0]), dispatcher])
+
+    return ret
 
 
 # take a GlobalContext, and generate the runtime and deploy IR
@@ -143,15 +403,47 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
     runtime_functions = [f for f in function_defs if not _is_constructor(f)]
     init_function = next((f for f in function_defs if _is_constructor(f)), None)
 
-    runtime = _runtime_ir(runtime_functions, global_ctx)
+    internal_functions = [f for f in runtime_functions if _is_internal(f)]
+
+    external_functions = [
+        f for f in runtime_functions if not _is_internal(f) and not _is_fallback(f)
+    ]
+    default_function = next((f for f in runtime_functions if _is_fallback(f)), None)
+
+    internal_functions_ir: list[IRnode] = []
+
+    # compile internal functions first so we have the function info
+    for func_ast in internal_functions:
+        func_ir = _ir_for_internal_function(func_ast, global_ctx, False)
+        internal_functions_ir.append(IRnode.from_list(func_ir))
+
+    if core._opt_none():
+        selector_section = _selector_section_linear(external_functions, global_ctx)
+    # dense vs sparse global overhead is amortized after about 4 methods.
+    # (--debug will force dense selector table anyway if _opt_codesize is selected.)
+    elif core._opt_codesize() and (len(external_functions) > 4 or _is_debug_mode()):
+        selector_section = _selector_section_dense(external_functions, global_ctx)
+    else:
+        selector_section = _selector_section_sparse(external_functions, global_ctx)
+
+    if default_function:
+        fallback_ir = _ir_for_fallback_or_ctor(default_function, global_ctx)
+    else:
+        fallback_ir = IRnode.from_list(
+            ["revert", 0, 0], annotation="Default function", error_msg="fallback function"
+        )
+
+    runtime = ["seq", selector_section]
+    runtime.append(["goto", "fallback"])
+    runtime.append(["label", "fallback", ["var_list"], fallback_ir])
+
+    runtime.extend(internal_functions_ir)
 
     deploy_code: List[Any] = ["seq"]
     immutables_len = global_ctx.immutable_section_bytes
     if init_function:
         # TODO might be cleaner to separate this into an _init_ir helper func
-        init_func_ir = generate_ir_for_function(
-            init_function, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
-        )
+        init_func_ir = _ir_for_fallback_or_ctor(init_function, global_ctx, is_ctor_context=True)
 
         # pass the amount of memory allocated for the init function
         # so that deployment does not clobber while preparing immutables
@@ -184,12 +476,10 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
         for f in internal_functions:
             init_func_t = init_function._metadata["type"]
             if f.name not in init_func_t.recursive_calls:
-                # unreachable
+                # unreachable code, delete it
                 continue
 
-            func_ir = generate_ir_for_function(
-                f, global_ctx, skip_nonpayable_check=False, is_ctor_context=True
-            )
+            func_ir = _ir_for_internal_function(f, global_ctx, is_ctor_context=True)
             deploy_code.append(func_ir)
 
     else:
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 63d92d9a47..69fcbf1f1f 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -300,9 +300,13 @@ def _build_opcodes(bytecode: bytes) -> str:
 
     while bytecode_sequence:
         op = bytecode_sequence.popleft()
-        opcode_output.append(opcode_map[op])
+        opcode_output.append(opcode_map.get(op, f"VERBATIM_{hex(op)}"))
         if "PUSH" in opcode_output[-1] and opcode_output[-1] != "PUSH0":
             push_len = int(opcode_map[op][4:])
+            # we can have push_len > len(bytecode_sequence) when there is data
+            # (instead of code) at end of contract
+            # CMC 2023-07-13 maybe just strip known data segments?
+            push_len = min(push_len, len(bytecode_sequence))
             push_values = [hex(bytecode_sequence.popleft())[2:] for i in range(push_len)]
             opcode_output.append(f"0x{''.join(push_values).upper()}")
 
diff --git a/vyper/compiler/settings.py b/vyper/compiler/settings.py
index bb5e9cdc25..d2c88a8592 100644
--- a/vyper/compiler/settings.py
+++ b/vyper/compiler/settings.py
@@ -42,3 +42,16 @@ class Settings:
     compiler_version: Optional[str] = None
     optimize: Optional[OptimizationLevel] = None
     evm_version: Optional[str] = None
+
+
+_DEBUG = False
+
+
+def _is_debug_mode():
+    global _DEBUG
+    return _DEBUG
+
+
+def _set_debug_mode(dbg: bool = False) -> None:
+    global _DEBUG
+    _DEBUG = dbg
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index a9064a44fa..5e29bad0b5 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -158,11 +158,20 @@ def _add_postambles(asm_ops):
         to_append.extend(_revert_string)
 
     if len(to_append) > 0:
+        # insert the postambles *before* runtime code
+        # so the data section of the runtime code can't bork the postambles.
+        runtime = None
+        if isinstance(asm_ops[-1], list) and isinstance(asm_ops[-1][0], _RuntimeHeader):
+            runtime = asm_ops.pop()
+
         # for some reason there might not be a STOP at the end of asm_ops.
         # (generally vyper programs will have it but raw IR might not).
         asm_ops.append("STOP")
         asm_ops.extend(to_append)
 
+        if runtime:
+            asm_ops.append(runtime)
+
     # need to do this recursively since every sublist is basically
     # treated as its own program (there are no global labels.)
     for t in asm_ops:
@@ -213,6 +222,9 @@ def compile_to_assembly(code, optimize=OptimizationLevel.GAS):
     res = _compile_to_assembly(code)
 
     _add_postambles(res)
+
+    _relocate_segments(res)
+
     if optimize != OptimizationLevel.NONE:
         _optimize_assembly(res)
     return res
@@ -500,14 +512,14 @@ def _height_of(witharg):
         assert isinstance(memsize, int), "non-int memsize"
         assert isinstance(padding, int), "non-int padding"
 
-        begincode = mksymbol("runtime_begin")
+        runtime_begin = mksymbol("runtime_begin")
 
         subcode = _compile_to_assembly(ir)
 
         o = []
 
         # COPY the code to memory for deploy
-        o.extend(["_sym_subcode_size", begincode, "_mem_deploy_start", "CODECOPY"])
+        o.extend(["_sym_subcode_size", runtime_begin, "_mem_deploy_start", "CODECOPY"])
 
         # calculate the len of runtime code
         o.extend(["_OFST", "_sym_subcode_size", padding])  # stack: len
@@ -517,10 +529,9 @@ def _height_of(witharg):
         # since the asm data structures are very primitive, to make sure
         # assembly_to_evm is able to calculate data offsets correctly,
         # we pass the memsize via magic opcodes to the subcode
-        subcode = [f"_DEPLOY_MEM_OFST_{memsize}"] + subcode
+        subcode = [_RuntimeHeader(runtime_begin, memsize)] + subcode
 
         # append the runtime code after the ctor code
-        o.extend([begincode, "BLANK"])
         # `append(...)` call here is intentional.
         # each sublist is essentially its own program with its
         # own symbols.
@@ -661,16 +672,36 @@ def _height_of(witharg):
             height,
         )
 
+    elif code.value == "data":
+        data_node = [_DataHeader("_sym_" + code.args[0].value)]
+
+        for c in code.args[1:]:
+            if isinstance(c.value, int):
+                assert 0 <= c < 256, f"invalid data byte {c}"
+                data_node.append(c.value)
+            elif isinstance(c.value, bytes):
+                data_node.append(c.value)
+            elif isinstance(c, IRnode):
+                assert c.value == "symbol"
+                data_node.extend(
+                    _compile_to_assembly(c, withargs, existing_labels, break_dest, height)
+                )
+            else:
+                raise ValueError(f"Invalid data: {type(c)} {c}")
+
+        # intentionally return a sublist.
+        return [data_node]
+
     # jump to a symbol, and push variable # of arguments onto stack
     elif code.value == "goto":
         o = []
         for i, c in enumerate(reversed(code.args[1:])):
             o.extend(_compile_to_assembly(c, withargs, existing_labels, break_dest, height + i))
-        o.extend(["_sym_" + str(code.args[0]), "JUMP"])
+        o.extend(["_sym_" + code.args[0].value, "JUMP"])
         return o
     # push a literal symbol
     elif code.value == "symbol":
-        return ["_sym_" + str(code.args[0])]
+        return ["_sym_" + code.args[0].value]
     # set a symbol as a location.
     elif code.value == "label":
         label_name = code.args[0].value
@@ -728,8 +759,8 @@ def _height_of(witharg):
     # inject debug opcode.
     elif code.value == "pc_debugger":
         return mkdebug(pc_debugger=True, source_pos=code.source_pos)
-    else:
-        raise Exception("Weird code element: " + repr(code))
+    else:  # pragma: no cover
+        raise ValueError(f"Weird code element: {type(code)} {code}")
 
 
 def note_line_num(line_number_map, item, pos):
@@ -764,11 +795,8 @@ def note_breakpoint(line_number_map, item, pos):
 
 
 def _prune_unreachable_code(assembly):
-    # In converting IR to assembly we sometimes end up with unreachable
-    # instructions - POPing to clear the stack or STOPing execution at the
-    # end of a function that has already returned or reverted. This should
-    # be addressed in the IR, but for now we do a final sanity check here
-    # to avoid unnecessary bytecode bloat.
+    # delete code between terminal ops and JUMPDESTS as those are
+    # unreachable
     changed = False
     i = 0
     while i < len(assembly) - 2:
@@ -777,7 +805,7 @@ def _prune_unreachable_code(assembly):
             instr = assembly[i][-1]
 
         if assembly[i] in _TERMINAL_OPS and not (
-            is_symbol(assembly[i + 1]) and assembly[i + 2] in ("JUMPDEST", "BLANK")
+            is_symbol(assembly[i + 1]) or isinstance(assembly[i + 1], list)
         ):
             changed = True
             del assembly[i + 1]
@@ -889,6 +917,14 @@ def _merge_iszero(assembly):
     return changed
 
 
+# a symbol _sym_x in assembly can either mean to push _sym_x to the stack,
+# or it can precede a location in code which we want to add to symbol map.
+# this helper function tells us if we want to add the previous instruction
+# to the symbol map.
+def is_symbol_map_indicator(asm_node):
+    return asm_node == "JUMPDEST"
+
+
 def _prune_unused_jumpdests(assembly):
     changed = False
 
@@ -896,9 +932,17 @@ def _prune_unused_jumpdests(assembly):
 
     # find all used jumpdests
     for i in range(len(assembly) - 1):
-        if is_symbol(assembly[i]) and assembly[i + 1] != "JUMPDEST":
+        if is_symbol(assembly[i]) and not is_symbol_map_indicator(assembly[i + 1]):
             used_jumpdests.add(assembly[i])
 
+    for item in assembly:
+        if isinstance(item, list) and isinstance(item[0], _DataHeader):
+            # add symbols used in data sections as they are likely
+            # used for a jumptable.
+            for t in item:
+                if is_symbol(t):
+                    used_jumpdests.add(t)
+
     # delete jumpdests that aren't used
     i = 0
     while i < len(assembly) - 2:
@@ -937,7 +981,7 @@ def _stack_peephole_opts(assembly):
 # optimize assembly, in place
 def _optimize_assembly(assembly):
     for x in assembly:
-        if isinstance(x, list):
+        if isinstance(x, list) and isinstance(x[0], _RuntimeHeader):
             _optimize_assembly(x)
 
     for _ in range(1024):
@@ -970,7 +1014,93 @@ def adjust_pc_maps(pc_maps, ofst):
     return ret
 
 
+SYMBOL_SIZE = 2  # size of a PUSH instruction for a code symbol
+
+
+def _data_to_evm(assembly, symbol_map):
+    ret = bytearray()
+    assert isinstance(assembly[0], _DataHeader)
+    for item in assembly[1:]:
+        if is_symbol(item):
+            symbol = symbol_map[item].to_bytes(SYMBOL_SIZE, "big")
+            ret.extend(symbol)
+        elif isinstance(item, int):
+            ret.append(item)
+        elif isinstance(item, bytes):
+            ret.extend(item)
+        else:
+            raise ValueError(f"invalid data {type(item)} {item}")
+
+    return ret
+
+
+# predict what length of an assembly [data] node will be in bytecode
+def _length_of_data(assembly):
+    ret = 0
+    assert isinstance(assembly[0], _DataHeader)
+    for item in assembly[1:]:
+        if is_symbol(item):
+            ret += SYMBOL_SIZE
+        elif isinstance(item, int):
+            assert 0 <= item < 256, f"invalid data byte {item}"
+            ret += 1
+        elif isinstance(item, bytes):
+            ret += len(item)
+        else:
+            raise ValueError(f"invalid data {type(item)} {item}")
+
+    return ret
+
+
+class _RuntimeHeader:
+    def __init__(self, label, ctor_mem_size):
+        self.label = label
+        self.ctor_mem_size = ctor_mem_size
+
+    def __repr__(self):
+        return f"<RUNTIME {self.label} mem @{self.ctor_mem_size}>"
+
+
+class _DataHeader:
+    def __init__(self, label):
+        self.label = label
+
+    def __repr__(self):
+        return f"DATA {self.label}"
+
+
+def _relocate_segments(assembly):
+    # relocate all data segments to the end, otherwise data could be
+    # interpreted as PUSH instructions and mangle otherwise valid jumpdests
+    # relocate all runtime segments to the end as well
+    data_segments = []
+    non_data_segments = []
+    code_segments = []
+    for t in assembly:
+        if isinstance(t, list):
+            if isinstance(t[0], _DataHeader):
+                data_segments.append(t)
+            else:
+                _relocate_segments(t)  # recurse
+                assert isinstance(t[0], _RuntimeHeader)
+                code_segments.append(t)
+        else:
+            non_data_segments.append(t)
+    assembly.clear()
+    assembly.extend(non_data_segments)
+    assembly.extend(code_segments)
+    assembly.extend(data_segments)
+
+
+# TODO: change API to split assembly_to_evm and assembly_to_source/symbol_maps
 def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
+    bytecode, source_maps, _ = assembly_to_evm_with_symbol_map(
+        assembly, pc_ofst=pc_ofst, insert_vyper_signature=insert_vyper_signature
+    )
+    return bytecode, source_maps
+
+
+def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_vyper_signature=False):
     """
     Assembles assembly into EVM
 
@@ -999,8 +1129,6 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
         bytecode_suffix += b"\xa1\x65vyper\x83" + bytes(list(version_tuple))
         bytecode_suffix += len(bytecode_suffix).to_bytes(2, "big")
 
-    CODE_OFST_SIZE = 2  # size of a PUSH instruction for a code symbol
-
     # to optimize the size of deploy code - we want to use the smallest
     # PUSH instruction possible which can support all memory symbols
     # (and also works with linear pass symbol resolution)
@@ -1009,13 +1137,13 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
     mem_ofst_size, ctor_mem_size = None, None
     max_mem_ofst = 0
     for i, item in enumerate(assembly):
-        if isinstance(item, list):
+        if isinstance(item, list) and isinstance(item[0], _RuntimeHeader):
             assert runtime_code is None, "Multiple subcodes"
-            runtime_code, runtime_map = assembly_to_evm(item)
 
-            assert item[0].startswith("_DEPLOY_MEM_OFST_")
             assert ctor_mem_size is None
-            ctor_mem_size = int(item[0][len("_DEPLOY_MEM_OFST_") :])
+            ctor_mem_size = item[0].ctor_mem_size
+
+            runtime_code, runtime_map = assembly_to_evm(item[1:])
 
             runtime_code_start, runtime_code_end = _runtime_code_offsets(
                 ctor_mem_size, len(runtime_code)
@@ -1053,14 +1181,14 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
 
         # update pc
         if is_symbol(item):
-            if assembly[i + 1] == "JUMPDEST" or assembly[i + 1] == "BLANK":
+            if is_symbol_map_indicator(assembly[i + 1]):
                 # Don't increment pc as the symbol itself doesn't go into code
                 if item in symbol_map:
                     raise CompilerPanic(f"duplicate jumpdest {item}")
 
                 symbol_map[item] = pc
             else:
-                pc += CODE_OFST_SIZE + 1  # PUSH2 highbits lowbits
+                pc += SYMBOL_SIZE + 1  # PUSH2 highbits lowbits
         elif is_mem_sym(item):
             # PUSH<n> item
             pc += mem_ofst_size + 1
@@ -1070,19 +1198,16 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
             # [_OFST, _sym_foo, bar] -> PUSH2 (foo+bar)
             # [_OFST, _mem_foo, bar] -> PUSHN (foo+bar)
             pc -= 1
-        elif item == "BLANK":
-            pc += 0
-        elif isinstance(item, str) and item.startswith("_DEPLOY_MEM_OFST_"):
-            # _DEPLOY_MEM_OFST is assembly magic which will
-            # get removed during final assembly-to-bytecode
-            pc += 0
-        elif isinstance(item, list):
+        elif isinstance(item, list) and isinstance(item[0], _RuntimeHeader):
+            symbol_map[item[0].label] = pc
             # add source map for all items in the runtime map
             t = adjust_pc_maps(runtime_map, pc)
             for key in line_number_map:
                 line_number_map[key].update(t[key])
             pc += len(runtime_code)
-
+        elif isinstance(item, list) and isinstance(item[0], _DataHeader):
+            symbol_map[item[0].label] = pc
+            pc += _length_of_data(item)
         else:
             pc += 1
 
@@ -1094,13 +1219,9 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
     if runtime_code is not None:
         symbol_map["_sym_subcode_size"] = len(runtime_code)
 
-    # (NOTE CMC 2022-06-17 this way of generating bytecode did not
-    # seem to be a perf hotspot. if it is, may want to use bytearray()
-    # instead).
-
-    # TODO refactor into two functions, create posmap and assemble
+    # TODO refactor into two functions, create symbol_map and assemble
 
-    o = b""
+    ret = bytearray()
 
     # now that all symbols have been resolved, generate bytecode
     # using the symbol map
@@ -1110,47 +1231,47 @@ def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
             to_skip -= 1
             continue
 
-        if item in ("DEBUG", "BLANK"):
+        if item in ("DEBUG",):
             continue  # skippable opcodes
 
-        elif isinstance(item, str) and item.startswith("_DEPLOY_MEM_OFST_"):
-            continue
-
         elif is_symbol(item):
-            if assembly[i + 1] != "JUMPDEST" and assembly[i + 1] != "BLANK":
-                bytecode, _ = assembly_to_evm(PUSH_N(symbol_map[item], n=CODE_OFST_SIZE))
-                o += bytecode
+            # push a symbol to stack
+            if not is_symbol_map_indicator(assembly[i + 1]):
+                bytecode, _ = assembly_to_evm(PUSH_N(symbol_map[item], n=SYMBOL_SIZE))
+                ret.extend(bytecode)
 
         elif is_mem_sym(item):
             bytecode, _ = assembly_to_evm(PUSH_N(symbol_map[item], n=mem_ofst_size))
-            o += bytecode
+            ret.extend(bytecode)
 
         elif is_ofst(item):
             # _OFST _sym_foo 32
             ofst = symbol_map[assembly[i + 1]] + assembly[i + 2]
-            n = mem_ofst_size if is_mem_sym(assembly[i + 1]) else CODE_OFST_SIZE
+            n = mem_ofst_size if is_mem_sym(assembly[i + 1]) else SYMBOL_SIZE
             bytecode, _ = assembly_to_evm(PUSH_N(ofst, n))
-            o += bytecode
+            ret.extend(bytecode)
             to_skip = 2
 
         elif isinstance(item, int):
-            o += bytes([item])
+            ret.append(item)
         elif isinstance(item, str) and item.upper() in get_opcodes():
-            o += bytes([get_opcodes()[item.upper()][0]])
+            ret.append(get_opcodes()[item.upper()][0])
         elif item[:4] == "PUSH":
-            o += bytes([PUSH_OFFSET + int(item[4:])])
+            ret.append(PUSH_OFFSET + int(item[4:]))
         elif item[:3] == "DUP":
-            o += bytes([DUP_OFFSET + int(item[3:])])
+            ret.append(DUP_OFFSET + int(item[3:]))
         elif item[:4] == "SWAP":
-            o += bytes([SWAP_OFFSET + int(item[4:])])
-        elif isinstance(item, list):
-            o += runtime_code
-        else:
-            # Should never reach because, assembly is create in _compile_to_assembly.
-            raise Exception("Weird symbol in assembly: " + str(item))  # pragma: no cover
+            ret.append(SWAP_OFFSET + int(item[4:]))
+        elif isinstance(item, list) and isinstance(item[0], _RuntimeHeader):
+            ret.extend(runtime_code)
+        elif isinstance(item, list) and isinstance(item[0], _DataHeader):
+            ret.extend(_data_to_evm(item, symbol_map))
+        else:  # pragma: no cover
+            # unreachable
+            raise ValueError(f"Weird symbol in assembly: {type(item)} {item}")
 
-    o += bytecode_suffix
+    ret.extend(bytecode_suffix)
 
     line_number_map["breakpoints"] = list(line_number_map["breakpoints"])
     line_number_map["pc_breakpoints"] = list(line_number_map["pc_breakpoints"])
-    return o, line_number_map
+    return bytes(ret), line_number_map, symbol_map

From 019a37ab98ff53f04fecfadf602b6cd5ac748f7f Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 25 Jul 2023 07:41:12 -0700
Subject: [PATCH 090/161] Merge pull request from GHSA-f5x6-7qgp-jhf3

---
 tests/parser/functions/test_ecrecover.py | 18 ++++++++++++++
 vyper/builtins/functions.py              | 30 ++++++++----------------
 2 files changed, 28 insertions(+), 20 deletions(-)

diff --git a/tests/parser/functions/test_ecrecover.py b/tests/parser/functions/test_ecrecover.py
index 77e9655b3e..40c9a6a936 100644
--- a/tests/parser/functions/test_ecrecover.py
+++ b/tests/parser/functions/test_ecrecover.py
@@ -40,3 +40,21 @@ def test_ecrecover_uints2() -> address:
     assert c.test_ecrecover_uints2() == local_account.address
 
     print("Passed ecrecover test")
+
+
+def test_invalid_signature(get_contract):
+    code = """
+dummies: HashMap[address, HashMap[address, uint256]]
+
+@external
+def test_ecrecover(hash: bytes32, v: uint8, r: uint256) -> address:
+    # read from hashmap to put garbage in 0 memory location
+    s: uint256 = self.dummies[msg.sender][msg.sender]
+    return ecrecover(hash, v, r, s)
+    """
+    c = get_contract(code)
+    hash_ = bytes(i for i in range(32))
+    v = 0  # invalid v! ecrecover precompile will not write to output buffer
+    r = 0
+    # note web3.py decoding of 0x000..00 address is None.
+    assert c.test_ecrecover(hash_, v, r) is None
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index e1dcee6b8d..685d832c01 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -764,29 +764,19 @@ def infer_arg_types(self, node):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        placeholder_node = IRnode.from_list(
-            context.new_internal_variable(BytesT(128)), typ=BytesT(128), location=MEMORY
-        )
+        input_buf = context.new_internal_variable(get_type_for_exact_size(128))
+        output_buf = MemoryPositions.FREE_VAR_SPACE
         return IRnode.from_list(
             [
                 "seq",
-                ["mstore", placeholder_node, args[0]],
-                ["mstore", ["add", placeholder_node, 32], args[1]],
-                ["mstore", ["add", placeholder_node, 64], args[2]],
-                ["mstore", ["add", placeholder_node, 96], args[3]],
-                [
-                    "pop",
-                    [
-                        "staticcall",
-                        ["gas"],
-                        1,
-                        placeholder_node,
-                        128,
-                        MemoryPositions.FREE_VAR_SPACE,
-                        32,
-                    ],
-                ],
-                ["mload", MemoryPositions.FREE_VAR_SPACE],
+                # clear output memory first, ecrecover can return 0 bytes
+                ["mstore", output_buf, 0],
+                ["mstore", input_buf, args[0]],
+                ["mstore", input_buf + 32, args[1]],
+                ["mstore", input_buf + 64, args[2]],
+                ["mstore", input_buf + 96, args[3]],
+                ["staticcall", "gas", 1, input_buf, 128, output_buf, 32],
+                ["mload", output_buf],
             ],
             typ=AddressT(),
         )

From d48438e10722db8fc9e74d8ed434745e3b0d31cf Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 25 Jul 2023 12:56:31 -0700
Subject: [PATCH 091/161] feat: implement bound= in ranges (#3537)

---
 .../semantics/analysis/test_for_loop.py       | 35 ++++++++++++++++++-
 .../features/iteration/test_for_range.py      | 17 +++++++++
 vyper/codegen/stmt.py                         | 21 ++++++++---
 vyper/ir/compile_ir.py                        |  3 +-
 vyper/semantics/analysis/annotation.py        |  3 ++
 vyper/semantics/analysis/local.py             | 27 ++++++++++----
 6 files changed, 91 insertions(+), 15 deletions(-)

diff --git a/tests/functional/semantics/analysis/test_for_loop.py b/tests/functional/semantics/analysis/test_for_loop.py
index 8707b4c326..0d61a8f8f8 100644
--- a/tests/functional/semantics/analysis/test_for_loop.py
+++ b/tests/functional/semantics/analysis/test_for_loop.py
@@ -1,7 +1,12 @@
 import pytest
 
 from vyper.ast import parse_to_ast
-from vyper.exceptions import ImmutableViolation, TypeMismatch
+from vyper.exceptions import (
+    ArgumentException,
+    ImmutableViolation,
+    StateAccessViolation,
+    TypeMismatch,
+)
 from vyper.semantics.analysis import validate_semantics
 
 
@@ -59,6 +64,34 @@ def bar():
         validate_semantics(vyper_module, {})
 
 
+def test_bad_keywords(namespace):
+    code = """
+
+@internal
+def bar(n: uint256):
+    x: uint256 = 0
+    for i in range(n, boundddd=10):
+        x += i
+    """
+    vyper_module = parse_to_ast(code)
+    with pytest.raises(ArgumentException):
+        validate_semantics(vyper_module, {})
+
+
+def test_bad_bound(namespace):
+    code = """
+
+@internal
+def bar(n: uint256):
+    x: uint256 = 0
+    for i in range(n, bound=n):
+        x += i
+    """
+    vyper_module = parse_to_ast(code)
+    with pytest.raises(StateAccessViolation):
+        validate_semantics(vyper_module, {})
+
+
 def test_modify_iterator_function_call(namespace):
     code = """
 
diff --git a/tests/parser/features/iteration/test_for_range.py b/tests/parser/features/iteration/test_for_range.py
index 30f4bb87e3..395dd28231 100644
--- a/tests/parser/features/iteration/test_for_range.py
+++ b/tests/parser/features/iteration/test_for_range.py
@@ -14,6 +14,23 @@ def repeat(z: int128) -> int128:
     assert c.repeat(9) == 54
 
 
+def test_range_bound(get_contract, assert_tx_failed):
+    code = """
+@external
+def repeat(n: uint256) -> uint256:
+    x: uint256 = 0
+    for i in range(n, bound=6):
+        x += i
+    return x
+    """
+    c = get_contract(code)
+    for n in range(7):
+        assert c.repeat(n) == sum(range(n))
+
+    # check codegen inserts assertion for n greater than bound
+    assert_tx_failed(lambda: c.repeat(7))
+
+
 def test_digit_reverser(get_contract_with_gas_estimation):
     digit_reverser = """
 @external
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 91d45f4916..86ea1813ea 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -258,11 +258,17 @@ def _parse_For_range(self):
         arg0 = self.stmt.iter.args[0]
         num_of_args = len(self.stmt.iter.args)
 
+        kwargs = {
+            s.arg: Expr.parse_value_expr(s.value, self.context)
+            for s in self.stmt.iter.keywords or []
+        }
+
         # Type 1 for, e.g. for i in range(10): ...
         if num_of_args == 1:
-            arg0_val = self._get_range_const_value(arg0)
+            n = Expr.parse_value_expr(arg0, self.context)
             start = IRnode.from_list(0, typ=iter_typ)
-            rounds = arg0_val
+            rounds = n
+            rounds_bound = kwargs.get("bound", rounds)
 
         # Type 2 for, e.g. for i in range(100, 110): ...
         elif self._check_valid_range_constant(self.stmt.iter.args[1]).is_literal:
@@ -270,6 +276,7 @@ def _parse_For_range(self):
             arg1_val = self._get_range_const_value(self.stmt.iter.args[1])
             start = IRnode.from_list(arg0_val, typ=iter_typ)
             rounds = IRnode.from_list(arg1_val - arg0_val, typ=iter_typ)
+            rounds_bound = rounds
 
         # Type 3 for, e.g. for i in range(x, x + 10): ...
         else:
@@ -278,9 +285,10 @@ def _parse_For_range(self):
             start = Expr.parse_value_expr(arg0, self.context)
             _, hi = start.typ.int_bounds
             start = clamp("le", start, hi + 1 - rounds)
+            rounds_bound = rounds
 
-        r = rounds if isinstance(rounds, int) else rounds.value
-        if r < 1:
+        bound = rounds_bound if isinstance(rounds_bound, int) else rounds_bound.value
+        if bound < 1:
             return
 
         varname = self.stmt.target.id
@@ -294,7 +302,10 @@ def _parse_For_range(self):
         loop_body.append(["mstore", iptr, i])
         loop_body.append(parse_body(self.stmt.body, self.context))
 
-        ir_node = IRnode.from_list(["repeat", i, start, rounds, rounds, loop_body])
+        # NOTE: codegen for `repeat` inserts an assertion that rounds <= rounds_bound.
+        # if we ever want to remove that, we need to manually add the assertion
+        # where it makes sense.
+        ir_node = IRnode.from_list(["repeat", i, start, rounds, rounds_bound, loop_body])
         del self.context.forvars[varname]
 
         return ir_node
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 5e29bad0b5..bba3b34515 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -413,9 +413,8 @@ def _height_of(witharg):
             )
             # stack: i, rounds, rounds_bound
             # assert rounds <= rounds_bound
-            # TODO this runtime assertion should never fail for
+            # TODO this runtime assertion shouldn't fail for
             # internally generated repeats.
-            # maybe drop it or jump to 0xFE
             o.extend(["DUP2", "GT"] + _assert_false())
 
             # stack: i, rounds
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index 3ea0319b54..d309f102cd 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -95,6 +95,9 @@ def visit_For(self, node):
             iter_type = node.target._metadata["type"]
             for a in node.iter.args:
                 self.expr_visitor.visit(a, iter_type)
+            for a in node.iter.keywords:
+                if a.arg == "bound":
+                    self.expr_visitor.visit(a.value, iter_type)
 
 
 class ExpressionAnnotationVisitor(_AnnotationVisitorBase):
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index c99b582ad3..c0c05325f2 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -346,17 +346,30 @@ def visit_For(self, node):
                 raise IteratorException(
                     "Cannot iterate over the result of a function call", node.iter
                 )
-            validate_call_args(node.iter, (1, 2))
+            validate_call_args(node.iter, (1, 2), kwargs=["bound"])
 
             args = node.iter.args
+            kwargs = {s.arg: s.value for s in node.iter.keywords or []}
             if len(args) == 1:
                 # range(CONSTANT)
-                if not isinstance(args[0], vy_ast.Num):
-                    raise StateAccessViolation("Value must be a literal", node)
-                if args[0].value <= 0:
-                    raise StructureException("For loop must have at least 1 iteration", args[0])
-                validate_expected_type(args[0], IntegerT.any())
-                type_list = get_possible_types_from_node(args[0])
+                n = args[0]
+                bound = kwargs.pop("bound", None)
+                validate_expected_type(n, IntegerT.any())
+
+                if bound is None:
+                    if not isinstance(n, vy_ast.Num):
+                        raise StateAccessViolation("Value must be a literal", n)
+                    if n.value <= 0:
+                        raise StructureException("For loop must have at least 1 iteration", args[0])
+                    type_list = get_possible_types_from_node(n)
+
+                else:
+                    if not isinstance(bound, vy_ast.Num):
+                        raise StateAccessViolation("bound must be a literal", bound)
+                    if bound.value <= 0:
+                        raise StructureException("bound must be at least 1", args[0])
+                    type_list = get_common_types(n, bound)
+
             else:
                 validate_expected_type(args[0], IntegerT.any())
                 type_list = get_common_types(*args)

From 2f39e69d077fb8ab90bd6fe039372dd4fe5cadde Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 25 Jul 2023 16:33:41 -0700
Subject: [PATCH 092/161] fix: public constant arrays (#3536)

public getters for arrays would panic at codegen because type
information for the array members was not available. this is because
type annotation would occur before getter expansion. this commit moves
the type annotation phase to right before getter expansion, so that the
generated ast nodes will get annotated.

it also fixes a small bug when trying to deepcopy the nodes generated by
ast expansion - the generated nodes have no node_id and raise an
exception when deepcopy tries to perform `__eq__` between two of the
generated FunctionDefs.
---
 tests/parser/globals/test_getters.py | 2 ++
 vyper/ast/expansion.py               | 1 -
 vyper/ast/nodes.py                   | 2 +-
 vyper/compiler/phases.py             | 1 -
 vyper/semantics/analysis/__init__.py | 3 +++
 5 files changed, 6 insertions(+), 3 deletions(-)

diff --git a/tests/parser/globals/test_getters.py b/tests/parser/globals/test_getters.py
index 59c91cbeef..5eac074ef6 100644
--- a/tests/parser/globals/test_getters.py
+++ b/tests/parser/globals/test_getters.py
@@ -35,6 +35,7 @@ def test_getter_code(get_contract_with_gas_estimation_for_constants):
 c: public(constant(uint256)) = 1
 d: public(immutable(uint256))
 e: public(immutable(uint256[2]))
+f: public(constant(uint256[2])) = [3, 7]
 
 @external
 def __init__():
@@ -68,6 +69,7 @@ def __init__():
     assert c.c() == 1
     assert c.d() == 1729
     assert c.e(0) == 2
+    assert [c.f(i) for i in range(2)] == [3, 7]
 
 
 def test_getter_mutability(get_contract):
diff --git a/vyper/ast/expansion.py b/vyper/ast/expansion.py
index 753f2687cd..5471b971a4 100644
--- a/vyper/ast/expansion.py
+++ b/vyper/ast/expansion.py
@@ -49,7 +49,6 @@ def generate_public_variable_getters(vyper_module: vy_ast.Module) -> None:
             # the base return statement is an `Attribute` node, e.g. `self.<var_name>`
             # for each input type we wrap it in a `Subscript` to access a specific member
             return_stmt = vy_ast.Attribute(value=vy_ast.Name(id="self"), attr=func_type.name)
-        return_stmt._metadata["type"] = node._metadata["type"]
 
         for i, type_ in enumerate(input_types):
             if not isinstance(annotation, vy_ast.Subscript):
diff --git a/vyper/ast/nodes.py b/vyper/ast/nodes.py
index 7c907b4d08..2497928035 100644
--- a/vyper/ast/nodes.py
+++ b/vyper/ast/nodes.py
@@ -339,7 +339,7 @@ def __hash__(self):
     def __eq__(self, other):
         if not isinstance(other, type(self)):
             return False
-        if other.node_id != self.node_id:
+        if getattr(other, "node_id", None) != getattr(self, "node_id", None):
             return False
         for field_name in (i for i in self.get_fields() if i not in VyperNode.__slots__):
             if getattr(self, field_name, None) != getattr(other, field_name, None):
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 4e1bd9e6c3..526d2f3253 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -263,7 +263,6 @@ def generate_folded_ast(
     vyper_module_folded = copy.deepcopy(vyper_module)
     vy_ast.folding.fold(vyper_module_folded)
     validate_semantics(vyper_module_folded, interface_codes)
-    vy_ast.expansion.expand_annotated_ast(vyper_module_folded)
     symbol_tables = set_data_positions(vyper_module_folded, storage_layout_overrides)
 
     return vyper_module_folded, symbol_tables
diff --git a/vyper/semantics/analysis/__init__.py b/vyper/semantics/analysis/__init__.py
index 5977a87812..9e987d1cd0 100644
--- a/vyper/semantics/analysis/__init__.py
+++ b/vyper/semantics/analysis/__init__.py
@@ -1,3 +1,5 @@
+import vyper.ast as vy_ast
+
 from .. import types  # break a dependency cycle.
 from ..namespace import get_namespace
 from .local import validate_functions
@@ -11,4 +13,5 @@ def validate_semantics(vyper_ast, interface_codes):
 
     with namespace.enter_scope():
         add_module_namespace(vyper_ast, interface_codes)
+        vy_ast.expansion.expand_annotated_ast(vyper_ast)
         validate_functions(vyper_ast)

From 3c3285c2f15a88c84574dcca1958a282d4910e5f Mon Sep 17 00:00:00 2001
From: Ikko Eltociear Ashimine <eltociear@gmail.com>
Date: Wed, 26 Jul 2023 23:25:47 +0900
Subject: [PATCH 093/161] docs: fix typo in release-notes.rst (#3538)

unitialized -> uninitialized
---
 docs/release-notes.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index dcdbcda74a..5b6880dfdc 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -774,7 +774,7 @@ The following VIPs were implemented for Beta 13:
 
 - Add ``vyper-json`` compilation mode (VIP `#1520 <https://github.com/vyperlang/vyper/issues/1520>`_)
 - Environment variables and constants can now be used as default parameters (VIP `#1525 <https://github.com/vyperlang/vyper/issues/1525>`_)
-- Require unitialized memory be set on creation (VIP `#1493 <https://github.com/vyperlang/vyper/issues/1493>`_)
+- Require uninitialized memory be set on creation (VIP `#1493 <https://github.com/vyperlang/vyper/issues/1493>`_)
 
 Some of the bug and stability fixes:
 

From 76f1cc5a8b288696446ac08d9099bf643d132c73 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 27 Jul 2023 10:48:21 -0700
Subject: [PATCH 094/161] chore: add error message for repeat range check
 (#3542)

since d48438e and 3de1415, loops can revert depending on user input. add
it to the error map so it's easier for users to debug.
---
 vyper/codegen/stmt.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 86ea1813ea..9dc75b46ba 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -305,7 +305,9 @@ def _parse_For_range(self):
         # NOTE: codegen for `repeat` inserts an assertion that rounds <= rounds_bound.
         # if we ever want to remove that, we need to manually add the assertion
         # where it makes sense.
-        ir_node = IRnode.from_list(["repeat", i, start, rounds, rounds_bound, loop_body])
+        ir_node = IRnode.from_list(
+            ["repeat", i, start, rounds, rounds_bound, loop_body], error_msg="range() bounds check"
+        )
         del self.context.forvars[varname]
 
         return ir_node

From cfda16c734ecddc170079817cd96b14e4fe24586 Mon Sep 17 00:00:00 2001
From: Pascal Marco Caversaccio <pcaversaccio@users.noreply.github.com>
Date: Mon, 31 Jul 2023 16:24:11 +0200
Subject: [PATCH 095/161] Use `0.3.7` as example in `Installing Vyper` (#3543)

---
 docs/installing-vyper.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/installing-vyper.rst b/docs/installing-vyper.rst
index 2e2d51bd6e..249182a1c2 100644
--- a/docs/installing-vyper.rst
+++ b/docs/installing-vyper.rst
@@ -76,7 +76,7 @@ Each tagged version of vyper is uploaded to `pypi <https://pypi.org/project/vype
 To install a specific version use:
 ::
 
-    pip install vyper==0.2.15
+    pip install vyper==0.3.7
 
 
 nix

From 246c970a4e2c6355a8c23c11ab43dcde20793e64 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Thu, 3 Aug 2023 09:19:35 +0800
Subject: [PATCH 096/161] docs: fix yanked version in release notes (#3545)

---
 docs/release-notes.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 5b6880dfdc..5dc33a49c6 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -403,6 +403,7 @@ Fixes:
 
 v0.2.14
 *******
+**THIS RELEASE HAS BEEN PULLED**
 
 Date released: 20-07-2021
 
@@ -414,7 +415,6 @@ Fixes:
 
 v0.2.13
 *******
-**THIS RELEASE HAS BEEN PULLED**
 
 Date released: 06-07-2021
 

From 855f7349668d0907f968f0f5f41b64730f4dd13f Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Thu, 3 Aug 2023 16:21:42 +0200
Subject: [PATCH 097/161] docs: update release notes / yanked versions (#3547)

---
 docs/release-notes.rst | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 5dc33a49c6..9a6384697b 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -187,6 +187,7 @@ Bugfixes:
 
 v0.3.5
 ******
+**THIS RELEASE HAS BEEN PULLED**
 
 Date released: 2022-08-05
 
@@ -415,6 +416,7 @@ Fixes:
 
 v0.2.13
 *******
+**THIS RELEASE HAS BEEN PULLED**
 
 Date released: 06-07-2021
 
@@ -521,6 +523,7 @@ Fixes:
 
 v0.2.6
 ******
+**THIS RELEASE HAS BEEN PULLED**
 
 Date released: 10-10-2020
 

From b87889974b9a600624e10ab4c46adfd2c1f930ff Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Sat, 5 Aug 2023 23:47:12 +0800
Subject: [PATCH 098/161] docs: epsilon builtin (#3552)

---
 docs/built-in-functions.rst | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/docs/built-in-functions.rst b/docs/built-in-functions.rst
index 74e8560498..84859d66c2 100644
--- a/docs/built-in-functions.rst
+++ b/docs/built-in-functions.rst
@@ -573,6 +573,24 @@ Math
         >>> ExampleContract.foo(3.1337)
         4
 
+.. py:function:: epsilon(typename) -> Any
+
+    Returns the smallest non-zero value for a decimal type.
+
+    * ``typename``: Name of the decimal type (currently only ``decimal``)
+
+    .. code-block:: python
+
+        @external
+        @view
+        def foo() -> decimal:
+            return epsilon(decimal)
+
+    .. code-block:: python
+
+        >>> ExampleContract.foo()
+        Decimal('1E-10')
+
 .. py:function:: floor(value: decimal) -> int256
 
     Round a decimal down to the nearest integer.

From cc2a5cd696f9720683a19a9490119ee7297a4192 Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Sun, 6 Aug 2023 17:08:19 +0200
Subject: [PATCH 099/161] docs: note on security advisory in release notes for
 versions `0.2.15`, `0.2.16`, and `0.3.0` (#3553)

* Add note on security advisory in release notes for `0.2.15`, `0.2.16`, and `0.3.0`

* Add link to `0.3.1` release
---
 docs/release-notes.rst | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 9a6384697b..f408c5c0ab 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -336,6 +336,7 @@ Special thanks to @skellet0r for some major features in this release!
 
 v0.3.0
 *******
+⚠️ A critical security vulnerability has been discovered in this version and we strongly recommend using version `0.3.1 <https://github.com/vyperlang/vyper/releases/tag/v0.3.1>`_ or higher. For more information, please see the Security Advisory `GHSA-5824-cm3x-3c38 <https://github.com/vyperlang/vyper/security/advisories/GHSA-5824-cm3x-3c38>`_.
 
 Date released: 2021-10-04
 
@@ -368,6 +369,7 @@ Special thanks to contributions from @skellet0r and @benjyz for this release!
 
 v0.2.16
 *******
+⚠️ A critical security vulnerability has been discovered in this version and we strongly recommend using version `0.3.1 <https://github.com/vyperlang/vyper/releases/tag/v0.3.1>`_ or higher. For more information, please see the Security Advisory `GHSA-5824-cm3x-3c38 <https://github.com/vyperlang/vyper/security/advisories/GHSA-5824-cm3x-3c38>`_.
 
 Date released: 2021-08-27
 
@@ -392,6 +394,7 @@ Special thanks to contributions from @skellet0r, @sambacha and @milancermak for
 
 v0.2.15
 *******
+⚠️ A critical security vulnerability has been discovered in this version and we strongly recommend using version `0.3.1 <https://github.com/vyperlang/vyper/releases/tag/v0.3.1>`_ or higher. For more information, please see the Security Advisory `GHSA-5824-cm3x-3c38 <https://github.com/vyperlang/vyper/security/advisories/GHSA-5824-cm3x-3c38>`_.
 
 Date released: 23-07-2021
 

From 728a27677240fdd55a4144d04b31004f8330847c Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Mon, 7 Aug 2023 06:14:30 +0200
Subject: [PATCH 100/161] docs: add security advisory note for `ecrecover`
 (#3539)

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 docs/built-in-functions.rst | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/docs/built-in-functions.rst b/docs/built-in-functions.rst
index 84859d66c2..bfaa8fdd5e 100644
--- a/docs/built-in-functions.rst
+++ b/docs/built-in-functions.rst
@@ -379,7 +379,11 @@ Cryptography
     * ``s``: second 32 bytes of signature
     * ``v``: final 1 byte of signature
 
-    Returns the associated address, or ``0`` on error.
+    Returns the associated address, or ``empty(address)`` on error.
+
+    .. note::
+
+         Prior to Vyper ``0.3.10``, the ``ecrecover`` function could return an undefined (possibly nonzero) value for invalid inputs to ``ecrecover``. For more information, please see `GHSA-f5x6-7qgp-jhf3 <https://github.com/vyperlang/vyper/security/advisories/GHSA-f5x6-7qgp-jhf3>`_.
 
     .. code-block:: python
 

From 43c8d8519a67a2b5da664d85ab6207a789707c1f Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Tue, 8 Aug 2023 00:35:35 +0800
Subject: [PATCH 101/161] fix: guard against kwargs for `range` expressions
 with two arguments (#3551)

and slight refactor -- extract `node.iter` expr to `range_` for clarity

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/parser/syntax/test_for_range.py | 21 ++++++++++++++++++++-
 vyper/semantics/analysis/local.py     | 14 +++++++++++---
 2 files changed, 31 insertions(+), 4 deletions(-)

diff --git a/tests/parser/syntax/test_for_range.py b/tests/parser/syntax/test_for_range.py
index b2a9491058..e6f35c1d2d 100644
--- a/tests/parser/syntax/test_for_range.py
+++ b/tests/parser/syntax/test_for_range.py
@@ -12,7 +12,26 @@ def foo():
         pass
     """,
         StructureException,
-    )
+    ),
+    (
+        """
+@external
+def bar():
+    for i in range(1,2,bound=2):
+        pass
+    """,
+        StructureException,
+    ),
+    (
+        """
+@external
+def bar():
+    x:uint256 = 1
+    for i in range(x,x+1,bound=2):
+        pass
+    """,
+        StructureException,
+    ),
 ]
 
 
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index c0c05325f2..c10df3b8fd 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -346,10 +346,11 @@ def visit_For(self, node):
                 raise IteratorException(
                     "Cannot iterate over the result of a function call", node.iter
                 )
-            validate_call_args(node.iter, (1, 2), kwargs=["bound"])
+            range_ = node.iter
+            validate_call_args(range_, (1, 2), kwargs=["bound"])
 
-            args = node.iter.args
-            kwargs = {s.arg: s.value for s in node.iter.keywords or []}
+            args = range_.args
+            kwargs = {s.arg: s.value for s in range_.keywords or []}
             if len(args) == 1:
                 # range(CONSTANT)
                 n = args[0]
@@ -371,6 +372,13 @@ def visit_For(self, node):
                     type_list = get_common_types(n, bound)
 
             else:
+                if range_.keywords:
+                    raise StructureException(
+                        "Keyword arguments are not supported for `range(N, M)` and"
+                        "`range(x, x + N)` expressions",
+                        range_.keywords[0],
+                    )
+
                 validate_expected_type(args[0], IntegerT.any())
                 type_list = get_common_types(*args)
                 if not isinstance(args[0], vy_ast.Constant):

From f72ad784d9cbf85235ee61d29f6571e1dfc48229 Mon Sep 17 00:00:00 2001
From: mahdiRostami <rostamimahdi1997@gmail.com>
Date: Mon, 21 Aug 2023 18:18:10 +0330
Subject: [PATCH 102/161] docs: add `vyper --version` (#3558)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

add “vyper --version” to installation instructions
---
 docs/installing-vyper.rst | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/docs/installing-vyper.rst b/docs/installing-vyper.rst
index 249182a1c2..fb2849708d 100644
--- a/docs/installing-vyper.rst
+++ b/docs/installing-vyper.rst
@@ -78,7 +78,11 @@ To install a specific version use:
 
     pip install vyper==0.3.7
 
+You can check if Vyper is installed completely or not by typing the following in your terminal/cmd:
 
+::
+
+    vyper --version
 nix
 ***
 

From 158099b9c1a49b5472293c1fb7a4baf3cd015eb5 Mon Sep 17 00:00:00 2001
From: Shmuel Kroizer <69422117+shmuel44@users.noreply.github.com>
Date: Sun, 27 Aug 2023 05:59:27 +0300
Subject: [PATCH 103/161] chore: update flake8 from gitlab to github (#3566)

---
 .pre-commit-config.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 739e977c96..4b416a4414 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -11,7 +11,7 @@ repos:
       - id: black
         name: black
 
--   repo: https://gitlab.com/pycqa/flake8
+-   repo: https://github.com/PyCQA/flake8
     rev: 3.9.2
     hooks:
     -   id: flake8

From c28f14f757e17a132cff0236ee0cadb61513aa90 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 12:59:02 -0400
Subject: [PATCH 104/161] chore: fix loop variable typing (#3571)

there is an inconsistency between codegen and typechecking types when a
loop iterates over a literal list.

in this code, although it compiles, during typechecking, `i` is typed as
a `uint8` while `[1,2,3]` is annotated with `int8[3]`

```
@external
def foo():
for i in [1,2,3]:
    a: uint8 = i
```

since the iterator type is always correct, this commit is a chore since
it fixes the discrepancy, but there is no known way to "abuse" the
behavior to get a wrong codegen type.

chainsec june 2023 review 5.15
---
 vyper/codegen/stmt.py                  | 4 +---
 vyper/semantics/analysis/annotation.py | 8 ++++----
 2 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 9dc75b46ba..3ecb0afdc3 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -316,10 +316,8 @@ def _parse_For_list(self):
         with self.context.range_scope():
             iter_list = Expr(self.stmt.iter, self.context).ir_node
 
-        # override with type inferred at typechecking time
-        # TODO investigate why stmt.target.type != stmt.iter.type.value_type
         target_type = self.stmt.target._metadata["type"]
-        iter_list.typ.value_type = target_type
+        assert target_type == iter_list.typ.value_type
 
         # user-supplied name for loop variable
         varname = self.stmt.target.id
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
index d309f102cd..01ca51d7f4 100644
--- a/vyper/semantics/analysis/annotation.py
+++ b/vyper/semantics/analysis/annotation.py
@@ -85,14 +85,14 @@ def visit_Return(self, node):
     def visit_For(self, node):
         if isinstance(node.iter, (vy_ast.Name, vy_ast.Attribute)):
             self.expr_visitor.visit(node.iter)
-        # typecheck list literal as static array
+
+        iter_type = node.target._metadata["type"]
         if isinstance(node.iter, vy_ast.List):
-            value_type = get_common_types(*node.iter.elements).pop()
+            # typecheck list literal as static array
             len_ = len(node.iter.elements)
-            self.expr_visitor.visit(node.iter, SArrayT(value_type, len_))
+            self.expr_visitor.visit(node.iter, SArrayT(iter_type, len_))
 
         if isinstance(node.iter, vy_ast.Call) and node.iter.func.id == "range":
-            iter_type = node.target._metadata["type"]
             for a in node.iter.args:
                 self.expr_visitor.visit(a, iter_type)
             for a in node.iter.keywords:

From 6ea56a6eb40a7225f42765d1bedc386bd2c6166d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 13:41:17 -0400
Subject: [PATCH 105/161] chore: fix dead parameter usages (#3575)

`_is_function_implemented` did not use its parameter `fn_name`, it used
the captured `name` variable, which happened to be the same as
`fn_name`.

chainsec june 2023 review 6.2
---
 vyper/codegen/expr.py         | 6 ++----
 vyper/semantics/types/user.py | 6 +++---
 2 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index d637a454bc..fa3b8bb498 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -662,9 +662,7 @@ def parse_Call(self):
             elif isinstance(self.expr._metadata["type"], StructT):
                 args = self.expr.args
                 if len(args) == 1 and isinstance(args[0], vy_ast.Dict):
-                    return Expr.struct_literals(
-                        args[0], function_name, self.context, self.expr._metadata["type"]
-                    )
+                    return Expr.struct_literals(args[0], self.context, self.expr._metadata["type"])
 
             # Interface assignment. Bar(<address>).
             elif isinstance(self.expr._metadata["type"], InterfaceT):
@@ -733,7 +731,7 @@ def parse_IfExp(self):
         return IRnode.from_list(["if", test, body, orelse], typ=typ, location=location)
 
     @staticmethod
-    def struct_literals(expr, name, context, typ):
+    def struct_literals(expr, context, typ):
         member_subs = {}
         member_typs = {}
         for key, value in zip(expr.keys, expr.values):
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index a603691410..a71f852dbf 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -313,11 +313,11 @@ def validate_implements(self, node: vy_ast.ImplementsDecl) -> None:
 
         def _is_function_implemented(fn_name, fn_type):
             vyper_self = namespace["self"].typ
-            if name not in vyper_self.members:
+            if fn_name not in vyper_self.members:
                 return False
-            s = vyper_self.members[name]
+            s = vyper_self.members[fn_name]
             if isinstance(s, ContractFunctionT):
-                to_compare = vyper_self.members[name]
+                to_compare = vyper_self.members[fn_name]
             # this is kludgy, rework order of passes in ModuleNodeVisitor
             elif isinstance(s, VarInfo) and s.is_public:
                 to_compare = s.decl_node._metadata["func_type"]

From 17e730a044c24d4ec99fa766331eccf7a2c1effa Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 14:01:01 -0400
Subject: [PATCH 106/161] chore: add sanity check in parse_BinOp (#3567)

add sanity check in parse_BinOp, we can be stricter in the case where
it's a shift binop.

chainsec june 2023 review 5.4
---
 vyper/codegen/expr.py | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/vyper/codegen/expr.py b/vyper/codegen/expr.py
index fa3b8bb498..dc0e98786f 100644
--- a/vyper/codegen/expr.py
+++ b/vyper/codegen/expr.py
@@ -368,13 +368,17 @@ def parse_BinOp(self):
         left = Expr.parse_value_expr(self.expr.left, self.context)
         right = Expr.parse_value_expr(self.expr.right, self.context)
 
-        if not isinstance(self.expr.op, (vy_ast.LShift, vy_ast.RShift)):
+        is_shift_op = isinstance(self.expr.op, (vy_ast.LShift, vy_ast.RShift))
+
+        if is_shift_op:
+            assert is_numeric_type(left.typ)
+            assert is_numeric_type(right.typ)
+        else:
             # Sanity check - ensure that we aren't dealing with different types
             # This should be unreachable due to the type check pass
             if left.typ != right.typ:
                 raise TypeCheckFailure(f"unreachable, {left.typ} != {right.typ}", self.expr)
-
-        assert is_numeric_type(left.typ) or is_enum_type(left.typ)
+            assert is_numeric_type(left.typ) or is_enum_type(left.typ)
 
         out_typ = left.typ
 

From 6a819b1db8b3812b8e814de680b589aae6ddd203 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 16:20:21 -0400
Subject: [PATCH 107/161] chore: fix args passed to `validate_call_args`
 (#3568)

`validate_call_args` takes kwargs, the list of valid keywords as an
argument and makes sure that when a call is made, the given keywords are
valid according to the passed kwargs. however, vyper does not allow
kwargs when calling internal functions, so we should actually pass no
kwargs to `validate_call_args`.

note that this PR does not actually introduce observed changes in
compiler behavior, as the later check in `fetch_call_return` correctly
validates there are no call site kwargs for internal functions.

chainsec june review 5.7
---
 vyper/semantics/types/function.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index 10711edc8e..506dae135c 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -488,8 +488,8 @@ def fetch_call_return(self, node: vy_ast.Call) -> Optional[VyperType]:
         if node.get("func.value.id") == "self" and self.visibility == FunctionVisibility.EXTERNAL:
             raise CallViolation("Cannot call external functions via 'self'", node)
 
+        kwarg_keys = []
         # for external calls, include gas and value as optional kwargs
-        kwarg_keys = [arg.name for arg in self.keyword_args]
         if not self.is_internal:
             kwarg_keys += list(self.call_site_kwargs.keys())
         validate_call_args(node, (self.n_positional_args, self.n_total_args), kwarg_keys)

From fa89ca2f6d09a42c0349a8b22eeba281039c85a1 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 16:25:39 -0400
Subject: [PATCH 108/161] chore: note `Context.in_assertion` is dead (#3564)

the `Context` class has an `in_assertion` flag which, when set, indicates
that the context should be constant according to the definition of
`is_constant()`. however, this flag is never set during code generation,
specifically, it is possible to have a non-constant expression in an
assert statement. for example, the following contract compiles:

```vyper
x: uint256

@internal
def bar() -> uint256:
    self.x = 1
    return self.x

@external
def foo():
    assert self.bar() == 1
```

chainsec june 2023 review 5.5
---
 vyper/codegen/context.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/vyper/codegen/context.py b/vyper/codegen/context.py
index e4b41adbc0..5b79f293bd 100644
--- a/vyper/codegen/context.py
+++ b/vyper/codegen/context.py
@@ -69,6 +69,7 @@ def __init__(
         self.constancy = constancy
 
         # Whether body is currently in an assert statement
+        # XXX: dead, never set to True
         self.in_assertion = False
 
         # Whether we are currently parsing a range expression

From ef1c589f1e3488b26de9edd078a7340cac1298a4 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 31 Aug 2023 16:26:13 -0400
Subject: [PATCH 109/161] refactor: initcode generation (#3574)

move internal function generation to after ctor generation. prior to
this commit, the existing code relies on the fact that the code
generation of runtime internal functions properly sets the frame
information of the ctor's callees. if this precondition is not met in
the future, the compiler could panic because the memory allocation info
will not be available.

chainsec june 2023 review 6.2
---
 vyper/codegen/module.py | 28 ++++++++++++++++------------
 1 file changed, 16 insertions(+), 12 deletions(-)

diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index ebe7f92cf2..8caea9ee9b 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -442,6 +442,20 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
     deploy_code: List[Any] = ["seq"]
     immutables_len = global_ctx.immutable_section_bytes
     if init_function:
+        # cleanly rerun codegen for internal functions with `is_ctor_ctx=True`
+        ctor_internal_func_irs = []
+        internal_functions = [f for f in runtime_functions if _is_internal(f)]
+        for f in internal_functions:
+            init_func_t = init_function._metadata["type"]
+            if f.name not in init_func_t.recursive_calls:
+                # unreachable code, delete it
+                continue
+
+            func_ir = _ir_for_internal_function(f, global_ctx, is_ctor_context=True)
+            ctor_internal_func_irs.append(func_ir)
+
+        # generate init_func_ir after callees to ensure they have analyzed
+        # memory usage.
         # TODO might be cleaner to separate this into an _init_ir helper func
         init_func_ir = _ir_for_fallback_or_ctor(init_function, global_ctx, is_ctor_context=True)
 
@@ -468,19 +482,9 @@ def generate_ir_for_module(global_ctx: GlobalContext) -> tuple[IRnode, IRnode]:
             deploy_code.append(["iload", max(0, immutables_len - 32)])
 
         deploy_code.append(init_func_ir)
-
         deploy_code.append(["deploy", init_mem_used, runtime, immutables_len])
-
-        # internal functions come after everything else
-        internal_functions = [f for f in runtime_functions if _is_internal(f)]
-        for f in internal_functions:
-            init_func_t = init_function._metadata["type"]
-            if f.name not in init_func_t.recursive_calls:
-                # unreachable code, delete it
-                continue
-
-            func_ir = _ir_for_internal_function(f, global_ctx, is_ctor_context=True)
-            deploy_code.append(func_ir)
+        # internal functions come at end of initcode
+        deploy_code.extend(ctor_internal_func_irs)
 
     else:
         if immutables_len != 0:

From a19cdeaf84e4c70aa6517a1535fbe442cd6059f3 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 1 Sep 2023 13:25:12 -0400
Subject: [PATCH 110/161] feat: relax restrictions on internal function
 signatures (#3573)

relax the restriction on unique "method ids" for internal methods. the
check used to be there to avoid collisions between external method ids
and internal "method ids" because the calling convention for internal
functions used to involve the method id as part of the signature, but
that is no longer the case. so we can safely allow collision between
internal "method ids" and external method ids.

cf. issue #1687 which was resolved in in 9e8c661494d84fbf.

chainsec june 2023 review 5.22
---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
Co-authored-by: trocher <rocher14@live.fr>
---
 .../syntax/utils/test_function_names.py       | 40 +++++++++++++++++++
 tests/signatures/test_method_id_conflicts.py  | 20 ----------
 vyper/semantics/analysis/module.py            | 11 +----
 3 files changed, 42 insertions(+), 29 deletions(-)

diff --git a/tests/parser/syntax/utils/test_function_names.py b/tests/parser/syntax/utils/test_function_names.py
index 90e185558c..5489a4f6a0 100644
--- a/tests/parser/syntax/utils/test_function_names.py
+++ b/tests/parser/syntax/utils/test_function_names.py
@@ -23,6 +23,22 @@ def wei(i: int128) -> int128:
     temp_var : int128 = i
     return temp_var1
     """,
+    # collision between getter and external function
+    """
+foo: public(uint256)
+
+@external
+def foo():
+    pass
+    """,
+    # collision between getter and external function, reverse order
+    """
+@external
+def foo():
+    pass
+
+foo: public(uint256)
+    """,
 ]
 
 
@@ -77,6 +93,30 @@ def append():
 def foo():
     self.append()
     """,
+    # "method id" collisions between internal functions are allowed
+    """
+@internal
+@view
+def gfah():
+    pass
+
+@internal
+@view
+def eexo():
+    pass
+    """,
+    # "method id" collisions between internal+external functions are allowed
+    """
+@internal
+@view
+def gfah():
+    pass
+
+@external
+@view
+def eexo():
+    pass
+    """,
 ]
 
 
diff --git a/tests/signatures/test_method_id_conflicts.py b/tests/signatures/test_method_id_conflicts.py
index 35c10300b4..f3312efeab 100644
--- a/tests/signatures/test_method_id_conflicts.py
+++ b/tests/signatures/test_method_id_conflicts.py
@@ -48,26 +48,6 @@ def OwnerTransferV7b711143(a: uint256):
     pass
     """,
     """
-# check collision between private method IDs
-@internal
-@view
-def gfah(): pass
-
-@internal
-@view
-def eexo(): pass
-    """,
-    """
-# check collision between private and public IDs
-@internal
-@view
-def gfah(): pass
-
-@external
-@view
-def eexo(): pass
-    """,
-    """
 # check collision with ID = 0x00000000
 wycpnbqcyf:public(uint256)
 
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index d916dcf119..02ae82faac 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -22,11 +22,7 @@
 from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.common import VyperNodeVisitorBase
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
-from vyper.semantics.analysis.utils import (
-    check_constant,
-    validate_expected_type,
-    validate_unique_method_ids,
-)
+from vyper.semantics.analysis.utils import check_constant, validate_expected_type
 from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import Namespace, get_namespace
 from vyper.semantics.types import EnumT, EventT, InterfaceT, StructT
@@ -90,6 +86,7 @@ def __init__(
                 err_list.raise_if_not_empty()
 
         # generate an `InterfaceT` from the top-level node - used for building the ABI
+        # note: also validates unique method ids
         interface = InterfaceT.from_ast(module_node)
         module_node._metadata["type"] = interface
         self.interface = interface  # this is useful downstream
@@ -102,11 +99,7 @@ def __init__(
         module_node._metadata["namespace"] = _ns
 
         # check for collisions between 4byte function selectors
-        # internal functions are intentionally included in this check, to prevent breaking
-        # changes in in case of a future change to their calling convention
         self_members = namespace["self"].typ.members
-        functions = [i for i in self_members.values() if isinstance(i, ContractFunctionT)]
-        validate_unique_method_ids(functions)
 
         # get list of internal function calls made by each function
         function_defs = self.ast.get_children(vy_ast.FunctionDef)

From 572b38c839c65ef032aa58f656194205bf4ecce7 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 1 Sep 2023 13:32:45 -0400
Subject: [PATCH 111/161] fix: raw_call type when max_outsize=0 is set (#3572)

prior to this commit, when `raw_call` is used with `max_outsize`
explicitly set to 0 (`max_outsize=0`) the compiler incorrectly infers that
raw_call has no return type

```vyper
@external
@payable
def foo(_target: address):
    # compiles
    a: bool = raw_call(_target, method_id("foo()"), revert_on_failure=False)
    # should have same behavior, but prior to this commit does not compile:
    b: bool = raw_call(_target, method_id("foo()"), max_outsize=0, revert_on_failure=False)
```

chainsec june 2023 review 5.16

---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
---
 tests/parser/functions/test_raw_call.py | 63 +++++++++++++++++++++++++
 vyper/builtins/functions.py             |  2 +-
 2 files changed, 64 insertions(+), 1 deletion(-)

diff --git a/tests/parser/functions/test_raw_call.py b/tests/parser/functions/test_raw_call.py
index 95db070ffa..9c6fba79e7 100644
--- a/tests/parser/functions/test_raw_call.py
+++ b/tests/parser/functions/test_raw_call.py
@@ -1,6 +1,7 @@
 import pytest
 from hexbytes import HexBytes
 
+from vyper import compile_code
 from vyper.builtins.functions import eip1167_bytecode
 from vyper.exceptions import ArgumentException, InvalidType, StateAccessViolation
 
@@ -260,6 +261,68 @@ def __default__():
     w3.eth.send_transaction({"to": caller.address, "data": sig})
 
 
+# check max_outsize=0 does same thing as not setting max_outsize.
+# compile to bytecode and compare bytecode directly.
+def test_max_outsize_0():
+    code1 = """
+@external
+def test_raw_call(_target: address):
+    raw_call(_target, method_id("foo()"))
+    """
+    code2 = """
+@external
+def test_raw_call(_target: address):
+    raw_call(_target, method_id("foo()"), max_outsize=0)
+    """
+    output1 = compile_code(code1, ["bytecode", "bytecode_runtime"])
+    output2 = compile_code(code2, ["bytecode", "bytecode_runtime"])
+    assert output1 == output2
+
+
+# check max_outsize=0 does same thing as not setting max_outsize,
+# this time with revert_on_failure set to False
+def test_max_outsize_0_no_revert_on_failure():
+    code1 = """
+@external
+def test_raw_call(_target: address) -> bool:
+    # compile raw_call both ways, with revert_on_failure
+    a: bool = raw_call(_target, method_id("foo()"), revert_on_failure=False)
+    return a
+    """
+    # same code, but with max_outsize=0
+    code2 = """
+@external
+def test_raw_call(_target: address) -> bool:
+    a: bool = raw_call(_target, method_id("foo()"), max_outsize=0, revert_on_failure=False)
+    return a
+    """
+    output1 = compile_code(code1, ["bytecode", "bytecode_runtime"])
+    output2 = compile_code(code2, ["bytecode", "bytecode_runtime"])
+    assert output1 == output2
+
+
+# test functionality of max_outsize=0
+def test_max_outsize_0_call(get_contract):
+    target_source = """
+@external
+@payable
+def bar() -> uint256:
+    return 123
+    """
+
+    caller_source = """
+@external
+@payable
+def foo(_addr: address) -> bool:
+    success: bool = raw_call(_addr, method_id("bar()"), max_outsize=0, revert_on_failure=False)
+    return success
+    """
+
+    target = get_contract(target_source)
+    caller = get_contract(caller_source)
+    assert caller.foo(target.address) is True
+
+
 def test_static_call_fails_nonpayable(get_contract, assert_tx_failed):
     target_source = """
 baz: int128
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 685d832c01..e8e001306c 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -1093,7 +1093,7 @@ def fetch_call_return(self, node):
         revert_on_failure = kwargz.get("revert_on_failure")
         revert_on_failure = revert_on_failure.value if revert_on_failure is not None else True
 
-        if outsize is None:
+        if outsize is None or outsize.value == 0:
             if revert_on_failure:
                 return None
             return BoolT()

From 2c21eab442f6feeac6bc92b95347f2d3968b09a6 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 1 Sep 2023 17:05:44 -0400
Subject: [PATCH 112/161] fix: implements check for indexed event arguments
 (#3570)

prior to this commit, implementing an interface with wrong indexed
arguments for an event would pass the implements check. this commit
fixes the behavior.

chainsec june 2023 review 5.12

---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
---
 tests/parser/functions/test_interfaces.py | 60 +++++++++++++++++-
 tests/parser/syntax/test_interfaces.py    | 76 +++++++++++++++++++++++
 vyper/builtins/interfaces/ERC721.py       | 16 ++---
 vyper/semantics/types/user.py             | 23 +++++--
 4 files changed, 160 insertions(+), 15 deletions(-)

diff --git a/tests/parser/functions/test_interfaces.py b/tests/parser/functions/test_interfaces.py
index e43c080d46..c16e188cfd 100644
--- a/tests/parser/functions/test_interfaces.py
+++ b/tests/parser/functions/test_interfaces.py
@@ -67,7 +67,6 @@ def test_basic_interface_implements(assert_compile_failed):
 
 implements: ERC20
 
-
 @external
 def test() -> bool:
     return True
@@ -146,6 +145,7 @@ def bar() -> uint256:
     )
 
 
+# check that event types match
 def test_malformed_event(assert_compile_failed):
     interface_code = """
 event Foo:
@@ -173,6 +173,64 @@ def bar() -> uint256:
     )
 
 
+# check that event non-indexed arg needs to match interface
+def test_malformed_events_indexed(assert_compile_failed):
+    interface_code = """
+event Foo:
+    a: uint256
+    """
+
+    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+
+    not_implemented_code = """
+import a as FooBarInterface
+
+implements: FooBarInterface
+
+# a should not be indexed
+event Foo:
+    a: indexed(uint256)
+
+@external
+def bar() -> uint256:
+    return 1
+    """
+
+    assert_compile_failed(
+        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
+        InterfaceViolation,
+    )
+
+
+# check that event indexed arg needs to match interface
+def test_malformed_events_indexed2(assert_compile_failed):
+    interface_code = """
+event Foo:
+    a: indexed(uint256)
+    """
+
+    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+
+    not_implemented_code = """
+import a as FooBarInterface
+
+implements: FooBarInterface
+
+# a should be indexed
+event Foo:
+    a: uint256
+
+@external
+def bar() -> uint256:
+    return 1
+    """
+
+    assert_compile_failed(
+        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
+        InterfaceViolation,
+    )
+
+
 VALID_IMPORT_CODE = [
     # import statement, import path without suffix
     ("import a as Foo", "a"),
diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index acadaff20d..5afb34e6bd 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -134,6 +134,82 @@ def f(a: uint256): # visibility is nonpayable instead of view
     """,
         InterfaceViolation,
     ),
+    (
+        # `receiver` of `Transfer` event should be indexed
+        """
+from vyper.interfaces import ERC20
+
+implements: ERC20
+
+event Transfer:
+    sender: indexed(address)
+    receiver: address
+    value: uint256
+
+event Approval:
+    owner: indexed(address)
+    spender: indexed(address)
+    value: uint256
+
+name: public(String[32])
+symbol: public(String[32])
+decimals: public(uint8)
+balanceOf: public(HashMap[address, uint256])
+allowance: public(HashMap[address, HashMap[address, uint256]])
+totalSupply: public(uint256)
+
+@external
+def transfer(_to : address, _value : uint256) -> bool:
+    return True
+
+@external
+def transferFrom(_from : address, _to : address, _value : uint256) -> bool:
+    return True
+
+@external
+def approve(_spender : address, _value : uint256) -> bool:
+    return True
+    """,
+        InterfaceViolation,
+    ),
+    (
+        # `value` of `Transfer` event should not be indexed
+        """
+from vyper.interfaces import ERC20
+
+implements: ERC20
+
+event Transfer:
+    sender: indexed(address)
+    receiver: indexed(address)
+    value: indexed(uint256)
+
+event Approval:
+    owner: indexed(address)
+    spender: indexed(address)
+    value: uint256
+
+name: public(String[32])
+symbol: public(String[32])
+decimals: public(uint8)
+balanceOf: public(HashMap[address, uint256])
+allowance: public(HashMap[address, HashMap[address, uint256]])
+totalSupply: public(uint256)
+
+@external
+def transfer(_to : address, _value : uint256) -> bool:
+    return True
+
+@external
+def transferFrom(_from : address, _to : address, _value : uint256) -> bool:
+    return True
+
+@external
+def approve(_spender : address, _value : uint256) -> bool:
+    return True
+    """,
+        InterfaceViolation,
+    ),
 ]
 
 
diff --git a/vyper/builtins/interfaces/ERC721.py b/vyper/builtins/interfaces/ERC721.py
index 29ef5f4c26..8dea4e4976 100644
--- a/vyper/builtins/interfaces/ERC721.py
+++ b/vyper/builtins/interfaces/ERC721.py
@@ -2,18 +2,18 @@
 # Events
 
 event Transfer:
-    _from: address
-    _to: address
-    _tokenId: uint256
+    _from: indexed(address)
+    _to: indexed(address)
+    _tokenId: indexed(uint256)
 
 event Approval:
-    _owner: address
-    _approved: address
-    _tokenId: uint256
+    _owner: indexed(address)
+    _approved: indexed(address)
+    _tokenId: indexed(uint256)
 
 event ApprovalForAll:
-    _owner: address
-    _operator: address
+    _owner: indexed(address)
+    _operator: indexed(address)
     _approved: bool
 
 # Functions
diff --git a/vyper/semantics/types/user.py b/vyper/semantics/types/user.py
index a71f852dbf..ce82731c34 100644
--- a/vyper/semantics/types/user.py
+++ b/vyper/semantics/types/user.py
@@ -164,6 +164,7 @@ def __init__(self, name: str, arguments: dict, indexed: list) -> None:
         super().__init__(members=arguments)
         self.name = name
         self.indexed = indexed
+        assert len(self.indexed) == len(self.arguments)
         self.event_id = int(keccak256(self.signature.encode()).hex(), 16)
 
     # backward compatible
@@ -172,8 +173,13 @@ def arguments(self):
         return self.members
 
     def __repr__(self):
-        arg_types = ",".join(repr(a) for a in self.arguments.values())
-        return f"event {self.name}({arg_types})"
+        args = []
+        for is_indexed, (_, argtype) in zip(self.indexed, self.arguments.items()):
+            argtype_str = repr(argtype)
+            if is_indexed:
+                argtype_str = f"indexed({argtype_str})"
+            args.append(f"{argtype_str}")
+        return f"event {self.name}({','.join(args)})"
 
     # TODO rename to abi_signature
     @property
@@ -337,12 +343,17 @@ def _is_function_implemented(fn_name, fn_type):
 
         # check for missing events
         for name, event in self.events.items():
+            if name not in namespace:
+                unimplemented.append(name)
+                continue
+
+            if not isinstance(namespace[name], EventT):
+                unimplemented.append(f"{name} is not an event!")
             if (
-                name not in namespace
-                or not isinstance(namespace[name], EventT)
-                or namespace[name].event_id != event.event_id
+                namespace[name].event_id != event.event_id
+                or namespace[name].indexed != event.indexed
             ):
-                unimplemented.append(name)
+                unimplemented.append(f"{name} is not implemented! (should be {event})")
 
         if len(unimplemented) > 0:
             # TODO: improve the error message for cases where the

From 78fa8dd8f91ba0cb26277eeffb585c68c83e7daa Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 5 Sep 2023 08:26:37 -0400
Subject: [PATCH 113/161] fix: order of evaluation for some builtins (#3583)

ecadd, ecmul, addmod, mulmod

in the case that the arguments have side effects, they could be
evaluated out of order

chainsec june 2023 review 5.1

---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
Co-authored-by: trocher <43437004+trocher@users.noreply.github.com>
---
 tests/parser/functions/test_addmod.py | 32 ++++++++++
 tests/parser/functions/test_ec.py     | 40 ++++++++++++
 tests/parser/functions/test_mulmod.py | 32 ++++++++++
 vyper/builtins/functions.py           | 92 ++++++++++++---------------
 4 files changed, 143 insertions(+), 53 deletions(-)

diff --git a/tests/parser/functions/test_addmod.py b/tests/parser/functions/test_addmod.py
index 67a7e9b101..b3135660bb 100644
--- a/tests/parser/functions/test_addmod.py
+++ b/tests/parser/functions/test_addmod.py
@@ -55,3 +55,35 @@ def c() -> uint256:
     c = get_contract_with_gas_estimation(code)
 
     assert c.foo() == 2
+
+
+def test_uint256_addmod_evaluation_order(get_contract_with_gas_estimation):
+    code = """
+a: uint256
+
+@external
+def foo1() -> uint256:
+    self.a = 0
+    return uint256_addmod(self.a, 1, self.bar())
+
+@external
+def foo2() -> uint256:
+    self.a = 0
+    return uint256_addmod(self.a, self.bar(), 3)
+
+@external
+def foo3() -> uint256:
+    self.a = 0
+    return uint256_addmod(1, self.a, self.bar())
+
+@internal
+def bar() -> uint256:
+    self.a = 1
+    return 2
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo1() == 1
+    assert c.foo2() == 2
+    assert c.foo3() == 1
diff --git a/tests/parser/functions/test_ec.py b/tests/parser/functions/test_ec.py
index 9ce37d0721..e1d9e3d2ee 100644
--- a/tests/parser/functions/test_ec.py
+++ b/tests/parser/functions/test_ec.py
@@ -76,6 +76,26 @@ def foo(a: Foo) -> uint256[2]:
     assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
 
 
+def test_ecadd_evaluation_order(get_contract_with_gas_estimation):
+    code = """
+x: uint256[2]
+
+@internal
+def bar() -> uint256[2]:
+    self.x = ecadd([1, 2], [1, 2])
+    return [1, 2]
+
+@external
+def foo() -> bool:
+    self.x = [1, 2]
+    a: uint256[2] = ecadd([1, 2], [1, 2])
+    b: uint256[2] = ecadd(self.x, self.bar())
+    return a[0] == b[0] and a[1] == b[1]
+    """
+    c = get_contract_with_gas_estimation(code)
+    assert c.foo() is True
+
+
 def test_ecmul(get_contract_with_gas_estimation):
     ecmuller = """
 x3: uint256[2]
@@ -136,3 +156,23 @@ def foo(a: Foo) -> uint256[2]:
     assert c2.foo(c1.address) == G1_times_three
 
     assert_side_effects_invoked(c1, lambda: c2.foo(c1.address, transact={}))
+
+
+def test_ecmul_evaluation_order(get_contract_with_gas_estimation):
+    code = """
+x: uint256[2]
+
+@internal
+def bar() -> uint256:
+    self.x = ecmul([1, 2], 3)
+    return 3
+
+@external
+def foo() -> bool:
+    self.x = [1, 2]
+    a: uint256[2] = ecmul([1, 2], 3)
+    b: uint256[2] = ecmul(self.x, self.bar())
+    return a[0] == b[0] and a[1] == b[1]
+    """
+    c = get_contract_with_gas_estimation(code)
+    assert c.foo() is True
diff --git a/tests/parser/functions/test_mulmod.py b/tests/parser/functions/test_mulmod.py
index 1ea7a3f8e8..96477897b9 100644
--- a/tests/parser/functions/test_mulmod.py
+++ b/tests/parser/functions/test_mulmod.py
@@ -73,3 +73,35 @@ def c() -> uint256:
     c = get_contract_with_gas_estimation(code)
 
     assert c.foo() == 600
+
+
+def test_uint256_mulmod_evaluation_order(get_contract_with_gas_estimation):
+    code = """
+a: uint256
+
+@external
+def foo1() -> uint256:
+    self.a = 1
+    return uint256_mulmod(self.a, 2, self.bar())
+
+@external
+def foo2() -> uint256:
+    self.a = 1
+    return uint256_mulmod(self.bar(), self.a, 2)
+
+@external
+def foo3() -> uint256:
+    self.a = 1
+    return uint256_mulmod(2, self.a, self.bar())
+
+@internal
+def bar() -> uint256:
+    self.a = 7
+    return 5
+    """
+
+    c = get_contract_with_gas_estimation(code)
+
+    assert c.foo1() == 2
+    assert c.foo2() == 1
+    assert c.foo3() == 2
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index e8e001306c..053ee512dc 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -25,9 +25,9 @@
     eval_once_check,
     eval_seq,
     get_bytearray_length,
-    get_element_ptr,
     get_type_for_exact_size,
     ir_tuple_from_args,
+    make_setter,
     needs_external_call_wrap,
     promote_signed_int,
     sar,
@@ -782,10 +782,6 @@ def build_IR(self, expr, args, kwargs, context):
         )
 
 
-def _getelem(arg, ind):
-    return unwrap_location(get_element_ptr(arg, IRnode.from_list(ind, typ=INT128_T)))
-
-
 class ECAdd(BuiltinFunction):
     _id = "ecadd"
     _inputs = [("a", SArrayT(UINT256_T, 2)), ("b", SArrayT(UINT256_T, 2))]
@@ -793,28 +789,22 @@ class ECAdd(BuiltinFunction):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        placeholder_node = IRnode.from_list(
-            context.new_internal_variable(BytesT(128)), typ=BytesT(128), location=MEMORY
-        )
+        buf_t = get_type_for_exact_size(128)
 
-        with args[0].cache_when_complex("a") as (b1, a), args[1].cache_when_complex("b") as (b2, b):
-            o = IRnode.from_list(
-                [
-                    "seq",
-                    ["mstore", placeholder_node, _getelem(a, 0)],
-                    ["mstore", ["add", placeholder_node, 32], _getelem(a, 1)],
-                    ["mstore", ["add", placeholder_node, 64], _getelem(b, 0)],
-                    ["mstore", ["add", placeholder_node, 96], _getelem(b, 1)],
-                    [
-                        "assert",
-                        ["staticcall", ["gas"], 6, placeholder_node, 128, placeholder_node, 64],
-                    ],
-                    placeholder_node,
-                ],
-                typ=SArrayT(UINT256_T, 2),
-                location=MEMORY,
-            )
-            return b2.resolve(b1.resolve(o))
+        buf = context.new_internal_variable(buf_t)
+
+        ret = ["seq"]
+
+        dst0 = IRnode.from_list(buf, typ=SArrayT(UINT256_T, 2), location=MEMORY)
+        ret.append(make_setter(dst0, args[0]))
+
+        dst1 = IRnode.from_list(buf + 64, typ=SArrayT(UINT256_T, 2), location=MEMORY)
+        ret.append(make_setter(dst1, args[1]))
+
+        ret.append(["assert", ["staticcall", ["gas"], 6, buf, 128, buf, 64]])
+        ret.append(buf)
+
+        return IRnode.from_list(ret, typ=SArrayT(UINT256_T, 2), location=MEMORY)
 
 
 class ECMul(BuiltinFunction):
@@ -824,27 +814,22 @@ class ECMul(BuiltinFunction):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        placeholder_node = IRnode.from_list(
-            context.new_internal_variable(BytesT(128)), typ=BytesT(128), location=MEMORY
-        )
+        buf_t = get_type_for_exact_size(96)
 
-        with args[0].cache_when_complex("a") as (b1, a), args[1].cache_when_complex("b") as (b2, b):
-            o = IRnode.from_list(
-                [
-                    "seq",
-                    ["mstore", placeholder_node, _getelem(a, 0)],
-                    ["mstore", ["add", placeholder_node, 32], _getelem(a, 1)],
-                    ["mstore", ["add", placeholder_node, 64], b],
-                    [
-                        "assert",
-                        ["staticcall", ["gas"], 7, placeholder_node, 96, placeholder_node, 64],
-                    ],
-                    placeholder_node,
-                ],
-                typ=SArrayT(UINT256_T, 2),
-                location=MEMORY,
-            )
-            return b2.resolve(b1.resolve(o))
+        buf = context.new_internal_variable(buf_t)
+
+        ret = ["seq"]
+
+        dst0 = IRnode.from_list(buf, typ=SArrayT(UINT256_T, 2), location=MEMORY)
+        ret.append(make_setter(dst0, args[0]))
+
+        dst1 = IRnode.from_list(buf + 64, typ=UINT256_T, location=MEMORY)
+        ret.append(make_setter(dst1, args[1]))
+
+        ret.append(["assert", ["staticcall", ["gas"], 7, buf, 96, buf, 64]])
+        ret.append(buf)
+
+        return IRnode.from_list(ret, typ=SArrayT(UINT256_T, 2), location=MEMORY)
 
 
 def _generic_element_getter(op):
@@ -1525,13 +1510,14 @@ def evaluate(self, node):
 
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
-        c = args[2]
-
-        with c.cache_when_complex("c") as (b1, c):
-            ret = IRnode.from_list(
-                ["seq", ["assert", c], [self._opcode, args[0], args[1], c]], typ=UINT256_T
-            )
-            return b1.resolve(ret)
+        x, y, z = args
+        with x.cache_when_complex("x") as (b1, x):
+            with y.cache_when_complex("y") as (b2, y):
+                with z.cache_when_complex("z") as (b3, z):
+                    ret = IRnode.from_list(
+                        ["seq", ["assert", z], [self._opcode, x, y, z]], typ=UINT256_T
+                    )
+                    return b1.resolve(b2.resolve(b3.resolve(ret)))
 
 
 class AddMod(_AddMulMod):

From 8700e6da32189b300896567f30c185338d93fd8f Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Tue, 5 Sep 2023 19:12:34 +0100
Subject: [PATCH 114/161] chore: add `asm` option to cli help (#3585)

* Add `asm` option to CLI help
* Add missing `enum` in function docstring
---
 vyper/ast/pre_parser.py    | 2 +-
 vyper/cli/vyper_compile.py | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/vyper/ast/pre_parser.py b/vyper/ast/pre_parser.py
index 7e677b3b92..788c44ef19 100644
--- a/vyper/ast/pre_parser.py
+++ b/vyper/ast/pre_parser.py
@@ -72,7 +72,7 @@ def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
     Re-formats a vyper source string into a python source string and performs
     some validation.  More specifically,
 
-    * Translates "interface", "struct" and "event" keywords into python "class" keyword
+    * Translates "interface", "struct", "enum, and "event" keywords into python "class" keyword
     * Validates "@version" pragma against current compiler version
     * Prevents direct use of python "class" keyword
     * Prevents use of python semi-colon statement separator
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 9c96d55040..9c97f8c667 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -41,6 +41,7 @@
 opcodes_runtime    - List of runtime opcodes as a string
 ir                 - Intermediate representation in list format
 ir_json            - Intermediate representation in JSON format
+asm                - Output the EVM assembly of the deployable bytecode
 hex-ir             - Output IR and assembly constants in hex instead of decimal
 """
 

From 3900ec0d2970aa8b4fbe64d4d698d4721ad09f21 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 5 Sep 2023 17:44:05 -0400
Subject: [PATCH 115/161] refactor: `ecadd()` and `ecmul()` codegen (#3587)

refactor `ecadd()` and `ecmul()` to use `make_setter` and share code, so
we don't need to do pointer arithmetic
---
 vyper/builtins/functions.py | 66 +++++++++++++++++--------------------
 1 file changed, 31 insertions(+), 35 deletions(-)

diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 053ee512dc..3933ab2de5 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -782,54 +782,50 @@ def build_IR(self, expr, args, kwargs, context):
         )
 
 
-class ECAdd(BuiltinFunction):
-    _id = "ecadd"
-    _inputs = [("a", SArrayT(UINT256_T, 2)), ("b", SArrayT(UINT256_T, 2))]
-    _return_type = SArrayT(UINT256_T, 2)
-
+class _ECArith(BuiltinFunction):
     @process_inputs
-    def build_IR(self, expr, args, kwargs, context):
-        buf_t = get_type_for_exact_size(128)
+    def build_IR(self, expr, _args, kwargs, context):
+        args_tuple = ir_tuple_from_args(_args)
 
-        buf = context.new_internal_variable(buf_t)
+        args_t = args_tuple.typ
+        input_buf = IRnode.from_list(
+            context.new_internal_variable(args_t), typ=args_t, location=MEMORY
+        )
+        ret_t = self._return_type
 
         ret = ["seq"]
+        ret.append(make_setter(input_buf, args_tuple))
 
-        dst0 = IRnode.from_list(buf, typ=SArrayT(UINT256_T, 2), location=MEMORY)
-        ret.append(make_setter(dst0, args[0]))
+        output_buf = context.new_internal_variable(ret_t)
 
-        dst1 = IRnode.from_list(buf + 64, typ=SArrayT(UINT256_T, 2), location=MEMORY)
-        ret.append(make_setter(dst1, args[1]))
+        args_ofst = input_buf
+        args_len = args_t.memory_bytes_required
+        out_ofst = output_buf
+        out_len = ret_t.memory_bytes_required
 
-        ret.append(["assert", ["staticcall", ["gas"], 6, buf, 128, buf, 64]])
-        ret.append(buf)
+        ret.append(
+            [
+                "assert",
+                ["staticcall", ["gas"], self._precompile, args_ofst, args_len, out_ofst, out_len],
+            ]
+        )
+        ret.append(output_buf)
 
-        return IRnode.from_list(ret, typ=SArrayT(UINT256_T, 2), location=MEMORY)
+        return IRnode.from_list(ret, typ=ret_t, location=MEMORY)
 
 
-class ECMul(BuiltinFunction):
-    _id = "ecmul"
-    _inputs = [("point", SArrayT(UINT256_T, 2)), ("scalar", UINT256_T)]
+class ECAdd(_ECArith):
+    _id = "ecadd"
+    _inputs = [("a", SArrayT(UINT256_T, 2)), ("b", SArrayT(UINT256_T, 2))]
     _return_type = SArrayT(UINT256_T, 2)
+    _precompile = 0x6
 
-    @process_inputs
-    def build_IR(self, expr, args, kwargs, context):
-        buf_t = get_type_for_exact_size(96)
-
-        buf = context.new_internal_variable(buf_t)
-
-        ret = ["seq"]
 
-        dst0 = IRnode.from_list(buf, typ=SArrayT(UINT256_T, 2), location=MEMORY)
-        ret.append(make_setter(dst0, args[0]))
-
-        dst1 = IRnode.from_list(buf + 64, typ=UINT256_T, location=MEMORY)
-        ret.append(make_setter(dst1, args[1]))
-
-        ret.append(["assert", ["staticcall", ["gas"], 7, buf, 96, buf, 64]])
-        ret.append(buf)
-
-        return IRnode.from_list(ret, typ=SArrayT(UINT256_T, 2), location=MEMORY)
+class ECMul(_ECArith):
+    _id = "ecmul"
+    _inputs = [("point", SArrayT(UINT256_T, 2)), ("scalar", UINT256_T)]
+    _return_type = SArrayT(UINT256_T, 2)
+    _precompile = 0x7
 
 
 def _generic_element_getter(op):

From a854929b602f8e40728bdc028c2485ec6da4a3ef Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 5 Sep 2023 18:21:32 -0400
Subject: [PATCH 116/161] fix: `ecrecover()` buffer edge case (#3586)

this commit fixes an edge case in `ecrecover()` that was not covered by
019a37ab98ff5. in the case that one of the arguments to ecrecover writes
to memory location 0, and the signature is invalid, `ecrecover()` could
return the data written by the argument. this commit fixes the issue by
allocating fresh memory for the output buffer (which won't be written to
by evaluating any of the arguments unless the memory allocator is
broken).
---
 tests/parser/functions/test_ecrecover.py | 27 ++++++++++++++++++++++++
 vyper/builtins/functions.py              |  2 +-
 2 files changed, 28 insertions(+), 1 deletion(-)

diff --git a/tests/parser/functions/test_ecrecover.py b/tests/parser/functions/test_ecrecover.py
index 40c9a6a936..8571948c3d 100644
--- a/tests/parser/functions/test_ecrecover.py
+++ b/tests/parser/functions/test_ecrecover.py
@@ -58,3 +58,30 @@ def test_ecrecover(hash: bytes32, v: uint8, r: uint256) -> address:
     r = 0
     # note web3.py decoding of 0x000..00 address is None.
     assert c.test_ecrecover(hash_, v, r) is None
+
+
+# slightly more subtle example: get_v() stomps memory location 0,
+# so this tests that the output buffer stays clean during ecrecover()
+# builtin execution.
+def test_invalid_signature2(get_contract):
+    code = """
+
+owner: immutable(address)
+
+@external
+def __init__():
+    owner = 0x7E5F4552091A69125d5DfCb7b8C2659029395Bdf
+
+@internal
+def get_v() -> uint256:
+    assert owner == owner # force a dload to write at index 0 of memory
+    return 21
+
+@payable
+@external
+def test_ecrecover() -> bool:
+    assert ecrecover(empty(bytes32), self.get_v(), 0, 0) == empty(address)
+    return True
+    """
+    c = get_contract(code)
+    assert c.test_ecrecover() is True
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 3933ab2de5..3ec8f69934 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -765,7 +765,7 @@ def infer_arg_types(self, node):
     @process_inputs
     def build_IR(self, expr, args, kwargs, context):
         input_buf = context.new_internal_variable(get_type_for_exact_size(128))
-        output_buf = MemoryPositions.FREE_VAR_SPACE
+        output_buf = context.new_internal_variable(get_type_for_exact_size(32))
         return IRnode.from_list(
             [
                 "seq",

From 39a23137cd1babfb24222e3a9e785e047bba0c6d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 5 Sep 2023 18:44:22 -0400
Subject: [PATCH 117/161] fix: metadata journal can rollback incorrectly
 (#3569)

this commit fixes an issue where multiple writes inside of a checkpoint
lead to journal corruption on rollback. it ensures a call to
`register_update()` when the metadata dict has already been updated
inside of a given checkpoint.

note this does not change any observed functionality in the compiler
because writes to the metadata journal inside for loops only ever happen
to be written once, but it prevents a bug in case we ever add multiple
writes inside of the same checkpoint.

chainsec june review 5.3

---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
---
 tests/ast/test_metadata_journal.py | 82 ++++++++++++++++++++++++++++++
 vyper/ast/metadata.py              |  5 +-
 2 files changed, 86 insertions(+), 1 deletion(-)
 create mode 100644 tests/ast/test_metadata_journal.py

diff --git a/tests/ast/test_metadata_journal.py b/tests/ast/test_metadata_journal.py
new file mode 100644
index 0000000000..34830409fc
--- /dev/null
+++ b/tests/ast/test_metadata_journal.py
@@ -0,0 +1,82 @@
+from vyper.ast.metadata import NodeMetadata
+from vyper.exceptions import VyperException
+
+
+def test_metadata_journal_basic():
+    m = NodeMetadata()
+
+    m["x"] = 1
+    assert m["x"] == 1
+
+
+def test_metadata_journal_commit():
+    m = NodeMetadata()
+
+    with m.enter_typechecker_speculation():
+        m["x"] = 1
+
+    assert m["x"] == 1
+
+
+def test_metadata_journal_exception():
+    m = NodeMetadata()
+
+    m["x"] = 1
+    try:
+        with m.enter_typechecker_speculation():
+            m["x"] = 2
+            m["x"] = 3
+
+            assert m["x"] == 3
+            raise VyperException("dummy exception")
+
+    except VyperException:
+        pass
+
+    # rollback upon exception
+    assert m["x"] == 1
+
+
+def test_metadata_journal_rollback_inner():
+    m = NodeMetadata()
+
+    m["x"] = 1
+    with m.enter_typechecker_speculation():
+        m["x"] = 2
+
+        try:
+            with m.enter_typechecker_speculation():
+                m["x"] = 3
+                m["x"] = 4  # test multiple writes
+
+                assert m["x"] == 4
+                raise VyperException("dummy exception")
+
+        except VyperException:
+            pass
+
+    assert m["x"] == 2
+
+
+def test_metadata_journal_rollback_outer():
+    m = NodeMetadata()
+
+    m["x"] = 1
+    try:
+        with m.enter_typechecker_speculation():
+            m["x"] = 2
+
+            with m.enter_typechecker_speculation():
+                m["x"] = 3
+                m["x"] = 4  # test multiple writes
+
+            assert m["x"] == 4
+
+            m["x"] = 5
+
+            raise VyperException("dummy exception")
+
+    except VyperException:
+        pass
+
+    assert m["x"] == 1
diff --git a/vyper/ast/metadata.py b/vyper/ast/metadata.py
index 30e06e0016..0a419c3732 100644
--- a/vyper/ast/metadata.py
+++ b/vyper/ast/metadata.py
@@ -17,8 +17,11 @@ def __init__(self):
         self._node_updates: list[dict[tuple[int, str, Any], NodeMetadata]] = []
 
     def register_update(self, metadata, k):
+        KEY = (id(metadata), k)
+        if KEY in self._node_updates[-1]:
+            return
         prev = metadata.get(k, self._NOT_FOUND)
-        self._node_updates[-1][(id(metadata), k)] = (metadata, prev)
+        self._node_updates[-1][KEY] = (metadata, prev)
 
     @contextlib.contextmanager
     def enter(self):

From 96d20425fa2fbebb9e9aeb0402399c745eb80cfe Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 5 Sep 2023 19:05:23 -0400
Subject: [PATCH 118/161] feat: add runtime code layout to initcode (#3584)

this commit adds the runtime code layout to the initcode payload (as a
suffix), so that the runtime code can be analyzed without source code.
this is particularly important for disassemblers, which need
demarcations for where the data section starts as distinct from the
runtime code segment itself.

the layout is:

CBOR-encoded list:
  runtime code length
  [<length of data section> for data section in runtime data sections]
  immutable section length
  {"vyper": (major, minor, patch)}
length of CBOR-encoded list + 2, encoded as two big-endian bytes.

note the specific format for the CBOR payload was chosen to avoid
changing the last 13 bytes of the signature compared to previous
versions of vyper. that is, the last 13 bytes still look like
b"\xa1evyper\x83...", this is because, as the last item in a list, its
encoding does not change compared to being the only dict in the payload.

this commit also changes the meaning of the two footer bytes: they now
indicate the length of the entire footer (including the two bytes
indicating the footer length). the sole purpose of this is to be more
intuitive as the two footer bytes indicate offset-from-the-end where the
CBOR-encoded metadata starts, rather than the length of the CBOR
payload (without the two length bytes).

lastly, this commit renames the internal `insert_vyper_signature=` kwarg
to `insert_compiler_metadata=` as the metadata includes more than just
the vyper version now.
---
 setup.py                                |   1 +
 tests/compiler/test_bytecode_runtime.py | 133 ++++++++++++++++++++++--
 vyper/compiler/output.py                |   2 +-
 vyper/compiler/phases.py                |  12 ++-
 vyper/ir/compile_ir.py                  |  64 ++++++++----
 5 files changed, 180 insertions(+), 32 deletions(-)

diff --git a/setup.py b/setup.py
index bbf6e60f55..c251071229 100644
--- a/setup.py
+++ b/setup.py
@@ -92,6 +92,7 @@ def _global_version(version):
     python_requires=">=3.10,<4",
     py_modules=["vyper"],
     install_requires=[
+        "cbor2>=5.4.6,<6",
         "asttokens>=2.0.5,<3",
         "pycryptodome>=3.5.1,<4",
         "semantic-version>=2.10,<3",
diff --git a/tests/compiler/test_bytecode_runtime.py b/tests/compiler/test_bytecode_runtime.py
index 86eff70a50..9519b03772 100644
--- a/tests/compiler/test_bytecode_runtime.py
+++ b/tests/compiler/test_bytecode_runtime.py
@@ -1,14 +1,135 @@
-import vyper
+import cbor2
+import pytest
 
+import vyper
+from vyper.compiler.settings import OptimizationLevel, Settings
 
-def test_bytecode_runtime():
-    code = """
+simple_contract_code = """
 @external
 def a() -> bool:
     return True
-    """
+"""
+
+many_functions = """
+@external
+def foo1():
+    pass
+
+@external
+def foo2():
+    pass
+
+@external
+def foo3():
+    pass
+
+@external
+def foo4():
+    pass
+
+@external
+def foo5():
+    pass
+"""
+
+has_immutables = """
+A_GOOD_PRIME: public(immutable(uint256))
+
+@external
+def __init__():
+    A_GOOD_PRIME = 967
+"""
+
+
+def _parse_cbor_metadata(initcode):
+    metadata_ofst = int.from_bytes(initcode[-2:], "big")
+    metadata = cbor2.loads(initcode[-metadata_ofst:-2])
+    return metadata
 
-    out = vyper.compile_code(code, ["bytecode_runtime", "bytecode"])
+
+def test_bytecode_runtime():
+    out = vyper.compile_code(simple_contract_code, ["bytecode_runtime", "bytecode"])
 
     assert len(out["bytecode"]) > len(out["bytecode_runtime"])
-    assert out["bytecode_runtime"][2:] in out["bytecode"][2:]
+    assert out["bytecode_runtime"].removeprefix("0x") in out["bytecode"].removeprefix("0x")
+
+
+def test_bytecode_signature():
+    out = vyper.compile_code(simple_contract_code, ["bytecode_runtime", "bytecode"])
+
+    runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
+    initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
+
+    metadata = _parse_cbor_metadata(initcode)
+    runtime_len, data_section_lengths, immutables_len, compiler = metadata
+
+    assert runtime_len == len(runtime_code)
+    assert data_section_lengths == []
+    assert immutables_len == 0
+    assert compiler == {"vyper": list(vyper.version.version_tuple)}
+
+
+def test_bytecode_signature_dense_jumptable():
+    settings = Settings(optimize=OptimizationLevel.CODESIZE)
+
+    out = vyper.compile_code(many_functions, ["bytecode_runtime", "bytecode"], settings=settings)
+
+    runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
+    initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
+
+    metadata = _parse_cbor_metadata(initcode)
+    runtime_len, data_section_lengths, immutables_len, compiler = metadata
+
+    assert runtime_len == len(runtime_code)
+    assert data_section_lengths == [5, 35]
+    assert immutables_len == 0
+    assert compiler == {"vyper": list(vyper.version.version_tuple)}
+
+
+def test_bytecode_signature_sparse_jumptable():
+    settings = Settings(optimize=OptimizationLevel.GAS)
+
+    out = vyper.compile_code(many_functions, ["bytecode_runtime", "bytecode"], settings=settings)
+
+    runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
+    initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
+
+    metadata = _parse_cbor_metadata(initcode)
+    runtime_len, data_section_lengths, immutables_len, compiler = metadata
+
+    assert runtime_len == len(runtime_code)
+    assert data_section_lengths == [8]
+    assert immutables_len == 0
+    assert compiler == {"vyper": list(vyper.version.version_tuple)}
+
+
+def test_bytecode_signature_immutables():
+    out = vyper.compile_code(has_immutables, ["bytecode_runtime", "bytecode"])
+
+    runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
+    initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
+
+    metadata = _parse_cbor_metadata(initcode)
+    runtime_len, data_section_lengths, immutables_len, compiler = metadata
+
+    assert runtime_len == len(runtime_code)
+    assert data_section_lengths == []
+    assert immutables_len == 32
+    assert compiler == {"vyper": list(vyper.version.version_tuple)}
+
+
+# check that deployed bytecode actually matches the cbor metadata
+@pytest.mark.parametrize("code", [simple_contract_code, has_immutables, many_functions])
+def test_bytecode_signature_deployed(code, get_contract, w3):
+    c = get_contract(code)
+    deployed_code = w3.eth.get_code(c.address)
+
+    initcode = c._classic_contract.bytecode
+
+    metadata = _parse_cbor_metadata(initcode)
+    runtime_len, data_section_lengths, immutables_len, compiler = metadata
+
+    assert compiler == {"vyper": list(vyper.version.version_tuple)}
+
+    # runtime_len includes data sections but not immutables
+    assert len(deployed_code) == runtime_len + immutables_len
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 69fcbf1f1f..334c5ba613 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -218,7 +218,7 @@ def _build_asm(asm_list):
 
 def build_source_map_output(compiler_data: CompilerData) -> OrderedDict:
     _, line_number_map = compile_ir.assembly_to_evm(
-        compiler_data.assembly_runtime, insert_vyper_signature=False
+        compiler_data.assembly_runtime, insert_compiler_metadata=False
     )
     # Sort line_number_map
     out = OrderedDict()
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 526d2f3253..a1c7342320 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -184,12 +184,12 @@ def assembly_runtime(self) -> list:
 
     @cached_property
     def bytecode(self) -> bytes:
-        insert_vyper_signature = not self.no_bytecode_metadata
-        return generate_bytecode(self.assembly, insert_vyper_signature=insert_vyper_signature)
+        insert_compiler_metadata = not self.no_bytecode_metadata
+        return generate_bytecode(self.assembly, insert_compiler_metadata=insert_compiler_metadata)
 
     @cached_property
     def bytecode_runtime(self) -> bytes:
-        return generate_bytecode(self.assembly_runtime, insert_vyper_signature=False)
+        return generate_bytecode(self.assembly_runtime, insert_compiler_metadata=False)
 
     @cached_property
     def blueprint_bytecode(self) -> bytes:
@@ -331,7 +331,7 @@ def _find_nested_opcode(assembly, key):
         return any(_find_nested_opcode(x, key) for x in sublists)
 
 
-def generate_bytecode(assembly: list, insert_vyper_signature: bool) -> bytes:
+def generate_bytecode(assembly: list, insert_compiler_metadata: bool) -> bytes:
     """
     Generate bytecode from assembly instructions.
 
@@ -345,4 +345,6 @@ def generate_bytecode(assembly: list, insert_vyper_signature: bool) -> bytes:
     bytes
         Final compiled bytecode.
     """
-    return compile_ir.assembly_to_evm(assembly, insert_vyper_signature=insert_vyper_signature)[0]
+    return compile_ir.assembly_to_evm(assembly, insert_compiler_metadata=insert_compiler_metadata)[
+        0
+    ]
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index bba3b34515..7a3e97155b 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -1,6 +1,9 @@
 import copy
 import functools
 import math
+from dataclasses import dataclass
+
+import cbor2
 
 from vyper.codegen.ir_node import IRnode
 from vyper.compiler.settings import OptimizationLevel
@@ -507,9 +510,9 @@ def _height_of(witharg):
     elif code.value == "deploy":
         memsize = code.args[0].value  # used later to calculate _mem_deploy_start
         ir = code.args[1]
-        padding = code.args[2].value
+        immutables_len = code.args[2].value
         assert isinstance(memsize, int), "non-int memsize"
-        assert isinstance(padding, int), "non-int padding"
+        assert isinstance(immutables_len, int), "non-int immutables_len"
 
         runtime_begin = mksymbol("runtime_begin")
 
@@ -521,14 +524,14 @@ def _height_of(witharg):
         o.extend(["_sym_subcode_size", runtime_begin, "_mem_deploy_start", "CODECOPY"])
 
         # calculate the len of runtime code
-        o.extend(["_OFST", "_sym_subcode_size", padding])  # stack: len
+        o.extend(["_OFST", "_sym_subcode_size", immutables_len])  # stack: len
         o.extend(["_mem_deploy_start"])  # stack: len mem_ofst
         o.extend(["RETURN"])
 
         # since the asm data structures are very primitive, to make sure
         # assembly_to_evm is able to calculate data offsets correctly,
         # we pass the memsize via magic opcodes to the subcode
-        subcode = [_RuntimeHeader(runtime_begin, memsize)] + subcode
+        subcode = [_RuntimeHeader(runtime_begin, memsize, immutables_len)] + subcode
 
         # append the runtime code after the ctor code
         # `append(...)` call here is intentional.
@@ -1051,18 +1054,19 @@ def _length_of_data(assembly):
     return ret
 
 
+@dataclass
 class _RuntimeHeader:
-    def __init__(self, label, ctor_mem_size):
-        self.label = label
-        self.ctor_mem_size = ctor_mem_size
+    label: str
+    ctor_mem_size: int
+    immutables_len: int
 
     def __repr__(self):
-        return f"<RUNTIME {self.label} mem @{self.ctor_mem_size}>"
+        return f"<RUNTIME {self.label} mem @{self.ctor_mem_size} imms @{self.immutables_len}>"
 
 
+@dataclass
 class _DataHeader:
-    def __init__(self, label):
-        self.label = label
+    label: str
 
     def __repr__(self):
         return f"DATA {self.label}"
@@ -1092,21 +1096,21 @@ def _relocate_segments(assembly):
 
 
 # TODO: change API to split assembly_to_evm and assembly_to_source/symbol_maps
-def assembly_to_evm(assembly, pc_ofst=0, insert_vyper_signature=False):
+def assembly_to_evm(assembly, pc_ofst=0, insert_compiler_metadata=False):
     bytecode, source_maps, _ = assembly_to_evm_with_symbol_map(
-        assembly, pc_ofst=pc_ofst, insert_vyper_signature=insert_vyper_signature
+        assembly, pc_ofst=pc_ofst, insert_compiler_metadata=insert_compiler_metadata
     )
     return bytecode, source_maps
 
 
-def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_vyper_signature=False):
+def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_compiler_metadata=False):
     """
     Assembles assembly into EVM
 
     assembly: list of asm instructions
     pc_ofst: when constructing the source map, the amount to offset all
              pcs by (no effect until we add deploy code source map)
-    insert_vyper_signature: whether to append vyper metadata to output
+    insert_compiler_metadata: whether to append vyper metadata to output
                             (should be true for runtime code)
     """
     line_number_map = {
@@ -1122,12 +1126,6 @@ def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_vyper_signature=
 
     runtime_code, runtime_code_start, runtime_code_end = None, None, None
 
-    bytecode_suffix = b""
-    if insert_vyper_signature:
-        # CBOR encoded: {"vyper": [major,minor,patch]}
-        bytecode_suffix += b"\xa1\x65vyper\x83" + bytes(list(version_tuple))
-        bytecode_suffix += len(bytecode_suffix).to_bytes(2, "big")
-
     # to optimize the size of deploy code - we want to use the smallest
     # PUSH instruction possible which can support all memory symbols
     # (and also works with linear pass symbol resolution)
@@ -1155,6 +1153,9 @@ def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_vyper_signature=
     if runtime_code_end is not None:
         mem_ofst_size = calc_mem_ofst_size(runtime_code_end + max_mem_ofst)
 
+    data_section_lengths = []
+    immutables_len = None
+
     # go through the code, resolving symbolic locations
     # (i.e. JUMPDEST locations) to actual code locations
     for i, item in enumerate(assembly):
@@ -1198,18 +1199,41 @@ def assembly_to_evm_with_symbol_map(assembly, pc_ofst=0, insert_vyper_signature=
             # [_OFST, _mem_foo, bar] -> PUSHN (foo+bar)
             pc -= 1
         elif isinstance(item, list) and isinstance(item[0], _RuntimeHeader):
+            # we are in initcode
             symbol_map[item[0].label] = pc
             # add source map for all items in the runtime map
             t = adjust_pc_maps(runtime_map, pc)
             for key in line_number_map:
                 line_number_map[key].update(t[key])
+            immutables_len = item[0].immutables_len
             pc += len(runtime_code)
+            # grab lengths of data sections from the runtime
+            for t in item:
+                if isinstance(t, list) and isinstance(t[0], _DataHeader):
+                    data_section_lengths.append(_length_of_data(t))
+
         elif isinstance(item, list) and isinstance(item[0], _DataHeader):
             symbol_map[item[0].label] = pc
             pc += _length_of_data(item)
         else:
             pc += 1
 
+    bytecode_suffix = b""
+    if insert_compiler_metadata:
+        # this will hold true when we are in initcode
+        assert immutables_len is not None
+        metadata = (
+            len(runtime_code),
+            data_section_lengths,
+            immutables_len,
+            {"vyper": version_tuple},
+        )
+        bytecode_suffix += cbor2.dumps(metadata)
+        # append the length of the footer, *including* the length
+        # of the length bytes themselves.
+        suffix_len = len(bytecode_suffix) + 2
+        bytecode_suffix += suffix_len.to_bytes(2, "big")
+
     pc += len(bytecode_suffix)
 
     symbol_map["_sym_code_end"] = pc

From 41c9a3a62f94678aa0a64b4db3676d6da963a1e7 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 11:15:09 -0400
Subject: [PATCH 119/161] chore: `v0.3.10rc1` release notes (#3534)

---------

Co-authored-by: tserg <8017125+tserg@users.noreply.github.com>
---
 docs/release-notes.rst | 58 +++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 57 insertions(+), 1 deletion(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index f408c5c0ab..da86c5c0ce 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -14,8 +14,64 @@ Release Notes
     for advisory links:
     :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/security\/advisories\/)([-A-Za-z0-9]+)/(`\2 <\1\2>`_)/g
 
+..
+    v0.3.10 ("Black Adder")
+    ***********************
+
+v0.3.10rc1
+**********
+
+Date released: 2023-09-06
+=========================
+
+v0.3.10 is a performance focused release. It adds a ``codesize`` optimization mode (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), adds new vyper-specific ``#pragma`` directives  (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), uses Cancun's ``MCOPY`` opcode for some compiler generated code (`#3483 <https://github.com/vyperlang/vyper/pull/3483>`_), and generates selector tables which now feature O(1) performance (`#3496 <https://github.com/vyperlang/vyper/pull/3496>`_).
+
+Breaking changes:
+-----------------
+
+- add runtime code layout to initcode (`#3584 <https://github.com/vyperlang/vyper/pull/3584>`_)
+- drop evm versions through istanbul (`#3470 <https://github.com/vyperlang/vyper/pull/3470>`_)
+- remove vyper signature from runtime (`#3471 <https://github.com/vyperlang/vyper/pull/3471>`_)
+
+Non-breaking changes and improvements:
+--------------------------------------
+
+- O(1) selector tables (`#3496 <https://github.com/vyperlang/vyper/pull/3496>`_)
+- implement bound= in ranges (`#3537 <https://github.com/vyperlang/vyper/pull/3537>`_, `#3551 <https://github.com/vyperlang/vyper/pull/3551>`_)
+- add optimization mode to vyper compiler (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_)
+- improve batch copy performance (`#3483 <https://github.com/vyperlang/vyper/pull/3483>`_, `#3499 <https://github.com/vyperlang/vyper/pull/3499>`_, `#3525 <https://github.com/vyperlang/vyper/pull/3525>`_)
+
+Notable fixes:
+--------------
+
+- fix ``ecrecover()`` behavior when signature is invalid (`GHSA-f5x6-7qgp-jhf3 <https://github.com/vyperlang/vyper/security/advisories/GHSA-f5x6-7qgp-jhf3>`_, `#3586 <https://github.com/vyperlang/vyper/pull/3586>`_)
+- fix: order of evaluation for some builtins (`#3583 <https://github.com/vyperlang/vyper/pull/3583>`_, `#3587 <https://github.com/vyperlang/vyper/pull/3587>`_)
+- fix: pycryptodome for arm builds (`#3485 <https://github.com/vyperlang/vyper/pull/3485>`_)
+- let params of internal functions be mutable (`#3473 <https://github.com/vyperlang/vyper/pull/3473>`_)
+- typechecking of folded builtins in (`#3490 <https://github.com/vyperlang/vyper/pull/3490>`_)
+- update tload/tstore opcodes per latest 1153 EIP spec (`#3484 <https://github.com/vyperlang/vyper/pull/3484>`_)
+- fix: raw_call type when max_outsize=0 is set (`#3572 <https://github.com/vyperlang/vyper/pull/3572>`_)
+- fix: implements check for indexed event arguments (`#3570 <https://github.com/vyperlang/vyper/pull/3570>`_)
+
+Other docs updates, chores and fixes:
+-------------------------------------
+
+- relax restrictions on internal function signatures (`#3573 <https://github.com/vyperlang/vyper/pull/3573>`_)
+- note on security advisory in release notes for versions ``0.2.15``, ``0.2.16``, and ``0.3.0`` (`#3553 <https://github.com/vyperlang/vyper/pull/3553>`_)
+- fix: yanked version in release notes (`#3545 <https://github.com/vyperlang/vyper/pull/3545>`_)
+- update release notes on yanked versions (`#3547 <https://github.com/vyperlang/vyper/pull/3547>`_)
+- improve error message for conflicting methods IDs (`#3491 <https://github.com/vyperlang/vyper/pull/3491>`_)
+- document epsilon builtin (`#3552 <https://github.com/vyperlang/vyper/pull/3552>`_)
+- relax version pragma parsing (`#3511 <https://github.com/vyperlang/vyper/pull/3511>`_)
+- fix: issue with finding installed packages in editable mode (`#3510 <https://github.com/vyperlang/vyper/pull/3510>`_)
+- add note on security advisory for ``ecrecover`` in docs (`#3539 <https://github.com/vyperlang/vyper/pull/3539>`_)
+- add ``asm`` option to cli help (`#3585 <https://github.com/vyperlang/vyper/pull/3585>`_)
+- add message to error map for repeat range check (`#3542 <https://github.com/vyperlang/vyper/pull/3542>`_)
+- fix: public constant arrays (`#3536 <https://github.com/vyperlang/vyper/pull/3536>`_)
+
+
 v0.3.9 ("Common Adder")
-******
+***********************
 
 Date released: 2023-05-29
 

From 09f95c5d3921bb193f35f7fff8f653a1f0bb79b6 Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Wed, 6 Sep 2023 20:14:48 +0100
Subject: [PATCH 120/161] chore: add `ir_runtime` option to cli help (#3592)

---
 vyper/cli/vyper_compile.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index 9c97f8c667..bdd01eebbe 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -41,6 +41,7 @@
 opcodes_runtime    - List of runtime opcodes as a string
 ir                 - Intermediate representation in list format
 ir_json            - Intermediate representation in JSON format
+ir_runtime         - Intermediate representation of runtime bytecode in list format
 asm                - Output the EVM assembly of the deployable bytecode
 hex-ir             - Output IR and assembly constants in hex instead of decimal
 """

From 1ed445765d546437febb7a2d3347d29bea6d943d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 15:18:46 -0400
Subject: [PATCH 121/161] chore(ci): fix macos universal2 build (#3590)

this was a build regression introduced by the inclusion of the `cbor2`
package in 96d20425fa2fb.
---
 .github/workflows/build.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index b4be1043c1..684955bea1 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -38,7 +38,7 @@ jobs:
 
       - name: Generate Binary
         run: >-
-          pip install --no-binary pycryptodome . &&
+          pip install --no-binary pycryptodome --no-binary cbor2 . &&
           pip install pyinstaller &&
           make freeze
 

From 294d97c2b853fb67ec7ca5398dfd60808384d4fb Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 16:02:51 -0400
Subject: [PATCH 122/161] fix: version parsing for release candidates (#3593)

the npm spec library is buggy and does not handle release candidates
correctly. switch to the pypa packaging library which does pep440. note
that we do a hack in order to support commonly used npm prefixes: no
prefix, and `^` as prefix. going forward in v0.4.x, we will switch to
pep440 entirely.
---
 docs/structure-of-a-contract.rst |  2 +-
 tests/ast/test_pre_parser.py     | 32 ++++++------------------
 vyper/ast/pre_parser.py          | 43 ++++++++++----------------------
 3 files changed, 21 insertions(+), 56 deletions(-)

diff --git a/docs/structure-of-a-contract.rst b/docs/structure-of-a-contract.rst
index f58ab3b067..d2c5d48d96 100644
--- a/docs/structure-of-a-contract.rst
+++ b/docs/structure-of-a-contract.rst
@@ -17,7 +17,7 @@ Vyper supports several source code directives to control compiler modes and help
 Version Pragma
 --------------
 
-The version pragma ensures that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax.
+The version pragma ensures that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax. Starting from v0.4.0 and up, version strings will use `PEP440 version specifiers <https://peps.python.org/pep-0440/#version-specifiers>_`.
 
 As of 0.3.10, the recommended way to specify the version pragma is as follows:
 
diff --git a/tests/ast/test_pre_parser.py b/tests/ast/test_pre_parser.py
index 150ee55edf..5427532c16 100644
--- a/tests/ast/test_pre_parser.py
+++ b/tests/ast/test_pre_parser.py
@@ -21,16 +21,9 @@ def set_version(version):
     "0.1.1",
     ">0.0.1",
     "^0.1.0",
-    "<=1.0.0 >=0.1.0",
-    "0.1.0 - 1.0.0",
-    "~0.1.0",
-    "0.1",
-    "0",
-    "*",
-    "x",
-    "0.x",
-    "0.1.x",
-    "0.2.0 || 0.1.1",
+    "<=1.0.0,>=0.1.0",
+    # "0.1.0 - 1.0.0",
+    "~=0.1.0",
 ]
 invalid_versions = [
     "0.1.0",
@@ -44,7 +37,6 @@ def set_version(version):
     "1.x",
     "0.2.x",
     "0.2.0 || 0.1.3",
-    "==0.1.1",
     "abc",
 ]
 
@@ -70,9 +62,10 @@ def test_invalid_version_pragma(file_version, mock_version):
     "<0.1.1-rc.1",
     ">0.1.1a1",
     ">0.1.1-alpha.1",
-    "0.1.1a9 - 0.1.1-rc.10",
+    ">=0.1.1a9,<=0.1.1-rc.10",
     "<0.1.1b8",
     "<0.1.1rc1",
+    "<0.2.0",
 ]
 prerelease_invalid_versions = [
     ">0.1.1-beta.9",
@@ -80,19 +73,8 @@ def test_invalid_version_pragma(file_version, mock_version):
     "0.1.1b8",
     "0.1.1rc2",
     "0.1.1-rc.9 - 0.1.1-rc.10",
-    "<0.2.0",
-    pytest.param(
-        "<0.1.1b1",
-        marks=pytest.mark.xfail(
-            reason="https://github.com/rbarrois/python-semanticversion/issues/100"
-        ),
-    ),
-    pytest.param(
-        "<0.1.1a9",
-        marks=pytest.mark.xfail(
-            reason="https://github.com/rbarrois/python-semanticversion/issues/100"
-        ),
-    ),
+    "<0.1.1b1",
+    "<0.1.1a9",
 ]
 
 
diff --git a/vyper/ast/pre_parser.py b/vyper/ast/pre_parser.py
index 788c44ef19..0ead889787 100644
--- a/vyper/ast/pre_parser.py
+++ b/vyper/ast/pre_parser.py
@@ -2,7 +2,7 @@
 import re
 from tokenize import COMMENT, NAME, OP, TokenError, TokenInfo, tokenize, untokenize
 
-from semantic_version import NpmSpec, Version
+from packaging.specifiers import InvalidSpecifier, SpecifierSet
 
 from vyper.compiler.settings import OptimizationLevel, Settings
 
@@ -12,21 +12,6 @@
 from vyper.exceptions import StructureException, SyntaxException, VersionException
 from vyper.typing import ModificationOffsets, ParserPosition
 
-VERSION_ALPHA_RE = re.compile(r"(?<=\d)a(?=\d)")  # 0.1.0a17
-VERSION_BETA_RE = re.compile(r"(?<=\d)b(?=\d)")  # 0.1.0b17
-VERSION_RC_RE = re.compile(r"(?<=\d)rc(?=\d)")  # 0.1.0rc17
-
-
-def _convert_version_str(version_str: str) -> str:
-    """
-    Convert loose version (0.1.0b17) to strict version (0.1.0-beta.17)
-    """
-    version_str = re.sub(VERSION_ALPHA_RE, "-alpha.", version_str)  # 0.1.0-alpha.17
-    version_str = re.sub(VERSION_BETA_RE, "-beta.", version_str)  # 0.1.0-beta.17
-    version_str = re.sub(VERSION_RC_RE, "-rc.", version_str)  # 0.1.0-rc.17
-
-    return version_str
-
 
 def validate_version_pragma(version_str: str, start: ParserPosition) -> None:
     """
@@ -34,28 +19,26 @@ def validate_version_pragma(version_str: str, start: ParserPosition) -> None:
     """
     from vyper import __version__
 
-    # NOTE: should be `x.y.z.*`
-    installed_version = ".".join(__version__.split(".")[:3])
-
-    strict_file_version = _convert_version_str(version_str)
-    strict_compiler_version = Version(_convert_version_str(installed_version))
-
-    if len(strict_file_version) == 0:
+    if len(version_str) == 0:
         raise VersionException("Version specification cannot be empty", start)
 
+    # X.Y.Z or vX.Y.Z => ==X.Y.Z, ==vX.Y.Z
+    if re.match("[v0-9]", version_str):
+        version_str = "==" + version_str
+    # convert npm to pep440
+    version_str = re.sub("^\\^", "~=", version_str)
+
     try:
-        npm_spec = NpmSpec(strict_file_version)
-    except ValueError:
+        spec = SpecifierSet(version_str)
+    except InvalidSpecifier:
         raise VersionException(
-            f'Version specification "{version_str}" is not a valid NPM semantic '
-            f"version specification",
-            start,
+            f'Version specification "{version_str}" is not a valid PEP440 specifier', start
         )
 
-    if not npm_spec.match(strict_compiler_version):
+    if not spec.contains(__version__, prereleases=True):
         raise VersionException(
             f'Version specification "{version_str}" is not compatible '
-            f'with compiler version "{installed_version}"',
+            f'with compiler version "{__version__}"',
             start,
         )
 

From aca2b4c5e54791943547342fae3c06552db1a3a7 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 16:04:14 -0400
Subject: [PATCH 123/161] chore: CI for pre-release (release candidate) actions
 (#3589)

---
 .github/workflows/build.yml   | 2 +-
 .github/workflows/publish.yml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 684955bea1..e81aa236d1 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -9,7 +9,7 @@ on:
     branches:
       - master
   release:
-    types: [released]
+    types: [published]  # releases and pre-releases (release candidates)
 
 defaults:
   run:
diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
index 44c6978295..f268942e7d 100644
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -5,7 +5,7 @@ name: Publish to PyPI
 
 on:
   release:
-    types: [released]
+    types: [published]  # releases and pre-releases (release candidates)
 
 jobs:
 

From bb6e69acc3158f0acf16f23637f053d63d226e5b Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 16:35:03 -0400
Subject: [PATCH 124/161] chore(ci): build binaries on pull requests (#3591)

build binaries on all pull requests, to have better oversight over
binary build success
---
 .github/workflows/build.yml | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index e81aa236d1..7243a05408 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -1,4 +1,4 @@
-name: Build and release artifacts
+name: Build artifacts
 
 on:
   workflow_dispatch:
@@ -8,6 +8,7 @@ on:
   push:
     branches:
       - master
+  pull_request:
   release:
     types: [published]  # releases and pre-releases (release candidates)
 
@@ -42,6 +43,7 @@ jobs:
           pip install pyinstaller &&
           make freeze
 
+
       - name: Upload Artifact
         uses: actions/upload-artifact@v3
         with:
@@ -101,3 +103,13 @@ jobs:
               "https://uploads.github.com/repos/${{ github.repository }}/releases/${{ github.event.release.id }}/assets?name=${BIN_NAME}" \
               --data-binary "@${BIN_NAME}"
           done
+
+  # check build success for pull requests
+  build-success:
+    if: always()
+    runs-on: ubuntu-latest
+    needs: [windows-build, unix-build]
+    steps:
+      - name: check that all builds succeeded
+        if: ${{ contains(needs.*.result, 'failure') }}
+        run: exit 1

From 0cb37e3ef96ce374dafec5b1fcb40849fe074c62 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 6 Sep 2023 17:51:33 -0400
Subject: [PATCH 125/161] fix: dependency specification for `packaging` (#3594)

setup.py regression introduced in 294d97c2b853fb
---
 setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.py b/setup.py
index c251071229..c81b9bed4a 100644
--- a/setup.py
+++ b/setup.py
@@ -95,7 +95,7 @@ def _global_version(version):
         "cbor2>=5.4.6,<6",
         "asttokens>=2.0.5,<3",
         "pycryptodome>=3.5.1,<4",
-        "semantic-version>=2.10,<3",
+        "packaging>=23.1,<24",
         "importlib-metadata",
         "wheel",
     ],

From 3b310d5292c4d1448e673d7b3adb223f9353260e Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 7 Sep 2023 17:45:35 -0400
Subject: [PATCH 126/161] chore(ci): fix binary names in release asset upload
 (#3597)

rename binary during asset upload to properly escape the filename for
the github API call.

(Github API states:
> GitHub renames asset filenames that have special characters,
non-alphanumeric characters, and leading or trailing periods. The "List
release assets" endpoint lists the renamed filenames. For more
information and help, contact GitHub Support.
)
---
 .github/workflows/build.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/build.yml b/.github/workflows/build.yml
index 7243a05408..c8d7f7d6c4 100644
--- a/.github/workflows/build.yml
+++ b/.github/workflows/build.yml
@@ -100,7 +100,7 @@ jobs:
               -X POST \
               -H "Authorization: Bearer ${{ secrets.GITHUB_TOKEN }}"\
               -H "Content-Type: application/octet-stream" \
-              "https://uploads.github.com/repos/${{ github.repository }}/releases/${{ github.event.release.id }}/assets?name=${BIN_NAME}" \
+              "https://uploads.github.com/repos/${{ github.repository }}/releases/${{ github.event.release.id }}/assets?name=${BIN_NAME/+/%2B}" \
               --data-binary "@${BIN_NAME}"
           done
 

From 344fd8f36c7f0cf1e34fd06ec30f34f6c487f340 Mon Sep 17 00:00:00 2001
From: Mikko Ohtamaa <mikko@redinnovation.com>
Date: Sun, 10 Sep 2023 17:30:01 +0200
Subject: [PATCH 127/161] docs: add README banner about Vyper audit competition
 (#3599)

Add a temporary banner at the top of the README to advertise the audit competition

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 README.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/README.md b/README.md
index af987ffd4f..bad929956d 100644
--- a/README.md
+++ b/README.md
@@ -1,3 +1,4 @@
+**Vyper compiler security audit competition starts 14th September with $150k worth of bounties.** [See the competition on CodeHawks](https://www.codehawks.com/contests/cll5rujmw0001js08menkj7hc) and find [more details in this blog post](https://mirror.xyz/0xBA41A04A14aeaEec79e2D694B21ba5Ab610982f1/WTZ3l3MLhTz9P4avq6JqipN5d4HJNiUY-d8zT0pfmXg).
 
 <img src="https://raw.githubusercontent.com/vyperlang/vyper/master/logo/vyper-logo-transparent.svg?sanitize=true" alt="" width="110">
 

From 0b740280c1e3c5528a20d47b29831948ddcc6d83 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 15 Sep 2023 18:01:03 -0400
Subject: [PATCH 128/161] fix: only allow valid identifiers to be nonreentrant
 keys (#3605)

disallow invalid identifiers like `" "`, `"123abc"` from being keys for
non-reentrant locks.

this commit also refactors the `validate_identifiers` helper function to
be in the `ast/` subdirectory, and slightly improves the VyperException
constructor by allowing None (optional) annotations.
---
 .../exceptions/test_structure_exception.py    |  23 +++-
 .../features/decorators/test_nonreentrant.py  |   4 +-
 tests/parser/test_call_graph_stability.py     |   2 +-
 tests/parser/types/test_identifier_naming.py  |   2 +-
 vyper/ast/identifiers.py                      | 111 ++++++++++++++++
 vyper/exceptions.py                           |   4 +-
 vyper/semantics/namespace.py                  | 119 +-----------------
 vyper/semantics/types/base.py                 |   2 +-
 vyper/semantics/types/function.py             |   6 +-
 9 files changed, 147 insertions(+), 126 deletions(-)
 create mode 100644 vyper/ast/identifiers.py

diff --git a/tests/parser/exceptions/test_structure_exception.py b/tests/parser/exceptions/test_structure_exception.py
index 08794b75f2..97ac2b139d 100644
--- a/tests/parser/exceptions/test_structure_exception.py
+++ b/tests/parser/exceptions/test_structure_exception.py
@@ -56,9 +56,26 @@ def double_nonreentrant():
     """,
     """
 @external
-@nonreentrant("B")
-@nonreentrant("C")
-def double_nonreentrant():
+@nonreentrant(" ")
+def invalid_nonreentrant_key():
+    pass
+    """,
+    """
+@external
+@nonreentrant("")
+def invalid_nonreentrant_key():
+    pass
+    """,
+    """
+@external
+@nonreentrant("123")
+def invalid_nonreentrant_key():
+    pass
+    """,
+    """
+@external
+@nonreentrant("!123abcd")
+def invalid_nonreentrant_key():
     pass
     """,
     """
diff --git a/tests/parser/features/decorators/test_nonreentrant.py b/tests/parser/features/decorators/test_nonreentrant.py
index ac73b35bec..9e74019250 100644
--- a/tests/parser/features/decorators/test_nonreentrant.py
+++ b/tests/parser/features/decorators/test_nonreentrant.py
@@ -142,7 +142,7 @@ def set_callback(c: address):
 
 @external
 @payable
-@nonreentrant('default')
+@nonreentrant("lock")
 def protected_function(val: String[100], do_callback: bool) -> uint256:
     self.special_value = val
     _amount: uint256 = msg.value
@@ -166,7 +166,7 @@ def unprotected_function(val: String[100], do_callback: bool):
 
 @external
 @payable
-@nonreentrant('default')
+@nonreentrant("lock")
 def __default__():
     pass
     """
diff --git a/tests/parser/test_call_graph_stability.py b/tests/parser/test_call_graph_stability.py
index b651092d16..a6193610e2 100644
--- a/tests/parser/test_call_graph_stability.py
+++ b/tests/parser/test_call_graph_stability.py
@@ -6,8 +6,8 @@
 from hypothesis import given, settings
 
 import vyper.ast as vy_ast
+from vyper.ast.identifiers import RESERVED_KEYWORDS
 from vyper.compiler.phases import CompilerData
-from vyper.semantics.namespace import RESERVED_KEYWORDS
 
 
 def _valid_identifier(attr):
diff --git a/tests/parser/types/test_identifier_naming.py b/tests/parser/types/test_identifier_naming.py
index f4f602f471..5cfc7e8ed7 100755
--- a/tests/parser/types/test_identifier_naming.py
+++ b/tests/parser/types/test_identifier_naming.py
@@ -1,10 +1,10 @@
 import pytest
 
 from vyper.ast.folding import BUILTIN_CONSTANTS
+from vyper.ast.identifiers import RESERVED_KEYWORDS
 from vyper.builtins.functions import BUILTIN_FUNCTIONS
 from vyper.codegen.expr import ENVIRONMENT_VARIABLES
 from vyper.exceptions import NamespaceCollision, StructureException, SyntaxException
-from vyper.semantics.namespace import RESERVED_KEYWORDS
 from vyper.semantics.types.primitives import AddressT
 
 BUILTIN_CONSTANTS = set(BUILTIN_CONSTANTS.keys())
diff --git a/vyper/ast/identifiers.py b/vyper/ast/identifiers.py
new file mode 100644
index 0000000000..985b04e5cd
--- /dev/null
+++ b/vyper/ast/identifiers.py
@@ -0,0 +1,111 @@
+import re
+
+from vyper.exceptions import StructureException
+
+
+def validate_identifier(attr, ast_node=None):
+    if not re.match("^[_a-zA-Z][a-zA-Z0-9_]*$", attr):
+        raise StructureException(f"'{attr}' contains invalid character(s)", ast_node)
+    if attr.lower() in RESERVED_KEYWORDS:
+        raise StructureException(f"'{attr}' is a reserved keyword", ast_node)
+
+
+# https://docs.python.org/3/reference/lexical_analysis.html#keywords
+# note we don't technically need to block all python reserved keywords,
+# but do it for hygiene
+_PYTHON_RESERVED_KEYWORDS = {
+    "False",
+    "None",
+    "True",
+    "and",
+    "as",
+    "assert",
+    "async",
+    "await",
+    "break",
+    "class",
+    "continue",
+    "def",
+    "del",
+    "elif",
+    "else",
+    "except",
+    "finally",
+    "for",
+    "from",
+    "global",
+    "if",
+    "import",
+    "in",
+    "is",
+    "lambda",
+    "nonlocal",
+    "not",
+    "or",
+    "pass",
+    "raise",
+    "return",
+    "try",
+    "while",
+    "with",
+    "yield",
+}
+_PYTHON_RESERVED_KEYWORDS = {s.lower() for s in _PYTHON_RESERVED_KEYWORDS}
+
+# Cannot be used for variable or member naming
+RESERVED_KEYWORDS = _PYTHON_RESERVED_KEYWORDS | {
+    # decorators
+    "public",
+    "external",
+    "nonpayable",
+    "constant",
+    "immutable",
+    "transient",
+    "internal",
+    "payable",
+    "nonreentrant",
+    # "class" keywords
+    "interface",
+    "struct",
+    "event",
+    "enum",
+    # EVM operations
+    "unreachable",
+    # special functions (no name mangling)
+    "init",
+    "_init_",
+    "___init___",
+    "____init____",
+    "default",
+    "_default_",
+    "___default___",
+    "____default____",
+    # more control flow and special operations
+    "range",
+    # more special operations
+    "indexed",
+    # denominations
+    "ether",
+    "wei",
+    "finney",
+    "szabo",
+    "shannon",
+    "lovelace",
+    "ada",
+    "babbage",
+    "gwei",
+    "kwei",
+    "mwei",
+    "twei",
+    "pwei",
+    # sentinal constant values
+    # TODO remove when these are removed from the language
+    "zero_address",
+    "empty_bytes32",
+    "max_int128",
+    "min_int128",
+    "max_decimal",
+    "min_decimal",
+    "max_uint256",
+    "zero_wei",
+}
diff --git a/vyper/exceptions.py b/vyper/exceptions.py
index aa23614e85..defca7cc53 100644
--- a/vyper/exceptions.py
+++ b/vyper/exceptions.py
@@ -54,7 +54,9 @@ def __init__(self, message="Error Message not found.", *items):
             # support older exceptions that don't annotate - remove this in the future!
             self.lineno, self.col_offset = items[0][:2]
         else:
-            self.annotations = items
+            # strip out None sources so that None can be passed as a valid
+            # annotation (in case it is only available optionally)
+            self.annotations = [k for k in items if k is not None]
 
     def with_annotation(self, *annotations):
         """
diff --git a/vyper/semantics/namespace.py b/vyper/semantics/namespace.py
index b88bc3d817..613ac0c03b 100644
--- a/vyper/semantics/namespace.py
+++ b/vyper/semantics/namespace.py
@@ -1,12 +1,7 @@
 import contextlib
-import re
-
-from vyper.exceptions import (
-    CompilerPanic,
-    NamespaceCollision,
-    StructureException,
-    UndeclaredDefinition,
-)
+
+from vyper.ast.identifiers import validate_identifier
+from vyper.exceptions import CompilerPanic, NamespaceCollision, UndeclaredDefinition
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
 
 
@@ -121,111 +116,3 @@ def override_global_namespace(ns):
     finally:
         # unclobber
         _namespace = tmp
-
-
-def validate_identifier(attr):
-    if not re.match("^[_a-zA-Z][a-zA-Z0-9_]*$", attr):
-        raise StructureException(f"'{attr}' contains invalid character(s)")
-    if attr.lower() in RESERVED_KEYWORDS:
-        raise StructureException(f"'{attr}' is a reserved keyword")
-
-
-# https://docs.python.org/3/reference/lexical_analysis.html#keywords
-# note we don't technically need to block all python reserved keywords,
-# but do it for hygiene
-_PYTHON_RESERVED_KEYWORDS = {
-    "False",
-    "None",
-    "True",
-    "and",
-    "as",
-    "assert",
-    "async",
-    "await",
-    "break",
-    "class",
-    "continue",
-    "def",
-    "del",
-    "elif",
-    "else",
-    "except",
-    "finally",
-    "for",
-    "from",
-    "global",
-    "if",
-    "import",
-    "in",
-    "is",
-    "lambda",
-    "nonlocal",
-    "not",
-    "or",
-    "pass",
-    "raise",
-    "return",
-    "try",
-    "while",
-    "with",
-    "yield",
-}
-_PYTHON_RESERVED_KEYWORDS = {s.lower() for s in _PYTHON_RESERVED_KEYWORDS}
-
-# Cannot be used for variable or member naming
-RESERVED_KEYWORDS = _PYTHON_RESERVED_KEYWORDS | {
-    # decorators
-    "public",
-    "external",
-    "nonpayable",
-    "constant",
-    "immutable",
-    "transient",
-    "internal",
-    "payable",
-    "nonreentrant",
-    # "class" keywords
-    "interface",
-    "struct",
-    "event",
-    "enum",
-    # EVM operations
-    "unreachable",
-    # special functions (no name mangling)
-    "init",
-    "_init_",
-    "___init___",
-    "____init____",
-    "default",
-    "_default_",
-    "___default___",
-    "____default____",
-    # more control flow and special operations
-    "range",
-    # more special operations
-    "indexed",
-    # denominations
-    "ether",
-    "wei",
-    "finney",
-    "szabo",
-    "shannon",
-    "lovelace",
-    "ada",
-    "babbage",
-    "gwei",
-    "kwei",
-    "mwei",
-    "twei",
-    "pwei",
-    # sentinal constant values
-    # TODO remove when these are removed from the language
-    "zero_address",
-    "empty_bytes32",
-    "max_int128",
-    "min_int128",
-    "max_decimal",
-    "min_decimal",
-    "max_uint256",
-    "zero_wei",
-}
diff --git a/vyper/semantics/types/base.py b/vyper/semantics/types/base.py
index af955f6071..c5af5c2a39 100644
--- a/vyper/semantics/types/base.py
+++ b/vyper/semantics/types/base.py
@@ -3,6 +3,7 @@
 
 from vyper import ast as vy_ast
 from vyper.abi_types import ABIType
+from vyper.ast.identifiers import validate_identifier
 from vyper.exceptions import (
     CompilerPanic,
     InvalidLiteral,
@@ -12,7 +13,6 @@
     UnknownAttribute,
 )
 from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
-from vyper.semantics.namespace import validate_identifier
 
 
 # Some fake type with an overridden `compare_type` which accepts any RHS
diff --git a/vyper/semantics/types/function.py b/vyper/semantics/types/function.py
index 506dae135c..77b9efb13d 100644
--- a/vyper/semantics/types/function.py
+++ b/vyper/semantics/types/function.py
@@ -5,6 +5,7 @@
 from typing import Any, Dict, List, Optional, Tuple
 
 from vyper import ast as vy_ast
+from vyper.ast.identifiers import validate_identifier
 from vyper.ast.validation import validate_call_args
 from vyper.exceptions import (
     ArgumentException,
@@ -220,7 +221,10 @@ def from_FunctionDef(
                         msg = "Nonreentrant decorator disallowed on `__init__`"
                         raise FunctionDeclarationException(msg, decorator)
 
-                    kwargs["nonreentrant"] = decorator.args[0].value
+                    nonreentrant_key = decorator.args[0].value
+                    validate_identifier(nonreentrant_key, decorator.args[0])
+
+                    kwargs["nonreentrant"] = nonreentrant_key
 
                 elif isinstance(decorator, vy_ast.Name):
                     if FunctionVisibility.is_valid_value(decorator.id):

From 823675a8dc49e8148b7a8c79e86f01dea7115cd9 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 18 Sep 2023 08:16:51 -0700
Subject: [PATCH 129/161] fix: dense selector table when there are empty
 buckets (#3606)

certain combinations of selectors can result in some buckets being
empty. in this case, the header section is incomplete. this commit fixes
the issue by bailing out of the mkbucket routine when there are empty
buckets (thus treating the configurations with empty buckets as invalid)

---------

Co-authored-by: Tanguy Rocher <tanguy.rocher@protonmail.com>
---
 tests/parser/test_selector_table.py | 431 ++++++++++++++++++++++++++++
 vyper/codegen/jumptable_utils.py    |  25 +-
 vyper/codegen/module.py             |   8 +-
 3 files changed, 458 insertions(+), 6 deletions(-)

diff --git a/tests/parser/test_selector_table.py b/tests/parser/test_selector_table.py
index 01a83698b7..3ac50707c2 100644
--- a/tests/parser/test_selector_table.py
+++ b/tests/parser/test_selector_table.py
@@ -10,6 +10,437 @@
 from vyper.compiler.settings import OptimizationLevel
 
 
+def test_dense_selector_table_empty_buckets(get_contract):
+    # some special combination of selectors which can result in
+    # some empty bucket being returned from _mk_buckets (that is,
+    # len(_mk_buckets(..., n_buckets)) != n_buckets
+    code = """
+@external
+def aX61QLPWF()->uint256:
+    return 1
+@external
+def aQHG0P2L1()->uint256:
+    return 2
+@external
+def a2G8ME94W()->uint256:
+    return 3
+@external
+def a0GNA21AY()->uint256:
+    return 4
+@external
+def a4U1XA4T5()->uint256:
+    return 5
+@external
+def aAYLMGOBZ()->uint256:
+    return 6
+@external
+def a0KXRLHKE()->uint256:
+    return 7
+@external
+def aDQS32HTR()->uint256:
+    return 8
+@external
+def aP4K6SA3S()->uint256:
+    return 9
+@external
+def aEB94ZP5S()->uint256:
+    return 10
+@external
+def aTOIMN0IM()->uint256:
+    return 11
+@external
+def aXV2N81OW()->uint256:
+    return 12
+@external
+def a66PP6Y5X()->uint256:
+    return 13
+@external
+def a5MWMTEWN()->uint256:
+    return 14
+@external
+def a5ZFST4Z8()->uint256:
+    return 15
+@external
+def aR13VXULX()->uint256:
+    return 16
+@external
+def aWITH917Y()->uint256:
+    return 17
+@external
+def a59NP6C5O()->uint256:
+    return 18
+@external
+def aJ02590EX()->uint256:
+    return 19
+@external
+def aUAXAAUQ8()->uint256:
+    return 20
+@external
+def aWR1XNC6J()->uint256:
+    return 21
+@external
+def aJABKZOKH()->uint256:
+    return 22
+@external
+def aO1TT0RJT()->uint256:
+    return 23
+@external
+def a41442IOK()->uint256:
+    return 24
+@external
+def aMVXV9FHQ()->uint256:
+    return 25
+@external
+def aNN0KJDZM()->uint256:
+    return 26
+@external
+def aOX965047()->uint256:
+    return 27
+@external
+def a575NX2J3()->uint256:
+    return 28
+@external
+def a16EN8O7W()->uint256:
+    return 29
+@external
+def aSZXLFF7O()->uint256:
+    return 30
+@external
+def aQKQCIPH9()->uint256:
+    return 31
+@external
+def aIP8021DL()->uint256:
+    return 32
+@external
+def aQAV0HSHX()->uint256:
+    return 33
+@external
+def aZVPAD745()->uint256:
+    return 34
+@external
+def aJYBSNST4()->uint256:
+    return 35
+@external
+def aQGWC4NYQ()->uint256:
+    return 36
+@external
+def aFMBB9CXJ()->uint256:
+    return 37
+@external
+def aYWM7ZUH1()->uint256:
+    return 38
+@external
+def aJAZONIX1()->uint256:
+    return 39
+@external
+def aQZ1HJK0H()->uint256:
+    return 40
+@external
+def aKIH9LOUB()->uint256:
+    return 41
+@external
+def aF4ZT80XL()->uint256:
+    return 42
+@external
+def aYQD8UKR5()->uint256:
+    return 43
+@external
+def aP6NCCAI4()->uint256:
+    return 44
+@external
+def aY92U2EAZ()->uint256:
+    return 45
+@external
+def aHMQ49D7P()->uint256:
+    return 46
+@external
+def aMC6YX8VF()->uint256:
+    return 47
+@external
+def a734X6YSI()->uint256:
+    return 48
+@external
+def aRXXPNSMU()->uint256:
+    return 49
+@external
+def aL5XKDTGT()->uint256:
+    return 50
+@external
+def a86V1Y18A()->uint256:
+    return 51
+@external
+def aAUM8PL5J()->uint256:
+    return 52
+@external
+def aBAEC1ERZ()->uint256:
+    return 53
+@external
+def a1U1VA3UE()->uint256:
+    return 54
+@external
+def aC9FGVAHC()->uint256:
+    return 55
+@external
+def aWN81WYJ3()->uint256:
+    return 56
+@external
+def a3KK1Y07J()->uint256:
+    return 57
+@external
+def aAZ6P6OSG()->uint256:
+    return 58
+@external
+def aWP5HCIB3()->uint256:
+    return 59
+@external
+def aVEK161C5()->uint256:
+    return 60
+@external
+def aY0Q3O519()->uint256:
+    return 61
+@external
+def aDHHHFIAE()->uint256:
+    return 62
+@external
+def aGSJBCZKQ()->uint256:
+    return 63
+@external
+def aZQQIUDHY()->uint256:
+    return 64
+@external
+def a12O9QDH5()->uint256:
+    return 65
+@external
+def aRQ1178XR()->uint256:
+    return 66
+@external
+def aDT25C832()->uint256:
+    return 67
+@external
+def aCSB01C4E()->uint256:
+    return 68
+@external
+def aYGBPKZSD()->uint256:
+    return 69
+@external
+def aP24N3EJ8()->uint256:
+    return 70
+@external
+def a531Y9X3C()->uint256:
+    return 71
+@external
+def a4727IKVS()->uint256:
+    return 72
+@external
+def a2EX1L2BS()->uint256:
+    return 73
+@external
+def a6145RN68()->uint256:
+    return 74
+@external
+def aDO1ZNX97()->uint256:
+    return 75
+@external
+def a3R28EU6M()->uint256:
+    return 76
+@external
+def a9BFC867L()->uint256:
+    return 77
+@external
+def aPL1MBGYC()->uint256:
+    return 78
+@external
+def aI6H11O48()->uint256:
+    return 79
+@external
+def aX0248DZY()->uint256:
+    return 80
+@external
+def aE4JBUJN4()->uint256:
+    return 81
+@external
+def aXBDB2ZBO()->uint256:
+    return 82
+@external
+def a7O7MYYHL()->uint256:
+    return 83
+@external
+def aERFF4PB6()->uint256:
+    return 84
+@external
+def aJCUBG6TJ()->uint256:
+    return 85
+@external
+def aQ5ELXM0F()->uint256:
+    return 86
+@external
+def aWDT9UQVV()->uint256:
+    return 87
+@external
+def a7UU40DJK()->uint256:
+    return 88
+@external
+def aH01IT5VS()->uint256:
+    return 89
+@external
+def aSKYTZ0FC()->uint256:
+    return 90
+@external
+def aNX5LYRAW()->uint256:
+    return 91
+@external
+def aUDKAOSGG()->uint256:
+    return 92
+@external
+def aZ86YGAAO()->uint256:
+    return 93
+@external
+def aIHWQGKLO()->uint256:
+    return 94
+@external
+def aKIKFLAR9()->uint256:
+    return 95
+@external
+def aCTPE0KRS()->uint256:
+    return 96
+@external
+def aAD75X00P()->uint256:
+    return 97
+@external
+def aDROUEF2F()->uint256:
+    return 98
+@external
+def a8CDIF6YN()->uint256:
+    return 99
+@external
+def aD2X7TM83()->uint256:
+    return 100
+@external
+def a3W5UUB4L()->uint256:
+    return 101
+@external
+def aG4MOBN4B()->uint256:
+    return 102
+@external
+def aPRS0MSG7()->uint256:
+    return 103
+@external
+def aKN3GHBUR()->uint256:
+    return 104
+@external
+def aGE435RHQ()->uint256:
+    return 105
+@external
+def a4E86BNFE()->uint256:
+    return 106
+@external
+def aYDG928YW()->uint256:
+    return 107
+@external
+def a2HFP5GQE()->uint256:
+    return 108
+@external
+def a5DPMVXKA()->uint256:
+    return 109
+@external
+def a3OFVC3DR()->uint256:
+    return 110
+@external
+def aK8F62DAN()->uint256:
+    return 111
+@external
+def aJS9EY3U6()->uint256:
+    return 112
+@external
+def aWW789JQH()->uint256:
+    return 113
+@external
+def a8AJJN3YR()->uint256:
+    return 114
+@external
+def a4D0MUIDU()->uint256:
+    return 115
+@external
+def a35W41JQR()->uint256:
+    return 116
+@external
+def a07DQOI1E()->uint256:
+    return 117
+@external
+def aFT43YNCT()->uint256:
+    return 118
+@external
+def a0E75I8X3()->uint256:
+    return 119
+@external
+def aT6NXIRO4()->uint256:
+    return 120
+@external
+def aXB2UBAKQ()->uint256:
+    return 121
+@external
+def aHWH55NW6()->uint256:
+    return 122
+@external
+def a7TCFE6C2()->uint256:
+    return 123
+@external
+def a8XYAM81I()->uint256:
+    return 124
+@external
+def aHQTQ4YBY()->uint256:
+    return 125
+@external
+def aGCZEHG6Y()->uint256:
+    return 126
+@external
+def a6LJTKIW0()->uint256:
+    return 127
+@external
+def aBDIXTD9S()->uint256:
+    return 128
+@external
+def aCB83G21P()->uint256:
+    return 129
+@external
+def aZC525N4K()->uint256:
+    return 130
+@external
+def a40LC94U6()->uint256:
+    return 131
+@external
+def a8X9TI93D()->uint256:
+    return 132
+@external
+def aGUG9CD8Y()->uint256:
+    return 133
+@external
+def a0LAERVAY()->uint256:
+    return 134
+@external
+def aXQ0UEX19()->uint256:
+    return 135
+@external
+def aKK9C7NE7()->uint256:
+    return 136
+@external
+def aS2APW8UE()->uint256:
+    return 137
+@external
+def a65NT07MM()->uint256:
+    return 138
+@external
+def aGRMT6ZW5()->uint256:
+    return 139
+@external
+def aILR4U1Z()->uint256:
+    return 140
+    """
+    c = get_contract(code)
+
+    assert c.aX61QLPWF() == 1  # will revert if the header section is misaligned
+
+
 @given(
     n_methods=st.integers(min_value=1, max_value=100),
     seed=st.integers(min_value=0, max_value=2**64 - 1),
diff --git a/vyper/codegen/jumptable_utils.py b/vyper/codegen/jumptable_utils.py
index 6987ce90bd..6404b75532 100644
--- a/vyper/codegen/jumptable_utils.py
+++ b/vyper/codegen/jumptable_utils.py
@@ -43,7 +43,11 @@ def _image_of(xs, magic):
     return [((x * magic) >> bits_shift) % len(xs) for x in xs]
 
 
-class _Failure(Exception):
+class _FindMagicFailure(Exception):
+    pass
+
+
+class _HasEmptyBuckets(Exception):
     pass
 
 
@@ -53,7 +57,7 @@ def find_magic_for(xs):
         if len(test) == len(set(test)):
             return m
 
-    raise _Failure(f"Could not find hash for {xs}")
+    raise _FindMagicFailure(f"Could not find hash for {xs}")
 
 
 def _mk_buckets(method_ids, n_buckets):
@@ -72,6 +76,11 @@ def _mk_buckets(method_ids, n_buckets):
 def _dense_jumptable_info(method_ids, n_buckets):
     buckets = _mk_buckets(method_ids, n_buckets)
 
+    # if there are somehow empty buckets, bail out as that can mess up
+    # the bucket header layout
+    if len(buckets) != n_buckets:
+        raise _HasEmptyBuckets()
+
     ret = {}
     for bucket_id, method_ids in buckets.items():
         magic = find_magic_for(method_ids)
@@ -98,8 +107,16 @@ def generate_dense_jumptable_info(signatures):
     while n_buckets > 0:
         try:
             # print(f"trying {n_buckets} (bucket size {n // n_buckets})")
-            ret = _dense_jumptable_info(method_ids, n_buckets)
-        except _Failure:
+            solution = _dense_jumptable_info(method_ids, n_buckets)
+            assert len(solution) == n_buckets
+            ret = n_buckets, solution
+
+        except _HasEmptyBuckets:
+            # found a solution which has empty buckets; skip it since
+            # it will break the bucket layout.
+            pass
+
+        except _FindMagicFailure:
             if ret is not None:
                 break
 
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 8caea9ee9b..6445a5e1e0 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -124,8 +124,12 @@ def _selector_section_dense(external_functions, global_ctx):
         ir_node = ["label", label, ["var_list"], entry_point.ir_node]
         function_irs.append(IRnode.from_list(ir_node))
 
-    jumptable_info = jumptable_utils.generate_dense_jumptable_info(entry_points.keys())
-    n_buckets = len(jumptable_info)
+    n_buckets, jumptable_info = jumptable_utils.generate_dense_jumptable_info(entry_points.keys())
+    # note: we are guaranteed by jumptable_utils that there are no buckets
+    # which are empty. sanity check that the bucket ids are well-behaved:
+    assert n_buckets == len(jumptable_info)
+    for i, (bucket_id, _) in enumerate(sorted(jumptable_info.items())):
+        assert i == bucket_id
 
     #  bucket magic <2 bytes> | bucket location <2 bytes> | bucket size <1 byte>
     # TODO: can make it smaller if the largest bucket magic <= 255

From ecf3050782ae15e40e27a338db3f29f296e94bfe Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 18 Sep 2023 14:48:29 -0700
Subject: [PATCH 130/161] chore: add tests for selector table stability (#3608)

---
 tests/parser/test_selector_table_stability.py | 53 +++++++++++++++++++
 1 file changed, 53 insertions(+)
 create mode 100644 tests/parser/test_selector_table_stability.py

diff --git a/tests/parser/test_selector_table_stability.py b/tests/parser/test_selector_table_stability.py
new file mode 100644
index 0000000000..abc2c17b8f
--- /dev/null
+++ b/tests/parser/test_selector_table_stability.py
@@ -0,0 +1,53 @@
+from vyper.codegen.jumptable_utils import generate_sparse_jumptable_buckets
+from vyper.compiler import compile_code
+from vyper.compiler.settings import OptimizationLevel, Settings
+
+
+def test_dense_jumptable_stability():
+    function_names = [f"foo{i}" for i in range(30)]
+
+    code = "\n".join(f"@external\ndef {name}():\n  pass" for name in function_names)
+
+    output = compile_code(code, ["asm"], settings=Settings(optimize=OptimizationLevel.CODESIZE))
+
+    # test that the selector table data is stable across different runs
+    # (tox should provide different PYTHONHASHSEEDs).
+    expected_asm = """{ DATA _sym_BUCKET_HEADERS b'\\x0bB' _sym_bucket_0 b'\\n' b'+\\x8d' _sym_bucket_1 b'\\x0c' b'\\x00\\x85' _sym_bucket_2 b'\\x08' } { DATA _sym_bucket_1 b'\\xd8\\xee\\xa1\\xe8' _sym_external_foo6___3639517672 b'\\x05' b'\\xd2\\x9e\\xe0\\xf9' _sym_external_foo0___3533627641 b'\\x05' b'\\x05\\xf1\\xe0_' _sym_external_foo2___99737695 b'\\x05' b'\\x91\\t\\xb4{' _sym_external_foo23___2433332347 b'\\x05' b'np3\\x7f' _sym_external_foo11___1852846975 b'\\x05' b'&\\xf5\\x96\\xf9' _sym_external_foo13___653629177 b'\\x05' b'\\x04ga\\xeb' _sym_external_foo14___73884139 b'\\x05' b'\\x89\\x06\\xad\\xc6' _sym_external_foo17___2298916294 b'\\x05' b'\\xe4%\\xac\\xd1' _sym_external_foo4___3827674321 b'\\x05' b'yj\\x01\\xac' _sym_external_foo7___2036990380 b'\\x05' b'\\xf1\\xe6K\\xe5' _sym_external_foo29___4058401765 b'\\x05' b'\\xd2\\x89X\\xb8' _sym_external_foo3___3532216504 b'\\x05' } { DATA _sym_bucket_2 b'\\x06p\\xffj' _sym_external_foo25___108068714 b'\\x05' b'\\x964\\x99I' _sym_external_foo24___2520029513 b'\\x05' b's\\x81\\xe7\\xc1' _sym_external_foo10___1937893313 b'\\x05' b'\\x85\\xad\\xc11' _sym_external_foo28___2242756913 b'\\x05' b'\\xfa"\\xb1\\xed' _sym_external_foo5___4196577773 b'\\x05' b'A\\xe7[\\x05' _sym_external_foo22___1105681157 b'\\x05' b'\\xd3\\x89U\\xe8' _sym_external_foo1___3548993000 b'\\x05' b'hL\\xf8\\xf3' _sym_external_foo20___1749874931 b'\\x05' } { DATA _sym_bucket_0 b'\\xee\\xd9\\x1d\\xe3' _sym_external_foo9___4007206371 b'\\x05' b'a\\xbc\\x1ch' _sym_external_foo16___1639717992 b'\\x05' b'\\xd3*\\xa7\\x0c' _sym_external_foo21___3542787852 b'\\x05' b'\\x18iG\\xd9' _sym_external_foo19___409552857 b'\\x05' b'\\n\\xf1\\xf9\\x7f' _sym_external_foo18___183630207 b'\\x05' b')\\xda\\xd7`' _sym_external_foo27___702207840 b'\\x05' b'2\\xf6\\xaa\\xda' _sym_external_foo12___855026394 b'\\x05' b'\\xbe\\xb5\\x05\\xf5' _sym_external_foo15___3199534581 b'\\x05' b'\\xfc\\xa7_\\xe6' _sym_external_foo8___4238827494 b'\\x05' b'\\x1b\\x12C8' _sym_external_foo26___454181688 b'\\x05' } }"""  # noqa: E501
+    assert expected_asm in output["asm"]
+
+
+def test_sparse_jumptable_stability():
+    function_names = [f"foo{i}()" for i in range(30)]
+
+    # sparse jumptable is not as complicated in assembly.
+    # here just test the data structure is stable
+
+    n_buckets, buckets = generate_sparse_jumptable_buckets(function_names)
+    assert n_buckets == 33
+
+    # the buckets sorted by id are what go into the IR, check equality against
+    # expected:
+    assert sorted(buckets.items()) == [
+        (0, [4238827494, 1639717992]),
+        (1, [1852846975]),
+        (2, [1749874931]),
+        (3, [4007206371]),
+        (4, [2298916294]),
+        (7, [2036990380]),
+        (10, [3639517672, 73884139]),
+        (12, [3199534581]),
+        (13, [99737695]),
+        (14, [3548993000, 4196577773]),
+        (15, [454181688, 702207840]),
+        (16, [3533627641]),
+        (17, [108068714]),
+        (20, [1105681157]),
+        (21, [409552857, 3542787852]),
+        (22, [4058401765]),
+        (23, [2520029513, 2242756913]),
+        (24, [855026394, 183630207]),
+        (25, [3532216504, 653629177]),
+        (26, [1937893313]),
+        (28, [2433332347]),
+        (31, [3827674321]),
+    ]

From 1711569f0852fa487d8677b0e9984b5692dfc4e6 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Wed, 20 Sep 2023 10:47:07 +0800
Subject: [PATCH 131/161] chore: always pass era-tester CI (#3415)

This PR relaxes the check for era-tester CI
so that it always succeeds as a non-blocking
CI.

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 .github/workflows/era-tester.yml | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/.github/workflows/era-tester.yml b/.github/workflows/era-tester.yml
index 187b5c03a2..3e0bb3e941 100644
--- a/.github/workflows/era-tester.yml
+++ b/.github/workflows/era-tester.yml
@@ -98,6 +98,7 @@ jobs:
 
     - name: Run tester (fast)
       # Run era tester with no LLVM optimizations
+      continue-on-error: true
       if: ${{ github.ref != 'refs/heads/master' }}
       run: |
         cd era-compiler-tester
@@ -105,7 +106,12 @@ jobs:
 
     - name: Run tester (slow)
       # Run era tester across the LLVM optimization matrix
+      continue-on-error: true
       if: ${{ github.ref == 'refs/heads/master' }}
       run: |
         cd era-compiler-tester
         cargo run --release --bin compiler-tester -- --path=tests/vyper/ --mode="M*B* ${{ env.VYPER_VERSION }}"
+
+    - name: Mark as success
+      run: |
+        exit 0

From f224d83a91d7ff5097dafaa715d53c6c1a88f502 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 20 Sep 2023 06:12:09 -0700
Subject: [PATCH 132/161] chore: tighten bounds for setuptools_scm (#3613)

there is a regression in 8.0.0 which results in the following invalid
code being generated for `vyper/version.py`:

```python
from __future__ import annotations
__version__ : str = version : str = '0.3.11'
__version_tuple__ : 'tuple[int | str, ...]' = \
  version_tuple : 'tuple[int | str, ...]' = (0, 3, 11)
```

this commit also removes some bad fuzzer deadlines.
---
 setup.py                                       | 2 +-
 tests/ast/nodes/test_evaluate_binop_decimal.py | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/setup.py b/setup.py
index c81b9bed4a..40efb436c5 100644
--- a/setup.py
+++ b/setup.py
@@ -99,7 +99,7 @@ def _global_version(version):
         "importlib-metadata",
         "wheel",
     ],
-    setup_requires=["pytest-runner", "setuptools_scm"],
+    setup_requires=["pytest-runner", "setuptools_scm>=7.1.0,<8.0.0"],
     tests_require=extras_require["test"],
     extras_require=extras_require,
     entry_points={
diff --git a/tests/ast/nodes/test_evaluate_binop_decimal.py b/tests/ast/nodes/test_evaluate_binop_decimal.py
index c6c69626b8..3c8ba0888c 100644
--- a/tests/ast/nodes/test_evaluate_binop_decimal.py
+++ b/tests/ast/nodes/test_evaluate_binop_decimal.py
@@ -13,7 +13,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50, deadline=None)
 @given(left=st_decimals, right=st_decimals)
 @example(left=Decimal("0.9999999999"), right=Decimal("0.0000000001"))
 @example(left=Decimal("0.0000000001"), right=Decimal("0.9999999999"))
@@ -52,7 +52,7 @@ def test_binop_pow():
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50, deadline=None)
 @given(
     values=st.lists(st_decimals, min_size=2, max_size=10),
     ops=st.lists(st.sampled_from("+-*/%"), min_size=11, max_size=11),

From 79303fc4fcba06994ee5c6a7baef57bdb185006c Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 21 Sep 2023 07:51:41 -0700
Subject: [PATCH 133/161] fix: memory allocation in certain builtins using
 `msize` (#3610)

in certain builtins which use `msize` to allocate a buffer for their
arguments (specifically, `raw_call()`, `create_copy_of()` and
`create_from_blueprint()`), corruption of the buffer can occur when
`msize` is not properly initialized. (this usually happens when there
are no variables which are held in memory in the outer external
function). what can happen is that some arguments can be evaluated after
`msize` is evaluated, leading to overwriting the memory region for the
argument buffer with other arguments. specifically, combined with the
condition that `msize` is underinitialized, this can happen with:

- the buffer for the initcode of `create_copy_of()` and
  `create_from_blueprint()` can be overwritten when the `salt=` or
  `value=` arguments write to memory

- the buffer for the `data` argument (when `msg.data` is provided,
  prompting the use of `msize`) of `raw_call()` can be overwritten when
  the `to`, `gas=` or `value=` arguments write to memory

this commit fixes the issue by using a variant of `cache_when_complex()`
to ensure that the relevant arguments are evaluated before `msize` is
evaluated.

this is a patch for GHSA-c647-pxm2-c52w.

summarized changelog:
* fix raw_call
* test: raw_call with msg.data buffer clean memory
* force memory effects in some clean_mem tests
* add tests for clean memory in create_* functions
* add scope_multi abstraction
* refactor raw_call to use scope_multi
* add fixes for create_* memory cleanliness
* update optimizer tests -- callvalue is now considered constant
* move salt back into scope_multi
* add a note on reads in cache_when_complex

---------

Co-authored-by: Tanguy Rocher <tanguy.rocher@protonmail.com>
---
 tests/compiler/ir/test_optimize_ir.py         |   8 +-
 .../parser/functions/test_create_functions.py | 209 ++++++++++++++++++
 tests/parser/functions/test_raw_call.py       | 158 +++++++++++++
 vyper/builtins/functions.py                   |  63 +++---
 vyper/codegen/ir_node.py                      |  81 ++++++-
 5 files changed, 487 insertions(+), 32 deletions(-)

diff --git a/tests/compiler/ir/test_optimize_ir.py b/tests/compiler/ir/test_optimize_ir.py
index b679e55453..1466166501 100644
--- a/tests/compiler/ir/test_optimize_ir.py
+++ b/tests/compiler/ir/test_optimize_ir.py
@@ -143,7 +143,9 @@
     (["sub", "x", 0], ["x"]),
     (["sub", "x", "x"], [0]),
     (["sub", ["sload", 0], ["sload", 0]], None),
-    (["sub", ["callvalue"], ["callvalue"]], None),
+    (["sub", ["callvalue"], ["callvalue"]], [0]),
+    (["sub", ["msize"], ["msize"]], None),
+    (["sub", ["gas"], ["gas"]], None),
     (["sub", -1, ["sload", 0]], ["not", ["sload", 0]]),
     (["mul", "x", 1], ["x"]),
     (["div", "x", 1], ["x"]),
@@ -210,7 +212,9 @@
     (["eq", -1, ["add", -(2**255), 2**255 - 1]], [1]),  # test compile-time wrapping
     (["eq", -2, ["add", 2**256 - 1, 2**256 - 1]], [1]),  # test compile-time wrapping
     (["eq", "x", "x"], [1]),
-    (["eq", "callvalue", "callvalue"], None),
+    (["eq", "gas", "gas"], None),
+    (["eq", "msize", "msize"], None),
+    (["eq", "callvalue", "callvalue"], [1]),
     (["ne", "x", "x"], [0]),
 ]
 
diff --git a/tests/parser/functions/test_create_functions.py b/tests/parser/functions/test_create_functions.py
index 876d50b27d..fa7729d98e 100644
--- a/tests/parser/functions/test_create_functions.py
+++ b/tests/parser/functions/test_create_functions.py
@@ -431,3 +431,212 @@ def test2(target: address, salt: bytes32) -> address:
     # test2 = c.test2(b"\x01", salt)
     # assert HexBytes(test2) == create2_address_of(c.address, salt, vyper_initcode(b"\x01"))
     # assert_tx_failed(lambda: c.test2(bytecode, salt))
+
+
+# XXX: these various tests to check the msize allocator for
+# create_copy_of and create_from_blueprint depend on calling convention
+# and variables writing to memory. think of ways to make more robust to
+# changes in calling convention and memory layout
+@pytest.mark.parametrize("blueprint_prefix", [b"", b"\xfe", b"\xfe\71\x00"])
+def test_create_from_blueprint_complex_value(
+    get_contract, deploy_blueprint_for, w3, blueprint_prefix
+):
+    # check msize allocator does not get trampled by value= kwarg
+    code = """
+var: uint256
+
+@external
+@payable
+def __init__(x: uint256):
+    self.var = x
+
+@external
+def foo()-> uint256:
+    return self.var
+    """
+
+    prefix_len = len(blueprint_prefix)
+
+    some_constant = b"\00" * 31 + b"\x0c"
+
+    deployer_code = f"""
+created_address: public(address)
+x: constant(Bytes[32]) = {some_constant}
+
+@internal
+def foo() -> uint256:
+    g:uint256 = 42
+    return 3
+
+@external
+@payable
+def test(target: address):
+    self.created_address = create_from_blueprint(
+        target,
+        x,
+        code_offset={prefix_len},
+        value=self.foo(),
+        raw_args=True
+    )
+    """
+
+    foo_contract = get_contract(code, 12)
+    expected_runtime_code = w3.eth.get_code(foo_contract.address)
+
+    f, FooContract = deploy_blueprint_for(code, initcode_prefix=blueprint_prefix)
+
+    d = get_contract(deployer_code)
+
+    d.test(f.address, transact={"value": 3})
+
+    test = FooContract(d.created_address())
+    assert w3.eth.get_code(test.address) == expected_runtime_code
+    assert test.foo() == 12
+
+
+@pytest.mark.parametrize("blueprint_prefix", [b"", b"\xfe", b"\xfe\71\x00"])
+def test_create_from_blueprint_complex_salt_raw_args(
+    get_contract, deploy_blueprint_for, w3, blueprint_prefix
+):
+    # test msize allocator does not get trampled by salt= kwarg
+    code = """
+var: uint256
+
+@external
+@payable
+def __init__(x: uint256):
+    self.var = x
+
+@external
+def foo()-> uint256:
+    return self.var
+    """
+
+    some_constant = b"\00" * 31 + b"\x0c"
+    prefix_len = len(blueprint_prefix)
+
+    deployer_code = f"""
+created_address: public(address)
+
+x: constant(Bytes[32]) = {some_constant}
+salt: constant(bytes32) = keccak256("kebab")
+
+@internal
+def foo() -> bytes32:
+    g:uint256 = 42
+    return salt
+
+@external
+@payable
+def test(target: address):
+    self.created_address = create_from_blueprint(
+        target,
+        x,
+        code_offset={prefix_len},
+        salt=self.foo(),
+        raw_args= True
+    )
+    """
+
+    foo_contract = get_contract(code, 12)
+    expected_runtime_code = w3.eth.get_code(foo_contract.address)
+
+    f, FooContract = deploy_blueprint_for(code, initcode_prefix=blueprint_prefix)
+
+    d = get_contract(deployer_code)
+
+    d.test(f.address, transact={})
+
+    test = FooContract(d.created_address())
+    assert w3.eth.get_code(test.address) == expected_runtime_code
+    assert test.foo() == 12
+
+
+@pytest.mark.parametrize("blueprint_prefix", [b"", b"\xfe", b"\xfe\71\x00"])
+def test_create_from_blueprint_complex_salt_no_constructor_args(
+    get_contract, deploy_blueprint_for, w3, blueprint_prefix
+):
+    # test msize allocator does not get trampled by salt= kwarg
+    code = """
+var: uint256
+
+@external
+@payable
+def __init__():
+    self.var = 12
+
+@external
+def foo()-> uint256:
+    return self.var
+    """
+
+    prefix_len = len(blueprint_prefix)
+    deployer_code = f"""
+created_address: public(address)
+
+salt: constant(bytes32) = keccak256("kebab")
+
+@external
+@payable
+def test(target: address):
+    self.created_address = create_from_blueprint(
+        target,
+        code_offset={prefix_len},
+        salt=keccak256(_abi_encode(target))
+    )
+    """
+
+    foo_contract = get_contract(code)
+    expected_runtime_code = w3.eth.get_code(foo_contract.address)
+
+    f, FooContract = deploy_blueprint_for(code, initcode_prefix=blueprint_prefix)
+
+    d = get_contract(deployer_code)
+
+    d.test(f.address, transact={})
+
+    test = FooContract(d.created_address())
+    assert w3.eth.get_code(test.address) == expected_runtime_code
+    assert test.foo() == 12
+
+
+def test_create_copy_of_complex_kwargs(get_contract, w3):
+    # test msize allocator does not get trampled by salt= kwarg
+    complex_salt = """
+created_address: public(address)
+
+@external
+def test(target: address) -> address:
+    self.created_address = create_copy_of(
+        target,
+        salt=keccak256(_abi_encode(target))
+    )
+    return self.created_address
+
+    """
+
+    c = get_contract(complex_salt)
+    bytecode = w3.eth.get_code(c.address)
+    c.test(c.address, transact={})
+    test1 = c.created_address()
+    assert w3.eth.get_code(test1) == bytecode
+
+    # test msize allocator does not get trampled by value= kwarg
+    complex_value = """
+created_address: public(address)
+
+@external
+@payable
+def test(target: address) -> address:
+    value: uint256 = 2
+    self.created_address = create_copy_of(target, value = [2,2,2][value])
+    return self.created_address
+
+    """
+
+    c = get_contract(complex_value)
+    bytecode = w3.eth.get_code(c.address)
+
+    c.test(c.address, transact={"value": 2})
+    test1 = c.created_address()
+    assert w3.eth.get_code(test1) == bytecode
diff --git a/tests/parser/functions/test_raw_call.py b/tests/parser/functions/test_raw_call.py
index 9c6fba79e7..81efe64a18 100644
--- a/tests/parser/functions/test_raw_call.py
+++ b/tests/parser/functions/test_raw_call.py
@@ -426,6 +426,164 @@ def baz(_addr: address, should_raise: bool) -> uint256:
     assert caller.baz(target.address, False) == 3
 
 
+# XXX: these test_raw_call_clean_mem* tests depend on variables and
+# calling convention writing to memory. think of ways to make more
+# robust to changes to calling convention and memory layout.
+
+
+def test_raw_call_msg_data_clean_mem(get_contract):
+    # test msize uses clean memory and does not get overwritten by
+    # any raw_call() arguments
+    code = """
+identity: constant(address) = 0x0000000000000000000000000000000000000004
+
+@external
+def foo():
+    pass
+
+@internal
+@view
+def get_address()->address:
+    a:uint256 = 121 # 0x79
+    return identity
+@external
+def bar(f: uint256, u: uint256) -> Bytes[100]:
+    # embed an internal call in the calculation of address
+    a: Bytes[100] = raw_call(self.get_address(), msg.data, max_outsize=100)
+    return a
+    """
+
+    c = get_contract(code)
+    assert (
+        c.bar(1, 2).hex() == "ae42e951"
+        "0000000000000000000000000000000000000000000000000000000000000001"
+        "0000000000000000000000000000000000000000000000000000000000000002"
+    )
+
+
+def test_raw_call_clean_mem2(get_contract):
+    # test msize uses clean memory and does not get overwritten by
+    # any raw_call() arguments, another way
+    code = """
+buf: Bytes[100]
+
+@external
+def bar(f: uint256, g: uint256, h: uint256) -> Bytes[100]:
+    # embed a memory modifying expression in the calculation of address
+    self.buf = raw_call(
+        [0x0000000000000000000000000000000000000004,][f-1],
+        msg.data,
+        max_outsize=100
+    )
+    return self.buf
+    """
+    c = get_contract(code)
+
+    assert (
+        c.bar(1, 2, 3).hex() == "9309b76e"
+        "0000000000000000000000000000000000000000000000000000000000000001"
+        "0000000000000000000000000000000000000000000000000000000000000002"
+        "0000000000000000000000000000000000000000000000000000000000000003"
+    )
+
+
+def test_raw_call_clean_mem3(get_contract):
+    # test msize uses clean memory and does not get overwritten by
+    # any raw_call() arguments, and also test order of evaluation for
+    # scope_multi
+    code = """
+buf: Bytes[100]
+canary: String[32]
+
+@internal
+def bar() -> address:
+    self.canary = "bar"
+    return 0x0000000000000000000000000000000000000004
+
+@internal
+def goo() -> uint256:
+    self.canary = "goo"
+    return 0
+
+@external
+def foo() -> String[32]:
+    self.buf = raw_call(self.bar(), msg.data, value = self.goo(), max_outsize=100)
+    return self.canary
+    """
+    c = get_contract(code)
+    assert c.foo() == "goo"
+
+
+def test_raw_call_clean_mem_kwargs_value(get_contract):
+    # test msize uses clean memory and does not get overwritten by
+    # any raw_call() kwargs
+    code = """
+buf: Bytes[100]
+
+# add a dummy function to trigger memory expansion in the selector table routine
+@external
+def foo():
+    pass
+
+@internal
+def _value() -> uint256:
+    x: uint256 = 1
+    return x
+
+@external
+def bar(f: uint256) -> Bytes[100]:
+    # embed a memory modifying expression in the calculation of address
+    self.buf = raw_call(
+        0x0000000000000000000000000000000000000004,
+        msg.data,
+        max_outsize=100,
+        value=self._value()
+    )
+    return self.buf
+    """
+    c = get_contract(code, value=1)
+
+    assert (
+        c.bar(13).hex() == "0423a132"
+        "000000000000000000000000000000000000000000000000000000000000000d"
+    )
+
+
+def test_raw_call_clean_mem_kwargs_gas(get_contract):
+    # test msize uses clean memory and does not get overwritten by
+    # any raw_call() kwargs
+    code = """
+buf: Bytes[100]
+
+# add a dummy function to trigger memory expansion in the selector table routine
+@external
+def foo():
+    pass
+
+@internal
+def _gas() -> uint256:
+    x: uint256 = msg.gas
+    return x
+
+@external
+def bar(f: uint256) -> Bytes[100]:
+    # embed a memory modifying expression in the calculation of address
+    self.buf = raw_call(
+        0x0000000000000000000000000000000000000004,
+        msg.data,
+        max_outsize=100,
+        gas=self._gas()
+    )
+    return self.buf
+    """
+    c = get_contract(code, value=1)
+
+    assert (
+        c.bar(15).hex() == "0423a132"
+        "000000000000000000000000000000000000000000000000000000000000000f"
+    )
+
+
 uncompilable_code = [
     (
         """
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 3ec8f69934..95759372a6 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -21,6 +21,7 @@
     clamp_basetype,
     clamp_nonzero,
     copy_bytes,
+    dummy_node_for_type,
     ensure_in_memory,
     eval_once_check,
     eval_seq,
@@ -36,7 +37,7 @@
     unwrap_location,
 )
 from vyper.codegen.expr import Expr
-from vyper.codegen.ir_node import Encoding
+from vyper.codegen.ir_node import Encoding, scope_multi
 from vyper.codegen.keccak256_helper import keccak256_helper
 from vyper.evm.address_space import MEMORY, STORAGE
 from vyper.exceptions import (
@@ -1155,14 +1156,17 @@ def build_IR(self, expr, args, kwargs, context):
             outsize,
         ]
 
-        if delegate_call:
-            call_op = ["delegatecall", gas, to, *common_call_args]
-        elif static_call:
-            call_op = ["staticcall", gas, to, *common_call_args]
-        else:
-            call_op = ["call", gas, to, value, *common_call_args]
+        gas, value = IRnode.from_list(gas), IRnode.from_list(value)
+        with scope_multi((to, value, gas), ("_to", "_value", "_gas")) as (b1, (to, value, gas)):
+            if delegate_call:
+                call_op = ["delegatecall", gas, to, *common_call_args]
+            elif static_call:
+                call_op = ["staticcall", gas, to, *common_call_args]
+            else:
+                call_op = ["call", gas, to, value, *common_call_args]
 
-        call_ir += [call_op]
+            call_ir += [call_op]
+            call_ir = b1.resolve(call_ir)
 
         # build sequence IR
         if outsize:
@@ -1589,13 +1593,15 @@ def build_IR(self, expr, context):
 
 # CREATE* functions
 
+CREATE2_SENTINEL = dummy_node_for_type(BYTES32_T)
+
 
 # create helper functions
 # generates CREATE op sequence + zero check for result
-def _create_ir(value, buf, length, salt=None, checked=True):
+def _create_ir(value, buf, length, salt, checked=True):
     args = [value, buf, length]
     create_op = "create"
-    if salt is not None:
+    if salt is not CREATE2_SENTINEL:
         create_op = "create2"
         args.append(salt)
 
@@ -1713,8 +1719,9 @@ def build_IR(self, expr, args, kwargs, context):
         context.check_is_not_constant("use {self._id}", expr)
 
         should_use_create2 = "salt" in [kwarg.arg for kwarg in expr.keywords]
+
         if not should_use_create2:
-            kwargs["salt"] = None
+            kwargs["salt"] = CREATE2_SENTINEL
 
         ir_builder = self._build_create_IR(expr, args, context, **kwargs)
 
@@ -1794,13 +1801,16 @@ def _add_gas_estimate(self, args, should_use_create2):
     def _build_create_IR(self, expr, args, context, value, salt):
         target = args[0]
 
-        with target.cache_when_complex("create_target") as (b1, target):
+        # something we can pass to scope_multi
+        with scope_multi(
+            (target, value, salt), ("create_target", "create_value", "create_salt")
+        ) as (b1, (target, value, salt)):
             codesize = IRnode.from_list(["extcodesize", target])
             msize = IRnode.from_list(["msize"])
-            with codesize.cache_when_complex("target_codesize") as (
+            with scope_multi((codesize, msize), ("target_codesize", "mem_ofst")) as (
                 b2,
-                codesize,
-            ), msize.cache_when_complex("mem_ofst") as (b3, mem_ofst):
+                (codesize, mem_ofst),
+            ):
                 ir = ["seq"]
 
                 # make sure there is actually code at the target
@@ -1824,7 +1834,7 @@ def _build_create_IR(self, expr, args, context, value, salt):
 
                 ir.append(_create_ir(value, buf, buf_len, salt))
 
-                return b1.resolve(b2.resolve(b3.resolve(ir)))
+                return b1.resolve(b2.resolve(ir))
 
 
 class CreateFromBlueprint(_CreateBase):
@@ -1877,17 +1887,18 @@ def _build_create_IR(self, expr, args, context, value, salt, code_offset, raw_ar
         # (since the abi encoder could write to fresh memory).
         # it would be good to not require the memory copy, but need
         # to evaluate memory safety.
-        with target.cache_when_complex("create_target") as (b1, target), argslen.cache_when_complex(
-            "encoded_args_len"
-        ) as (b2, encoded_args_len), code_offset.cache_when_complex("code_ofst") as (b3, codeofst):
-            codesize = IRnode.from_list(["sub", ["extcodesize", target], codeofst])
+        with scope_multi(
+            (target, value, salt, argslen, code_offset),
+            ("create_target", "create_value", "create_salt", "encoded_args_len", "code_offset"),
+        ) as (b1, (target, value, salt, encoded_args_len, code_offset)):
+            codesize = IRnode.from_list(["sub", ["extcodesize", target], code_offset])
             # copy code to memory starting from msize. we are clobbering
             # unused memory so it's safe.
             msize = IRnode.from_list(["msize"], location=MEMORY)
-            with codesize.cache_when_complex("target_codesize") as (
-                b4,
-                codesize,
-            ), msize.cache_when_complex("mem_ofst") as (b5, mem_ofst):
+            with scope_multi((codesize, msize), ("target_codesize", "mem_ofst")) as (
+                b2,
+                (codesize, mem_ofst),
+            ):
                 ir = ["seq"]
 
                 # make sure there is code at the target, and that
@@ -1907,7 +1918,7 @@ def _build_create_IR(self, expr, args, context, value, salt, code_offset, raw_ar
                 # copy the target code into memory.
                 # layout starting from mem_ofst:
                 # 00...00 (22 0's) | preamble | bytecode
-                ir.append(["extcodecopy", target, mem_ofst, codeofst, codesize])
+                ir.append(["extcodecopy", target, mem_ofst, code_offset, codesize])
 
                 ir.append(copy_bytes(add_ofst(mem_ofst, codesize), argbuf, encoded_args_len, bufsz))
 
@@ -1922,7 +1933,7 @@ def _build_create_IR(self, expr, args, context, value, salt, code_offset, raw_ar
 
                 ir.append(_create_ir(value, mem_ofst, length, salt))
 
-                return b1.resolve(b2.resolve(b3.resolve(b4.resolve(b5.resolve(ir)))))
+                return b1.resolve(b2.resolve(ir))
 
 
 class _UnsafeMath(BuiltinFunction):
diff --git a/vyper/codegen/ir_node.py b/vyper/codegen/ir_node.py
index 6cb0a07281..ad4aa76437 100644
--- a/vyper/codegen/ir_node.py
+++ b/vyper/codegen/ir_node.py
@@ -1,3 +1,4 @@
+import contextlib
 import re
 from enum import Enum, auto
 from functools import cached_property
@@ -46,6 +47,77 @@ class Encoding(Enum):
     # future: packed
 
 
+# shortcut for chaining multiple cache_when_complex calls
+# CMC 2023-08-10 remove this and scope_together _as soon as_ we have
+# real variables in IR (that we can declare without explicit scoping -
+# needs liveness analysis).
+@contextlib.contextmanager
+def scope_multi(ir_nodes, names):
+    assert len(ir_nodes) == len(names)
+
+    builders = []
+    scoped_ir_nodes = []
+
+    class _MultiBuilder:
+        def resolve(self, body):
+            # sanity check that it's initialized properly
+            assert len(builders) == len(ir_nodes)
+            ret = body
+            for b in reversed(builders):
+                ret = b.resolve(ret)
+            return ret
+
+    mb = _MultiBuilder()
+
+    with contextlib.ExitStack() as stack:
+        for arg, name in zip(ir_nodes, names):
+            b, ir_node = stack.enter_context(arg.cache_when_complex(name))
+
+            builders.append(b)
+            scoped_ir_nodes.append(ir_node)
+
+        yield mb, scoped_ir_nodes
+
+
+# create multiple with scopes if any of the items are complex, to force
+# ordering of side effects.
+@contextlib.contextmanager
+def scope_together(ir_nodes, names):
+    assert len(ir_nodes) == len(names)
+
+    should_scope = any(s._optimized.is_complex_ir for s in ir_nodes)
+
+    class _Builder:
+        def resolve(self, body):
+            if not should_scope:
+                # uses of the variable have already been inlined
+                return body
+
+            ret = body
+            # build with scopes from inside-out (hence reversed)
+            for arg, name in reversed(list(zip(ir_nodes, names))):
+                ret = ["with", name, arg, ret]
+
+            if isinstance(body, IRnode):
+                return IRnode.from_list(
+                    ret, typ=body.typ, location=body.location, encoding=body.encoding
+                )
+            else:
+                return ret
+
+    b = _Builder()
+
+    if should_scope:
+        ir_vars = tuple(
+            IRnode.from_list(name, typ=arg.typ, location=arg.location, encoding=arg.encoding)
+            for (arg, name) in zip(ir_nodes, names)
+        )
+        yield b, ir_vars
+    else:
+        # inline them
+        yield b, ir_nodes
+
+
 # this creates a magical block which maps to IR `with`
 class _WithBuilder:
     def __init__(self, ir_node, name, should_inline=False):
@@ -326,14 +398,15 @@ def _check(condition, err):
     def gas(self):
         return self._gas + self.add_gas_estimate
 
-    # the IR should be cached.
-    # TODO make this private. turns out usages are all for the caching
-    # idiom that cache_when_complex addresses
+    # the IR should be cached and/or evaluated exactly once
     @property
     def is_complex_ir(self):
         # list of items not to cache. note can add other env variables
         # which do not change, e.g. calldatasize, coinbase, etc.
-        do_not_cache = {"~empty", "calldatasize"}
+        # reads (from memory or storage) should not be cached because
+        # they can have or be affected by side effects.
+        do_not_cache = {"~empty", "calldatasize", "callvalue"}
+
         return (
             isinstance(self.value, str)
             and (self.value.lower() in VALID_IR_MACROS or self.value.upper() in get_ir_opcodes())

From 1e9922d9f76bed2083ce2187e5be72912cfe2082 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 25 Sep 2023 09:59:56 -0700
Subject: [PATCH 134/161] chore: add notes to selector table implementation
 (#3618)

and a couple sanity checks
---
 vyper/codegen/function_definitions/common.py | 7 +++++++
 vyper/codegen/module.py                      | 5 ++++-
 2 files changed, 11 insertions(+), 1 deletion(-)

diff --git a/vyper/codegen/function_definitions/common.py b/vyper/codegen/function_definitions/common.py
index 3fd5ce0b29..1d24b6c6dd 100644
--- a/vyper/codegen/function_definitions/common.py
+++ b/vyper/codegen/function_definitions/common.py
@@ -73,6 +73,13 @@ class EntryPointInfo:
     min_calldatasize: int  # the min calldata required for this entry point
     ir_node: IRnode  # the ir for this entry point
 
+    def __post_init__(self):
+        # ABI v2 property guaranteed by the spec.
+        # https://docs.soliditylang.org/en/v0.8.21/abi-spec.html#formal-specification-of-the-encoding states:  # noqa: E501
+        # > Note that for any X, len(enc(X)) is a multiple of 32.
+        assert self.min_calldatasize >= 4
+        assert (self.min_calldatasize - 4) % 32 == 0
+
 
 @dataclass
 class ExternalFuncIR(FuncIR):
diff --git a/vyper/codegen/module.py b/vyper/codegen/module.py
index 6445a5e1e0..bfdafa8ba9 100644
--- a/vyper/codegen/module.py
+++ b/vyper/codegen/module.py
@@ -93,9 +93,12 @@ def _generate_external_entry_points(external_functions, global_ctx):
     for code in external_functions:
         func_ir = generate_ir_for_function(code, global_ctx)
         for abi_sig, entry_point in func_ir.entry_points.items():
+            method_id = method_id_int(abi_sig)
             assert abi_sig not in entry_points
+            assert method_id not in sig_of
+
             entry_points[abi_sig] = entry_point
-            sig_of[method_id_int(abi_sig)] = abi_sig
+            sig_of[method_id] = abi_sig
 
         # stick function common body into final entry point to save a jump
         ir_node = IRnode.from_list(["seq", entry_point.ir_node, func_ir.common_ir])

From 7b9d159b84c0e568378d53e753350e7f691c413a Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 25 Sep 2023 20:05:33 -0700
Subject: [PATCH 135/161] docs: mcopy is enabled with cancun target (#3620)

---
 docs/compiling-a-contract.rst | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/compiling-a-contract.rst b/docs/compiling-a-contract.rst
index 6d1cdf98d7..b529d1efb1 100644
--- a/docs/compiling-a-contract.rst
+++ b/docs/compiling-a-contract.rst
@@ -197,6 +197,7 @@ The following is a list of supported EVM versions, and changes in the compiler i
 
    - The ``transient`` keyword allows declaration of variables which live in transient storage
    - Functions marked with ``@nonreentrant`` are protected with TLOAD/TSTORE instead of SLOAD/SSTORE
+   - The ``MCOPY`` opcode will be generated automatically by the compiler for most memory operations.
 
 
 

From e5c323afa4f61a2fc7a28bbfb824afd90ec86158 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 26 Sep 2023 11:24:32 -0700
Subject: [PATCH 136/161] chore: fix some documentation inconsistencies (#3624)

* raw_args kwarg to create_from_blueprint
* fix create_from_blueprint example
* clarify "all but one 64th" behavior when forwarding gas left=
* remove dead comment
* update internal documentation for generate_ir_for_external_function()
* update memory layout in create_from_blueprint comments
* fix warning for BitwiseNot
* fix error message about msg.data
* docs: extract32 can output any bytesM type
* remove dead variable in comment
---
 docs/built-in-functions.rst                         | 13 +++++++++----
 vyper/builtins/functions.py                         |  6 ++----
 .../function_definitions/external_function.py       | 11 ++++-------
 vyper/semantics/analysis/local.py                   |  2 +-
 vyper/semantics/analysis/module.py                  |  1 -
 5 files changed, 16 insertions(+), 17 deletions(-)

diff --git a/docs/built-in-functions.rst b/docs/built-in-functions.rst
index bfaa8fdd5e..45cf9ec8c2 100644
--- a/docs/built-in-functions.rst
+++ b/docs/built-in-functions.rst
@@ -184,13 +184,14 @@ Vyper has three built-ins for contract creation; all three contract creation bui
     The implementation of ``create_copy_of`` assumes that the code at ``target`` is smaller than 16MB. While this is much larger than the EIP-170 constraint of 24KB, it is a conservative size limit intended to future-proof deployer contracts in case the EIP-170 constraint is lifted. If the code at ``target`` is larger than 16MB, the behavior of ``create_copy_of`` is undefined.
 
 
-.. py:function:: create_from_blueprint(target: address, *args, value: uint256 = 0, code_offset=0, [, salt: bytes32]) -> address
+.. py:function:: create_from_blueprint(target: address, *args, value: uint256 = 0, raw_args: bool = False, code_offset: int = 0, [, salt: bytes32]) -> address
 
     Copy the code of ``target`` into memory and execute it as initcode. In other words, this operation interprets the code at ``target`` not as regular runtime code, but directly as initcode. The ``*args`` are interpreted as constructor arguments, and are ABI-encoded and included when executing the initcode.
 
     * ``target``: Address of the blueprint to invoke
     * ``*args``: Constructor arguments to forward to the initcode.
     * ``value``: The wei value to send to the new contract address (Optional, default 0)
+    * ``raw_args``: If ``True``, ``*args`` must be a single ``Bytes[...]`` argument, which will be interpreted as a raw bytes buffer to forward to the create operation (which is useful for instance, if pre- ABI-encoded data is passed in from elsewhere). (Optional, default ``False``)
     * ``code_offset``: The offset to start the ``EXTCODECOPY`` from (Optional, default 0)
     * ``salt``: A ``bytes32`` value utilized by the deterministic ``CREATE2`` opcode (Optional, if not supplied, ``CREATE`` is used)
 
@@ -201,7 +202,7 @@ Vyper has three built-ins for contract creation; all three contract creation bui
         @external
         def foo(blueprint: address) -> address:
             arg1: uint256 = 18
-            arg2: String = "some string"
+            arg2: String[32] = "some string"
             return create_from_blueprint(blueprint, arg1, arg2, code_offset=1)
 
 .. note::
@@ -226,7 +227,7 @@ Vyper has three built-ins for contract creation; all three contract creation bui
     * ``to``: Destination address to call to
     * ``data``: Data to send to the destination address
     * ``max_outsize``: Maximum length of the bytes array returned from the call. If the returned call data exceeds this length, only this number of bytes is returned. (Optional, default ``0``)
-    * ``gas``: The amount of gas to attach to the call. If not set, all remaining gas is forwarded.
+    * ``gas``: The amount of gas to attach to the call. (Optional, defaults to ``msg.gas``).
     * ``value``: The wei value to send to the address (Optional, default ``0``)
     * ``is_delegate_call``: If ``True``, the call will be sent as ``DELEGATECALL`` (Optional, default ``False``)
     * ``is_static_call``: If ``True``, the call will be sent as ``STATICCALL`` (Optional, default ``False``)
@@ -264,6 +265,10 @@ Vyper has three built-ins for contract creation; all three contract creation bui
             assert success
             return response
 
+    .. note::
+
+        Regarding "forwarding all gas", note that, while Vyper will provide ``msg.gas`` to the call, in practice, there are some subtleties around forwarding all remaining gas on the EVM which are out of scope of this documentation and could be subject to change. For instance, see the language in EIP-150 around "all but one 64th".
+
 .. py:function:: raw_log(topics: bytes32[4], data: Union[Bytes, bytes32]) -> None
 
     Provides low level access to the ``LOG`` opcodes, emitting a log without having to specify an ABI type.
@@ -500,7 +505,7 @@ Data Manipulation
 
     * ``b``: ``Bytes`` list to extract from
     * ``start``: Start point to extract from
-    * ``output_type``: Type of output (``bytes32``, ``integer``, or ``address``). Defaults to ``bytes32``.
+    * ``output_type``: Type of output (``bytesM``, ``integer``, or ``address``). Defaults to ``bytes32``.
 
     Returns a value of the type specified by ``output_type``.
 
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 95759372a6..a0936712b2 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -1418,7 +1418,7 @@ class BitwiseNot(BuiltinFunction):
 
     def evaluate(self, node):
         if not self.__class__._warned:
-            vyper_warn("`bitwise_not()` is deprecated! Please use the ^ operator instead.")
+            vyper_warn("`bitwise_not()` is deprecated! Please use the ~ operator instead.")
             self.__class__._warned = True
 
         validate_call_args(node, 1)
@@ -1917,9 +1917,8 @@ def _build_create_IR(self, expr, args, context, value, salt, code_offset, raw_ar
 
                 # copy the target code into memory.
                 # layout starting from mem_ofst:
-                # 00...00 (22 0's) | preamble | bytecode
+                # <target initcode> | <abi-encoded args OR arg buffer if raw_arg=True>
                 ir.append(["extcodecopy", target, mem_ofst, code_offset, codesize])
-
                 ir.append(copy_bytes(add_ofst(mem_ofst, codesize), argbuf, encoded_args_len, bufsz))
 
                 # theoretically, dst = "msize", but just be safe.
@@ -2586,7 +2585,6 @@ def evaluate(self, node):
         if isinstance(input_type, IntegerT):
             ret = vy_ast.Int.from_node(node, value=val)
 
-        # TODO: to change to known_type once #3213 is merged
         ret._metadata["type"] = input_type
         return ret
 
diff --git a/vyper/codegen/function_definitions/external_function.py b/vyper/codegen/function_definitions/external_function.py
index 32236e9aad..65276469e7 100644
--- a/vyper/codegen/function_definitions/external_function.py
+++ b/vyper/codegen/function_definitions/external_function.py
@@ -135,20 +135,17 @@ def handler_for(calldata_kwargs, default_kwargs):
     return ret
 
 
-# TODO it would be nice if this returned a data structure which were
-# amenable to generating a jump table instead of the linear search for
-# method_id we have now.
 def generate_ir_for_external_function(code, func_t, context):
     # TODO type hints:
     # def generate_ir_for_external_function(
     #    code: vy_ast.FunctionDef,
     #    func_t: ContractFunctionT,
     #    context: Context,
-    #    check_nonpayable: bool,
     # ) -> IRnode:
-    """Return the IR for an external function. Includes code to inspect the method_id,
-    enter the function (nonpayable and reentrancy checks), handle kwargs and exit
-    the function (clean up reentrancy storage variables)
+    """
+    Return the IR for an external function. Returns IR for the body
+    of the function, handle kwargs and exit the function. Also returns
+    metadata required for `module.py` to construct the selector table.
     """
     nonreentrant_pre, nonreentrant_post = get_nonreentrant_lock(func_t)
 
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index c10df3b8fd..b391b33953 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -150,7 +150,7 @@ def _validate_msg_data_attribute(node: vy_ast.Attribute) -> None:
         allowed_builtins = ("slice", "len", "raw_call")
         if not isinstance(parent, vy_ast.Call) or parent.get("func.id") not in allowed_builtins:
             raise StructureException(
-                "msg.data is only allowed inside of the slice or len functions", node
+                "msg.data is only allowed inside of the slice, len or raw_call functions", node
             )
         if parent.get("func.id") == "slice":
             ok_args = len(parent.args) == 3 and isinstance(parent.args[2], vy_ast.Int)
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index 02ae82faac..e59422294c 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -98,7 +98,6 @@ def __init__(
         _ns.update({k: namespace[k] for k in namespace._scopes[-1]})  # type: ignore
         module_node._metadata["namespace"] = _ns
 
-        # check for collisions between 4byte function selectors
         self_members = namespace["self"].typ.members
 
         # get list of internal function calls made by each function

From d438d927bed3b850fe4768a490f3acde5f51b475 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 26 Sep 2023 15:24:46 -0700
Subject: [PATCH 137/161] fix: `_abi_decode()` validation (#3626)

`_abi_decode()` does not validate input when it is nested in certain
expressions. the following example gets correctly validated (bounds
checked):

```vyper
    x: uint8 = _abi_decode(slice(msg.data, 4, 32), uint8)
```

however, the following example is not bounds checked:

```vyper
@external
def abi_decode(x: uint256) -> uint256:
    a: uint256 = convert(
        _abi_decode(
            slice(msg.data, 4, 32),
            (uint8)
        ),
        uint256
    )
    return a  # abi_decode(256) returns: 256
```

the issue is caused because the `ABIDecode()` builtin tags its output
with `encoding=Encoding.ABI`, but this does not result in validation
until that itself is passed to `make_setter` (which is called for
instance when generating an assignment or return statement).

the issue can be triggered by constructing an example where the output
of `ABIDecode()` is not internally passed to `make_setter` or other
input validating routine.

this commit fixes the issue by calling `make_setter` in `ABIDecode()`
before returning the output buffer, which causes validation to be
performed. note that this causes a performance regression in the common
(and majority of) cases where `make_setter` is immediately called on the
result of `ABIDecode()` because a redundant memory copy ends up being
generated (like in the aforementioned examples: in a plain assignment or
return statement). however, fixing this performance regression is left
to future work in the optimizer.
---
 tests/parser/functions/test_abi_decode.py | 28 ++++++++++++
 vyper/builtins/functions.py               | 52 +++++++++++------------
 2 files changed, 52 insertions(+), 28 deletions(-)

diff --git a/tests/parser/functions/test_abi_decode.py b/tests/parser/functions/test_abi_decode.py
index 2f9b93057d..2216a5bd76 100644
--- a/tests/parser/functions/test_abi_decode.py
+++ b/tests/parser/functions/test_abi_decode.py
@@ -344,6 +344,34 @@ def abi_decode(x: Bytes[96]) -> (uint256, uint256):
     assert_tx_failed(lambda: c.abi_decode(input_))
 
 
+def test_clamper_nested_uint8(get_contract, assert_tx_failed):
+    # check that _abi_decode clamps on word-types even when it is in a nested expression
+    # decode -> validate uint8 -> revert if input >= 256 -> cast back to uint256
+    contract = """
+@external
+def abi_decode(x: uint256) -> uint256:
+    a: uint256 = convert(_abi_decode(slice(msg.data, 4, 32), (uint8)), uint256)
+    return a
+    """
+    c = get_contract(contract)
+    assert c.abi_decode(255) == 255
+    assert_tx_failed(lambda: c.abi_decode(256))
+
+
+def test_clamper_nested_bytes(get_contract, assert_tx_failed):
+    # check that _abi_decode clamps dynamic even when it is in a nested expression
+    # decode -> validate Bytes[20] -> revert if len(input) > 20 -> convert back to -> add 1
+    contract = """
+@external
+def abi_decode(x: Bytes[96]) -> Bytes[21]:
+    a: Bytes[21] = concat(b"a", _abi_decode(x, Bytes[20]))
+    return a
+    """
+    c = get_contract(contract)
+    assert c.abi_decode(abi.encode("(bytes)", (b"bc",))) == b"abc"
+    assert_tx_failed(lambda: c.abi_decode(abi.encode("(bytes)", (b"a" * 22,))))
+
+
 @pytest.mark.parametrize(
     "output_typ,input_",
     [
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index a0936712b2..8cdd2a4b8b 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -29,7 +29,6 @@
     get_type_for_exact_size,
     ir_tuple_from_args,
     make_setter,
-    needs_external_call_wrap,
     promote_signed_int,
     sar,
     shl,
@@ -2367,8 +2366,6 @@ def build_IR(self, expr, args, kwargs, context):
 class ABIEncode(BuiltinFunction):
     _id = "_abi_encode"  # TODO prettier to rename this to abi.encode
     # signature: *, ensure_tuple=<literal_bool> -> Bytes[<calculated len>]
-    # (check the signature manually since we have no utility methods
-    # to handle varargs.)
     # explanation of ensure_tuple:
     # default is to force even a single value into a tuple,
     # e.g. _abi_encode(bytes) -> _abi_encode((bytes,))
@@ -2529,24 +2526,11 @@ def build_IR(self, expr, args, kwargs, context):
             )
 
         data = ensure_in_memory(data, context)
+
         with data.cache_when_complex("to_decode") as (b1, data):
             data_ptr = bytes_data_ptr(data)
             data_len = get_bytearray_length(data)
 
-            # Normally, ABI-encoded data assumes the argument is a tuple
-            # (See comments for `wrap_value_for_external_return`)
-            # However, we do not want to use `wrap_value_for_external_return`
-            # technique as used in external call codegen because in order to be
-            # type-safe we would need an extra memory copy. To avoid a copy,
-            # we manually add the ABI-dynamic offset so that it is
-            # re-interpreted in-place.
-            if (
-                unwrap_tuple is True
-                and needs_external_call_wrap(output_typ)
-                and output_typ.abi_type.is_dynamic()
-            ):
-                data_ptr = add_ofst(data_ptr, 32)
-
             ret = ["seq"]
 
             if abi_min_size == abi_size_bound:
@@ -2555,18 +2539,30 @@ def build_IR(self, expr, args, kwargs, context):
                 # runtime assert: abi_min_size <= data_len <= abi_size_bound
                 ret.append(clamp2(abi_min_size, data_len, abi_size_bound, signed=False))
 
-            # return pointer to the buffer
-            ret.append(data_ptr)
-
-            return b1.resolve(
-                IRnode.from_list(
-                    ret,
-                    typ=output_typ,
-                    location=data.location,
-                    encoding=Encoding.ABI,
-                    annotation=f"abi_decode({output_typ})",
-                )
+            to_decode = IRnode.from_list(
+                data_ptr,
+                typ=wrapped_typ,
+                location=data.location,
+                encoding=Encoding.ABI,
+                annotation=f"abi_decode({output_typ})",
             )
+            to_decode.encoding = Encoding.ABI
+
+            # TODO optimization: skip make_setter when we don't need
+            # input validation
+
+            output_buf = context.new_internal_variable(wrapped_typ)
+            output = IRnode.from_list(output_buf, typ=wrapped_typ, location=MEMORY)
+
+            # sanity check buffer size for wrapped output type will not buffer overflow
+            assert wrapped_typ.memory_bytes_required == output_typ.memory_bytes_required
+            ret.append(make_setter(output, to_decode))
+
+            ret.append(output)
+            # finalize. set the type and location for the return buffer.
+            # (note: unwraps the tuple type if necessary)
+            ret = IRnode.from_list(ret, typ=output_typ, location=MEMORY)
+            return b1.resolve(ret)
 
 
 class _MinMaxValue(TypenameFoldedFunction):

From 950a97ea0d16db9884ec2f09bc71f1fc52c20bb5 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 26 Sep 2023 16:19:34 -0700
Subject: [PATCH 138/161] fix: type check abi_decode arguments (#3623)

currently, the following code will trigger a compiler panic:

```vyper
@external
def foo(j: uint256) -> bool:
    s: bool = _abi_decode(j, bool, unwrap_tuple= False)
    return s
```

the following code will compile, even though it should not typecheck:

```vyper
@external
def foo(s: String[32]) -> bool:
    t: bool = _abi_decode(s, bool, unwrap_tuple=False)
    return t
```

this commit fixes the issue by typechecking the input to
`_abi_decode()`. it also adds syntax tests for `_abi_decode()`.
---
 tests/parser/syntax/test_abi_decode.py | 45 ++++++++++++++++++++++++++
 vyper/builtins/functions.py            |  2 ++
 2 files changed, 47 insertions(+)
 create mode 100644 tests/parser/syntax/test_abi_decode.py

diff --git a/tests/parser/syntax/test_abi_decode.py b/tests/parser/syntax/test_abi_decode.py
new file mode 100644
index 0000000000..f05ff429cd
--- /dev/null
+++ b/tests/parser/syntax/test_abi_decode.py
@@ -0,0 +1,45 @@
+import pytest
+
+from vyper import compiler
+from vyper.exceptions import TypeMismatch
+
+fail_list = [
+    (
+        """
+@external
+def foo(j: uint256) -> bool:
+    s: bool = _abi_decode(j, bool, unwrap_tuple= False)
+    return s
+    """,
+        TypeMismatch,
+    ),
+    (
+        """
+@external
+def bar(j: String[32]) -> bool:
+    s: bool = _abi_decode(j, bool, unwrap_tuple= False)
+    return s
+    """,
+        TypeMismatch,
+    ),
+]
+
+
+@pytest.mark.parametrize("bad_code,exc", fail_list)
+def test_abi_encode_fail(bad_code, exc):
+    with pytest.raises(exc):
+        compiler.compile_code(bad_code)
+
+
+valid_list = [
+    """
+@external
+def foo(x: Bytes[32]) -> uint256:
+    return _abi_decode(x, uint256)
+    """
+]
+
+
+@pytest.mark.parametrize("good_code", valid_list)
+def test_abi_encode_success(good_code):
+    assert compiler.compile_code(good_code) is not None
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index 8cdd2a4b8b..f07202831d 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -2490,6 +2490,8 @@ def fetch_call_return(self, node):
         return output_type.typedef
 
     def infer_arg_types(self, node):
+        self._validate_arg_types(node)
+
         validate_call_args(node, 2, ["unwrap_tuple"])
 
         data_type = get_exact_type_from_node(node.args[0])

From 2bdbd846b09c94f05739e1274e00825912404fe3 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Wed, 27 Sep 2023 21:06:03 +0800
Subject: [PATCH 139/161] chore: add metadata to vyper-json (#3622)

---
 tests/cli/vyper_json/test_output_selection.py | 6 ++++++
 vyper/cli/vyper_json.py                       | 2 +-
 vyper/compiler/output.py                      | 1 -
 3 files changed, 7 insertions(+), 2 deletions(-)

diff --git a/tests/cli/vyper_json/test_output_selection.py b/tests/cli/vyper_json/test_output_selection.py
index c72f06f5a7..3b12e2b54a 100644
--- a/tests/cli/vyper_json/test_output_selection.py
+++ b/tests/cli/vyper_json/test_output_selection.py
@@ -52,3 +52,9 @@ def test_solc_style():
     input_json = {"settings": {"outputSelection": {"foo.vy": {"": ["abi"], "foo.vy": ["ir"]}}}}
     sources = {"foo.vy": ""}
     assert get_input_dict_output_formats(input_json, sources) == {"foo.vy": ["abi", "ir_dict"]}
+
+
+def test_metadata():
+    input_json = {"settings": {"outputSelection": {"*": ["metadata"]}}}
+    sources = {"foo.vy": ""}
+    assert get_input_dict_output_formats(input_json, sources) == {"foo.vy": ["metadata"]}
diff --git a/vyper/cli/vyper_json.py b/vyper/cli/vyper_json.py
index 4a1c91550e..f6d82c3fe0 100755
--- a/vyper/cli/vyper_json.py
+++ b/vyper/cli/vyper_json.py
@@ -29,7 +29,7 @@
     "interface": "interface",
     "ir": "ir_dict",
     "ir_runtime": "ir_runtime_dict",
-    # "metadata": "metadata",  # don't include  in "*" output for now
+    "metadata": "metadata",
     "layout": "layout",
     "userdoc": "userdoc",
 }
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 334c5ba613..9ef492c3e2 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -104,7 +104,6 @@ def build_ir_runtime_dict_output(compiler_data: CompilerData) -> dict:
 
 
 def build_metadata_output(compiler_data: CompilerData) -> dict:
-    warnings.warn("metadata output format is unstable!")
     sigs = compiler_data.function_signatures
 
     def _var_rec_dict(variable_record):

From aecd911347af5912a22540ff3dc513273e51c72d Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 28 Sep 2023 14:42:12 -0700
Subject: [PATCH 140/161] fix: metadata output interaction with natspec (#3627)

enabling the `-f metadata` output has an interaction with other outputs
because the metadata output format mutates some internal data structures
in-place. this is because `vars()` returns a reference to the object's
`__dict__` as opposed to a copy of it. the behavior can be seen by
trying to call the compiler with `-f metadata,devdoc,userdoc`. this
issue was revealed in (but not introduced by) 2bdbd846b0, because that
commit caused metadata and userdoc to be bundled together by default.

this commit fixes the issue by constructing a copy of the object during
metadata output formatting. it also modifies the test suite to include
more output formats, to test the interactions between these different
output formats. in doing so, it was also found that some examples have
invalid natspec, which has also been fixed.
---
 examples/tokens/ERC1155ownable.vy | 2 --
 tests/base_conftest.py            | 4 ++--
 vyper/compiler/output.py          | 6 +++---
 3 files changed, 5 insertions(+), 7 deletions(-)

diff --git a/examples/tokens/ERC1155ownable.vy b/examples/tokens/ERC1155ownable.vy
index 8094225f18..f1070b8f89 100644
--- a/examples/tokens/ERC1155ownable.vy
+++ b/examples/tokens/ERC1155ownable.vy
@@ -214,7 +214,6 @@ def mint(receiver: address, id: uint256, amount:uint256):
     @param receiver the account that will receive the minted token
     @param id the ID of the token
     @param amount of tokens for this ID
-    @param data the data associated with this mint. Usually stays empty
     """
     assert not self.paused, "The contract has been paused"
     assert self.owner == msg.sender, "Only the contract owner can mint"
@@ -232,7 +231,6 @@ def mintBatch(receiver: address, ids: DynArray[uint256, BATCH_SIZE], amounts: Dy
     @param receiver the account that will receive the minted token
     @param ids array of ids for the tokens
     @param amounts amounts of tokens for each ID in the ids array
-    @param data the data associated with this mint. Usually stays empty
     """
     assert not self.paused, "The contract has been paused"
     assert self.owner == msg.sender, "Only the contract owner can mint"
diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index 81e8dedc36..1c7c6f3aed 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -118,8 +118,8 @@ def _get_contract(w3, source_code, optimize, *args, override_opt_level=None, **k
     settings.optimize = override_opt_level or optimize
     out = compiler.compile_code(
         source_code,
-        # test that metadata gets generated
-        ["abi", "bytecode", "metadata"],
+        # test that metadata and natspecs get generated
+        ["abi", "bytecode", "metadata", "userdoc", "devdoc"],
         settings=settings,
         interface_codes=kwargs.pop("interface_codes", None),
         show_gas_estimates=True,  # Enable gas estimates for testing
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 9ef492c3e2..1c38fcff9b 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -107,7 +107,7 @@ def build_metadata_output(compiler_data: CompilerData) -> dict:
     sigs = compiler_data.function_signatures
 
     def _var_rec_dict(variable_record):
-        ret = vars(variable_record)
+        ret = vars(variable_record).copy()
         ret["typ"] = str(ret["typ"])
         if ret["data_offset"] is None:
             del ret["data_offset"]
@@ -117,7 +117,7 @@ def _var_rec_dict(variable_record):
         return ret
 
     def _to_dict(func_t):
-        ret = vars(func_t)
+        ret = vars(func_t).copy()
         ret["return_type"] = str(ret["return_type"])
         ret["_ir_identifier"] = func_t._ir_info.ir_identifier
 
@@ -133,7 +133,7 @@ def _to_dict(func_t):
             args = ret[attr]
             ret[attr] = {arg.name: str(arg.typ) for arg in args}
 
-        ret["frame_info"] = vars(func_t._ir_info.frame_info)
+        ret["frame_info"] = vars(func_t._ir_info.frame_info).copy()
         del ret["frame_info"]["frame_vars"]  # frame_var.pos might be IR, cannot serialize
 
         keep_keys = {

From 42817806cadaffefed7bf9c8edd64abf439be4de Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 28 Sep 2023 14:55:05 -0700
Subject: [PATCH 141/161] fix: improve test case inputs in selector table fuzz
 (#3625)

this commit improves the fuzz examples for the selector table. the
nested `@given` tests too many "dumb" examples (ex. 0, 1, max_value)
when `max_examples` is not large enough. the nested `@given` strategy
can find falsifying inputs, but it requires the inner `max_examples` to
be set much higher, and the shrinking takes much longer. this setting
of `max_examples=125` with a single `@given` using the `@composite`
strategy in this commit finds the selector table bug (that was fixed in
823675a8dc) after an average of 3 runs.
---
 tests/parser/test_selector_table.py | 98 +++++++++++++++--------------
 1 file changed, 52 insertions(+), 46 deletions(-)

diff --git a/tests/parser/test_selector_table.py b/tests/parser/test_selector_table.py
index 3ac50707c2..180c0266bf 100644
--- a/tests/parser/test_selector_table.py
+++ b/tests/parser/test_selector_table.py
@@ -478,66 +478,72 @@ def test_dense_jumptable_bucket_size(n_methods, seed):
     assert n_buckets / n < 0.4 or n < 10
 
 
+@st.composite
+def generate_methods(draw, max_calldata_bytes):
+    max_default_args = draw(st.integers(min_value=0, max_value=4))
+    default_fn_mutability = draw(st.sampled_from(["", "@pure", "@view", "@nonpayable", "@payable"]))
+
+    return (
+        max_default_args,
+        default_fn_mutability,
+        draw(
+            st.lists(
+                st.tuples(
+                    # function id:
+                    st.integers(min_value=0),
+                    # mutability:
+                    st.sampled_from(["@pure", "@view", "@nonpayable", "@payable"]),
+                    # n calldata words:
+                    st.integers(min_value=0, max_value=max_calldata_bytes // 32),
+                    # n bytes to strip from calldata
+                    st.integers(min_value=1, max_value=4),
+                    # n default args
+                    st.integers(min_value=0, max_value=max_default_args),
+                ),
+                unique_by=lambda x: x[0],
+                min_size=1,
+                max_size=100,
+            )
+        ),
+    )
+
+
 @pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 # dense selector table packing boundaries at 256 and 65336
 @pytest.mark.parametrize("max_calldata_bytes", [255, 256, 65336])
-@settings(max_examples=5, deadline=None)
-@given(
-    seed=st.integers(min_value=0, max_value=2**64 - 1),
-    max_default_args=st.integers(min_value=0, max_value=4),
-    default_fn_mutability=st.sampled_from(["", "@pure", "@view", "@nonpayable", "@payable"]),
-)
 @pytest.mark.fuzzing
 def test_selector_table_fuzz(
-    max_calldata_bytes,
-    seed,
-    max_default_args,
-    opt_level,
-    default_fn_mutability,
-    w3,
-    get_contract,
-    assert_tx_failed,
-    get_logs,
+    max_calldata_bytes, opt_level, w3, get_contract, assert_tx_failed, get_logs
 ):
-    def abi_sig(calldata_words, i, n_default_args):
-        args = [] if not calldata_words else [f"uint256[{calldata_words}]"]
-        args.extend(["uint256"] * n_default_args)
-        argstr = ",".join(args)
-        return f"foo{seed + i}({argstr})"
+    def abi_sig(func_id, calldata_words, n_default_args):
+        params = [] if not calldata_words else [f"uint256[{calldata_words}]"]
+        params.extend(["uint256"] * n_default_args)
+        paramstr = ",".join(params)
+        return f"foo{func_id}({paramstr})"
 
-    def generate_func_def(mutability, calldata_words, i, n_default_args):
+    def generate_func_def(func_id, mutability, calldata_words, n_default_args):
         arglist = [] if not calldata_words else [f"x: uint256[{calldata_words}]"]
         for j in range(n_default_args):
             arglist.append(f"x{j}: uint256 = 0")
         args = ", ".join(arglist)
-        _log_return = f"log _Return({i})" if mutability == "@payable" else ""
+        _log_return = f"log _Return({func_id})" if mutability == "@payable" else ""
 
         return f"""
 @external
 {mutability}
-def foo{seed + i}({args}) -> uint256:
+def foo{func_id}({args}) -> uint256:
     {_log_return}
-    return {i}
+    return {func_id}
     """
 
-    @given(
-        methods=st.lists(
-            st.tuples(
-                st.sampled_from(["@pure", "@view", "@nonpayable", "@payable"]),
-                st.integers(min_value=0, max_value=max_calldata_bytes // 32),
-                # n bytes to strip from calldata
-                st.integers(min_value=1, max_value=4),
-                # n default args
-                st.integers(min_value=0, max_value=max_default_args),
-            ),
-            min_size=1,
-            max_size=100,
-        )
-    )
-    @settings(max_examples=25)
-    def _test(methods):
+    @given(_input=generate_methods(max_calldata_bytes))
+    @settings(max_examples=125, deadline=None)
+    def _test(_input):
+        max_default_args, default_fn_mutability, methods = _input
+
         func_defs = "\n".join(
-            generate_func_def(m, s, i, d) for i, (m, s, _, d) in enumerate(methods)
+            generate_func_def(func_id, mutability, calldata_words, n_default_args)
+            for (func_id, mutability, calldata_words, _, n_default_args) in (methods)
         )
 
         if default_fn_mutability == "":
@@ -571,8 +577,8 @@ def __default__():
 
         c = get_contract(code, override_opt_level=opt_level)
 
-        for i, (mutability, n_calldata_words, n_strip_bytes, n_default_args) in enumerate(methods):
-            funcname = f"foo{seed + i}"
+        for func_id, mutability, n_calldata_words, n_strip_bytes, n_default_args in methods:
+            funcname = f"foo{func_id}"
             func = getattr(c, funcname)
 
             for j in range(n_default_args + 1):
@@ -580,9 +586,9 @@ def __default__():
                 args.extend([1] * j)
 
                 # check the function returns as expected
-                assert func(*args) == i
+                assert func(*args) == func_id
 
-                method_id = utils.method_id(abi_sig(n_calldata_words, i, j))
+                method_id = utils.method_id(abi_sig(func_id, n_calldata_words, j))
 
                 argsdata = b"\x00" * (n_calldata_words * 32 + j * 32)
 
@@ -590,7 +596,7 @@ def __default__():
                 if mutability == "@payable":
                     tx = func(*args, transact={"value": 1})
                     (event,) = get_logs(tx, c, "_Return")
-                    assert event.args.val == i
+                    assert event.args.val == func_id
                 else:
                     hexstr = (method_id + argsdata).hex()
                     txdata = {"to": c.address, "data": hexstr, "value": 1}

From 917959e3993ab0592d28bb5326e89a7a3ae0eb58 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 28 Sep 2023 18:25:39 -0700
Subject: [PATCH 142/161] docs: new for loop range syntax: `bound=` (#3540)

`for i in range(..., bound=...)`

---------

Co-authored-by: El De-dog-lo <3859395+fubuloubu@users.noreply.github.com>
---
 docs/control-structures.rst                       | 13 +++++++++++--
 tests/parser/features/iteration/test_for_range.py |  4 ++--
 vyper/codegen/stmt.py                             |  4 +++-
 vyper/ir/compile_ir.py                            |  2 +-
 4 files changed, 17 insertions(+), 6 deletions(-)

diff --git a/docs/control-structures.rst b/docs/control-structures.rst
index fc8a472ff6..873135709a 100644
--- a/docs/control-structures.rst
+++ b/docs/control-structures.rst
@@ -271,16 +271,25 @@ Ranges are created using the ``range`` function. The following examples are vali
 
 ``STOP`` is a literal integer greater than zero. ``i`` begins as zero and increments by one until it is equal to ``STOP``.
 
+.. code-block:: python
+
+    for i in range(stop, bound=N):
+        ...
+
+Here, ``stop`` can be a variable with integer type, greater than zero. ``N`` must be a compile-time constant. ``i`` begins as zero and increments by one until it is equal to ``stop``. If ``stop`` is larger than ``N``, execution will revert at runtime. In certain cases, you may not have a guarantee that ``stop`` is less than ``N``, but still want to avoid the possibility of runtime reversion. To accomplish this, use the ``bound=`` keyword in combination with ``min(stop, N)`` as the argument to ``range``, like ``range(min(stop, N), bound=N)``. This is helpful for use cases like chunking up operations on larger arrays across multiple transactions.
+
+Another use of range can be with ``START`` and ``STOP`` bounds.
+
 .. code-block:: python
 
     for i in range(START, STOP):
         ...
 
-``START`` and ``STOP`` are literal integers, with ``STOP`` being a greater value than ``START``. ``i`` begins as ``START`` and increments by one until it is equal to ``STOP``.
+Here, ``START`` and ``STOP`` are literal integers, with ``STOP`` being a greater value than ``START``. ``i`` begins as ``START`` and increments by one until it is equal to ``STOP``.
 
 .. code-block:: python
 
     for i in range(a, a + N):
         ...
 
-``a`` is a variable with an integer type and ``N`` is a literal integer greater than zero.  ``i`` begins as ``a`` and increments by one until it is equal to ``a + N``.
+``a`` is a variable with an integer type and ``N`` is a literal integer greater than zero.  ``i`` begins as ``a`` and increments by one until it is equal to ``a + N``. If ``a + N`` would overflow, execution will revert.
diff --git a/tests/parser/features/iteration/test_for_range.py b/tests/parser/features/iteration/test_for_range.py
index 395dd28231..ed6235d992 100644
--- a/tests/parser/features/iteration/test_for_range.py
+++ b/tests/parser/features/iteration/test_for_range.py
@@ -20,12 +20,12 @@ def test_range_bound(get_contract, assert_tx_failed):
 def repeat(n: uint256) -> uint256:
     x: uint256 = 0
     for i in range(n, bound=6):
-        x += i
+        x += i + 1
     return x
     """
     c = get_contract(code)
     for n in range(7):
-        assert c.repeat(n) == sum(range(n))
+        assert c.repeat(n) == sum(i + 1 for i in range(n))
 
     # check codegen inserts assertion for n greater than bound
     assert_tx_failed(lambda: c.repeat(7))
diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index 3ecb0afdc3..c2951986c8 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -302,7 +302,9 @@ def _parse_For_range(self):
         loop_body.append(["mstore", iptr, i])
         loop_body.append(parse_body(self.stmt.body, self.context))
 
-        # NOTE: codegen for `repeat` inserts an assertion that rounds <= rounds_bound.
+        # NOTE: codegen for `repeat` inserts an assertion that
+        # (gt rounds_bound rounds). note this also covers the case where
+        # rounds < 0.
         # if we ever want to remove that, we need to manually add the assertion
         # where it makes sense.
         ir_node = IRnode.from_list(
diff --git a/vyper/ir/compile_ir.py b/vyper/ir/compile_ir.py
index 7a3e97155b..1c4dc1ef7c 100644
--- a/vyper/ir/compile_ir.py
+++ b/vyper/ir/compile_ir.py
@@ -415,7 +415,7 @@ def _height_of(witharg):
                 )
             )
             # stack: i, rounds, rounds_bound
-            # assert rounds <= rounds_bound
+            # assert 0 <= rounds <= rounds_bound (for rounds_bound < 2**255)
             # TODO this runtime assertion shouldn't fail for
             # internally generated repeats.
             o.extend(["DUP2", "GT"] + _assert_false())

From c913b2db0881a6f4e1c70b7929b713a6aab05c62 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 28 Sep 2023 18:32:04 -0700
Subject: [PATCH 143/161] chore: remove deadlines and reruns (#3630)

for historical reasons, pytest ran with `--allow-reruns` when tests
failed because tests would usually fail due to deadline errors. deadline
errors have never indicated any meaningful issue with the compiler, they
are just a somewhat unavoidable byproduct of the fact that we are
running in a CI environment which has a lot of jitter.

this commit changes the hypothesis deadline to `None` for the whole test
suite, and removes the `--allow-reruns` parameter in the CI, which
should make the test suite much more efficient when there are failures.
---
 .github/workflows/test.yml                       | 6 +++---
 tests/ast/nodes/test_evaluate_binop_decimal.py   | 4 ++--
 tests/ast/nodes/test_evaluate_binop_int.py       | 8 ++++----
 tests/ast/nodes/test_evaluate_boolop.py          | 4 ++--
 tests/ast/nodes/test_evaluate_compare.py         | 8 ++++----
 tests/ast/nodes/test_evaluate_subscript.py       | 2 +-
 tests/builtins/folding/test_abs.py               | 4 ++--
 tests/builtins/folding/test_addmod_mulmod.py     | 2 +-
 tests/builtins/folding/test_bitwise.py           | 8 ++++----
 tests/builtins/folding/test_floor_ceil.py        | 2 +-
 tests/builtins/folding/test_fold_as_wei_value.py | 4 ++--
 tests/builtins/folding/test_keccak_sha.py        | 6 +++---
 tests/builtins/folding/test_min_max.py           | 6 +++---
 tests/builtins/folding/test_powmod.py            | 2 +-
 tests/conftest.py                                | 6 ++++++
 tests/fuzzing/test_exponents.py                  | 4 ++--
 tests/grammar/test_grammar.py                    | 4 ++--
 tests/parser/features/test_internal_call.py      | 2 +-
 tests/parser/functions/test_slice.py             | 4 ++--
 tests/parser/test_call_graph_stability.py        | 2 +-
 tests/parser/test_selector_table.py              | 6 +++---
 tests/parser/types/numbers/test_isqrt.py         | 1 -
 tests/parser/types/numbers/test_sqrt.py          | 2 --
 tests/parser/types/test_bytes_zero_padding.py    | 1 -
 24 files changed, 50 insertions(+), 48 deletions(-)

diff --git a/.github/workflows/test.yml b/.github/workflows/test.yml
index fd78e2fff8..8d23368eb0 100644
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@@ -104,7 +104,7 @@ jobs:
       run: pip install tox
 
     - name: Run Tox
-      run: TOXENV=py${{ matrix.python-version[1] }} tox -r -- --optimize ${{ matrix.opt-mode }} ${{ matrix.debug && '--enable-compiler-debug-mode' || '' }} --reruns 10 --reruns-delay 1 -r aR tests/
+      run: TOXENV=py${{ matrix.python-version[1] }} tox -r -- --optimize ${{ matrix.opt-mode }} ${{ matrix.debug && '--enable-compiler-debug-mode' || '' }} -r aR tests/
 
     - name: Upload Coverage
       uses: codecov/codecov-action@v1
@@ -148,12 +148,12 @@ jobs:
 
     # fetch test durations
     # NOTE: if the tests get poorly distributed, run this and commit the resulting `.test_durations` file to the `vyper-test-durations` repo.
-    # `TOXENV=fuzzing tox -r -- --store-durations --reruns 10 --reruns-delay 1 -r aR tests/`
+    # `TOXENV=fuzzing tox -r -- --store-durations -r aR tests/`
     - name: Fetch test-durations
       run: curl --location "https://raw.githubusercontent.com/vyperlang/vyper-test-durations/5982755ee8459f771f2e8622427c36494646e1dd/test_durations" -o .test_durations
 
     - name: Run Tox
-      run: TOXENV=fuzzing tox -r -- --splits 60 --group ${{ matrix.group }} --splitting-algorithm least_duration --reruns 10 --reruns-delay 1 -r aR tests/
+      run: TOXENV=fuzzing tox -r -- --splits 60 --group ${{ matrix.group }} --splitting-algorithm least_duration -r aR tests/
 
     - name: Upload Coverage
       uses: codecov/codecov-action@v1
diff --git a/tests/ast/nodes/test_evaluate_binop_decimal.py b/tests/ast/nodes/test_evaluate_binop_decimal.py
index 3c8ba0888c..5c9956caba 100644
--- a/tests/ast/nodes/test_evaluate_binop_decimal.py
+++ b/tests/ast/nodes/test_evaluate_binop_decimal.py
@@ -13,7 +13,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=None)
+@settings(max_examples=50)
 @given(left=st_decimals, right=st_decimals)
 @example(left=Decimal("0.9999999999"), right=Decimal("0.0000000001"))
 @example(left=Decimal("0.0000000001"), right=Decimal("0.9999999999"))
@@ -52,7 +52,7 @@ def test_binop_pow():
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=None)
+@settings(max_examples=50)
 @given(
     values=st.lists(st_decimals, min_size=2, max_size=10),
     ops=st.lists(st.sampled_from("+-*/%"), min_size=11, max_size=11),
diff --git a/tests/ast/nodes/test_evaluate_binop_int.py b/tests/ast/nodes/test_evaluate_binop_int.py
index d632a95461..80c9381c0f 100644
--- a/tests/ast/nodes/test_evaluate_binop_int.py
+++ b/tests/ast/nodes/test_evaluate_binop_int.py
@@ -9,7 +9,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st_int32, right=st_int32)
 @example(left=1, right=1)
 @example(left=1, right=-1)
@@ -42,7 +42,7 @@ def foo(a: int128, b: int128) -> int128:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st_uint64, right=st_uint64)
 @pytest.mark.parametrize("op", "+-*/%")
 def test_binop_uint256(get_contract, assert_tx_failed, op, left, right):
@@ -69,7 +69,7 @@ def foo(a: uint256, b: uint256) -> uint256:
 
 @pytest.mark.xfail(reason="need to implement safe exponentiation logic")
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st.integers(min_value=2, max_value=245), right=st.integers(min_value=0, max_value=16))
 @example(left=0, right=0)
 @example(left=0, right=1)
@@ -89,7 +89,7 @@ def foo(a: uint256, b: uint256) -> uint256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(
     values=st.lists(st.integers(min_value=-256, max_value=256), min_size=2, max_size=10),
     ops=st.lists(st.sampled_from("+-*/%"), min_size=11, max_size=11),
diff --git a/tests/ast/nodes/test_evaluate_boolop.py b/tests/ast/nodes/test_evaluate_boolop.py
index 6bd9ecc6cb..8b70537c39 100644
--- a/tests/ast/nodes/test_evaluate_boolop.py
+++ b/tests/ast/nodes/test_evaluate_boolop.py
@@ -8,7 +8,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(values=st.lists(st.booleans(), min_size=2, max_size=10))
 @pytest.mark.parametrize("comparator", ["and", "or"])
 def test_boolop_simple(get_contract, values, comparator):
@@ -32,7 +32,7 @@ def foo({input_value}) -> bool:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(
     values=st.lists(st.booleans(), min_size=2, max_size=10),
     comparators=st.lists(st.sampled_from(["and", "or"]), min_size=11, max_size=11),
diff --git a/tests/ast/nodes/test_evaluate_compare.py b/tests/ast/nodes/test_evaluate_compare.py
index 9ff5cea338..07f8e70de6 100644
--- a/tests/ast/nodes/test_evaluate_compare.py
+++ b/tests/ast/nodes/test_evaluate_compare.py
@@ -8,7 +8,7 @@
 
 # TODO expand to all signed types
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st.integers(), right=st.integers())
 @pytest.mark.parametrize("op", ["==", "!=", "<", "<=", ">=", ">"])
 def test_compare_eq_signed(get_contract, op, left, right):
@@ -28,7 +28,7 @@ def foo(a: int128, b: int128) -> bool:
 
 # TODO expand to all unsigned types
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st.integers(min_value=0), right=st.integers(min_value=0))
 @pytest.mark.parametrize("op", ["==", "!=", "<", "<=", ">=", ">"])
 def test_compare_eq_unsigned(get_contract, op, left, right):
@@ -47,7 +47,7 @@ def foo(a: uint128, b: uint128) -> bool:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=20, deadline=1000)
+@settings(max_examples=20)
 @given(left=st.integers(), right=st.lists(st.integers(), min_size=1, max_size=16))
 def test_compare_in(left, right, get_contract):
     source = f"""
@@ -76,7 +76,7 @@ def bar(a: int128) -> bool:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=20, deadline=1000)
+@settings(max_examples=20)
 @given(left=st.integers(), right=st.lists(st.integers(), min_size=1, max_size=16))
 def test_compare_not_in(left, right, get_contract):
     source = f"""
diff --git a/tests/ast/nodes/test_evaluate_subscript.py b/tests/ast/nodes/test_evaluate_subscript.py
index 3c0fa5d16d..ca50a076a5 100644
--- a/tests/ast/nodes/test_evaluate_subscript.py
+++ b/tests/ast/nodes/test_evaluate_subscript.py
@@ -6,7 +6,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(
     idx=st.integers(min_value=0, max_value=9),
     array=st.lists(st.integers(), min_size=10, max_size=10),
diff --git a/tests/builtins/folding/test_abs.py b/tests/builtins/folding/test_abs.py
index 58f861ed0c..1c919d7826 100644
--- a/tests/builtins/folding/test_abs.py
+++ b/tests/builtins/folding/test_abs.py
@@ -8,7 +8,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(a=st.integers(min_value=-(2**255) + 1, max_value=2**255 - 1))
 @example(a=0)
 def test_abs(get_contract, a):
@@ -27,7 +27,7 @@ def foo(a: int256) -> int256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(a=st.integers(min_value=2**255, max_value=2**256 - 1))
 def test_abs_upper_bound_folding(get_contract, a):
     source = f"""
diff --git a/tests/builtins/folding/test_addmod_mulmod.py b/tests/builtins/folding/test_addmod_mulmod.py
index 0514dea18a..33dcc62984 100644
--- a/tests/builtins/folding/test_addmod_mulmod.py
+++ b/tests/builtins/folding/test_addmod_mulmod.py
@@ -9,7 +9,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(a=st_uint256, b=st_uint256, c=st_uint256)
 @pytest.mark.parametrize("fn_name", ["uint256_addmod", "uint256_mulmod"])
 def test_modmath(get_contract, a, b, c, fn_name):
diff --git a/tests/builtins/folding/test_bitwise.py b/tests/builtins/folding/test_bitwise.py
index d28e482589..63e733644f 100644
--- a/tests/builtins/folding/test_bitwise.py
+++ b/tests/builtins/folding/test_bitwise.py
@@ -14,7 +14,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("op", ["&", "|", "^"])
 @given(a=st_uint256, b=st_uint256)
 def test_bitwise_ops(get_contract, a, b, op):
@@ -34,7 +34,7 @@ def foo(a: uint256, b: uint256) -> uint256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("op", ["<<", ">>"])
 @given(a=st_uint256, b=st.integers(min_value=0, max_value=256))
 def test_bitwise_shift_unsigned(get_contract, a, b, op):
@@ -64,7 +64,7 @@ def foo(a: uint256, b: uint256) -> uint256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("op", ["<<", ">>"])
 @given(a=st_sint256, b=st.integers(min_value=0, max_value=256))
 def test_bitwise_shift_signed(get_contract, a, b, op):
@@ -92,7 +92,7 @@ def foo(a: int256, b: uint256) -> int256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(value=st_uint256)
 def test_bitwise_not(get_contract, value):
     source = """
diff --git a/tests/builtins/folding/test_floor_ceil.py b/tests/builtins/folding/test_floor_ceil.py
index 763f8fec63..87db23889a 100644
--- a/tests/builtins/folding/test_floor_ceil.py
+++ b/tests/builtins/folding/test_floor_ceil.py
@@ -13,7 +13,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(value=st_decimals)
 @example(value=Decimal("0.9999999999"))
 @example(value=Decimal("0.0000000001"))
diff --git a/tests/builtins/folding/test_fold_as_wei_value.py b/tests/builtins/folding/test_fold_as_wei_value.py
index 11d23bd3bf..210ab51f0d 100644
--- a/tests/builtins/folding/test_fold_as_wei_value.py
+++ b/tests/builtins/folding/test_fold_as_wei_value.py
@@ -19,7 +19,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=10, deadline=1000)
+@settings(max_examples=10)
 @given(value=st_decimals)
 @pytest.mark.parametrize("denom", denoms)
 def test_decimal(get_contract, value, denom):
@@ -38,7 +38,7 @@ def foo(a: decimal) -> uint256:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=10, deadline=1000)
+@settings(max_examples=10)
 @given(value=st.integers(min_value=0, max_value=2**128))
 @pytest.mark.parametrize("denom", denoms)
 def test_integer(get_contract, value, denom):
diff --git a/tests/builtins/folding/test_keccak_sha.py b/tests/builtins/folding/test_keccak_sha.py
index 8e283566de..a2fe460dd1 100644
--- a/tests/builtins/folding/test_keccak_sha.py
+++ b/tests/builtins/folding/test_keccak_sha.py
@@ -10,7 +10,7 @@
 
 @pytest.mark.fuzzing
 @given(value=st.text(alphabet=alphabet, min_size=0, max_size=100))
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("fn_name", ["keccak256", "sha256"])
 def test_string(get_contract, value, fn_name):
     source = f"""
@@ -29,7 +29,7 @@ def foo(a: String[100]) -> bytes32:
 
 @pytest.mark.fuzzing
 @given(value=st.binary(min_size=0, max_size=100))
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("fn_name", ["keccak256", "sha256"])
 def test_bytes(get_contract, value, fn_name):
     source = f"""
@@ -48,7 +48,7 @@ def foo(a: Bytes[100]) -> bytes32:
 
 @pytest.mark.fuzzing
 @given(value=st.binary(min_size=1, max_size=100))
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @pytest.mark.parametrize("fn_name", ["keccak256", "sha256"])
 def test_hex(get_contract, value, fn_name):
     source = f"""
diff --git a/tests/builtins/folding/test_min_max.py b/tests/builtins/folding/test_min_max.py
index e2d33237ca..309f7519c0 100644
--- a/tests/builtins/folding/test_min_max.py
+++ b/tests/builtins/folding/test_min_max.py
@@ -18,7 +18,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st_decimals, right=st_decimals)
 @pytest.mark.parametrize("fn_name", ["min", "max"])
 def test_decimal(get_contract, left, right, fn_name):
@@ -37,7 +37,7 @@ def foo(a: decimal, b: decimal) -> decimal:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st_int128, right=st_int128)
 @pytest.mark.parametrize("fn_name", ["min", "max"])
 def test_int128(get_contract, left, right, fn_name):
@@ -56,7 +56,7 @@ def foo(a: int128, b: int128) -> int128:
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=50, deadline=1000)
+@settings(max_examples=50)
 @given(left=st_uint256, right=st_uint256)
 @pytest.mark.parametrize("fn_name", ["min", "max"])
 def test_min_uint256(get_contract, left, right, fn_name):
diff --git a/tests/builtins/folding/test_powmod.py b/tests/builtins/folding/test_powmod.py
index fdc0e300ab..8667ec93fd 100644
--- a/tests/builtins/folding/test_powmod.py
+++ b/tests/builtins/folding/test_powmod.py
@@ -9,7 +9,7 @@
 
 
 @pytest.mark.fuzzing
-@settings(max_examples=100, deadline=1000)
+@settings(max_examples=100)
 @given(a=st_uint256, b=st_uint256)
 def test_powmod_uint256(get_contract, a, b):
     source = """
diff --git a/tests/conftest.py b/tests/conftest.py
index d519ca3100..c9d3f794a0 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -1,6 +1,7 @@
 import logging
 from functools import wraps
 
+import hypothesis
 import pytest
 from eth_tester import EthereumTester, PyEVMBackend
 from eth_utils import setup_DEBUG2_logging
@@ -23,6 +24,11 @@
 ############
 
 
+# disable hypothesis deadline globally
+hypothesis.settings.register_profile("ci", deadline=None)
+hypothesis.settings.load_profile("ci")
+
+
 def set_evm_verbose_logging():
     logger = logging.getLogger("eth.vm.computation.Computation")
     setup_DEBUG2_logging()
diff --git a/tests/fuzzing/test_exponents.py b/tests/fuzzing/test_exponents.py
index 29c1f198ed..5726e4c1ca 100644
--- a/tests/fuzzing/test_exponents.py
+++ b/tests/fuzzing/test_exponents.py
@@ -92,7 +92,7 @@ def foo(a: int16) -> int16:
 @example(a=2**127 - 1)
 # 256 bits
 @example(a=2**256 - 1)
-@settings(max_examples=200, deadline=1000)
+@settings(max_examples=200)
 def test_max_exp(get_contract, assert_tx_failed, a):
     code = f"""
 @external
@@ -127,7 +127,7 @@ def foo(b: uint256) -> uint256:
 @example(a=2**63 - 1)
 # 128 bits
 @example(a=2**127 - 1)
-@settings(max_examples=200, deadline=1000)
+@settings(max_examples=200)
 def test_max_exp_int128(get_contract, assert_tx_failed, a):
     code = f"""
 @external
diff --git a/tests/grammar/test_grammar.py b/tests/grammar/test_grammar.py
index d665ca2544..aa0286cfa5 100644
--- a/tests/grammar/test_grammar.py
+++ b/tests/grammar/test_grammar.py
@@ -4,7 +4,7 @@
 import hypothesis
 import hypothesis.strategies as st
 import pytest
-from hypothesis import HealthCheck, assume, given
+from hypothesis import assume, given
 from hypothesis.extra.lark import LarkStrategy
 
 from vyper.ast import Module, parse_to_ast
@@ -103,7 +103,7 @@ def has_no_docstrings(c):
 
 @pytest.mark.fuzzing
 @given(code=from_grammar().filter(lambda c: utf8_encodable(c)))
-@hypothesis.settings(deadline=400, max_examples=500, suppress_health_check=(HealthCheck.too_slow,))
+@hypothesis.settings(max_examples=500)
 def test_grammar_bruteforce(code):
     if utf8_encodable(code):
         _, _, reformatted_code = pre_parse(code + "\n")
diff --git a/tests/parser/features/test_internal_call.py b/tests/parser/features/test_internal_call.py
index d7a41acbc0..f10d22ec99 100644
--- a/tests/parser/features/test_internal_call.py
+++ b/tests/parser/features/test_internal_call.py
@@ -669,7 +669,7 @@ def test_internal_call_kwargs(get_contract, typ1, strategy1, typ2, strategy2):
     # GHSA-ph9x-4vc9-m39g
 
     @given(kwarg1=strategy1, default1=strategy1, kwarg2=strategy2, default2=strategy2)
-    @settings(deadline=None, max_examples=5)  # len(cases) * len(cases) * 5 * 5
+    @settings(max_examples=5)  # len(cases) * len(cases) * 5 * 5
     def fuzz(kwarg1, kwarg2, default1, default2):
         code = f"""
 @internal
diff --git a/tests/parser/functions/test_slice.py b/tests/parser/functions/test_slice.py
index 6229b47921..3090dafda0 100644
--- a/tests/parser/functions/test_slice.py
+++ b/tests/parser/functions/test_slice.py
@@ -36,7 +36,7 @@ def slice_tower_test(inp1: Bytes[50]) -> Bytes[50]:
 @pytest.mark.parametrize("literal_length", (True, False))
 @pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
-@settings(max_examples=100, deadline=None)
+@settings(max_examples=100)
 @pytest.mark.fuzzing
 def test_slice_immutable(
     get_contract,
@@ -90,7 +90,7 @@ def _get_contract():
 @pytest.mark.parametrize("literal_length", (True, False))
 @pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
-@settings(max_examples=100, deadline=None)
+@settings(max_examples=100)
 @pytest.mark.fuzzing
 def test_slice_bytes(
     get_contract,
diff --git a/tests/parser/test_call_graph_stability.py b/tests/parser/test_call_graph_stability.py
index a6193610e2..4c85c330f3 100644
--- a/tests/parser/test_call_graph_stability.py
+++ b/tests/parser/test_call_graph_stability.py
@@ -15,7 +15,7 @@ def _valid_identifier(attr):
 
 
 # random names for functions
-@settings(max_examples=20, deadline=None)
+@settings(max_examples=20)
 @given(
     st.lists(
         st.tuples(
diff --git a/tests/parser/test_selector_table.py b/tests/parser/test_selector_table.py
index 180c0266bf..161cd480fd 100644
--- a/tests/parser/test_selector_table.py
+++ b/tests/parser/test_selector_table.py
@@ -446,7 +446,7 @@ def aILR4U1Z()->uint256:
     seed=st.integers(min_value=0, max_value=2**64 - 1),
 )
 @pytest.mark.fuzzing
-@settings(max_examples=10, deadline=None)
+@settings(max_examples=10)
 def test_sparse_jumptable_probe_depth(n_methods, seed):
     sigs = [f"foo{i + seed}()" for i in range(n_methods)]
     _, buckets = generate_sparse_jumptable_buckets(sigs)
@@ -466,7 +466,7 @@ def test_sparse_jumptable_probe_depth(n_methods, seed):
     seed=st.integers(min_value=0, max_value=2**64 - 1),
 )
 @pytest.mark.fuzzing
-@settings(max_examples=10, deadline=None)
+@settings(max_examples=10)
 def test_dense_jumptable_bucket_size(n_methods, seed):
     sigs = [f"foo{i + seed}()" for i in range(n_methods)]
     n = len(sigs)
@@ -537,7 +537,7 @@ def foo{func_id}({args}) -> uint256:
     """
 
     @given(_input=generate_methods(max_calldata_bytes))
-    @settings(max_examples=125, deadline=None)
+    @settings(max_examples=125)
     def _test(_input):
         max_default_args, default_fn_mutability, methods = _input
 
diff --git a/tests/parser/types/numbers/test_isqrt.py b/tests/parser/types/numbers/test_isqrt.py
index ce26d24d06..b734323a6e 100644
--- a/tests/parser/types/numbers/test_isqrt.py
+++ b/tests/parser/types/numbers/test_isqrt.py
@@ -119,7 +119,6 @@ def test(a: uint256) -> (uint256, uint256, uint256, uint256, uint256, String[100
 @hypothesis.example(2704)
 @hypothesis.example(110889)
 @hypothesis.example(32239684)
-@hypothesis.settings(deadline=1000)
 def test_isqrt_valid_range(isqrt_contract, value):
     vyper_isqrt = isqrt_contract.test(value)
     actual_isqrt = math.isqrt(value)
diff --git a/tests/parser/types/numbers/test_sqrt.py b/tests/parser/types/numbers/test_sqrt.py
index df1ed0539c..020a79e7ef 100644
--- a/tests/parser/types/numbers/test_sqrt.py
+++ b/tests/parser/types/numbers/test_sqrt.py
@@ -145,7 +145,6 @@ def test_sqrt_bounds(sqrt_contract, value):
 )
 @hypothesis.example(value=Decimal(SizeLimits.MAX_INT128))
 @hypothesis.example(value=Decimal(0))
-@hypothesis.settings(deadline=1000)
 def test_sqrt_valid_range(sqrt_contract, value):
     vyper_sqrt = sqrt_contract.test(value)
     actual_sqrt = decimal_sqrt(value)
@@ -158,7 +157,6 @@ def test_sqrt_valid_range(sqrt_contract, value):
         min_value=Decimal(SizeLimits.MIN_INT128), max_value=Decimal("-1E10"), places=DECIMAL_PLACES
     )
 )
-@hypothesis.settings(deadline=400)
 @hypothesis.example(value=Decimal(SizeLimits.MIN_INT128))
 @hypothesis.example(value=Decimal("-1E10"))
 def test_sqrt_invalid_range(sqrt_contract, value):
diff --git a/tests/parser/types/test_bytes_zero_padding.py b/tests/parser/types/test_bytes_zero_padding.py
index ee938fdffb..f9fcf37b25 100644
--- a/tests/parser/types/test_bytes_zero_padding.py
+++ b/tests/parser/types/test_bytes_zero_padding.py
@@ -26,7 +26,6 @@ def get_count(counter: uint256) -> Bytes[24]:
 
 @pytest.mark.fuzzing
 @hypothesis.given(value=hypothesis.strategies.integers(min_value=0, max_value=2**64))
-@hypothesis.settings(deadline=400)
 def test_zero_pad_range(little_endian_contract, value):
     actual_bytes = value.to_bytes(8, byteorder="little")
     contract_bytes = little_endian_contract.get_count(value)

From 8aae7cd6b86c15978bdfa16d5a6e3ca273121107 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 2 Oct 2023 19:20:19 -0700
Subject: [PATCH 144/161] feat: disallow invalid pragmas (#3634)

this commit prevents typos (ex. `# pragma evm-versionn ...`) from
getting unexpectedly ignored. it also fixes an issue with the
`evm_version` pragma getting properly propagated into
`CompilerData.settings`. it also fixes a misnamed test function, and
adds some unit tests to check that `evm_version` gets properly
propagated into `CompilerData.settings`.

commit summary:
* fix `evm_version` passing into compiler data
* fix `compile_code()`
* add tests for `CompilerData.settings`
* add tests for invalid pragmas
---
 tests/ast/test_pre_parser.py | 70 ++++++++++++++++++++++++++++++++----
 vyper/ast/pre_parser.py      |  7 ++--
 vyper/compiler/README.md     |  6 ++--
 vyper/compiler/__init__.py   | 22 ++++++------
 vyper/compiler/phases.py     |  5 +++
 5 files changed, 87 insertions(+), 23 deletions(-)

diff --git a/tests/ast/test_pre_parser.py b/tests/ast/test_pre_parser.py
index 5427532c16..3d072674f6 100644
--- a/tests/ast/test_pre_parser.py
+++ b/tests/ast/test_pre_parser.py
@@ -1,8 +1,9 @@
 import pytest
 
 from vyper.ast.pre_parser import pre_parse, validate_version_pragma
+from vyper.compiler.phases import CompilerData
 from vyper.compiler.settings import OptimizationLevel, Settings
-from vyper.exceptions import VersionException
+from vyper.exceptions import StructureException, VersionException
 
 SRC_LINE = (1, 0)  # Dummy source line
 COMPILER_VERSION = "0.1.1"
@@ -96,43 +97,50 @@ def test_prerelease_invalid_version_pragma(file_version, mock_version):
         """
     """,
         Settings(),
+        Settings(optimize=OptimizationLevel.GAS),
     ),
     (
         """
     #pragma optimize codesize
     """,
         Settings(optimize=OptimizationLevel.CODESIZE),
+        None,
     ),
     (
         """
     #pragma optimize none
     """,
         Settings(optimize=OptimizationLevel.NONE),
+        None,
     ),
     (
         """
     #pragma optimize gas
     """,
         Settings(optimize=OptimizationLevel.GAS),
+        None,
     ),
     (
         """
     #pragma version 0.3.10
     """,
         Settings(compiler_version="0.3.10"),
+        Settings(optimize=OptimizationLevel.GAS),
     ),
     (
         """
     #pragma evm-version shanghai
     """,
         Settings(evm_version="shanghai"),
+        Settings(evm_version="shanghai", optimize=OptimizationLevel.GAS),
     ),
     (
         """
     #pragma optimize codesize
     #pragma evm-version shanghai
     """,
-        Settings(evm_version="shanghai", optimize=OptimizationLevel.GAS),
+        Settings(evm_version="shanghai", optimize=OptimizationLevel.CODESIZE),
+        None,
     ),
     (
         """
@@ -140,6 +148,7 @@ def test_prerelease_invalid_version_pragma(file_version, mock_version):
     #pragma evm-version shanghai
     """,
         Settings(evm_version="shanghai", compiler_version="0.3.10"),
+        Settings(evm_version="shanghai", optimize=OptimizationLevel.GAS),
     ),
     (
         """
@@ -147,6 +156,7 @@ def test_prerelease_invalid_version_pragma(file_version, mock_version):
     #pragma optimize gas
     """,
         Settings(compiler_version="0.3.10", optimize=OptimizationLevel.GAS),
+        Settings(optimize=OptimizationLevel.GAS),
     ),
     (
         """
@@ -155,11 +165,59 @@ def test_prerelease_invalid_version_pragma(file_version, mock_version):
     #pragma optimize gas
     """,
         Settings(compiler_version="0.3.10", optimize=OptimizationLevel.GAS, evm_version="shanghai"),
+        Settings(optimize=OptimizationLevel.GAS, evm_version="shanghai"),
     ),
 ]
 
 
-@pytest.mark.parametrize("code, expected_pragmas", pragma_examples)
-def parse_pragmas(code, expected_pragmas):
-    pragmas, _, _ = pre_parse(code)
-    assert pragmas == expected_pragmas
+@pytest.mark.parametrize("code, pre_parse_settings, compiler_data_settings", pragma_examples)
+def test_parse_pragmas(code, pre_parse_settings, compiler_data_settings, mock_version):
+    mock_version("0.3.10")
+    settings, _, _ = pre_parse(code)
+
+    assert settings == pre_parse_settings
+
+    compiler_data = CompilerData(code)
+
+    # check what happens after CompilerData constructor
+    if compiler_data_settings is None:
+        # None is sentinel here meaning that nothing changed
+        compiler_data_settings = pre_parse_settings
+
+    assert compiler_data.settings == compiler_data_settings
+
+
+invalid_pragmas = [
+    # evm-versionnn
+    """
+# pragma evm-versionnn cancun
+    """,
+    # bad fork name
+    """
+# pragma evm-version cancunn
+    """,
+    # oppptimize
+    """
+# pragma oppptimize codesize
+    """,
+    # ggas
+    """
+# pragma optimize ggas
+    """,
+    # double specified
+    """
+# pragma optimize gas
+# pragma optimize codesize
+    """,
+    # double specified
+    """
+# pragma evm-version cancun
+# pragma evm-version shanghai
+    """,
+]
+
+
+@pytest.mark.parametrize("code", invalid_pragmas)
+def test_invalid_pragma(code):
+    with pytest.raises(StructureException):
+        pre_parse(code)
diff --git a/vyper/ast/pre_parser.py b/vyper/ast/pre_parser.py
index 0ead889787..9d96efea5e 100644
--- a/vyper/ast/pre_parser.py
+++ b/vyper/ast/pre_parser.py
@@ -111,7 +111,7 @@ def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
                         validate_version_pragma(compiler_version, start)
                         settings.compiler_version = compiler_version
 
-                    if pragma.startswith("optimize "):
+                    elif pragma.startswith("optimize "):
                         if settings.optimize is not None:
                             raise StructureException("pragma optimize specified twice!", start)
                         try:
@@ -119,7 +119,7 @@ def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
                             settings.optimize = OptimizationLevel.from_string(mode)
                         except ValueError:
                             raise StructureException(f"Invalid optimization mode `{mode}`", start)
-                    if pragma.startswith("evm-version "):
+                    elif pragma.startswith("evm-version "):
                         if settings.evm_version is not None:
                             raise StructureException("pragma evm-version specified twice!", start)
                         evm_version = pragma.removeprefix("evm-version").strip()
@@ -127,6 +127,9 @@ def pre_parse(code: str) -> tuple[Settings, ModificationOffsets, str]:
                             raise StructureException("Invalid evm version: `{evm_version}`", start)
                         settings.evm_version = evm_version
 
+                    else:
+                        raise StructureException(f"Unknown pragma `{pragma.split()[0]}`")
+
             if typ == NAME and string in ("class", "yield"):
                 raise SyntaxException(
                     f"The `{string}` keyword is not allowed. ", code, start[0], start[1]
diff --git a/vyper/compiler/README.md b/vyper/compiler/README.md
index d6b55fdd82..eb70750a2b 100644
--- a/vyper/compiler/README.md
+++ b/vyper/compiler/README.md
@@ -51,11 +51,9 @@ for specific implementation details.
 [`vyper.compiler.compile_codes`](__init__.py) is the main user-facing function for
 generating compiler output from Vyper source. The process is as follows:
 
-1. The `@evm_wrapper` decorator sets the target EVM version in
-[`opcodes.py`](../evm/opcodes.py).
-2. A [`CompilerData`](phases.py) object is created for each contract to be compiled.
+1. A [`CompilerData`](phases.py) object is created for each contract to be compiled.
 This object uses `@property` methods to trigger phases of the compiler as required.
-3. Functions in [`output.py`](output.py) generate the requested outputs from the
+2. Functions in [`output.py`](output.py) generate the requested outputs from the
 compiler data.
 
 ## Design
diff --git a/vyper/compiler/__init__.py b/vyper/compiler/__init__.py
index 0b3c0d8191..b1c4201361 100644
--- a/vyper/compiler/__init__.py
+++ b/vyper/compiler/__init__.py
@@ -120,17 +120,17 @@ def compile_codes(
         # make IR output the same between runs
         codegen.reset_names()
 
-        with anchor_evm_version(settings.evm_version):
-            compiler_data = CompilerData(
-                source_code,
-                contract_name,
-                interfaces,
-                source_id,
-                settings,
-                storage_layout_override,
-                show_gas_estimates,
-                no_bytecode_metadata,
-            )
+        compiler_data = CompilerData(
+            source_code,
+            contract_name,
+            interfaces,
+            source_id,
+            settings,
+            storage_layout_override,
+            show_gas_estimates,
+            no_bytecode_metadata,
+        )
+        with anchor_evm_version(compiler_data.settings.evm_version):
             for output_format in output_formats[contract_name]:
                 if output_format not in OUTPUT_FORMATS:
                     raise ValueError(f"Unsupported format type {repr(output_format)}")
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index a1c7342320..5ddf071caf 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -88,9 +88,12 @@ def __init__(
         self.no_bytecode_metadata = no_bytecode_metadata
         self.settings = settings or Settings()
 
+        _ = self._generate_ast  # force settings to be calculated
+
     @cached_property
     def _generate_ast(self):
         settings, ast = generate_ast(self.source_code, self.source_id, self.contract_name)
+
         # validate the compiler settings
         # XXX: this is a bit ugly, clean up later
         if settings.evm_version is not None:
@@ -117,6 +120,8 @@ def _generate_ast(self):
         if self.settings.optimize is None:
             self.settings.optimize = OptimizationLevel.default()
 
+        # note self.settings.compiler_version is erased here as it is
+        # not used after pre-parsing
         return ast
 
     @cached_property

From e9c16e40dd11ba21ba817ff0da78eaeab744fd39 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 3 Oct 2023 16:36:58 -0700
Subject: [PATCH 145/161] fix: block `mload` merging when src and dst overlap
 (#3635)

this commit fixes an optimization bug when the target architecture has
the `mcopy` instruction (i.e. `cancun` or later). the bug was introduced
in 5dc3ac7. specifically, the `merge_mload` step can incorrectly merge
`mload`/`mstore` sequences (into `mcopy`) when the source and
destination buffers overlap, and the destination buffer is "ahead of"
(i.e. greater than) the source buffer. this commit fixes the issue by
blocking the optimization in these cases, and adds unit and functional
tests demonstrating the correct behavior.

---------

Co-authored-by: Robert Chen <me@robertchen.cc>
---
 tests/compiler/ir/test_optimize_ir.py    | 107 +++++++++++++++++++++++
 tests/parser/features/test_assignment.py |  60 +++++++++++++
 vyper/ir/optimizer.py                    |   9 +-
 3 files changed, 174 insertions(+), 2 deletions(-)

diff --git a/tests/compiler/ir/test_optimize_ir.py b/tests/compiler/ir/test_optimize_ir.py
index 1466166501..cb46ba238d 100644
--- a/tests/compiler/ir/test_optimize_ir.py
+++ b/tests/compiler/ir/test_optimize_ir.py
@@ -1,9 +1,13 @@
 import pytest
 
 from vyper.codegen.ir_node import IRnode
+from vyper.evm.opcodes import EVM_VERSIONS, anchor_evm_version
 from vyper.exceptions import StaticAssertionException
 from vyper.ir import optimizer
 
+POST_CANCUN = {k: v for k, v in EVM_VERSIONS.items() if v >= EVM_VERSIONS["cancun"]}
+
+
 optimize_list = [
     (["eq", 1, 2], [0]),
     (["lt", 1, 2], [1]),
@@ -272,3 +276,106 @@ def test_operator_set_values():
     assert optimizer.COMPARISON_OPS == {"lt", "gt", "le", "ge", "slt", "sgt", "sle", "sge"}
     assert optimizer.STRICT_COMPARISON_OPS == {"lt", "gt", "slt", "sgt"}
     assert optimizer.UNSTRICT_COMPARISON_OPS == {"le", "ge", "sle", "sge"}
+
+
+mload_merge_list = [
+    # copy "backward" with no overlap between src and dst buffers,
+    # OK to become mcopy
+    (
+        ["seq", ["mstore", 32, ["mload", 128]], ["mstore", 64, ["mload", 160]]],
+        ["mcopy", 32, 128, 64],
+    ),
+    # copy with overlap "backwards", OK to become mcopy
+    (["seq", ["mstore", 32, ["mload", 64]], ["mstore", 64, ["mload", 96]]], ["mcopy", 32, 64, 64]),
+    # "stationary" overlap (i.e. a no-op mcopy), OK to become mcopy
+    (["seq", ["mstore", 32, ["mload", 32]], ["mstore", 64, ["mload", 64]]], ["mcopy", 32, 32, 64]),
+    # copy "forward" with no overlap, OK to become mcopy
+    (["seq", ["mstore", 64, ["mload", 0]], ["mstore", 96, ["mload", 32]]], ["mcopy", 64, 0, 64]),
+    # copy "forwards" with overlap by one word, must NOT become mcopy
+    (["seq", ["mstore", 64, ["mload", 32]], ["mstore", 96, ["mload", 64]]], None),
+    # check "forward" overlap by one byte, must NOT become mcopy
+    (["seq", ["mstore", 64, ["mload", 1]], ["mstore", 96, ["mload", 33]]], None),
+    # check "forward" overlap by one byte again, must NOT become mcopy
+    (["seq", ["mstore", 63, ["mload", 0]], ["mstore", 95, ["mload", 32]]], None),
+    # copy 3 words with partial overlap "forwards", partially becomes mcopy
+    # (2 words are mcopied and 1 word is mload/mstored
+    (
+        [
+            "seq",
+            ["mstore", 96, ["mload", 32]],
+            ["mstore", 128, ["mload", 64]],
+            ["mstore", 160, ["mload", 96]],
+        ],
+        ["seq", ["mcopy", 96, 32, 64], ["mstore", 160, ["mload", 96]]],
+    ),
+    # copy 4 words with partial overlap "forwards", becomes 2 mcopies of 2 words each
+    (
+        [
+            "seq",
+            ["mstore", 96, ["mload", 32]],
+            ["mstore", 128, ["mload", 64]],
+            ["mstore", 160, ["mload", 96]],
+            ["mstore", 192, ["mload", 128]],
+        ],
+        ["seq", ["mcopy", 96, 32, 64], ["mcopy", 160, 96, 64]],
+    ),
+    # copy 4 words with 1 byte of overlap, must NOT become mcopy
+    (
+        [
+            "seq",
+            ["mstore", 96, ["mload", 33]],
+            ["mstore", 128, ["mload", 65]],
+            ["mstore", 160, ["mload", 97]],
+            ["mstore", 192, ["mload", 129]],
+        ],
+        None,
+    ),
+    # Ensure only sequential mstore + mload sequences are optimized
+    (
+        [
+            "seq",
+            ["mstore", 0, ["mload", 32]],
+            ["sstore", 0, ["calldataload", 4]],
+            ["mstore", 32, ["mload", 64]],
+        ],
+        None,
+    ),
+    # not-word aligned optimizations (not overlap)
+    (["seq", ["mstore", 0, ["mload", 1]], ["mstore", 32, ["mload", 33]]], ["mcopy", 0, 1, 64]),
+    # not-word aligned optimizations (overlap)
+    (["seq", ["mstore", 1, ["mload", 0]], ["mstore", 33, ["mload", 32]]], None),
+    # not-word aligned optimizations (overlap and not-overlap)
+    (
+        [
+            "seq",
+            ["mstore", 0, ["mload", 1]],
+            ["mstore", 32, ["mload", 33]],
+            ["mstore", 1, ["mload", 0]],
+            ["mstore", 33, ["mload", 32]],
+        ],
+        ["seq", ["mcopy", 0, 1, 64], ["mstore", 1, ["mload", 0]], ["mstore", 33, ["mload", 32]]],
+    ),
+    # overflow test
+    (
+        [
+            "seq",
+            ["mstore", 2**256 - 1 - 31 - 32, ["mload", 0]],
+            ["mstore", 2**256 - 1 - 31, ["mload", 32]],
+        ],
+        ["mcopy", 2**256 - 1 - 31 - 32, 0, 64],
+    ),
+]
+
+
+@pytest.mark.parametrize("ir", mload_merge_list)
+@pytest.mark.parametrize("evm_version", list(POST_CANCUN.keys()))
+def test_mload_merge(ir, evm_version):
+    with anchor_evm_version(evm_version):
+        optimized = optimizer.optimize(IRnode.from_list(ir[0]))
+        if ir[1] is None:
+            # no-op, assert optimizer does nothing
+            expected = IRnode.from_list(ir[0])
+        else:
+            expected = IRnode.from_list(ir[1])
+
+        assert optimized == expected
diff --git a/tests/parser/features/test_assignment.py b/tests/parser/features/test_assignment.py
index e550f60541..35b008a8ba 100644
--- a/tests/parser/features/test_assignment.py
+++ b/tests/parser/features/test_assignment.py
@@ -442,3 +442,63 @@ def bug(p: Point) -> Point:
     """
     c = get_contract(code)
     assert c.bug((1, 2)) == (2, 1)
+
+
+mload_merge_codes = [
+    (
+        """
+@external
+def foo() -> uint256[4]:
+    # copy "backwards"
+    xs: uint256[4] = [1, 2, 3, 4]
+
+# dst < src
+    xs[0] = xs[1]
+    xs[1] = xs[2]
+    xs[2] = xs[3]
+
+    return xs
+    """,
+        [2, 3, 4, 4],
+    ),
+    (
+        """
+@external
+def foo() -> uint256[4]:
+    # copy "forwards"
+    xs: uint256[4] = [1, 2, 3, 4]
+
+# src < dst
+    xs[1] = xs[0]
+    xs[2] = xs[1]
+    xs[3] = xs[2]
+
+    return xs
+    """,
+        [1, 1, 1, 1],
+    ),
+    (
+        """
+@external
+def foo() -> uint256[5]:
+    # partial "forward" copy
+    xs: uint256[5] = [1, 2, 3, 4, 5]
+
+# src < dst
+    xs[2] = xs[0]
+    xs[3] = xs[1]
+    xs[4] = xs[2]
+
+    return xs
+    """,
+        [1, 2, 1, 2, 1],
+    ),
+]
+
+
+# functional test that mload merging does not occur when source and dest
+# buffers overlap. (note: mload merging only applies after cancun)
+@pytest.mark.parametrize("code,expected_result", mload_merge_codes)
+def test_mcopy_overlap(get_contract, code, expected_result):
+    c = get_contract(code)
+    assert c.foo() == expected_result
diff --git a/vyper/ir/optimizer.py b/vyper/ir/optimizer.py
index 08c2168381..8df4bbac2d 100644
--- a/vyper/ir/optimizer.py
+++ b/vyper/ir/optimizer.py
@@ -662,10 +662,10 @@ def _rewrite_mstore_dload(argz):
 def _merge_mload(argz):
     if not version_check(begin="cancun"):
         return False
-    return _merge_load(argz, "mload", "mcopy")
+    return _merge_load(argz, "mload", "mcopy", allow_overlap=False)
 
 
-def _merge_load(argz, _LOAD, _COPY):
+def _merge_load(argz, _LOAD, _COPY, allow_overlap=True):
     # look for sequential operations copying from X to Y
     # and merge them into a single copy operation
     changed = False
@@ -689,9 +689,14 @@ def _merge_load(argz, _LOAD, _COPY):
                 initial_dst_offset = dst_offset
                 initial_src_offset = src_offset
                 idx = i
+
+            # dst and src overlap, discontinue the optimization
+            has_overlap = initial_src_offset < initial_dst_offset < src_offset + 32
+
             if (
                 initial_dst_offset + total_length == dst_offset
                 and initial_src_offset + total_length == src_offset
+                and (allow_overlap or not has_overlap)
             ):
                 mstore_nodes.append(ir_node)
                 total_length += 32

From 9136169468f317a53b4e7448389aa315f90b95ba Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 4 Oct 2023 06:16:44 -0700
Subject: [PATCH 146/161] docs: v0.3.10 release (#3629)

---
 docs/release-notes.rst | 14 +++++++-------
 1 file changed, 7 insertions(+), 7 deletions(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index da86c5c0ce..64199bc860 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -14,14 +14,10 @@ Release Notes
     for advisory links:
     :'<,'>s/\v(https:\/\/github.com\/vyperlang\/vyper\/security\/advisories\/)([-A-Za-z0-9]+)/(`\2 <\1\2>`_)/g
 
-..
-    v0.3.10 ("Black Adder")
-    ***********************
-
-v0.3.10rc1
-**********
+v0.3.10 ("Black Adder")
+***********************
 
-Date released: 2023-09-06
+Date released: 2023-10-04
 =========================
 
 v0.3.10 is a performance focused release. It adds a ``codesize`` optimization mode (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), adds new vyper-specific ``#pragma`` directives  (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), uses Cancun's ``MCOPY`` opcode for some compiler generated code (`#3483 <https://github.com/vyperlang/vyper/pull/3483>`_), and generates selector tables which now feature O(1) performance (`#3496 <https://github.com/vyperlang/vyper/pull/3496>`_).
@@ -32,6 +28,7 @@ Breaking changes:
 - add runtime code layout to initcode (`#3584 <https://github.com/vyperlang/vyper/pull/3584>`_)
 - drop evm versions through istanbul (`#3470 <https://github.com/vyperlang/vyper/pull/3470>`_)
 - remove vyper signature from runtime (`#3471 <https://github.com/vyperlang/vyper/pull/3471>`_)
+- only allow valid identifiers to be nonreentrant keys (`#3605 <https://github.com/vyperlang/vyper/pull/3605>`_)
 
 Non-breaking changes and improvements:
 --------------------------------------
@@ -46,12 +43,15 @@ Notable fixes:
 
 - fix ``ecrecover()`` behavior when signature is invalid (`GHSA-f5x6-7qgp-jhf3 <https://github.com/vyperlang/vyper/security/advisories/GHSA-f5x6-7qgp-jhf3>`_, `#3586 <https://github.com/vyperlang/vyper/pull/3586>`_)
 - fix: order of evaluation for some builtins (`#3583 <https://github.com/vyperlang/vyper/pull/3583>`_, `#3587 <https://github.com/vyperlang/vyper/pull/3587>`_)
+- fix: memory allocation in certain builtins using ``msize`` (`#3610 <https://github.com/vyperlang/vyper/pull/3610>`_)
+- fix: ``_abi_decode()`` input validation in certain complex expressions (`#3626 <https://github.com/vyperlang/vyper/pull/3626>`_)
 - fix: pycryptodome for arm builds (`#3485 <https://github.com/vyperlang/vyper/pull/3485>`_)
 - let params of internal functions be mutable (`#3473 <https://github.com/vyperlang/vyper/pull/3473>`_)
 - typechecking of folded builtins in (`#3490 <https://github.com/vyperlang/vyper/pull/3490>`_)
 - update tload/tstore opcodes per latest 1153 EIP spec (`#3484 <https://github.com/vyperlang/vyper/pull/3484>`_)
 - fix: raw_call type when max_outsize=0 is set (`#3572 <https://github.com/vyperlang/vyper/pull/3572>`_)
 - fix: implements check for indexed event arguments (`#3570 <https://github.com/vyperlang/vyper/pull/3570>`_)
+- fix: type-checking for ``_abi_decode()`` arguments (`#3626 <https://github.com/vyperlang/vyper/pull/3623>`_)
 
 Other docs updates, chores and fixes:
 -------------------------------------

From b8b4610a46379558367ba60f94ac2813eec056d4 Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Wed, 4 Oct 2023 20:25:09 +0200
Subject: [PATCH 147/161] chore: update `FUNDING.yml` to point directly at
 wallet (#3636)

Add link to the Vyper multisig address.
---
 FUNDING.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/FUNDING.yml b/FUNDING.yml
index 81e82160d0..efb9eb01b7 100644
--- a/FUNDING.yml
+++ b/FUNDING.yml
@@ -1 +1 @@
-custom: https://gitcoin.co/grants/200/vyper-smart-contract-language-2
+custom: https://etherscan.io/address/0x70CCBE10F980d80b7eBaab7D2E3A73e87D67B775

From 5ca0cbfa4064a5577347bca8377bc9bea1cebca5 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 4 Oct 2023 12:17:36 -0700
Subject: [PATCH 148/161] docs: fix nit in v0.3.10 release notes (#3638)

---
 docs/release-notes.rst | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/release-notes.rst b/docs/release-notes.rst
index 64199bc860..3db11dc451 100644
--- a/docs/release-notes.rst
+++ b/docs/release-notes.rst
@@ -20,7 +20,7 @@ v0.3.10 ("Black Adder")
 Date released: 2023-10-04
 =========================
 
-v0.3.10 is a performance focused release. It adds a ``codesize`` optimization mode (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), adds new vyper-specific ``#pragma`` directives  (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), uses Cancun's ``MCOPY`` opcode for some compiler generated code (`#3483 <https://github.com/vyperlang/vyper/pull/3483>`_), and generates selector tables which now feature O(1) performance (`#3496 <https://github.com/vyperlang/vyper/pull/3496>`_).
+v0.3.10 is a performance focused release that additionally ships numerous bugfixes. It adds a ``codesize`` optimization mode (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), adds new vyper-specific ``#pragma`` directives  (`#3493 <https://github.com/vyperlang/vyper/pull/3493>`_), uses Cancun's ``MCOPY`` opcode for some compiler generated code (`#3483 <https://github.com/vyperlang/vyper/pull/3483>`_), and generates selector tables which now feature O(1) performance (`#3496 <https://github.com/vyperlang/vyper/pull/3496>`_).
 
 Breaking changes:
 -----------------

From 435754dd1db3e1b0b4608569e003f060e6e9eb40 Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Thu, 5 Oct 2023 16:54:29 +0200
Subject: [PATCH 149/161] docs: add note on `pragma` parsing (#3640)

* Fix broken link in `structure-of-a-contract.rst`
* Add note on `pragma` version parsing
---
 docs/structure-of-a-contract.rst | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/docs/structure-of-a-contract.rst b/docs/structure-of-a-contract.rst
index d2c5d48d96..3861bf4380 100644
--- a/docs/structure-of-a-contract.rst
+++ b/docs/structure-of-a-contract.rst
@@ -17,7 +17,7 @@ Vyper supports several source code directives to control compiler modes and help
 Version Pragma
 --------------
 
-The version pragma ensures that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax. Starting from v0.4.0 and up, version strings will use `PEP440 version specifiers <https://peps.python.org/pep-0440/#version-specifiers>_`.
+The version pragma ensures that a contract is only compiled by the intended compiler version, or range of versions. Version strings use `NPM <https://docs.npmjs.com/about-semantic-versioning>`_ style syntax. Starting from v0.4.0 and up, version strings will use `PEP440 version specifiers <https://peps.python.org/pep-0440/#version-specifiers>`_.
 
 As of 0.3.10, the recommended way to specify the version pragma is as follows:
 
@@ -25,6 +25,10 @@ As of 0.3.10, the recommended way to specify the version pragma is as follows:
 
     #pragma version ^0.3.0
 
+.. note::
+
+    Both pragma directive versions ``#pragma`` and ``# pragma`` are supported.
+
 The following declaration is equivalent, and, prior to 0.3.10, was the only supported method to specify the compiler version:
 
 .. code-block:: python

From 68da04b2e9e010c2e4da288a80eeeb9c8e076025 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Thu, 5 Oct 2023 09:04:18 -0700
Subject: [PATCH 150/161] fix: block memory allocation overflow (#3639)

this fixes potential overflow bugs in pointer calculation by blocking
memory allocation above a certain size. the size limit is set at
`2**64`, which is the size of addressable memory on physical machines.

practically, for EVM use cases, we could limit at a much smaller number
(like `2**24`), but we want to allow for "exotic" targets which may
allow much more addressable memory.
---
 vyper/codegen/memory_allocator.py | 12 +++++++++++-
 vyper/exceptions.py               |  4 ++++
 2 files changed, 15 insertions(+), 1 deletion(-)

diff --git a/vyper/codegen/memory_allocator.py b/vyper/codegen/memory_allocator.py
index 582d4b9c54..b5e1212917 100644
--- a/vyper/codegen/memory_allocator.py
+++ b/vyper/codegen/memory_allocator.py
@@ -1,6 +1,6 @@
 from typing import List
 
-from vyper.exceptions import CompilerPanic
+from vyper.exceptions import CompilerPanic, MemoryAllocationException
 from vyper.utils import MemoryPositions
 
 
@@ -46,6 +46,8 @@ class MemoryAllocator:
 
     next_mem: int
 
+    _ALLOCATION_LIMIT: int = 2**64
+
     def __init__(self, start_position: int = MemoryPositions.RESERVED_MEMORY):
         """
         Initializer.
@@ -110,6 +112,14 @@ def _expand_memory(self, size: int) -> int:
         before_value = self.next_mem
         self.next_mem += size
         self.size_of_mem = max(self.size_of_mem, self.next_mem)
+
+        if self.size_of_mem >= self._ALLOCATION_LIMIT:
+            # this should not be caught
+            raise MemoryAllocationException(
+                f"Tried to allocate {self.size_of_mem} bytes! "
+                f"(limit is {self._ALLOCATION_LIMIT} (2**64) bytes)"
+            )
+
         return before_value
 
     def deallocate_memory(self, pos: int, size: int) -> None:
diff --git a/vyper/exceptions.py b/vyper/exceptions.py
index defca7cc53..8b2020285a 100644
--- a/vyper/exceptions.py
+++ b/vyper/exceptions.py
@@ -269,6 +269,10 @@ class StorageLayoutException(VyperException):
     """Invalid slot for the storage layout overrides"""
 
 
+class MemoryAllocationException(VyperException):
+    """Tried to allocate too much memory"""
+
+
 class JSONError(Exception):
 
     """Invalid compiler input JSON."""

From 74a8e0254461119af9a5d504f326877d7aed4134 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Tue, 17 Oct 2023 09:23:40 -0700
Subject: [PATCH 151/161] chore: reorder compilation of branches in stmt.py
 (#3603)

the if and else branches were being allocated out-of-source-order. this
commit switches the order of compilation of the if and else branches to
be in source order. this is a hygienic fix, right now the only thing
that should be affected is the memory allocator (but if more side
effects are ever introduced in codegen, the existing code might compile
the side effects out of order).
---
 vyper/codegen/stmt.py | 14 ++++++--------
 1 file changed, 6 insertions(+), 8 deletions(-)

diff --git a/vyper/codegen/stmt.py b/vyper/codegen/stmt.py
index c2951986c8..254cad32e6 100644
--- a/vyper/codegen/stmt.py
+++ b/vyper/codegen/stmt.py
@@ -91,17 +91,15 @@ def parse_Assign(self):
         return IRnode.from_list(ret)
 
     def parse_If(self):
+        with self.context.block_scope():
+            test_expr = Expr.parse_value_expr(self.stmt.test, self.context)
+            body = ["if", test_expr, parse_body(self.stmt.body, self.context)]
+
         if self.stmt.orelse:
             with self.context.block_scope():
-                add_on = [parse_body(self.stmt.orelse, self.context)]
-        else:
-            add_on = []
+                body.extend([parse_body(self.stmt.orelse, self.context)])
 
-        with self.context.block_scope():
-            test_expr = Expr.parse_value_expr(self.stmt.test, self.context)
-            body = ["if", test_expr, parse_body(self.stmt.body, self.context)] + add_on
-            ir_node = IRnode.from_list(body)
-        return ir_node
+        return IRnode.from_list(body)
 
     def parse_Log(self):
         event = self.stmt._metadata["type"]

From 5482bbcbed22b856bec6e57c06aeb7e0bee9a1ab Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Wed, 18 Oct 2023 00:26:56 +0800
Subject: [PATCH 152/161] feat: remove builtin constants (#3350)

Builtin constants like `MAX_INT128`, `MIN_INT128`, `MIN_DECIMAL`,
`MAX_DECIMAL` and `MAX_UINT256` have been deprecated since v0.3.4 with
the introduction of the `min_value` and `max_value` builtins, and
further back for `ZERO_ADDRESS` and `EMPTY_BYTES32` with the `empty`
builtin.

This PR removes them from the language entirely, and will be a breaking
change.
---
 tests/ast/test_folding.py                     | 43 -------------------
 .../features/decorators/test_private.py       |  2 +-
 .../test_external_contract_calls.py           | 14 +++---
 .../features/iteration/test_for_in_list.py    |  2 +-
 tests/parser/features/test_assignment.py      |  4 +-
 tests/parser/features/test_memory_dealloc.py  |  2 +-
 tests/parser/functions/test_abi_decode.py     |  4 +-
 tests/parser/functions/test_convert.py        | 18 --------
 .../parser/functions/test_default_function.py |  2 +-
 tests/parser/functions/test_empty.py          | 20 ++++-----
 tests/parser/functions/test_return_tuple.py   |  4 +-
 tests/parser/integration/test_escrow.py       |  4 +-
 tests/parser/syntax/test_bool.py              |  4 +-
 tests/parser/syntax/test_interfaces.py        |  4 +-
 tests/parser/syntax/test_no_none.py           | 12 +++---
 tests/parser/syntax/test_tuple_assign.py      |  2 +-
 tests/parser/syntax/test_unbalanced_return.py |  4 +-
 tests/parser/types/numbers/test_constants.py  |  8 ++--
 tests/parser/types/test_identifier_naming.py  |  8 +---
 tests/parser/types/test_string.py             |  2 +-
 vyper/ast/folding.py                          | 33 --------------
 vyper/compiler/phases.py                      |  1 -
 22 files changed, 49 insertions(+), 148 deletions(-)

diff --git a/tests/ast/test_folding.py b/tests/ast/test_folding.py
index 22d5f58222..62a7140e97 100644
--- a/tests/ast/test_folding.py
+++ b/tests/ast/test_folding.py
@@ -132,49 +132,6 @@ def test_replace_constant_no(source):
     assert vy_ast.compare_nodes(unmodified_ast, folded_ast)
 
 
-builtins_modified = [
-    "ZERO_ADDRESS",
-    "foo = ZERO_ADDRESS",
-    "foo: int128[ZERO_ADDRESS] = 42",
-    "foo = [ZERO_ADDRESS]",
-    "def foo(bar: address = ZERO_ADDRESS): pass",
-    "def foo(): bar = ZERO_ADDRESS",
-    "def foo(): return ZERO_ADDRESS",
-    "log foo(ZERO_ADDRESS)",
-    "log foo(42, ZERO_ADDRESS)",
-]
-
-
-@pytest.mark.parametrize("source", builtins_modified)
-def test_replace_builtin_constant(source):
-    unmodified_ast = vy_ast.parse_to_ast(source)
-    folded_ast = vy_ast.parse_to_ast(source)
-
-    folding.replace_builtin_constants(folded_ast)
-
-    assert not vy_ast.compare_nodes(unmodified_ast, folded_ast)
-
-
-builtins_unmodified = [
-    "ZERO_ADDRESS = 2",
-    "ZERO_ADDRESS()",
-    "def foo(ZERO_ADDRESS: int128 = 42): pass",
-    "def foo(): ZERO_ADDRESS = 42",
-    "def ZERO_ADDRESS(): pass",
-    "log ZERO_ADDRESS(42)",
-]
-
-
-@pytest.mark.parametrize("source", builtins_unmodified)
-def test_replace_builtin_constant_no(source):
-    unmodified_ast = vy_ast.parse_to_ast(source)
-    folded_ast = vy_ast.parse_to_ast(source)
-
-    folding.replace_builtin_constants(folded_ast)
-
-    assert vy_ast.compare_nodes(unmodified_ast, folded_ast)
-
-
 userdefined_modified = [
     "FOO",
     "foo = FOO",
diff --git a/tests/parser/features/decorators/test_private.py b/tests/parser/features/decorators/test_private.py
index 7c92f72af9..51e6d90ee1 100644
--- a/tests/parser/features/decorators/test_private.py
+++ b/tests/parser/features/decorators/test_private.py
@@ -304,7 +304,7 @@ def test(a: bytes32) -> (bytes32, uint256, int128):
     b: uint256 = 1
     c: int128 = 1
     d: int128 = 123
-    f: bytes32 = EMPTY_BYTES32
+    f: bytes32 = empty(bytes32)
     f, b, c = self._test(a)
     assert d == 123
     return f, b, c
diff --git a/tests/parser/features/external_contracts/test_external_contract_calls.py b/tests/parser/features/external_contracts/test_external_contract_calls.py
index b3cc6f5576..12fcde2f4f 100644
--- a/tests/parser/features/external_contracts/test_external_contract_calls.py
+++ b/tests/parser/features/external_contracts/test_external_contract_calls.py
@@ -775,9 +775,9 @@ def foo() -> (address, Bytes[3], address): view
 
 @external
 def bar(arg1: address) -> (address, Bytes[3], address):
-    a: address = ZERO_ADDRESS
+    a: address = empty(address)
     b: Bytes[3] = b""
-    c: address = ZERO_ADDRESS
+    c: address = empty(address)
     a, b, c = Foo(arg1).foo()
     return a, b, c
 """
@@ -808,9 +808,9 @@ def foo() -> (address, Bytes[3], address): view
 
 @external
 def bar(arg1: address) -> (address, Bytes[3], address):
-    a: address = ZERO_ADDRESS
+    a: address = empty(address)
     b: Bytes[3] = b""
-    c: address = ZERO_ADDRESS
+    c: address = empty(address)
     a, b, c = Foo(arg1).foo()
     return a, b, c
 """
@@ -841,9 +841,9 @@ def foo() -> (address, Bytes[3], address): view
 
 @external
 def bar(arg1: address) -> (address, Bytes[3], address):
-    a: address = ZERO_ADDRESS
+    a: address = empty(address)
     b: Bytes[3] = b""
-    c: address = ZERO_ADDRESS
+    c: address = empty(address)
     a, b, c = Foo(arg1).foo()
     return a, b, c
 """
@@ -1538,7 +1538,7 @@ def out_literals() -> (int128, address, Bytes[10]) : view
 @external
 def test(addr: address) -> (int128, address, Bytes[10]):
     a: int128 = 0
-    b: address = ZERO_ADDRESS
+    b: address = empty(address)
     c: Bytes[10] = b""
     (a, b, c) = Test(addr).out_literals()
     return a, b,c
diff --git a/tests/parser/features/iteration/test_for_in_list.py b/tests/parser/features/iteration/test_for_in_list.py
index bfd960a787..fb01cc98eb 100644
--- a/tests/parser/features/iteration/test_for_in_list.py
+++ b/tests/parser/features/iteration/test_for_in_list.py
@@ -230,7 +230,7 @@ def iterate_return_second() -> address:
         count += 1
         if count == 2:
             return i
-    return ZERO_ADDRESS
+    return empty(address)
     """
 
     c = get_contract_with_gas_estimation(code)
diff --git a/tests/parser/features/test_assignment.py b/tests/parser/features/test_assignment.py
index 35b008a8ba..cd26659a5c 100644
--- a/tests/parser/features/test_assignment.py
+++ b/tests/parser/features/test_assignment.py
@@ -331,7 +331,7 @@ def foo():
 @external
 def foo():
     y: int128 = 1
-    z: bytes32 = EMPTY_BYTES32
+    z: bytes32 = empty(bytes32)
     z = y
     """,
         """
@@ -344,7 +344,7 @@ def foo():
 @external
 def foo():
     y: uint256 = 1
-    z: bytes32 = EMPTY_BYTES32
+    z: bytes32 = empty(bytes32)
     z = y
     """,
     ],
diff --git a/tests/parser/features/test_memory_dealloc.py b/tests/parser/features/test_memory_dealloc.py
index de82f03296..814bf0d3bb 100644
--- a/tests/parser/features/test_memory_dealloc.py
+++ b/tests/parser/features/test_memory_dealloc.py
@@ -9,7 +9,7 @@ def sendit(): nonpayable
 
 @external
 def foo(target: address) -> uint256[2]:
-    log Shimmy(ZERO_ADDRESS, 3)
+    log Shimmy(empty(address), 3)
     amount: uint256 = 1
     flargen: uint256 = 42
     Other(target).sendit()
diff --git a/tests/parser/functions/test_abi_decode.py b/tests/parser/functions/test_abi_decode.py
index 2216a5bd76..242841e1cf 100644
--- a/tests/parser/functions/test_abi_decode.py
+++ b/tests/parser/functions/test_abi_decode.py
@@ -25,7 +25,7 @@ def test_abi_decode_complex(get_contract):
 
 @external
 def abi_decode(x: Bytes[160]) -> (address, int128, bool, decimal, bytes32):
-    a: address = ZERO_ADDRESS
+    a: address = empty(address)
     b: int128 = 0
     c: bool = False
     d: decimal = 0.0
@@ -39,7 +39,7 @@ def abi_decode_struct(x: Bytes[544]) -> Human:
         name: "",
         pet: Animal({
             name: "",
-            address_: ZERO_ADDRESS,
+            address_: empty(address),
             id_: 0,
             is_furry: False,
             price: 0.0,
diff --git a/tests/parser/functions/test_convert.py b/tests/parser/functions/test_convert.py
index eb8449447c..b5ce613235 100644
--- a/tests/parser/functions/test_convert.py
+++ b/tests/parser/functions/test_convert.py
@@ -534,24 +534,6 @@ def foo(a: {typ}) -> Status:
         assert_compile_failed(lambda: get_contract_with_gas_estimation(contract), TypeMismatch)
 
 
-# TODO CMC 2022-04-06 I think this test is somewhat unnecessary.
-@pytest.mark.parametrize(
-    "builtin_constant,out_type,out_value",
-    [("ZERO_ADDRESS", "bool", False), ("msg.sender", "bool", True)],
-)
-def test_convert_builtin_constant(
-    get_contract_with_gas_estimation, builtin_constant, out_type, out_value
-):
-    contract = f"""
-@external
-def convert_builtin_constant() -> {out_type}:
-    return convert({builtin_constant}, {out_type})
-    """
-
-    c = get_contract_with_gas_estimation(contract)
-    assert c.convert_builtin_constant() == out_value
-
-
 # uint256 conversion is currently valid due to type inference on literals
 # not quite working yet
 same_type_conversion_blocked = sorted(TEST_TYPES - {UINT256_T})
diff --git a/tests/parser/functions/test_default_function.py b/tests/parser/functions/test_default_function.py
index 4aa0b04a77..4ad68697ac 100644
--- a/tests/parser/functions/test_default_function.py
+++ b/tests/parser/functions/test_default_function.py
@@ -41,7 +41,7 @@ def test_basic_default_default_param_function(w3, get_logs, get_contract_with_ga
 @external
 @payable
 def fooBar(a: int128 = 12345) -> int128:
-    log Sent(ZERO_ADDRESS)
+    log Sent(empty(address))
     return a
 
 @external
diff --git a/tests/parser/functions/test_empty.py b/tests/parser/functions/test_empty.py
index c10d03550a..c3627785dc 100644
--- a/tests/parser/functions/test_empty.py
+++ b/tests/parser/functions/test_empty.py
@@ -87,8 +87,8 @@ def foo():
     self.foobar = empty(address)
     bar = empty(address)
 
-    assert self.foobar == ZERO_ADDRESS
-    assert bar == ZERO_ADDRESS
+    assert self.foobar == empty(address)
+    assert bar == empty(address)
     """,
         """
 @external
@@ -214,12 +214,12 @@ def foo():
     self.foobar = empty(address[3])
     bar = empty(address[3])
 
-    assert self.foobar[0] == ZERO_ADDRESS
-    assert self.foobar[1] == ZERO_ADDRESS
-    assert self.foobar[2] == ZERO_ADDRESS
-    assert bar[0] == ZERO_ADDRESS
-    assert bar[1] == ZERO_ADDRESS
-    assert bar[2] == ZERO_ADDRESS
+    assert self.foobar[0] == empty(address)
+    assert self.foobar[1] == empty(address)
+    assert self.foobar[2] == empty(address)
+    assert bar[0] == empty(address)
+    assert bar[1] == empty(address)
+    assert bar[2] == empty(address)
     """,
     ],
 )
@@ -376,14 +376,14 @@ def foo():
     assert self.foobar.c == False
     assert self.foobar.d == 0.0
     assert self.foobar.e == 0x0000000000000000000000000000000000000000000000000000000000000000
-    assert self.foobar.f == ZERO_ADDRESS
+    assert self.foobar.f == empty(address)
 
     assert bar.a == 0
     assert bar.b == 0
     assert bar.c == False
     assert bar.d == 0.0
     assert bar.e == 0x0000000000000000000000000000000000000000000000000000000000000000
-    assert bar.f == ZERO_ADDRESS
+    assert bar.f == empty(address)
     """
 
     c = get_contract_with_gas_estimation(code)
diff --git a/tests/parser/functions/test_return_tuple.py b/tests/parser/functions/test_return_tuple.py
index 87b7cdcde3..b375839147 100644
--- a/tests/parser/functions/test_return_tuple.py
+++ b/tests/parser/functions/test_return_tuple.py
@@ -99,7 +99,7 @@ def out_literals() -> (int128, address, Bytes[10]):
 @external
 def test() -> (int128, address, Bytes[10]):
     a: int128 = 0
-    b: address = ZERO_ADDRESS
+    b: address = empty(address)
     c: Bytes[10] = b""
     (a, b, c) = self._out_literals()
     return a, b, c
@@ -138,7 +138,7 @@ def test2() -> (int128, address):
 
 @external
 def test3() -> (address, int128):
-    x: address = ZERO_ADDRESS
+    x: address = empty(address)
     self.a, self.c, x, self.d = self._out_literals()
     return x, self.a
     """
diff --git a/tests/parser/integration/test_escrow.py b/tests/parser/integration/test_escrow.py
index 2982ff9eae..1578f5a418 100644
--- a/tests/parser/integration/test_escrow.py
+++ b/tests/parser/integration/test_escrow.py
@@ -9,7 +9,7 @@ def test_arbitration_code(w3, get_contract_with_gas_estimation, assert_tx_failed
 
 @external
 def setup(_seller: address, _arbitrator: address):
-    if self.buyer == ZERO_ADDRESS:
+    if self.buyer == empty(address):
         self.buyer = msg.sender
         self.seller = _seller
         self.arbitrator = _arbitrator
@@ -43,7 +43,7 @@ def test_arbitration_code_with_init(w3, assert_tx_failed, get_contract_with_gas_
 @external
 @payable
 def __init__(_seller: address, _arbitrator: address):
-    if self.buyer == ZERO_ADDRESS:
+    if self.buyer == empty(address):
         self.buyer = msg.sender
         self.seller = _seller
         self.arbitrator = _arbitrator
diff --git a/tests/parser/syntax/test_bool.py b/tests/parser/syntax/test_bool.py
index 09f799d91c..48ed37321a 100644
--- a/tests/parser/syntax/test_bool.py
+++ b/tests/parser/syntax/test_bool.py
@@ -52,7 +52,7 @@ def foo() -> bool:
     """
 @external
 def foo() -> bool:
-    a: address = ZERO_ADDRESS
+    a: address = empty(address)
     return a == 1
     """,
     (
@@ -137,7 +137,7 @@ def foo() -> bool:
     """
 @external
 def foo2(a: address) -> bool:
-    return a != ZERO_ADDRESS
+    return a != empty(address)
     """,
 ]
 
diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index 5afb34e6bd..498f1363d8 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -47,7 +47,7 @@ def test():
 
 @external
 def test():
-    a: address(ERC20) = ZERO_ADDRESS
+    a: address(ERC20) = empty(address)
     """,
         InvalidType,
     ),
@@ -306,7 +306,7 @@ def some_func(): nonpayable
 
 @external
 def __init__():
-    self.my_interface[self.idx] = MyInterface(ZERO_ADDRESS)
+    self.my_interface[self.idx] = MyInterface(empty(address))
     """,
     """
 interface MyInterface:
diff --git a/tests/parser/syntax/test_no_none.py b/tests/parser/syntax/test_no_none.py
index 7030a56b18..24c32a46a4 100644
--- a/tests/parser/syntax/test_no_none.py
+++ b/tests/parser/syntax/test_no_none.py
@@ -30,13 +30,13 @@ def foo():
         """
 @external
 def foo():
-    bar: bytes32 = EMPTY_BYTES32
+    bar: bytes32 = empty(bytes32)
     bar = None
     """,
         """
 @external
 def foo():
-    bar: address = ZERO_ADDRESS
+    bar: address = empty(address)
     bar = None
     """,
         """
@@ -104,13 +104,13 @@ def foo():
         """
 @external
 def foo():
-    bar: bytes32 = EMPTY_BYTES32
+    bar: bytes32 = empty(bytes32)
     assert bar is None
     """,
         """
 @external
 def foo():
-    bar: address = ZERO_ADDRESS
+    bar: address = empty(address)
     assert bar is None
     """,
     ]
@@ -148,13 +148,13 @@ def foo():
         """
 @external
 def foo():
-    bar: bytes32 = EMPTY_BYTES32
+    bar: bytes32 = empty(bytes32)
     assert bar == None
     """,
         """
 @external
 def foo():
-    bar: address = ZERO_ADDRESS
+    bar: address = empty(address)
     assert bar == None
     """,
     ]
diff --git a/tests/parser/syntax/test_tuple_assign.py b/tests/parser/syntax/test_tuple_assign.py
index 115499ce8b..49b63ee614 100644
--- a/tests/parser/syntax/test_tuple_assign.py
+++ b/tests/parser/syntax/test_tuple_assign.py
@@ -41,7 +41,7 @@ def out_literals() -> (int128, int128, Bytes[10]):
 @external
 def test() -> (int128, address, Bytes[10]):
     a: int128 = 0
-    b: address = ZERO_ADDRESS
+    b: address = empty(address)
     a, b = self.out_literals()  # tuple count mismatch
     return
     """,
diff --git a/tests/parser/syntax/test_unbalanced_return.py b/tests/parser/syntax/test_unbalanced_return.py
index 5337b4b677..d1d9732777 100644
--- a/tests/parser/syntax/test_unbalanced_return.py
+++ b/tests/parser/syntax/test_unbalanced_return.py
@@ -56,7 +56,7 @@ def valid_address(sender: address) -> bool:
         """
 @internal
 def valid_address(sender: address) -> bool:
-    if sender == ZERO_ADDRESS:
+    if sender == empty(address):
         selfdestruct(sender)
         _sender: address = sender
     else:
@@ -144,7 +144,7 @@ def test() -> int128:
     """
 @external
 def test() -> int128:
-    x: bytes32 = EMPTY_BYTES32
+    x: bytes32 = empty(bytes32)
     if False:
         if False:
             return 0
diff --git a/tests/parser/types/numbers/test_constants.py b/tests/parser/types/numbers/test_constants.py
index 0d5e386dad..652c8e8bd9 100644
--- a/tests/parser/types/numbers/test_constants.py
+++ b/tests/parser/types/numbers/test_constants.py
@@ -12,12 +12,12 @@ def test_builtin_constants(get_contract_with_gas_estimation):
     code = """
 @external
 def test_zaddress(a: address) -> bool:
-    return a == ZERO_ADDRESS
+    return a == empty(address)
 
 
 @external
 def test_empty_bytes32(a: bytes32) -> bool:
-    return a == EMPTY_BYTES32
+    return a == empty(bytes32)
 
 
 @external
@@ -81,12 +81,12 @@ def goo() -> int128:
 
 @external
 def hoo() -> bytes32:
-    bar: bytes32 = EMPTY_BYTES32
+    bar: bytes32 = empty(bytes32)
     return bar
 
 @external
 def joo() -> address:
-    bar: address = ZERO_ADDRESS
+    bar: address = empty(address)
     return bar
 
 @external
diff --git a/tests/parser/types/test_identifier_naming.py b/tests/parser/types/test_identifier_naming.py
index 5cfc7e8ed7..0a93329848 100755
--- a/tests/parser/types/test_identifier_naming.py
+++ b/tests/parser/types/test_identifier_naming.py
@@ -1,16 +1,12 @@
 import pytest
 
-from vyper.ast.folding import BUILTIN_CONSTANTS
 from vyper.ast.identifiers import RESERVED_KEYWORDS
 from vyper.builtins.functions import BUILTIN_FUNCTIONS
 from vyper.codegen.expr import ENVIRONMENT_VARIABLES
 from vyper.exceptions import NamespaceCollision, StructureException, SyntaxException
 from vyper.semantics.types.primitives import AddressT
 
-BUILTIN_CONSTANTS = set(BUILTIN_CONSTANTS.keys())
-ALL_RESERVED_KEYWORDS = (
-    BUILTIN_CONSTANTS | BUILTIN_FUNCTIONS | RESERVED_KEYWORDS | ENVIRONMENT_VARIABLES
-)
+ALL_RESERVED_KEYWORDS = BUILTIN_FUNCTIONS | RESERVED_KEYWORDS | ENVIRONMENT_VARIABLES
 
 
 @pytest.mark.parametrize("constant", sorted(ALL_RESERVED_KEYWORDS))
@@ -46,7 +42,7 @@ def test({constant}: int128):
 
 
 SELF_NAMESPACE_MEMBERS = set(AddressT._type_members.keys())
-DISALLOWED_FN_NAMES = SELF_NAMESPACE_MEMBERS | RESERVED_KEYWORDS | BUILTIN_CONSTANTS
+DISALLOWED_FN_NAMES = SELF_NAMESPACE_MEMBERS | RESERVED_KEYWORDS
 ALLOWED_FN_NAMES = ALL_RESERVED_KEYWORDS - DISALLOWED_FN_NAMES
 
 
diff --git a/tests/parser/types/test_string.py b/tests/parser/types/test_string.py
index a5eef66dae..7f1fa71329 100644
--- a/tests/parser/types/test_string.py
+++ b/tests/parser/types/test_string.py
@@ -139,7 +139,7 @@ def out_literals() -> (int128, address, String[10]) : view
 @external
 def test(addr: address) -> (int128, address, String[10]):
     a: int128 = 0
-    b: address = ZERO_ADDRESS
+    b: address = empty(address)
     c: String[10] = ""
     (a, b, c) = Test(addr).out_literals()
     return a, b,c
diff --git a/vyper/ast/folding.py b/vyper/ast/folding.py
index fbd1dfc2f4..38d58f6fd0 100644
--- a/vyper/ast/folding.py
+++ b/vyper/ast/folding.py
@@ -1,4 +1,3 @@
-import warnings
 from typing import Optional, Union
 
 from vyper.ast import nodes as vy_ast
@@ -6,21 +5,6 @@
 from vyper.exceptions import UnfoldableNode, UnknownType
 from vyper.semantics.types.base import VyperType
 from vyper.semantics.types.utils import type_from_annotation
-from vyper.utils import SizeLimits
-
-BUILTIN_CONSTANTS = {
-    "EMPTY_BYTES32": (
-        vy_ast.Hex,
-        "0x0000000000000000000000000000000000000000000000000000000000000000",
-        "empty(bytes32)",
-    ),  # NOQA: E501
-    "ZERO_ADDRESS": (vy_ast.Hex, "0x0000000000000000000000000000000000000000", "empty(address)"),
-    "MAX_INT128": (vy_ast.Int, 2**127 - 1, "max_value(int128)"),
-    "MIN_INT128": (vy_ast.Int, -(2**127), "min_value(int128)"),
-    "MAX_DECIMAL": (vy_ast.Decimal, SizeLimits.MAX_AST_DECIMAL, "max_value(decimal)"),
-    "MIN_DECIMAL": (vy_ast.Decimal, SizeLimits.MIN_AST_DECIMAL, "min_value(decimal)"),
-    "MAX_UINT256": (vy_ast.Int, 2**256 - 1, "max_value(uint256)"),
-}
 
 
 def fold(vyper_module: vy_ast.Module) -> None:
@@ -32,8 +16,6 @@ def fold(vyper_module: vy_ast.Module) -> None:
     vyper_module : Module
         Top-level Vyper AST node.
     """
-    replace_builtin_constants(vyper_module)
-
     changed_nodes = 1
     while changed_nodes:
         changed_nodes = 0
@@ -138,21 +120,6 @@ def replace_builtin_functions(vyper_module: vy_ast.Module) -> int:
     return changed_nodes
 
 
-def replace_builtin_constants(vyper_module: vy_ast.Module) -> None:
-    """
-    Replace references to builtin constants with their literal values.
-
-    Arguments
-    ---------
-    vyper_module : Module
-        Top-level Vyper AST node.
-    """
-    for name, (node, value, replacement) in BUILTIN_CONSTANTS.items():
-        found = replace_constant(vyper_module, name, node(value=value), True)
-        if found > 0:
-            warnings.warn(f"{name} is deprecated. Please use `{replacement}` instead.")
-
-
 def replace_user_defined_constants(vyper_module: vy_ast.Module) -> int:
     """
     Find user-defined constant assignments, and replace references
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 5ddf071caf..72be4396e4 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -235,7 +235,6 @@ def generate_unfolded_ast(
     vyper_module: vy_ast.Module, interface_codes: Optional[InterfaceImports]
 ) -> vy_ast.Module:
     vy_ast.validation.validate_literal_nodes(vyper_module)
-    vy_ast.folding.replace_builtin_constants(vyper_module)
     vy_ast.folding.replace_builtin_functions(vyper_module)
     # note: validate_semantics does type inference on the AST
     validate_semantics(vyper_module, interface_codes)

From 3ba14124602b673d45b86bae7ff90a01d782acb5 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Fri, 20 Oct 2023 01:26:40 +0800
Subject: [PATCH 153/161] refactor: merge `annotation.py` and `local.py`
 (#3456)

This commit merges two phases of analysis: typechecking
(`vyper/semantics/analysis/local.py`) and annotation of ast nodes with
types (`vyper/semantics/analysis/annotation.py`). This is both for
consistency with how it is done for `analysis/module.py`, and also
because it increases internal consistency, as some typechecking was
being done in `annotation.py`. It is also easier to maintain this way,
since bugfixes or modifications to typechecking need to only be done in
one place, rather than two passes. Lastly, it also probably improves
performance, because it collapses two passes into one (and calls
`get_*_type_from_node` less often).

This commit also fixes a bug with accessing the iterator when the
iterator is an empty list literal.
---
 tests/parser/syntax/test_list.py       |   3 +-
 vyper/ast/nodes.pyi                    |   5 +
 vyper/builtins/_signatures.py          |   2 +-
 vyper/builtins/functions.py            |   6 +
 vyper/semantics/analysis/annotation.py | 283 ------------
 vyper/semantics/analysis/common.py     |  19 +-
 vyper/semantics/analysis/local.py      | 607 ++++++++++++++++---------
 vyper/semantics/analysis/utils.py      |  13 +-
 8 files changed, 420 insertions(+), 518 deletions(-)
 delete mode 100644 vyper/semantics/analysis/annotation.py

diff --git a/tests/parser/syntax/test_list.py b/tests/parser/syntax/test_list.py
index 3f81b911c8..db41de5526 100644
--- a/tests/parser/syntax/test_list.py
+++ b/tests/parser/syntax/test_list.py
@@ -305,8 +305,9 @@ def foo():
     """
 @external
 def foo():
+    x: DynArray[uint256, 3] = [1, 2, 3]
     for i in [[], []]:
-        pass
+        x = i
     """,
 ]
 
diff --git a/vyper/ast/nodes.pyi b/vyper/ast/nodes.pyi
index 0d59a2fa63..47c9af8526 100644
--- a/vyper/ast/nodes.pyi
+++ b/vyper/ast/nodes.pyi
@@ -142,6 +142,7 @@ class Expr(VyperNode):
 
 class UnaryOp(ExprNode):
     op: VyperNode = ...
+    operand: VyperNode = ...
 
 class USub(VyperNode): ...
 class Not(VyperNode): ...
@@ -165,12 +166,15 @@ class BitXor(VyperNode): ...
 
 class BoolOp(ExprNode):
     op: VyperNode = ...
+    values: list[VyperNode] = ...
 
 class And(VyperNode): ...
 class Or(VyperNode): ...
 
 class Compare(ExprNode):
     op: VyperNode = ...
+    left: VyperNode = ...
+    right: VyperNode = ...
 
 class Eq(VyperNode): ...
 class NotEq(VyperNode): ...
@@ -179,6 +183,7 @@ class LtE(VyperNode): ...
 class Gt(VyperNode): ...
 class GtE(VyperNode): ...
 class In(VyperNode): ...
+class NotIn(VyperNode): ...
 
 class Call(ExprNode):
     args: list = ...
diff --git a/vyper/builtins/_signatures.py b/vyper/builtins/_signatures.py
index d39a4a085f..2802421129 100644
--- a/vyper/builtins/_signatures.py
+++ b/vyper/builtins/_signatures.py
@@ -74,7 +74,7 @@ def decorator_fn(self, node, context):
     return decorator_fn
 
 
-class BuiltinFunction:
+class BuiltinFunction(VyperType):
     _has_varargs = False
     _kwargs: Dict[str, KwargSettings] = {}
 
diff --git a/vyper/builtins/functions.py b/vyper/builtins/functions.py
index f07202831d..001939638b 100644
--- a/vyper/builtins/functions.py
+++ b/vyper/builtins/functions.py
@@ -475,6 +475,12 @@ def evaluate(self, node):
 
         return vy_ast.Int.from_node(node, value=length)
 
+    def infer_arg_types(self, node):
+        self._validate_arg_types(node)
+        # return a concrete type
+        typ = get_possible_types_from_node(node.args[0]).pop()
+        return [typ]
+
     def build_IR(self, node, context):
         arg = Expr(node.args[0], context).ir_node
         if arg.value == "~calldata":
diff --git a/vyper/semantics/analysis/annotation.py b/vyper/semantics/analysis/annotation.py
deleted file mode 100644
index 01ca51d7f4..0000000000
--- a/vyper/semantics/analysis/annotation.py
+++ /dev/null
@@ -1,283 +0,0 @@
-from vyper import ast as vy_ast
-from vyper.exceptions import StructureException, TypeCheckFailure
-from vyper.semantics.analysis.utils import (
-    get_common_types,
-    get_exact_type_from_node,
-    get_possible_types_from_node,
-)
-from vyper.semantics.types import TYPE_T, BoolT, EnumT, EventT, SArrayT, StructT, is_type_t
-from vyper.semantics.types.function import ContractFunctionT, MemberFunctionT
-
-
-class _AnnotationVisitorBase:
-
-    """
-    Annotation visitor base class.
-
-    Annotation visitors apply metadata (such as type information) to vyper AST objects.
-    Immediately after type checking a statement-level node, that node is passed to
-    `StatementAnnotationVisitor`. Some expression nodes are then passed onward to
-    `ExpressionAnnotationVisitor` for additional annotation.
-    """
-
-    def visit(self, node, *args):
-        if isinstance(node, self.ignored_types):
-            return
-        # iterate over the MRO until we find a matching visitor function
-        # this lets us use a single function to broadly target several
-        # node types with a shared parent
-        for class_ in node.__class__.mro():
-            ast_type = class_.__name__
-            visitor_fn = getattr(self, f"visit_{ast_type}", None)
-            if visitor_fn:
-                visitor_fn(node, *args)
-                return
-        raise StructureException(f"Cannot annotate: {node.ast_type}", node)
-
-
-class StatementAnnotationVisitor(_AnnotationVisitorBase):
-    ignored_types = (vy_ast.Break, vy_ast.Continue, vy_ast.Pass, vy_ast.Raise)
-
-    def __init__(self, fn_node: vy_ast.FunctionDef, namespace: dict) -> None:
-        self.func = fn_node._metadata["type"]
-        self.namespace = namespace
-        self.expr_visitor = ExpressionAnnotationVisitor(self.func)
-
-        assert self.func.n_keyword_args == len(fn_node.args.defaults)
-        for kwarg in self.func.keyword_args:
-            self.expr_visitor.visit(kwarg.default_value, kwarg.typ)
-
-    def visit(self, node):
-        super().visit(node)
-
-    def visit_AnnAssign(self, node):
-        type_ = get_exact_type_from_node(node.target)
-        self.expr_visitor.visit(node.target, type_)
-        self.expr_visitor.visit(node.value, type_)
-
-    def visit_Assert(self, node):
-        self.expr_visitor.visit(node.test)
-
-    def visit_Assign(self, node):
-        type_ = get_exact_type_from_node(node.target)
-        self.expr_visitor.visit(node.target, type_)
-        self.expr_visitor.visit(node.value, type_)
-
-    def visit_AugAssign(self, node):
-        type_ = get_exact_type_from_node(node.target)
-        self.expr_visitor.visit(node.target, type_)
-        self.expr_visitor.visit(node.value, type_)
-
-    def visit_Expr(self, node):
-        self.expr_visitor.visit(node.value)
-
-    def visit_If(self, node):
-        self.expr_visitor.visit(node.test)
-
-    def visit_Log(self, node):
-        node._metadata["type"] = self.namespace[node.value.func.id]
-        self.expr_visitor.visit(node.value)
-
-    def visit_Return(self, node):
-        if node.value is not None:
-            self.expr_visitor.visit(node.value, self.func.return_type)
-
-    def visit_For(self, node):
-        if isinstance(node.iter, (vy_ast.Name, vy_ast.Attribute)):
-            self.expr_visitor.visit(node.iter)
-
-        iter_type = node.target._metadata["type"]
-        if isinstance(node.iter, vy_ast.List):
-            # typecheck list literal as static array
-            len_ = len(node.iter.elements)
-            self.expr_visitor.visit(node.iter, SArrayT(iter_type, len_))
-
-        if isinstance(node.iter, vy_ast.Call) and node.iter.func.id == "range":
-            for a in node.iter.args:
-                self.expr_visitor.visit(a, iter_type)
-            for a in node.iter.keywords:
-                if a.arg == "bound":
-                    self.expr_visitor.visit(a.value, iter_type)
-
-
-class ExpressionAnnotationVisitor(_AnnotationVisitorBase):
-    ignored_types = ()
-
-    def __init__(self, fn_node: ContractFunctionT):
-        self.func = fn_node
-
-    def visit(self, node, type_=None):
-        # the statement visitor sometimes passes type information about expressions
-        super().visit(node, type_)
-
-    def visit_Attribute(self, node, type_):
-        type_ = get_exact_type_from_node(node)
-        node._metadata["type"] = type_
-        self.visit(node.value, None)
-
-    def visit_BinOp(self, node, type_):
-        if type_ is None:
-            type_ = get_common_types(node.left, node.right)
-            if len(type_) == 1:
-                type_ = type_.pop()
-        node._metadata["type"] = type_
-
-        self.visit(node.left, type_)
-        self.visit(node.right, type_)
-
-    def visit_BoolOp(self, node, type_):
-        for value in node.values:
-            self.visit(value)
-
-    def visit_Call(self, node, type_):
-        call_type = get_exact_type_from_node(node.func)
-        node_type = type_ or call_type.fetch_call_return(node)
-        node._metadata["type"] = node_type
-        self.visit(node.func)
-
-        if isinstance(call_type, ContractFunctionT):
-            # function calls
-            if call_type.is_internal:
-                self.func.called_functions.add(call_type)
-            for arg, typ in zip(node.args, call_type.argument_types):
-                self.visit(arg, typ)
-            for kwarg in node.keywords:
-                # We should only see special kwargs
-                self.visit(kwarg.value, call_type.call_site_kwargs[kwarg.arg].typ)
-
-        elif is_type_t(call_type, EventT):
-            # events have no kwargs
-            for arg, typ in zip(node.args, list(call_type.typedef.arguments.values())):
-                self.visit(arg, typ)
-        elif is_type_t(call_type, StructT):
-            # struct ctors
-            # ctors have no kwargs
-            for value, arg_type in zip(
-                node.args[0].values, list(call_type.typedef.members.values())
-            ):
-                self.visit(value, arg_type)
-        elif isinstance(call_type, MemberFunctionT):
-            assert len(node.args) == len(call_type.arg_types)
-            for arg, arg_type in zip(node.args, call_type.arg_types):
-                self.visit(arg, arg_type)
-        else:
-            # builtin functions
-            arg_types = call_type.infer_arg_types(node)
-            for arg, arg_type in zip(node.args, arg_types):
-                self.visit(arg, arg_type)
-            kwarg_types = call_type.infer_kwarg_types(node)
-            for kwarg in node.keywords:
-                self.visit(kwarg.value, kwarg_types[kwarg.arg])
-
-    def visit_Compare(self, node, type_):
-        if isinstance(node.op, (vy_ast.In, vy_ast.NotIn)):
-            if isinstance(node.right, vy_ast.List):
-                type_ = get_common_types(node.left, *node.right.elements).pop()
-                self.visit(node.left, type_)
-                rlen = len(node.right.elements)
-                self.visit(node.right, SArrayT(type_, rlen))
-            else:
-                type_ = get_exact_type_from_node(node.right)
-                self.visit(node.right, type_)
-                if isinstance(type_, EnumT):
-                    self.visit(node.left, type_)
-                else:
-                    # array membership
-                    self.visit(node.left, type_.value_type)
-        else:
-            type_ = get_common_types(node.left, node.right).pop()
-            self.visit(node.left, type_)
-            self.visit(node.right, type_)
-
-    def visit_Constant(self, node, type_):
-        if type_ is None:
-            possible_types = get_possible_types_from_node(node)
-            if len(possible_types) == 1:
-                type_ = possible_types.pop()
-        node._metadata["type"] = type_
-
-    def visit_Dict(self, node, type_):
-        node._metadata["type"] = type_
-
-    def visit_Index(self, node, type_):
-        self.visit(node.value, type_)
-
-    def visit_List(self, node, type_):
-        if type_ is None:
-            type_ = get_possible_types_from_node(node)
-            # CMC 2022-04-14 this seems sus. try to only annotate
-            # if get_possible_types only returns 1 type
-            if len(type_) >= 1:
-                type_ = type_.pop()
-        node._metadata["type"] = type_
-        for element in node.elements:
-            self.visit(element, type_.value_type)
-
-    def visit_Name(self, node, type_):
-        if isinstance(type_, TYPE_T):
-            node._metadata["type"] = type_
-        else:
-            node._metadata["type"] = get_exact_type_from_node(node)
-
-    def visit_Subscript(self, node, type_):
-        node._metadata["type"] = type_
-
-        if isinstance(type_, TYPE_T):
-            # don't recurse; can't annotate AST children of type definition
-            return
-
-        if isinstance(node.value, vy_ast.List):
-            possible_base_types = get_possible_types_from_node(node.value)
-
-            if len(possible_base_types) == 1:
-                base_type = possible_base_types.pop()
-
-            elif type_ is not None and len(possible_base_types) > 1:
-                for possible_type in possible_base_types:
-                    if type_.compare_type(possible_type.value_type):
-                        base_type = possible_type
-                        break
-                else:
-                    # this should have been caught in
-                    # `get_possible_types_from_node` but wasn't.
-                    raise TypeCheckFailure(f"Expected {type_} but it is not a possible type", node)
-
-        else:
-            base_type = get_exact_type_from_node(node.value)
-
-        # get the correct type for the index, it might
-        # not be base_type.key_type
-        index_types = get_possible_types_from_node(node.slice.value)
-        index_type = index_types.pop()
-
-        self.visit(node.slice, index_type)
-        self.visit(node.value, base_type)
-
-    def visit_Tuple(self, node, type_):
-        node._metadata["type"] = type_
-
-        if isinstance(type_, TYPE_T):
-            # don't recurse; can't annotate AST children of type definition
-            return
-
-        for element, subtype in zip(node.elements, type_.member_types):
-            self.visit(element, subtype)
-
-    def visit_UnaryOp(self, node, type_):
-        if type_ is None:
-            type_ = get_possible_types_from_node(node.operand)
-            if len(type_) == 1:
-                type_ = type_.pop()
-        node._metadata["type"] = type_
-        self.visit(node.operand, type_)
-
-    def visit_IfExp(self, node, type_):
-        if type_ is None:
-            ts = get_common_types(node.body, node.orelse)
-            if len(ts) == 1:
-                type_ = ts.pop()
-
-        node._metadata["type"] = type_
-        self.visit(node.test, BoolT())
-        self.visit(node.body, type_)
-        self.visit(node.orelse, type_)
diff --git a/vyper/semantics/analysis/common.py b/vyper/semantics/analysis/common.py
index 193d1892e1..507eb0a570 100644
--- a/vyper/semantics/analysis/common.py
+++ b/vyper/semantics/analysis/common.py
@@ -10,10 +10,17 @@ class VyperNodeVisitorBase:
     def visit(self, node, *args):
         if isinstance(node, self.ignored_types):
             return
+
+        # iterate over the MRO until we find a matching visitor function
+        # this lets us use a single function to broadly target several
+        # node types with a shared parent
+        for class_ in node.__class__.mro():
+            ast_type = class_.__name__
+            visitor_fn = getattr(self, f"visit_{ast_type}", None)
+            if visitor_fn:
+                return visitor_fn(node, *args)
+
         node_type = type(node).__name__
-        visitor_fn = getattr(self, f"visit_{node_type}", None)
-        if visitor_fn is None:
-            raise StructureException(
-                f"Unsupported syntax for {self.scope_name} namespace: {node_type}", node
-            )
-        visitor_fn(node, *args)
+        raise StructureException(
+            f"Unsupported syntax for {self.scope_name} namespace: {node_type}", node
+        )
diff --git a/vyper/semantics/analysis/local.py b/vyper/semantics/analysis/local.py
index b391b33953..647f01c299 100644
--- a/vyper/semantics/analysis/local.py
+++ b/vyper/semantics/analysis/local.py
@@ -14,11 +14,11 @@
     NonPayableViolation,
     StateAccessViolation,
     StructureException,
+    TypeCheckFailure,
     TypeMismatch,
     VariableDeclarationException,
     VyperException,
 )
-from vyper.semantics.analysis.annotation import StatementAnnotationVisitor
 from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.common import VyperNodeVisitorBase
 from vyper.semantics.analysis.utils import (
@@ -34,9 +34,11 @@
 from vyper.semantics.environment import CONSTANT_ENVIRONMENT_VARS, MUTABLE_ENVIRONMENT_VARS
 from vyper.semantics.namespace import get_namespace
 from vyper.semantics.types import (
+    TYPE_T,
     AddressT,
     BoolT,
     DArrayT,
+    EnumT,
     EventT,
     HashMapT,
     IntegerT,
@@ -44,6 +46,8 @@
     StringT,
     StructT,
     TupleT,
+    VyperType,
+    _BytestringT,
     is_type_t,
 )
 from vyper.semantics.types.function import ContractFunctionT, MemberFunctionT, StateMutability
@@ -117,20 +121,8 @@ def _check_iterator_modification(
     return None
 
 
-def _validate_revert_reason(msg_node: vy_ast.VyperNode) -> None:
-    if msg_node:
-        if isinstance(msg_node, vy_ast.Str):
-            if not msg_node.value.strip():
-                raise StructureException("Reason string cannot be empty", msg_node)
-        elif not (isinstance(msg_node, vy_ast.Name) and msg_node.id == "UNREACHABLE"):
-            try:
-                validate_expected_type(msg_node, StringT(1024))
-            except TypeMismatch as e:
-                raise InvalidType("revert reason must fit within String[1024]") from e
-
-
-def _validate_address_code_attribute(node: vy_ast.Attribute) -> None:
-    value_type = get_exact_type_from_node(node.value)
+# helpers
+def _validate_address_code(node: vy_ast.Attribute, value_type: VyperType) -> None:
     if isinstance(value_type, AddressT) and node.attr == "code":
         # Validate `slice(<address>.code, start, length)` where `length` is constant
         parent = node.get_ancestor()
@@ -139,6 +131,7 @@ def _validate_address_code_attribute(node: vy_ast.Attribute) -> None:
             ok_args = len(parent.args) == 3 and isinstance(parent.args[2], vy_ast.Int)
             if ok_func and ok_args:
                 return
+
         raise StructureException(
             "(address).code is only allowed inside of a slice function with a constant length", node
         )
@@ -160,8 +153,30 @@ def _validate_msg_data_attribute(node: vy_ast.Attribute) -> None:
                 )
 
 
+def _validate_msg_value_access(node: vy_ast.Attribute) -> None:
+    if isinstance(node.value, vy_ast.Name) and node.attr == "value" and node.value.id == "msg":
+        raise NonPayableViolation("msg.value is not allowed in non-payable functions", node)
+
+
+def _validate_pure_access(node: vy_ast.Attribute, typ: VyperType) -> None:
+    env_vars = set(CONSTANT_ENVIRONMENT_VARS.keys()) | set(MUTABLE_ENVIRONMENT_VARS.keys())
+    if isinstance(node.value, vy_ast.Name) and node.value.id in env_vars:
+        if isinstance(typ, ContractFunctionT) and typ.mutability == StateMutability.PURE:
+            return
+
+        raise StateAccessViolation(
+            "not allowed to query contract or environment variables in pure functions", node
+        )
+
+
+def _validate_self_reference(node: vy_ast.Name) -> None:
+    # CMC 2023-10-19 this detector seems sus, things like `a.b(self)` could slip through
+    if node.id == "self" and not isinstance(node.get_ancestor(), vy_ast.Attribute):
+        raise StateAccessViolation("not allowed to query self in pure functions", node)
+
+
 class FunctionNodeVisitor(VyperNodeVisitorBase):
-    ignored_types = (vy_ast.Constant, vy_ast.Pass)
+    ignored_types = (vy_ast.Pass,)
     scope_name = "function"
 
     def __init__(
@@ -171,8 +186,7 @@ def __init__(
         self.fn_node = fn_node
         self.namespace = namespace
         self.func = fn_node._metadata["type"]
-        self.annotation_visitor = StatementAnnotationVisitor(fn_node, namespace)
-        self.expr_visitor = _LocalExpressionVisitor()
+        self.expr_visitor = _ExprVisitor(self.func)
 
         # allow internal function params to be mutable
         location, is_immutable = (
@@ -189,44 +203,13 @@ def __init__(
                     f"Missing or unmatched return statements in function '{fn_node.name}'", fn_node
                 )
 
-        if self.func.mutability == StateMutability.PURE:
-            node_list = fn_node.get_descendants(
-                vy_ast.Attribute,
-                {
-                    "value.id": set(CONSTANT_ENVIRONMENT_VARS.keys()).union(
-                        set(MUTABLE_ENVIRONMENT_VARS.keys())
-                    )
-                },
-            )
-
-            # Add references to `self` as standalone address
-            self_references = fn_node.get_descendants(vy_ast.Name, {"id": "self"})
-            standalone_self = [
-                n for n in self_references if not isinstance(n.get_ancestor(), vy_ast.Attribute)
-            ]
-            node_list.extend(standalone_self)  # type: ignore
-
-            for node in node_list:
-                t = node._metadata.get("type")
-                if isinstance(t, ContractFunctionT) and t.mutability == StateMutability.PURE:
-                    # allowed
-                    continue
-                raise StateAccessViolation(
-                    "not allowed to query contract or environment variables in pure functions",
-                    node_list[0],
-                )
-        if self.func.mutability is not StateMutability.PAYABLE:
-            node_list = fn_node.get_descendants(
-                vy_ast.Attribute, {"value.id": "msg", "attr": "value"}
-            )
-            if node_list:
-                raise NonPayableViolation(
-                    "msg.value is not allowed in non-payable functions", node_list[0]
-                )
+        # visit default args
+        assert self.func.n_keyword_args == len(fn_node.args.defaults)
+        for kwarg in self.func.keyword_args:
+            self.expr_visitor.visit(kwarg.default_value, kwarg.typ)
 
     def visit(self, node):
         super().visit(node)
-        self.annotation_visitor.visit(node)
 
     def visit_AnnAssign(self, node):
         name = node.get("target.id")
@@ -238,16 +221,42 @@ def visit_AnnAssign(self, node):
                 "Memory variables must be declared with an initial value", node
             )
 
-        type_ = type_from_annotation(node.annotation, DataLocation.MEMORY)
-        validate_expected_type(node.value, type_)
+        typ = type_from_annotation(node.annotation, DataLocation.MEMORY)
+        validate_expected_type(node.value, typ)
 
         try:
-            self.namespace[name] = VarInfo(type_, location=DataLocation.MEMORY)
+            self.namespace[name] = VarInfo(typ, location=DataLocation.MEMORY)
         except VyperException as exc:
             raise exc.with_annotation(node) from None
-        self.expr_visitor.visit(node.value)
 
-    def visit_Assign(self, node):
+        self.expr_visitor.visit(node.target, typ)
+        self.expr_visitor.visit(node.value, typ)
+
+    def _validate_revert_reason(self, msg_node: vy_ast.VyperNode) -> None:
+        if isinstance(msg_node, vy_ast.Str):
+            if not msg_node.value.strip():
+                raise StructureException("Reason string cannot be empty", msg_node)
+            self.expr_visitor.visit(msg_node, get_exact_type_from_node(msg_node))
+        elif not (isinstance(msg_node, vy_ast.Name) and msg_node.id == "UNREACHABLE"):
+            try:
+                validate_expected_type(msg_node, StringT(1024))
+            except TypeMismatch as e:
+                raise InvalidType("revert reason must fit within String[1024]") from e
+            self.expr_visitor.visit(msg_node, get_exact_type_from_node(msg_node))
+        # CMC 2023-10-19 nice to have: tag UNREACHABLE nodes with a special type
+
+    def visit_Assert(self, node):
+        if node.msg:
+            self._validate_revert_reason(node.msg)
+
+        try:
+            validate_expected_type(node.test, BoolT())
+        except InvalidType:
+            raise InvalidType("Assertion test value must be a boolean", node.test)
+        self.expr_visitor.visit(node.test, BoolT())
+
+    # repeated code for Assign and AugAssign
+    def _assign_helper(self, node):
         if isinstance(node.value, vy_ast.Tuple):
             raise StructureException("Right-hand side of assignment cannot be a tuple", node.value)
 
@@ -260,81 +269,71 @@ def visit_Assign(self, node):
         validate_expected_type(node.value, target.typ)
         target.validate_modification(node, self.func.mutability)
 
-        self.expr_visitor.visit(node.value)
-        self.expr_visitor.visit(node.target)
+        self.expr_visitor.visit(node.value, target.typ)
+        self.expr_visitor.visit(node.target, target.typ)
 
-    def visit_AugAssign(self, node):
-        if isinstance(node.value, vy_ast.Tuple):
-            raise StructureException("Right-hand side of assignment cannot be a tuple", node.value)
-
-        lhs_info = get_expr_info(node.target)
-
-        validate_expected_type(node.value, lhs_info.typ)
-        lhs_info.validate_modification(node, self.func.mutability)
-
-        self.expr_visitor.visit(node.value)
-        self.expr_visitor.visit(node.target)
-
-    def visit_Raise(self, node):
-        if node.exc:
-            _validate_revert_reason(node.exc)
-            self.expr_visitor.visit(node.exc)
+    def visit_Assign(self, node):
+        self._assign_helper(node)
 
-    def visit_Assert(self, node):
-        if node.msg:
-            _validate_revert_reason(node.msg)
-            self.expr_visitor.visit(node.msg)
+    def visit_AugAssign(self, node):
+        self._assign_helper(node)
 
-        try:
-            validate_expected_type(node.test, BoolT())
-        except InvalidType:
-            raise InvalidType("Assertion test value must be a boolean", node.test)
-        self.expr_visitor.visit(node.test)
+    def visit_Break(self, node):
+        for_node = node.get_ancestor(vy_ast.For)
+        if for_node is None:
+            raise StructureException("`break` must be enclosed in a `for` loop", node)
 
     def visit_Continue(self, node):
+        # TODO: use context/state instead of ast search
         for_node = node.get_ancestor(vy_ast.For)
         if for_node is None:
             raise StructureException("`continue` must be enclosed in a `for` loop", node)
 
-    def visit_Break(self, node):
-        for_node = node.get_ancestor(vy_ast.For)
-        if for_node is None:
-            raise StructureException("`break` must be enclosed in a `for` loop", node)
+    def visit_Expr(self, node):
+        if not isinstance(node.value, vy_ast.Call):
+            raise StructureException("Expressions without assignment are disallowed", node)
 
-    def visit_Return(self, node):
-        values = node.value
-        if values is None:
-            if self.func.return_type:
-                raise FunctionDeclarationException("Return statement is missing a value", node)
-            return
-        elif self.func.return_type is None:
-            raise FunctionDeclarationException("Function does not return any values", node)
+        fn_type = get_exact_type_from_node(node.value.func)
+        if is_type_t(fn_type, EventT):
+            raise StructureException("To call an event you must use the `log` statement", node)
 
-        if isinstance(values, vy_ast.Tuple):
-            values = values.elements
-            if not isinstance(self.func.return_type, TupleT):
-                raise FunctionDeclarationException("Function only returns a single value", node)
-            if self.func.return_type.length != len(values):
-                raise FunctionDeclarationException(
-                    f"Incorrect number of return values: "
-                    f"expected {self.func.return_type.length}, got {len(values)}",
+        if is_type_t(fn_type, StructT):
+            raise StructureException("Struct creation without assignment is disallowed", node)
+
+        if isinstance(fn_type, ContractFunctionT):
+            if (
+                fn_type.mutability > StateMutability.VIEW
+                and self.func.mutability <= StateMutability.VIEW
+            ):
+                raise StateAccessViolation(
+                    f"Cannot call a mutating function from a {self.func.mutability.value} function",
                     node,
                 )
-            for given, expected in zip(values, self.func.return_type.member_types):
-                validate_expected_type(given, expected)
-        else:
-            validate_expected_type(values, self.func.return_type)
-        self.expr_visitor.visit(node.value)
 
-    def visit_If(self, node):
-        validate_expected_type(node.test, BoolT())
-        self.expr_visitor.visit(node.test)
-        with self.namespace.enter_scope():
-            for n in node.body:
-                self.visit(n)
-        with self.namespace.enter_scope():
-            for n in node.orelse:
-                self.visit(n)
+            if (
+                self.func.mutability == StateMutability.PURE
+                and fn_type.mutability != StateMutability.PURE
+            ):
+                raise StateAccessViolation(
+                    "Cannot call non-pure function from a pure function", node
+                )
+
+        if isinstance(fn_type, MemberFunctionT) and fn_type.is_modifying:
+            # it's a dotted function call like dynarray.pop()
+            expr_info = get_expr_info(node.value.func.value)
+            expr_info.validate_modification(node, self.func.mutability)
+
+        # NOTE: fetch_call_return validates call args.
+        return_value = fn_type.fetch_call_return(node.value)
+        if (
+            return_value
+            and not isinstance(fn_type, MemberFunctionT)
+            and not isinstance(fn_type, ContractFunctionT)
+        ):
+            raise StructureException(
+                f"Function '{fn_type._id}' cannot be called without assigning the result", node
+            )
+        self.expr_visitor.visit(node.value, fn_type)
 
     def visit_For(self, node):
         if isinstance(node.iter, vy_ast.Subscript):
@@ -463,19 +462,18 @@ def visit_For(self, node):
                             f"which potentially modifies iterated storage variable '{iter_name}'",
                             call_node,
                         )
-        self.expr_visitor.visit(node.iter)
 
         if not isinstance(node.target, vy_ast.Name):
             raise StructureException("Invalid syntax for loop iterator", node.target)
 
         for_loop_exceptions = []
         iter_name = node.target.id
-        for type_ in type_list:
+        for possible_target_type in type_list:
             # type check the for loop body using each possible type for iterator value
 
             with self.namespace.enter_scope():
                 try:
-                    self.namespace[iter_name] = VarInfo(type_, is_constant=True)
+                    self.namespace[iter_name] = VarInfo(possible_target_type, is_constant=True)
                 except VyperException as exc:
                     raise exc.with_annotation(node) from None
 
@@ -486,17 +484,27 @@ def visit_For(self, node):
                 except (TypeMismatch, InvalidOperation) as exc:
                     for_loop_exceptions.append(exc)
                 else:
-                    # type information is applied directly here because the
-                    # scope is closed prior to the call to
-                    # `StatementAnnotationVisitor`
-                    node.target._metadata["type"] = type_
-
-                    # success -- bail out instead of error handling.
+                    self.expr_visitor.visit(node.target, possible_target_type)
+
+                    if isinstance(node.iter, (vy_ast.Name, vy_ast.Attribute)):
+                        iter_type = get_exact_type_from_node(node.iter)
+                        # note CMC 2023-10-23: slightly redundant with how type_list is computed
+                        validate_expected_type(node.target, iter_type.value_type)
+                        self.expr_visitor.visit(node.iter, iter_type)
+                    if isinstance(node.iter, vy_ast.List):
+                        len_ = len(node.iter.elements)
+                        self.expr_visitor.visit(node.iter, SArrayT(possible_target_type, len_))
+                    if isinstance(node.iter, vy_ast.Call) and node.iter.func.id == "range":
+                        for a in node.iter.args:
+                            self.expr_visitor.visit(a, possible_target_type)
+                        for a in node.iter.keywords:
+                            if a.arg == "bound":
+                                self.expr_visitor.visit(a.value, possible_target_type)
+
+                    # success -- do not enter error handling section
                     return
 
-        # if we have gotten here, there was an error for
-        # every type tried for the iterator
-
+        # failed to find a good type. bail out
         if len(set(str(i) for i in for_loop_exceptions)) == 1:
             # if every attempt at type checking raised the same exception
             raise for_loop_exceptions[0]
@@ -510,56 +518,20 @@ def visit_For(self, node):
             "but type checking fails with all possible types:",
             node,
             *(
-                (f"Casting '{iter_name}' as {type_}: {exc.message}", exc.annotations[0])
-                for type_, exc in zip(type_list, for_loop_exceptions)
+                (f"Casting '{iter_name}' as {typ}: {exc.message}", exc.annotations[0])
+                for typ, exc in zip(type_list, for_loop_exceptions)
             ),
         )
 
-    def visit_Expr(self, node):
-        if not isinstance(node.value, vy_ast.Call):
-            raise StructureException("Expressions without assignment are disallowed", node)
-
-        fn_type = get_exact_type_from_node(node.value.func)
-        if is_type_t(fn_type, EventT):
-            raise StructureException("To call an event you must use the `log` statement", node)
-
-        if is_type_t(fn_type, StructT):
-            raise StructureException("Struct creation without assignment is disallowed", node)
-
-        if isinstance(fn_type, ContractFunctionT):
-            if (
-                fn_type.mutability > StateMutability.VIEW
-                and self.func.mutability <= StateMutability.VIEW
-            ):
-                raise StateAccessViolation(
-                    f"Cannot call a mutating function from a {self.func.mutability.value} function",
-                    node,
-                )
-
-            if (
-                self.func.mutability == StateMutability.PURE
-                and fn_type.mutability != StateMutability.PURE
-            ):
-                raise StateAccessViolation(
-                    "Cannot call non-pure function from a pure function", node
-                )
-
-        if isinstance(fn_type, MemberFunctionT) and fn_type.is_modifying:
-            # it's a dotted function call like dynarray.pop()
-            expr_info = get_expr_info(node.value.func.value)
-            expr_info.validate_modification(node, self.func.mutability)
-
-        # NOTE: fetch_call_return validates call args.
-        return_value = fn_type.fetch_call_return(node.value)
-        if (
-            return_value
-            and not isinstance(fn_type, MemberFunctionT)
-            and not isinstance(fn_type, ContractFunctionT)
-        ):
-            raise StructureException(
-                f"Function '{fn_type._id}' cannot be called without assigning the result", node
-            )
-        self.expr_visitor.visit(node.value)
+    def visit_If(self, node):
+        validate_expected_type(node.test, BoolT())
+        self.expr_visitor.visit(node.test, BoolT())
+        with self.namespace.enter_scope():
+            for n in node.body:
+                self.visit(n)
+        with self.namespace.enter_scope():
+            for n in node.orelse:
+                self.visit(n)
 
     def visit_Log(self, node):
         if not isinstance(node.value, vy_ast.Call):
@@ -572,62 +544,249 @@ def visit_Log(self, node):
                 f"Cannot emit logs from {self.func.mutability.value.lower()} functions", node
             )
         f.fetch_call_return(node.value)
-        self.expr_visitor.visit(node.value)
+        node._metadata["type"] = f.typedef
+        self.expr_visitor.visit(node.value, f.typedef)
+
+    def visit_Raise(self, node):
+        if node.exc:
+            self._validate_revert_reason(node.exc)
 
+    def visit_Return(self, node):
+        values = node.value
+        if values is None:
+            if self.func.return_type:
+                raise FunctionDeclarationException("Return statement is missing a value", node)
+            return
+        elif self.func.return_type is None:
+            raise FunctionDeclarationException("Function does not return any values", node)
 
-class _LocalExpressionVisitor(VyperNodeVisitorBase):
-    ignored_types = (vy_ast.Constant, vy_ast.Name)
+        if isinstance(values, vy_ast.Tuple):
+            values = values.elements
+            if not isinstance(self.func.return_type, TupleT):
+                raise FunctionDeclarationException("Function only returns a single value", node)
+            if self.func.return_type.length != len(values):
+                raise FunctionDeclarationException(
+                    f"Incorrect number of return values: "
+                    f"expected {self.func.return_type.length}, got {len(values)}",
+                    node,
+                )
+            for given, expected in zip(values, self.func.return_type.member_types):
+                validate_expected_type(given, expected)
+        else:
+            validate_expected_type(values, self.func.return_type)
+        self.expr_visitor.visit(node.value, self.func.return_type)
+
+
+class _ExprVisitor(VyperNodeVisitorBase):
     scope_name = "function"
 
-    def visit_Attribute(self, node: vy_ast.Attribute) -> None:
-        self.visit(node.value)
+    def __init__(self, fn_node: ContractFunctionT):
+        self.func = fn_node
+
+    def visit(self, node, typ):
+        # recurse and typecheck in case we are being fed the wrong type for
+        # some reason. note that `validate_expected_type` is unnecessary
+        # for nodes that already call `get_exact_type_from_node` and
+        # `get_possible_types_from_node` because `validate_expected_type`
+        # would be calling the same function again.
+        # CMC 2023-06-27 would be cleanest to call validate_expected_type()
+        # before recursing but maybe needs some refactoring before that
+        # can happen.
+        super().visit(node, typ)
+
+        # annotate
+        node._metadata["type"] = typ
+
+    def visit_Attribute(self, node: vy_ast.Attribute, typ: VyperType) -> None:
         _validate_msg_data_attribute(node)
-        _validate_address_code_attribute(node)
-
-    def visit_BinOp(self, node: vy_ast.BinOp) -> None:
-        self.visit(node.left)
-        self.visit(node.right)
-
-    def visit_BoolOp(self, node: vy_ast.BoolOp) -> None:
-        for value in node.values:  # type: ignore[attr-defined]
-            self.visit(value)
-
-    def visit_Call(self, node: vy_ast.Call) -> None:
-        self.visit(node.func)
-        for arg in node.args:
-            self.visit(arg)
-        for kwarg in node.keywords:
-            self.visit(kwarg.value)
-
-    def visit_Compare(self, node: vy_ast.Compare) -> None:
-        self.visit(node.left)  # type: ignore[attr-defined]
-        self.visit(node.right)  # type: ignore[attr-defined]
-
-    def visit_Dict(self, node: vy_ast.Dict) -> None:
-        for key in node.keys:
-            self.visit(key)
+
+        # CMC 2023-10-19 TODO generalize this to mutability check on every node.
+        # something like,
+        # if self.func.mutability < expr_info.mutability:
+        #    raise ...
+
+        if self.func.mutability != StateMutability.PAYABLE:
+            _validate_msg_value_access(node)
+
+        if self.func.mutability == StateMutability.PURE:
+            _validate_pure_access(node, typ)
+
+        value_type = get_exact_type_from_node(node.value)
+        _validate_address_code(node, value_type)
+
+        self.visit(node.value, value_type)
+
+    def visit_BinOp(self, node: vy_ast.BinOp, typ: VyperType) -> None:
+        validate_expected_type(node.left, typ)
+        self.visit(node.left, typ)
+
+        rtyp = typ
+        if isinstance(node.op, (vy_ast.LShift, vy_ast.RShift)):
+            rtyp = get_possible_types_from_node(node.right).pop()
+
+        validate_expected_type(node.right, rtyp)
+
+        self.visit(node.right, rtyp)
+
+    def visit_BoolOp(self, node: vy_ast.BoolOp, typ: VyperType) -> None:
+        assert typ == BoolT()  # sanity check
         for value in node.values:
-            self.visit(value)
+            validate_expected_type(value, BoolT())
+            self.visit(value, BoolT())
+
+    def visit_Call(self, node: vy_ast.Call, typ: VyperType) -> None:
+        call_type = get_exact_type_from_node(node.func)
+        # except for builtin functions, `get_exact_type_from_node`
+        # already calls `validate_expected_type` on the call args
+        # and kwargs via `call_type.fetch_call_return`
+        self.visit(node.func, call_type)
+
+        if isinstance(call_type, ContractFunctionT):
+            # function calls
+            if call_type.is_internal:
+                self.func.called_functions.add(call_type)
+            for arg, typ in zip(node.args, call_type.argument_types):
+                self.visit(arg, typ)
+            for kwarg in node.keywords:
+                # We should only see special kwargs
+                typ = call_type.call_site_kwargs[kwarg.arg].typ
+                self.visit(kwarg.value, typ)
+
+        elif is_type_t(call_type, EventT):
+            # events have no kwargs
+            expected_types = call_type.typedef.arguments.values()
+            for arg, typ in zip(node.args, expected_types):
+                self.visit(arg, typ)
+        elif is_type_t(call_type, StructT):
+            # struct ctors
+            # ctors have no kwargs
+            expected_types = call_type.typedef.members.values()
+            for value, arg_type in zip(node.args[0].values, expected_types):
+                self.visit(value, arg_type)
+        elif isinstance(call_type, MemberFunctionT):
+            assert len(node.args) == len(call_type.arg_types)
+            for arg, arg_type in zip(node.args, call_type.arg_types):
+                self.visit(arg, arg_type)
+        else:
+            # builtin functions
+            arg_types = call_type.infer_arg_types(node)
+            # `infer_arg_types` already calls `validate_expected_type`
+            for arg, arg_type in zip(node.args, arg_types):
+                self.visit(arg, arg_type)
+            kwarg_types = call_type.infer_kwarg_types(node)
+            for kwarg in node.keywords:
+                self.visit(kwarg.value, kwarg_types[kwarg.arg])
+
+    def visit_Compare(self, node: vy_ast.Compare, typ: VyperType) -> None:
+        if isinstance(node.op, (vy_ast.In, vy_ast.NotIn)):
+            # membership in list literal - `x in [a, b, c]`
+            # needle: ltyp, haystack: rtyp
+            if isinstance(node.right, vy_ast.List):
+                ltyp = get_common_types(node.left, *node.right.elements).pop()
+
+                rlen = len(node.right.elements)
+                rtyp = SArrayT(ltyp, rlen)
+                validate_expected_type(node.right, rtyp)
+            else:
+                rtyp = get_exact_type_from_node(node.right)
+                if isinstance(rtyp, EnumT):
+                    # enum membership - `some_enum in other_enum`
+                    ltyp = rtyp
+                else:
+                    # array membership - `x in my_list_variable`
+                    assert isinstance(rtyp, (SArrayT, DArrayT))
+                    ltyp = rtyp.value_type
 
-    def visit_Index(self, node: vy_ast.Index) -> None:
-        self.visit(node.value)
+            validate_expected_type(node.left, ltyp)
 
-    def visit_List(self, node: vy_ast.List) -> None:
-        for element in node.elements:
-            self.visit(element)
+            self.visit(node.left, ltyp)
+            self.visit(node.right, rtyp)
+
+        else:
+            # ex. a < b
+            cmp_typ = get_common_types(node.left, node.right).pop()
+            if isinstance(cmp_typ, _BytestringT):
+                # for bytestrings, get_common_types automatically downcasts
+                # to the smaller common type - that will annotate with the
+                # wrong type, instead use get_exact_type_from_node (which
+                # resolves to the right type for bytestrings anyways).
+                ltyp = get_exact_type_from_node(node.left)
+                rtyp = get_exact_type_from_node(node.right)
+            else:
+                ltyp = rtyp = cmp_typ
+                validate_expected_type(node.left, ltyp)
+                validate_expected_type(node.right, rtyp)
+
+            self.visit(node.left, ltyp)
+            self.visit(node.right, rtyp)
+
+    def visit_Constant(self, node: vy_ast.Constant, typ: VyperType) -> None:
+        validate_expected_type(node, typ)
 
-    def visit_Subscript(self, node: vy_ast.Subscript) -> None:
-        self.visit(node.value)
-        self.visit(node.slice)
+    def visit_Index(self, node: vy_ast.Index, typ: VyperType) -> None:
+        validate_expected_type(node.value, typ)
+        self.visit(node.value, typ)
 
-    def visit_Tuple(self, node: vy_ast.Tuple) -> None:
+    def visit_List(self, node: vy_ast.List, typ: VyperType) -> None:
+        assert isinstance(typ, (SArrayT, DArrayT))
         for element in node.elements:
-            self.visit(element)
+            validate_expected_type(element, typ.value_type)
+            self.visit(element, typ.value_type)
 
-    def visit_UnaryOp(self, node: vy_ast.UnaryOp) -> None:
-        self.visit(node.operand)  # type: ignore[attr-defined]
+    def visit_Name(self, node: vy_ast.Name, typ: VyperType) -> None:
+        if self.func.mutability == StateMutability.PURE:
+            _validate_self_reference(node)
+
+        if not isinstance(typ, TYPE_T):
+            validate_expected_type(node, typ)
+
+    def visit_Subscript(self, node: vy_ast.Subscript, typ: VyperType) -> None:
+        if isinstance(typ, TYPE_T):
+            # don't recurse; can't annotate AST children of type definition
+            return
+
+        if isinstance(node.value, vy_ast.List):
+            possible_base_types = get_possible_types_from_node(node.value)
+
+            for possible_type in possible_base_types:
+                if typ.compare_type(possible_type.value_type):
+                    base_type = possible_type
+                    break
+            else:
+                # this should have been caught in
+                # `get_possible_types_from_node` but wasn't.
+                raise TypeCheckFailure(f"Expected {typ} but it is not a possible type", node)
+
+        else:
+            base_type = get_exact_type_from_node(node.value)
+
+        # get the correct type for the index, it might
+        # not be exactly base_type.key_type
+        # note: index_type is validated in types_from_Subscript
+        index_types = get_possible_types_from_node(node.slice.value)
+        index_type = index_types.pop()
+
+        self.visit(node.slice, index_type)
+        self.visit(node.value, base_type)
+
+    def visit_Tuple(self, node: vy_ast.Tuple, typ: VyperType) -> None:
+        if isinstance(typ, TYPE_T):
+            # don't recurse; can't annotate AST children of type definition
+            return
+
+        assert isinstance(typ, TupleT)
+        for element, subtype in zip(node.elements, typ.member_types):
+            validate_expected_type(element, subtype)
+            self.visit(element, subtype)
 
-    def visit_IfExp(self, node: vy_ast.IfExp) -> None:
-        self.visit(node.test)
-        self.visit(node.body)
-        self.visit(node.orelse)
+    def visit_UnaryOp(self, node: vy_ast.UnaryOp, typ: VyperType) -> None:
+        validate_expected_type(node.operand, typ)
+        self.visit(node.operand, typ)
+
+    def visit_IfExp(self, node: vy_ast.IfExp, typ: VyperType) -> None:
+        validate_expected_type(node.test, BoolT())
+        self.visit(node.test, BoolT())
+        validate_expected_type(node.body, typ)
+        self.visit(node.body, typ)
+        validate_expected_type(node.orelse, typ)
+        self.visit(node.orelse, typ)
diff --git a/vyper/semantics/analysis/utils.py b/vyper/semantics/analysis/utils.py
index 4f911764e0..afa6b56838 100644
--- a/vyper/semantics/analysis/utils.py
+++ b/vyper/semantics/analysis/utils.py
@@ -312,10 +312,17 @@ def types_from_Constant(self, node):
     def types_from_List(self, node):
         # literal array
         if _is_empty_list(node):
-            # empty list literal `[]`
             ret = []
-            # subtype can be anything
-            for t in types.PRIMITIVE_TYPES.values():
+
+            if len(node.elements) > 0:
+                # empty nested list literals `[[], []]`
+                subtypes = self.get_possible_types_from_node(node.elements[0])
+            else:
+                # empty list literal `[]`
+                # subtype can be anything
+                subtypes = types.PRIMITIVE_TYPES.values()
+
+            for t in subtypes:
                 # 1 is minimum possible length for dynarray,
                 # can be assigned to anything
                 if isinstance(t, VyperType):

From ed0b1e0ac8ddb47019efcff4b692ff6470fc6a04 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Fri, 20 Oct 2023 07:52:04 -0700
Subject: [PATCH 154/161] fix: add missing test for memory allocation overflow
 (#3650)

should have been added in 68da04b2e9e0 but the file was not committed
---
 tests/parser/features/test_memory_alloc.py | 16 ++++++++++++++++
 1 file changed, 16 insertions(+)
 create mode 100644 tests/parser/features/test_memory_alloc.py

diff --git a/tests/parser/features/test_memory_alloc.py b/tests/parser/features/test_memory_alloc.py
new file mode 100644
index 0000000000..ee6d15c67c
--- /dev/null
+++ b/tests/parser/features/test_memory_alloc.py
@@ -0,0 +1,16 @@
+import pytest
+
+from vyper.compiler import compile_code
+from vyper.exceptions import MemoryAllocationException
+
+
+def test_memory_overflow():
+    code = """
+@external
+def zzz(x: DynArray[uint256, 2**59]):  # 2**64 / 32 bytes per word == 2**59
+    y: uint256[7] = [0,0,0,0,0,0,0]
+
+    y[6] = y[5]
+    """
+    with pytest.raises(MemoryAllocationException):
+        compile_code(code)

From b01cd686aa567b32498fefd76bd96b0597c6f099 Mon Sep 17 00:00:00 2001
From: engn33r <engn33r@users.noreply.github.com>
Date: Mon, 23 Oct 2023 02:00:08 +0000
Subject: [PATCH 155/161] docs: fix link to style guide (#3658)

---
 .github/PULL_REQUEST_TEMPLATE.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/PULL_REQUEST_TEMPLATE.md b/.github/PULL_REQUEST_TEMPLATE.md
index 94eb5ec04c..baa8decacc 100644
--- a/.github/PULL_REQUEST_TEMPLATE.md
+++ b/.github/PULL_REQUEST_TEMPLATE.md
@@ -6,7 +6,7 @@
 
 ### Commit message
 
-Commit message for the final, squashed PR. (Optional, but reviewers will appreciate it! Please see [our commit message style guide](../../blob/master/docs/style-guide.rst#best-practices-1) for what we would ideally like to see in a commit message.)
+Commit message for the final, squashed PR. (Optional, but reviewers will appreciate it! Please see [our commit message style guide](../../master/docs/style-guide.rst#best-practices-1) for what we would ideally like to see in a commit message.)
 
 ### Description for the changelog
 

From 52dc413c684532d5c4d6cdd91e3b058957cfcba0 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Wed, 1 Nov 2023 15:03:51 -0400
Subject: [PATCH 156/161] docs: retire security@vyperlang.org (#3660)

now that private vulnerability reporting is available on github, the
security inbox is no longer required (or regularly monitored)

cf. https://docs.github.com/en/code-security/security-advisories/working-with-repository-security-advisories/configuring-private-vulnerability-reporting-for-a-repository
---
 SECURITY.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/SECURITY.md b/SECURITY.md
index c7bdad4ee7..0a054b2c93 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -48,7 +48,7 @@ https://github.com/vyperlang/vyper/security/advisories
 
 If you think you have found a security vulnerability with a project that has used Vyper,
 please report the vulnerability to the relevant project's security disclosure program prior
-to reporting to us. If one is not available, please email your vulnerability to security@vyperlang.org.
+to reporting to us. If one is not available, submit it at https://github.com/vyperlang/vyper/security/advisories.
 
 **Please Do Not Log An Issue** mentioning the vulnerability.
 

From 9ce56e7d8b0196a5d51d706a8d2376b98d3e8ad7 Mon Sep 17 00:00:00 2001
From: tserg <8017125+tserg@users.noreply.github.com>
Date: Fri, 3 Nov 2023 00:33:20 +0800
Subject: [PATCH 157/161] chore: fix test for `slice` (#3633)

fix some test cases for `slice` and simplify the test logic

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/parser/functions/test_slice.py | 88 +++++++++++++++++-----------
 1 file changed, 55 insertions(+), 33 deletions(-)

diff --git a/tests/parser/functions/test_slice.py b/tests/parser/functions/test_slice.py
index 3090dafda0..53e092019f 100644
--- a/tests/parser/functions/test_slice.py
+++ b/tests/parser/functions/test_slice.py
@@ -32,8 +32,8 @@ def slice_tower_test(inp1: Bytes[50]) -> Bytes[50]:
 _bytes_1024 = st.binary(min_size=0, max_size=1024)
 
 
-@pytest.mark.parametrize("literal_start", (True, False))
-@pytest.mark.parametrize("literal_length", (True, False))
+@pytest.mark.parametrize("use_literal_start", (True, False))
+@pytest.mark.parametrize("use_literal_length", (True, False))
 @pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
 @settings(max_examples=100)
@@ -45,13 +45,13 @@ def test_slice_immutable(
     opt_level,
     bytesdata,
     start,
-    literal_start,
+    use_literal_start,
     length,
-    literal_length,
+    use_literal_length,
     length_bound,
 ):
-    _start = start if literal_start else "start"
-    _length = length if literal_length else "length"
+    _start = start if use_literal_start else "start"
+    _length = length if use_literal_length else "length"
 
     code = f"""
 IMMUTABLE_BYTES: immutable(Bytes[{length_bound}])
@@ -71,10 +71,10 @@ def _get_contract():
         return get_contract(code, bytesdata, start, length, override_opt_level=opt_level)
 
     if (
-        (start + length > length_bound and literal_start and literal_length)
-        or (literal_length and length > length_bound)
-        or (literal_start and start > length_bound)
-        or (literal_length and length < 1)
+        (start + length > length_bound and use_literal_start and use_literal_length)
+        or (use_literal_length and length > length_bound)
+        or (use_literal_start and start > length_bound)
+        or (use_literal_length and length == 0)
     ):
         assert_compile_failed(lambda: _get_contract(), ArgumentException)
     elif start + length > len(bytesdata) or (len(bytesdata) > length_bound):
@@ -86,13 +86,13 @@ def _get_contract():
 
 
 @pytest.mark.parametrize("location", ("storage", "calldata", "memory", "literal", "code"))
-@pytest.mark.parametrize("literal_start", (True, False))
-@pytest.mark.parametrize("literal_length", (True, False))
+@pytest.mark.parametrize("use_literal_start", (True, False))
+@pytest.mark.parametrize("use_literal_length", (True, False))
 @pytest.mark.parametrize("opt_level", list(OptimizationLevel))
 @given(start=_draw_1024, length=_draw_1024, length_bound=_draw_1024_1, bytesdata=_bytes_1024)
 @settings(max_examples=100)
 @pytest.mark.fuzzing
-def test_slice_bytes(
+def test_slice_bytes_fuzz(
     get_contract,
     assert_compile_failed,
     assert_tx_failed,
@@ -100,18 +100,28 @@ def test_slice_bytes(
     location,
     bytesdata,
     start,
-    literal_start,
+    use_literal_start,
     length,
-    literal_length,
+    use_literal_length,
     length_bound,
 ):
+    preamble = ""
     if location == "memory":
         spliced_code = f"foo: Bytes[{length_bound}] = inp"
         foo = "foo"
     elif location == "storage":
+        preamble = f"""
+foo: Bytes[{length_bound}]
+        """
         spliced_code = "self.foo = inp"
         foo = "self.foo"
     elif location == "code":
+        preamble = f"""
+IMMUTABLE_BYTES: immutable(Bytes[{length_bound}])
+@external
+def __init__(foo: Bytes[{length_bound}]):
+    IMMUTABLE_BYTES = foo
+    """
         spliced_code = ""
         foo = "IMMUTABLE_BYTES"
     elif location == "literal":
@@ -123,15 +133,11 @@ def test_slice_bytes(
     else:
         raise Exception("unreachable")
 
-    _start = start if literal_start else "start"
-    _length = length if literal_length else "length"
+    _start = start if use_literal_start else "start"
+    _length = length if use_literal_length else "length"
 
     code = f"""
-foo: Bytes[{length_bound}]
-IMMUTABLE_BYTES: immutable(Bytes[{length_bound}])
-@external
-def __init__(foo: Bytes[{length_bound}]):
-    IMMUTABLE_BYTES = foo
+{preamble}
 
 @external
 def do_slice(inp: Bytes[{length_bound}], start: uint256, length: uint256) -> Bytes[{length_bound}]:
@@ -142,24 +148,40 @@ def do_slice(inp: Bytes[{length_bound}], start: uint256, length: uint256) -> Byt
     def _get_contract():
         return get_contract(code, bytesdata, override_opt_level=opt_level)
 
-    data_length = len(bytesdata) if location == "literal" else length_bound
-    if (
-        (start + length > data_length and literal_start and literal_length)
-        or (literal_length and length > data_length)
-        or (location == "literal" and len(bytesdata) > length_bound)
-        or (literal_start and start > data_length)
-        or (literal_length and length < 1)
-    ):
+    # length bound is the container size; input_bound is the bound on the input
+    # (which can be different, if the input is a literal)
+    input_bound = length_bound
+    slice_output_too_large = False
+
+    if location == "literal":
+        input_bound = len(bytesdata)
+
+        # ex.:
+        # @external
+        # def do_slice(inp: Bytes[1], start: uint256, length: uint256) -> Bytes[1]:
+        #    return slice(b'\x00\x00', 0, length)
+        output_length = length if use_literal_length else input_bound
+        slice_output_too_large = output_length > length_bound
+
+    end = start + length
+
+    compile_time_oob = (
+        (use_literal_length and (length > input_bound or length == 0))
+        or (use_literal_start and start > input_bound)
+        or (use_literal_start and use_literal_length and start + length > input_bound)
+    )
+
+    if compile_time_oob or slice_output_too_large:
         assert_compile_failed(lambda: _get_contract(), (ArgumentException, TypeMismatch))
-    elif len(bytesdata) > data_length:
+    elif location == "code" and len(bytesdata) > length_bound:
         # deploy fail
         assert_tx_failed(lambda: _get_contract())
-    elif start + length > len(bytesdata):
+    elif end > len(bytesdata) or len(bytesdata) > length_bound:
         c = _get_contract()
         assert_tx_failed(lambda: c.do_slice(bytesdata, start, length))
     else:
         c = _get_contract()
-        assert c.do_slice(bytesdata, start, length) == bytesdata[start : start + length], code
+        assert c.do_slice(bytesdata, start, length) == bytesdata[start:end], code
 
 
 def test_slice_private(get_contract):

From 5d10ea0d2a26ab0c58beab4b0b9a4a3d90c9c439 Mon Sep 17 00:00:00 2001
From: Charles Cooper <cooper.charles.m@gmail.com>
Date: Mon, 6 Nov 2023 15:33:31 -0500
Subject: [PATCH 158/161] refactor: internal handling of imports (#3655)

this commit refactors how imports are handled internally.

historically, vyper handled imports by using a preprocessing step
(`extract_file_interface_imports`) which resolved imports to files and
provided them to the compiler pipeline as pure inputs. however, this
causes problems once the module system gets more complicated:
- it mixes passes. resolving imports and loading the files should
  essentially be resolved during analysis, but instead they are being
  resolved before the compiler is even entered into(!)
- it produces slightly different code paths into the main compiler entry
  point which introduces subtle bugs over time from scaffolding
  differences
- relatedly, each entry point into the compiler has to maintain its own
  mechanism for resolving different kinds of inputs to the compiler
  (JSON interfaces vs .vy files at the moment).

this commit replaces the external scaffolding with an "InputBundle"
abstraction which essentially models how the compiler interacts with its
inputs (depending on whether it is using the filesystem or JSON inputs).
this makes the entry points to the compiler overall simpler, and have
more consistent behavior.

this commit also:
- changes builtin interfaces so they are represented in the codebase as
  `.vy` files which are imported similarly to how regular (non-builtin)
  files are imported
- simplifies the `compile_files` and `compile_json` pipelines
- removes the `compile_codes` API, which was not actually more useful
  than the `compile_code` API (which is kept).
- cleans up tests by introducing a `make_file` and `make_input_bundle`
  abstraction
- simplifies and merges several files in the tests/cli/ directories
- adds a test for multiple output selections in the standard json pipeline
---
 tests/base_conftest.py                        |  15 +-
 tests/cli/vyper_compile/test_compile_files.py | 205 +++++++++++-
 tests/cli/vyper_compile/test_import_paths.py  | 260 ---------------
 tests/cli/vyper_compile/test_parse_args.py    |   2 +
 .../test_compile_from_input_dict.py           | 132 --------
 tests/cli/vyper_json/test_compile_json.py     | 190 +++++++++--
 tests/cli/vyper_json/test_get_contracts.py    |  71 ----
 tests/cli/vyper_json/test_get_inputs.py       | 142 ++++++++
 tests/cli/vyper_json/test_get_settings.py     |   2 -
 tests/cli/vyper_json/test_interfaces.py       | 126 -------
 tests/cli/vyper_json/test_output_dict.py      |  38 ---
 tests/cli/vyper_json/test_output_selection.py |  38 +--
 .../vyper_json/test_parse_args_vyperjson.py   |   3 +-
 tests/compiler/test_bytecode_runtime.py       |  14 +-
 tests/compiler/test_compile_code.py           |   2 +-
 tests/compiler/test_input_bundle.py           | 208 ++++++++++++
 tests/compiler/test_opcodes.py                |   2 +-
 tests/compiler/test_source_map.py             |   6 +-
 tests/conftest.py                             |  29 ++
 tests/parser/ast_utils/test_ast_dict.py       |   8 +-
 tests/parser/features/test_init.py            |   2 +-
 tests/parser/functions/test_bitwise.py        |   2 +-
 tests/parser/functions/test_interfaces.py     | 201 ++++++------
 tests/parser/functions/test_raw_call.py       |   8 +-
 tests/parser/functions/test_return_struct.py  |   4 +-
 tests/parser/syntax/test_codehash.py          |   2 +-
 tests/parser/syntax/test_interfaces.py        |  11 +-
 tests/parser/syntax/test_self_balance.py      |   2 +-
 tests/parser/test_selector_table_stability.py |   4 +-
 tests/parser/types/numbers/test_constants.py  |   2 +-
 vyper/__init__.py                             |   2 +-
 .../interfaces/{ERC165.py => ERC165.vy}       |   2 -
 .../interfaces/{ERC20.py => ERC20.vy}         |   2 -
 vyper/builtins/interfaces/ERC20Detailed.py    |  22 --
 vyper/builtins/interfaces/ERC20Detailed.vy    |  18 +
 .../interfaces/{ERC4626.py => ERC4626.vy}     |   2 -
 .../interfaces/{ERC721.py => ERC721.vy}       |   3 -
 vyper/builtins/interfaces/__init__.py         |   0
 vyper/cli/utils.py                            |  58 ----
 vyper/cli/vyper_compile.py                    | 137 +++-----
 vyper/cli/vyper_json.py                       | 307 ++++++------------
 vyper/cli/vyper_serve.py                      |   6 +-
 vyper/compiler/__init__.py                    | 177 +++-------
 vyper/compiler/input_bundle.py                | 180 ++++++++++
 vyper/compiler/output.py                      |   5 +-
 vyper/compiler/phases.py                      |  52 +--
 vyper/semantics/analysis/__init__.py          |   4 +-
 vyper/semantics/analysis/module.py            | 155 +++++----
 vyper/typing.py                               |   8 -
 49 files changed, 1448 insertions(+), 1423 deletions(-)
 delete mode 100644 tests/cli/vyper_compile/test_import_paths.py
 delete mode 100644 tests/cli/vyper_json/test_compile_from_input_dict.py
 delete mode 100644 tests/cli/vyper_json/test_get_contracts.py
 create mode 100644 tests/cli/vyper_json/test_get_inputs.py
 delete mode 100644 tests/cli/vyper_json/test_interfaces.py
 delete mode 100644 tests/cli/vyper_json/test_output_dict.py
 create mode 100644 tests/compiler/test_input_bundle.py
 rename vyper/builtins/interfaces/{ERC165.py => ERC165.vy} (75%)
 rename vyper/builtins/interfaces/{ERC20.py => ERC20.vy} (96%)
 delete mode 100644 vyper/builtins/interfaces/ERC20Detailed.py
 create mode 100644 vyper/builtins/interfaces/ERC20Detailed.vy
 rename vyper/builtins/interfaces/{ERC4626.py => ERC4626.vy} (98%)
 rename vyper/builtins/interfaces/{ERC721.py => ERC721.vy} (97%)
 delete mode 100644 vyper/builtins/interfaces/__init__.py
 delete mode 100644 vyper/cli/utils.py
 create mode 100644 vyper/compiler/input_bundle.py

diff --git a/tests/base_conftest.py b/tests/base_conftest.py
index 1c7c6f3aed..f613ad0f47 100644
--- a/tests/base_conftest.py
+++ b/tests/base_conftest.py
@@ -112,16 +112,18 @@ def w3(tester):
     return w3
 
 
-def _get_contract(w3, source_code, optimize, *args, override_opt_level=None, **kwargs):
+def _get_contract(
+    w3, source_code, optimize, *args, override_opt_level=None, input_bundle=None, **kwargs
+):
     settings = Settings()
     settings.evm_version = kwargs.pop("evm_version", None)
     settings.optimize = override_opt_level or optimize
     out = compiler.compile_code(
         source_code,
         # test that metadata and natspecs get generated
-        ["abi", "bytecode", "metadata", "userdoc", "devdoc"],
+        output_formats=["abi", "bytecode", "metadata", "userdoc", "devdoc"],
         settings=settings,
-        interface_codes=kwargs.pop("interface_codes", None),
+        input_bundle=input_bundle,
         show_gas_estimates=True,  # Enable gas estimates for testing
     )
     parse_vyper_source(source_code)  # Test grammar.
@@ -144,8 +146,7 @@ def _deploy_blueprint_for(w3, source_code, optimize, initcode_prefix=b"", **kwar
     settings.optimize = optimize
     out = compiler.compile_code(
         source_code,
-        ["abi", "bytecode"],
-        interface_codes=kwargs.pop("interface_codes", None),
+        output_formats=["abi", "bytecode", "metadata", "userdoc", "devdoc"],
         settings=settings,
         show_gas_estimates=True,  # Enable gas estimates for testing
     )
@@ -187,10 +188,10 @@ def deploy_blueprint_for(source_code, *args, **kwargs):
 
 @pytest.fixture(scope="module")
 def get_contract(w3, optimize):
-    def get_contract(source_code, *args, **kwargs):
+    def fn(source_code, *args, **kwargs):
         return _get_contract(w3, source_code, optimize, *args, **kwargs)
 
-    return get_contract
+    return fn
 
 
 @pytest.fixture
diff --git a/tests/cli/vyper_compile/test_compile_files.py b/tests/cli/vyper_compile/test_compile_files.py
index 31cf622658..2a16efa777 100644
--- a/tests/cli/vyper_compile/test_compile_files.py
+++ b/tests/cli/vyper_compile/test_compile_files.py
@@ -1,12 +1,12 @@
+from pathlib import Path
+
 import pytest
 
 from vyper.cli.vyper_compile import compile_files
 
 
-def test_combined_json_keys(tmp_path):
-    bar_path = tmp_path.joinpath("bar.vy")
-    with bar_path.open("w") as fp:
-        fp.write("")
+def test_combined_json_keys(tmp_path, make_file):
+    make_file("bar.vy", "")
 
     combined_keys = {
         "bytecode",
@@ -19,12 +19,203 @@ def test_combined_json_keys(tmp_path):
         "userdoc",
         "devdoc",
     }
-    compile_data = compile_files([bar_path], ["combined_json"], root_folder=tmp_path)
+    compile_data = compile_files(["bar.vy"], ["combined_json"], root_folder=tmp_path)
 
-    assert set(compile_data.keys()) == {"bar.vy", "version"}
-    assert set(compile_data["bar.vy"].keys()) == combined_keys
+    assert set(compile_data.keys()) == {Path("bar.vy"), "version"}
+    assert set(compile_data[Path("bar.vy")].keys()) == combined_keys
 
 
 def test_invalid_root_path():
     with pytest.raises(FileNotFoundError):
         compile_files([], [], root_folder="path/that/does/not/exist")
+
+
+FOO_CODE = """
+{}
+
+struct FooStruct:
+    foo_: uint256
+
+@external
+def foo() -> FooStruct:
+    return FooStruct({{foo_: 13}})
+
+@external
+def bar(a: address) -> FooStruct:
+    return {}(a).bar()
+"""
+
+BAR_CODE = """
+struct FooStruct:
+    foo_: uint256
+@external
+def bar() -> FooStruct:
+    return FooStruct({foo_: 13})
+"""
+
+
+SAME_FOLDER_IMPORT_STMT = [
+    ("import Bar as Bar", "Bar"),
+    ("import contracts.Bar as Bar", "Bar"),
+    ("from . import Bar", "Bar"),
+    ("from contracts import Bar", "Bar"),
+    ("from ..contracts import Bar", "Bar"),
+    ("from . import Bar as FooBar", "FooBar"),
+    ("from contracts import Bar as FooBar", "FooBar"),
+    ("from ..contracts import Bar as FooBar", "FooBar"),
+]
+
+
+@pytest.mark.parametrize("import_stmt,alias", SAME_FOLDER_IMPORT_STMT)
+def test_import_same_folder(import_stmt, alias, tmp_path, make_file):
+    foo = "contracts/foo.vy"
+    make_file("contracts/foo.vy", FOO_CODE.format(import_stmt, alias))
+    make_file("contracts/Bar.vy", BAR_CODE)
+
+    assert compile_files([foo], ["combined_json"], root_folder=tmp_path)
+
+
+SUBFOLDER_IMPORT_STMT = [
+    ("import other.Bar as Bar", "Bar"),
+    ("import contracts.other.Bar as Bar", "Bar"),
+    ("from other import Bar", "Bar"),
+    ("from contracts.other import Bar", "Bar"),
+    ("from .other import Bar", "Bar"),
+    ("from ..contracts.other import Bar", "Bar"),
+    ("from other import Bar as FooBar", "FooBar"),
+    ("from contracts.other import Bar as FooBar", "FooBar"),
+    ("from .other import Bar as FooBar", "FooBar"),
+    ("from ..contracts.other import Bar as FooBar", "FooBar"),
+]
+
+
+@pytest.mark.parametrize("import_stmt, alias", SUBFOLDER_IMPORT_STMT)
+def test_import_subfolder(import_stmt, alias, tmp_path, make_file):
+    foo = make_file("contracts/foo.vy", (FOO_CODE.format(import_stmt, alias)))
+    make_file("contracts/other/Bar.vy", BAR_CODE)
+
+    assert compile_files([foo], ["combined_json"], root_folder=tmp_path)
+
+
+OTHER_FOLDER_IMPORT_STMT = [
+    ("import interfaces.Bar as Bar", "Bar"),
+    ("from interfaces import Bar", "Bar"),
+    ("from ..interfaces import Bar", "Bar"),
+    ("from interfaces import Bar as FooBar", "FooBar"),
+    ("from ..interfaces import Bar as FooBar", "FooBar"),
+]
+
+
+@pytest.mark.parametrize("import_stmt, alias", OTHER_FOLDER_IMPORT_STMT)
+def test_import_other_folder(import_stmt, alias, tmp_path, make_file):
+    foo = make_file("contracts/foo.vy", FOO_CODE.format(import_stmt, alias))
+    make_file("interfaces/Bar.vy", BAR_CODE)
+
+    assert compile_files([foo], ["combined_json"], root_folder=tmp_path)
+
+
+def test_import_parent_folder(tmp_path, make_file):
+    foo = make_file("contracts/baz/foo.vy", FOO_CODE.format("from ... import Bar", "Bar"))
+    make_file("Bar.vy", BAR_CODE)
+
+    assert compile_files([foo], ["combined_json"], root_folder=tmp_path)
+
+    # perform relative import outside of base folder
+    compile_files([foo], ["combined_json"], root_folder=tmp_path / "contracts")
+
+
+META_IMPORT_STMT = [
+    "import Meta as Meta",
+    "import contracts.Meta as Meta",
+    "from . import Meta",
+    "from contracts import Meta",
+]
+
+
+@pytest.mark.parametrize("import_stmt", META_IMPORT_STMT)
+def test_import_self_interface(import_stmt, tmp_path, make_file):
+    # a contract can access its derived interface by importing itself
+    code = f"""
+{import_stmt}
+
+struct FooStruct:
+    foo_: uint256
+
+@external
+def know_thyself(a: address) -> FooStruct:
+    return Meta(a).be_known()
+
+@external
+def be_known() -> FooStruct:
+    return FooStruct({{foo_: 42}})
+    """
+    meta = make_file("contracts/Meta.vy", code)
+
+    assert compile_files([meta], ["combined_json"], root_folder=tmp_path)
+
+
+DERIVED_IMPORT_STMT_BAZ = ["import Foo as Foo", "from . import Foo"]
+
+DERIVED_IMPORT_STMT_FOO = ["import Bar as Bar", "from . import Bar"]
+
+
+@pytest.mark.parametrize("import_stmt_baz", DERIVED_IMPORT_STMT_BAZ)
+@pytest.mark.parametrize("import_stmt_foo", DERIVED_IMPORT_STMT_FOO)
+def test_derived_interface_imports(import_stmt_baz, import_stmt_foo, tmp_path, make_file):
+    # contracts-as-interfaces should be able to contain import statements
+    baz_code = f"""
+{import_stmt_baz}
+
+struct FooStruct:
+    foo_: uint256
+
+@external
+def foo(a: address) -> FooStruct:
+    return Foo(a).foo()
+
+@external
+def bar(_foo: address, _bar: address) -> FooStruct:
+    return Foo(_foo).bar(_bar)
+    """
+
+    make_file("Foo.vy", FOO_CODE.format(import_stmt_foo, "Bar"))
+    make_file("Bar.vy", BAR_CODE)
+    baz = make_file("Baz.vy", baz_code)
+
+    assert compile_files([baz], ["combined_json"], root_folder=tmp_path)
+
+
+def test_local_namespace(make_file, tmp_path):
+    # interface code namespaces should be isolated
+    # all of these contract should be able to compile together
+    codes = [
+        "import foo as FooBar",
+        "import bar as FooBar",
+        "import foo as BarFoo",
+        "import bar as BarFoo",
+    ]
+    struct_def = """
+struct FooStruct:
+    foo_: uint256
+
+    """
+
+    paths = []
+    for i, code in enumerate(codes):
+        code += struct_def
+        filename = f"code{i}.vy"
+        make_file(filename, code)
+        paths.append(filename)
+
+    for file_name in ("foo.vy", "bar.vy"):
+        make_file(file_name, BAR_CODE)
+
+    assert compile_files(paths, ["combined_json"], root_folder=tmp_path)
+
+
+def test_compile_outside_root_path(tmp_path, make_file):
+    # absolute paths relative to "."
+    foo = make_file("foo.vy", FOO_CODE.format("import bar as Bar", "Bar"))
+    bar = make_file("bar.vy", BAR_CODE)
+
+    assert compile_files([foo, bar], ["combined_json"], root_folder=".")
diff --git a/tests/cli/vyper_compile/test_import_paths.py b/tests/cli/vyper_compile/test_import_paths.py
deleted file mode 100644
index 81f209113f..0000000000
--- a/tests/cli/vyper_compile/test_import_paths.py
+++ /dev/null
@@ -1,260 +0,0 @@
-import pytest
-
-from vyper.cli.vyper_compile import compile_files, get_interface_file_path
-
-FOO_CODE = """
-{}
-
-struct FooStruct:
-    foo_: uint256
-
-@external
-def foo() -> FooStruct:
-    return FooStruct({{foo_: 13}})
-
-@external
-def bar(a: address) -> FooStruct:
-    return {}(a).bar()
-"""
-
-BAR_CODE = """
-struct FooStruct:
-    foo_: uint256
-@external
-def bar() -> FooStruct:
-    return FooStruct({foo_: 13})
-"""
-
-
-SAME_FOLDER_IMPORT_STMT = [
-    ("import Bar as Bar", "Bar"),
-    ("import contracts.Bar as Bar", "Bar"),
-    ("from . import Bar", "Bar"),
-    ("from contracts import Bar", "Bar"),
-    ("from ..contracts import Bar", "Bar"),
-    ("from . import Bar as FooBar", "FooBar"),
-    ("from contracts import Bar as FooBar", "FooBar"),
-    ("from ..contracts import Bar as FooBar", "FooBar"),
-]
-
-
-@pytest.mark.parametrize("import_stmt,alias", SAME_FOLDER_IMPORT_STMT)
-def test_import_same_folder(import_stmt, alias, tmp_path):
-    tmp_path.joinpath("contracts").mkdir()
-
-    foo_path = tmp_path.joinpath("contracts/foo.vy")
-    with foo_path.open("w") as fp:
-        fp.write(FOO_CODE.format(import_stmt, alias))
-
-    with tmp_path.joinpath("contracts/Bar.vy").open("w") as fp:
-        fp.write(BAR_CODE)
-
-    assert compile_files([foo_path], ["combined_json"], root_folder=tmp_path)
-
-
-SUBFOLDER_IMPORT_STMT = [
-    ("import other.Bar as Bar", "Bar"),
-    ("import contracts.other.Bar as Bar", "Bar"),
-    ("from other import Bar", "Bar"),
-    ("from contracts.other import Bar", "Bar"),
-    ("from .other import Bar", "Bar"),
-    ("from ..contracts.other import Bar", "Bar"),
-    ("from other import Bar as FooBar", "FooBar"),
-    ("from contracts.other import Bar as FooBar", "FooBar"),
-    ("from .other import Bar as FooBar", "FooBar"),
-    ("from ..contracts.other import Bar as FooBar", "FooBar"),
-]
-
-
-@pytest.mark.parametrize("import_stmt, alias", SUBFOLDER_IMPORT_STMT)
-def test_import_subfolder(import_stmt, alias, tmp_path):
-    tmp_path.joinpath("contracts").mkdir()
-
-    foo_path = tmp_path.joinpath("contracts/foo.vy")
-    with foo_path.open("w") as fp:
-        fp.write(FOO_CODE.format(import_stmt, alias))
-
-    tmp_path.joinpath("contracts/other").mkdir()
-    with tmp_path.joinpath("contracts/other/Bar.vy").open("w") as fp:
-        fp.write(BAR_CODE)
-
-    assert compile_files([foo_path], ["combined_json"], root_folder=tmp_path)
-
-
-OTHER_FOLDER_IMPORT_STMT = [
-    ("import interfaces.Bar as Bar", "Bar"),
-    ("from interfaces import Bar", "Bar"),
-    ("from ..interfaces import Bar", "Bar"),
-    ("from interfaces import Bar as FooBar", "FooBar"),
-    ("from ..interfaces import Bar as FooBar", "FooBar"),
-]
-
-
-@pytest.mark.parametrize("import_stmt, alias", OTHER_FOLDER_IMPORT_STMT)
-def test_import_other_folder(import_stmt, alias, tmp_path):
-    tmp_path.joinpath("contracts").mkdir()
-
-    foo_path = tmp_path.joinpath("contracts/foo.vy")
-    with foo_path.open("w") as fp:
-        fp.write(FOO_CODE.format(import_stmt, alias))
-
-    tmp_path.joinpath("interfaces").mkdir()
-    with tmp_path.joinpath("interfaces/Bar.vy").open("w") as fp:
-        fp.write(BAR_CODE)
-
-    assert compile_files([foo_path], ["combined_json"], root_folder=tmp_path)
-
-
-def test_import_parent_folder(tmp_path, assert_compile_failed):
-    tmp_path.joinpath("contracts").mkdir()
-    tmp_path.joinpath("contracts/baz").mkdir()
-
-    foo_path = tmp_path.joinpath("contracts/baz/foo.vy")
-    with foo_path.open("w") as fp:
-        fp.write(FOO_CODE.format("from ... import Bar", "Bar"))
-
-    with tmp_path.joinpath("Bar.vy").open("w") as fp:
-        fp.write(BAR_CODE)
-
-    assert compile_files([foo_path], ["combined_json"], root_folder=tmp_path)
-    # Cannot perform relative import outside of base folder
-    with pytest.raises(FileNotFoundError):
-        compile_files([foo_path], ["combined_json"], root_folder=tmp_path.joinpath("contracts"))
-
-
-META_IMPORT_STMT = [
-    "import Meta as Meta",
-    "import contracts.Meta as Meta",
-    "from . import Meta",
-    "from contracts import Meta",
-]
-
-
-@pytest.mark.parametrize("import_stmt", META_IMPORT_STMT)
-def test_import_self_interface(import_stmt, tmp_path):
-    # a contract can access its derived interface by importing itself
-    code = f"""
-{import_stmt}
-
-struct FooStruct:
-    foo_: uint256
-
-@external
-def know_thyself(a: address) -> FooStruct:
-    return Meta(a).be_known()
-
-@external
-def be_known() -> FooStruct:
-    return FooStruct({{foo_: 42}})
-    """
-
-    tmp_path.joinpath("contracts").mkdir()
-
-    meta_path = tmp_path.joinpath("contracts/Meta.vy")
-    with meta_path.open("w") as fp:
-        fp.write(code)
-
-    assert compile_files([meta_path], ["combined_json"], root_folder=tmp_path)
-
-
-DERIVED_IMPORT_STMT_BAZ = ["import Foo as Foo", "from . import Foo"]
-
-DERIVED_IMPORT_STMT_FOO = ["import Bar as Bar", "from . import Bar"]
-
-
-@pytest.mark.parametrize("import_stmt_baz", DERIVED_IMPORT_STMT_BAZ)
-@pytest.mark.parametrize("import_stmt_foo", DERIVED_IMPORT_STMT_FOO)
-def test_derived_interface_imports(import_stmt_baz, import_stmt_foo, tmp_path):
-    # contracts-as-interfaces should be able to contain import statements
-    baz_code = f"""
-{import_stmt_baz}
-
-struct FooStruct:
-    foo_: uint256
-
-@external
-def foo(a: address) -> FooStruct:
-    return Foo(a).foo()
-
-@external
-def bar(_foo: address, _bar: address) -> FooStruct:
-    return Foo(_foo).bar(_bar)
-    """
-
-    with tmp_path.joinpath("Foo.vy").open("w") as fp:
-        fp.write(FOO_CODE.format(import_stmt_foo, "Bar"))
-
-    with tmp_path.joinpath("Bar.vy").open("w") as fp:
-        fp.write(BAR_CODE)
-
-    baz_path = tmp_path.joinpath("Baz.vy")
-    with baz_path.open("w") as fp:
-        fp.write(baz_code)
-
-    assert compile_files([baz_path], ["combined_json"], root_folder=tmp_path)
-
-
-def test_local_namespace(tmp_path):
-    # interface code namespaces should be isolated
-    # all of these contract should be able to compile together
-    codes = [
-        "import foo as FooBar",
-        "import bar as FooBar",
-        "import foo as BarFoo",
-        "import bar as BarFoo",
-    ]
-    struct_def = """
-struct FooStruct:
-    foo_: uint256
-
-    """
-
-    compile_paths = []
-    for i, code in enumerate(codes):
-        code += struct_def
-        path = tmp_path.joinpath(f"code{i}.vy")
-        with path.open("w") as fp:
-            fp.write(code)
-        compile_paths.append(path)
-
-    for file_name in ("foo.vy", "bar.vy"):
-        with tmp_path.joinpath(file_name).open("w") as fp:
-            fp.write(BAR_CODE)
-
-    assert compile_files(compile_paths, ["combined_json"], root_folder=tmp_path)
-
-
-def test_get_interface_file_path(tmp_path):
-    for file_name in ("foo.vy", "foo.json", "bar.vy", "baz.json", "potato"):
-        with tmp_path.joinpath(file_name).open("w") as fp:
-            fp.write("")
-
-    tmp_path.joinpath("interfaces").mkdir()
-    for file_name in ("interfaces/foo.json", "interfaces/bar"):
-        with tmp_path.joinpath(file_name).open("w") as fp:
-            fp.write("")
-
-    base_paths = [tmp_path, tmp_path.joinpath("interfaces")]
-    assert get_interface_file_path(base_paths, "foo") == tmp_path.joinpath("foo.vy")
-    assert get_interface_file_path(base_paths, "bar") == tmp_path.joinpath("bar.vy")
-    assert get_interface_file_path(base_paths, "baz") == tmp_path.joinpath("baz.json")
-
-    base_paths = [tmp_path.joinpath("interfaces"), tmp_path]
-    assert get_interface_file_path(base_paths, "foo") == tmp_path.joinpath("interfaces/foo.json")
-    assert get_interface_file_path(base_paths, "bar") == tmp_path.joinpath("bar.vy")
-    assert get_interface_file_path(base_paths, "baz") == tmp_path.joinpath("baz.json")
-
-    with pytest.raises(Exception):
-        get_interface_file_path(base_paths, "potato")
-
-
-def test_compile_outside_root_path(tmp_path):
-    foo_path = tmp_path.joinpath("foo.vy")
-    with foo_path.open("w") as fp:
-        fp.write(FOO_CODE.format("import bar as Bar", "Bar"))
-
-    bar_path = tmp_path.joinpath("bar.vy")
-    with bar_path.open("w") as fp:
-        fp.write(BAR_CODE)
-
-    assert compile_files([foo_path, bar_path], ["combined_json"], root_folder=".")
diff --git a/tests/cli/vyper_compile/test_parse_args.py b/tests/cli/vyper_compile/test_parse_args.py
index a676a7836b..0e8c4e9605 100644
--- a/tests/cli/vyper_compile/test_parse_args.py
+++ b/tests/cli/vyper_compile/test_parse_args.py
@@ -21,7 +21,9 @@ def foo() -> bool:
     bar_path = chdir_path.joinpath("bar.vy")
     with bar_path.open("w") as fp:
         fp.write(code)
+
     _parse_args([str(bar_path)])  # absolute path
     os.chdir(chdir_path.parent)
+
     _parse_args([str(bar_path)])  # absolute path, subfolder of cwd
     _parse_args([str(bar_path.relative_to(chdir_path.parent))])  # relative path
diff --git a/tests/cli/vyper_json/test_compile_from_input_dict.py b/tests/cli/vyper_json/test_compile_from_input_dict.py
deleted file mode 100644
index a6d0a23100..0000000000
--- a/tests/cli/vyper_json/test_compile_from_input_dict.py
+++ /dev/null
@@ -1,132 +0,0 @@
-#!/usr/bin/env python3
-
-from copy import deepcopy
-
-import pytest
-
-import vyper
-from vyper.cli.vyper_json import (
-    TRANSLATE_MAP,
-    compile_from_input_dict,
-    exc_handler_raises,
-    exc_handler_to_dict,
-)
-from vyper.exceptions import InvalidType, JSONError, SyntaxException
-
-FOO_CODE = """
-import contracts.bar as Bar
-
-@external
-def foo(a: address) -> bool:
-    return Bar(a).bar(1)
-
-@external
-def baz() -> uint256:
-    return self.balance
-"""
-
-BAR_CODE = """
-@external
-def bar(a: uint256) -> bool:
-    return True
-"""
-
-BAD_SYNTAX_CODE = """
-def bar()>:
-"""
-
-BAD_COMPILER_CODE = """
-@external
-def oopsie(a: uint256) -> bool:
-    return 42
-"""
-
-BAR_ABI = [
-    {
-        "name": "bar",
-        "outputs": [{"type": "bool", "name": "out"}],
-        "inputs": [{"type": "uint256", "name": "a"}],
-        "stateMutability": "nonpayable",
-        "type": "function",
-        "gas": 313,
-    }
-]
-
-INPUT_JSON = {
-    "language": "Vyper",
-    "sources": {
-        "contracts/foo.vy": {"content": FOO_CODE},
-        "contracts/bar.vy": {"content": BAR_CODE},
-    },
-    "interfaces": {"contracts/bar.json": {"abi": BAR_ABI}},
-    "settings": {"outputSelection": {"*": ["*"]}},
-}
-
-
-def test_root_folder_not_exists():
-    with pytest.raises(FileNotFoundError):
-        compile_from_input_dict({}, root_folder="/path/that/does/not/exist")
-
-
-def test_wrong_language():
-    with pytest.raises(JSONError):
-        compile_from_input_dict({"language": "Solidity"})
-
-
-def test_exc_handler_raises_syntax():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["sources"]["badcode.vy"] = {"content": BAD_SYNTAX_CODE}
-    with pytest.raises(SyntaxException):
-        compile_from_input_dict(input_json, exc_handler_raises)
-
-
-def test_exc_handler_to_dict_syntax():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["sources"]["badcode.vy"] = {"content": BAD_SYNTAX_CODE}
-    result, _ = compile_from_input_dict(input_json, exc_handler_to_dict)
-    assert "errors" in result
-    assert len(result["errors"]) == 1
-    error = result["errors"][0]
-    assert error["component"] == "parser"
-    assert error["type"] == "SyntaxException"
-
-
-def test_exc_handler_raises_compiler():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["sources"]["badcode.vy"] = {"content": BAD_COMPILER_CODE}
-    with pytest.raises(InvalidType):
-        compile_from_input_dict(input_json, exc_handler_raises)
-
-
-def test_exc_handler_to_dict_compiler():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["sources"]["badcode.vy"] = {"content": BAD_COMPILER_CODE}
-    result, _ = compile_from_input_dict(input_json, exc_handler_to_dict)
-    assert sorted(result.keys()) == ["compiler", "errors"]
-    assert result["compiler"] == f"vyper-{vyper.__version__}"
-    assert len(result["errors"]) == 1
-    error = result["errors"][0]
-    assert error["component"] == "compiler"
-    assert error["type"] == "InvalidType"
-
-
-def test_source_ids_increment():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["settings"]["outputSelection"] = {"*": ["evm.deployedBytecode.sourceMap"]}
-    result, _ = compile_from_input_dict(input_json)
-    assert result["contracts/bar.vy"]["source_map"]["pc_pos_map_compressed"].startswith("-1:-1:0")
-    assert result["contracts/foo.vy"]["source_map"]["pc_pos_map_compressed"].startswith("-1:-1:1")
-
-
-def test_outputs():
-    result, _ = compile_from_input_dict(INPUT_JSON)
-    assert sorted(result.keys()) == ["contracts/bar.vy", "contracts/foo.vy"]
-    assert sorted(result["contracts/bar.vy"].keys()) == sorted(set(TRANSLATE_MAP.values()))
-
-
-def test_relative_import_paths():
-    input_json = deepcopy(INPUT_JSON)
-    input_json["sources"]["contracts/potato/baz/baz.vy"] = {"content": """from ... import foo"""}
-    input_json["sources"]["contracts/potato/baz/potato.vy"] = {"content": """from . import baz"""}
-    input_json["sources"]["contracts/potato/footato.vy"] = {"content": """from baz import baz"""}
-    compile_from_input_dict(input_json)
diff --git a/tests/cli/vyper_json/test_compile_json.py b/tests/cli/vyper_json/test_compile_json.py
index f03006c4ad..732762d72b 100644
--- a/tests/cli/vyper_json/test_compile_json.py
+++ b/tests/cli/vyper_json/test_compile_json.py
@@ -1,12 +1,11 @@
-#!/usr/bin/env python3
-
 import json
-from copy import deepcopy
 
 import pytest
 
-from vyper.cli.vyper_json import compile_from_input_dict, compile_json
-from vyper.exceptions import JSONError
+import vyper
+from vyper.cli.vyper_json import compile_from_input_dict, compile_json, exc_handler_to_dict
+from vyper.compiler import OUTPUT_FORMATS, compile_code
+from vyper.exceptions import InvalidType, JSONError, SyntaxException
 
 FOO_CODE = """
 import contracts.bar as Bar
@@ -14,6 +13,10 @@
 @external
 def foo(a: address) -> bool:
     return Bar(a).bar(1)
+
+@external
+def baz() -> uint256:
+    return self.balance
 """
 
 BAR_CODE = """
@@ -22,6 +25,16 @@ def bar(a: uint256) -> bool:
     return True
 """
 
+BAD_SYNTAX_CODE = """
+def bar()>:
+"""
+
+BAD_COMPILER_CODE = """
+@external
+def oopsie(a: uint256) -> bool:
+    return 42
+"""
+
 BAR_ABI = [
     {
         "name": "bar",
@@ -29,23 +42,26 @@ def bar(a: uint256) -> bool:
         "inputs": [{"type": "uint256", "name": "a"}],
         "stateMutability": "nonpayable",
         "type": "function",
-        "gas": 313,
     }
 ]
 
-INPUT_JSON = {
-    "language": "Vyper",
-    "sources": {
-        "contracts/foo.vy": {"content": FOO_CODE},
-        "contracts/bar.vy": {"content": BAR_CODE},
-    },
-    "interfaces": {"contracts/bar.json": {"abi": BAR_ABI}},
-    "settings": {"outputSelection": {"*": ["*"]}},
-}
+
+@pytest.fixture(scope="function")
+def input_json():
+    return {
+        "language": "Vyper",
+        "sources": {
+            "contracts/foo.vy": {"content": FOO_CODE},
+            "contracts/bar.vy": {"content": BAR_CODE},
+        },
+        "interfaces": {"contracts/ibar.json": {"abi": BAR_ABI}},
+        "settings": {"outputSelection": {"*": ["*"]}},
+    }
 
 
-def test_input_formats():
-    assert compile_json(INPUT_JSON) == compile_json(json.dumps(INPUT_JSON))
+# test string and dict inputs both work
+def test_string_input(input_json):
+    assert compile_json(input_json) == compile_json(json.dumps(input_json))
 
 
 def test_bad_json():
@@ -53,10 +69,146 @@ def test_bad_json():
         compile_json("this probably isn't valid JSON, is it")
 
 
-def test_keyerror_becomes_jsonerror():
-    input_json = deepcopy(INPUT_JSON)
+def test_keyerror_becomes_jsonerror(input_json):
     del input_json["sources"]
     with pytest.raises(KeyError):
         compile_from_input_dict(input_json)
     with pytest.raises(JSONError):
         compile_json(input_json)
+
+
+def test_compile_json(input_json, make_input_bundle):
+    input_bundle = make_input_bundle({"contracts/bar.vy": BAR_CODE})
+
+    foo = compile_code(
+        FOO_CODE,
+        source_id=0,
+        contract_name="contracts/foo.vy",
+        output_formats=OUTPUT_FORMATS,
+        input_bundle=input_bundle,
+    )
+    bar = compile_code(
+        BAR_CODE, source_id=1, contract_name="contracts/bar.vy", output_formats=OUTPUT_FORMATS
+    )
+
+    compile_code_results = {"contracts/bar.vy": bar, "contracts/foo.vy": foo}
+
+    output_json = compile_json(input_json)
+    assert list(output_json["contracts"].keys()) == ["contracts/foo.vy", "contracts/bar.vy"]
+
+    assert sorted(output_json.keys()) == ["compiler", "contracts", "sources"]
+    assert output_json["compiler"] == f"vyper-{vyper.__version__}"
+
+    for source_id, contract_name in enumerate(["foo", "bar"]):
+        path = f"contracts/{contract_name}.vy"
+        data = compile_code_results[path]
+        assert output_json["sources"][path] == {"id": source_id, "ast": data["ast_dict"]["ast"]}
+        assert output_json["contracts"][path][contract_name] == {
+            "abi": data["abi"],
+            "devdoc": data["devdoc"],
+            "interface": data["interface"],
+            "ir": data["ir_dict"],
+            "userdoc": data["userdoc"],
+            "metadata": data["metadata"],
+            "evm": {
+                "bytecode": {"object": data["bytecode"], "opcodes": data["opcodes"]},
+                "deployedBytecode": {
+                    "object": data["bytecode_runtime"],
+                    "opcodes": data["opcodes_runtime"],
+                    "sourceMap": data["source_map"]["pc_pos_map_compressed"],
+                    "sourceMapFull": data["source_map_full"],
+                },
+                "methodIdentifiers": data["method_identifiers"],
+            },
+        }
+
+
+def test_different_outputs(make_input_bundle, input_json):
+    input_json["settings"]["outputSelection"] = {
+        "contracts/bar.vy": "*",
+        "contracts/foo.vy": ["evm.methodIdentifiers"],
+    }
+    output_json = compile_json(input_json)
+    assert list(output_json["contracts"].keys()) == ["contracts/foo.vy", "contracts/bar.vy"]
+
+    assert sorted(output_json.keys()) == ["compiler", "contracts", "sources"]
+    assert output_json["compiler"] == f"vyper-{vyper.__version__}"
+
+    contracts = output_json["contracts"]
+
+    foo = contracts["contracts/foo.vy"]["foo"]
+    bar = contracts["contracts/bar.vy"]["bar"]
+    assert sorted(bar.keys()) == ["abi", "devdoc", "evm", "interface", "ir", "metadata", "userdoc"]
+
+    assert sorted(foo.keys()) == ["evm"]
+
+    # check method_identifiers
+    input_bundle = make_input_bundle({"contracts/bar.vy": BAR_CODE})
+    method_identifiers = compile_code(
+        FOO_CODE,
+        contract_name="contracts/foo.vy",
+        output_formats=["method_identifiers"],
+        input_bundle=input_bundle,
+    )["method_identifiers"]
+    assert foo["evm"]["methodIdentifiers"] == method_identifiers
+
+
+def test_root_folder_not_exists(input_json):
+    with pytest.raises(FileNotFoundError):
+        compile_json(input_json, root_folder="/path/that/does/not/exist")
+
+
+def test_wrong_language():
+    with pytest.raises(JSONError):
+        compile_json({"language": "Solidity"})
+
+
+def test_exc_handler_raises_syntax(input_json):
+    input_json["sources"]["badcode.vy"] = {"content": BAD_SYNTAX_CODE}
+    with pytest.raises(SyntaxException):
+        compile_json(input_json)
+
+
+def test_exc_handler_to_dict_syntax(input_json):
+    input_json["sources"]["badcode.vy"] = {"content": BAD_SYNTAX_CODE}
+    result = compile_json(input_json, exc_handler_to_dict)
+    assert "errors" in result
+    assert len(result["errors"]) == 1
+    error = result["errors"][0]
+    assert error["component"] == "compiler", error
+    assert error["type"] == "SyntaxException"
+
+
+def test_exc_handler_raises_compiler(input_json):
+    input_json["sources"]["badcode.vy"] = {"content": BAD_COMPILER_CODE}
+    with pytest.raises(InvalidType):
+        compile_json(input_json)
+
+
+def test_exc_handler_to_dict_compiler(input_json):
+    input_json["sources"]["badcode.vy"] = {"content": BAD_COMPILER_CODE}
+    result = compile_json(input_json, exc_handler_to_dict)
+    assert sorted(result.keys()) == ["compiler", "errors"]
+    assert result["compiler"] == f"vyper-{vyper.__version__}"
+    assert len(result["errors"]) == 1
+    error = result["errors"][0]
+    assert error["component"] == "compiler"
+    assert error["type"] == "InvalidType"
+
+
+def test_source_ids_increment(input_json):
+    input_json["settings"]["outputSelection"] = {"*": ["evm.deployedBytecode.sourceMap"]}
+    result = compile_json(input_json)
+
+    def get(filename, contractname):
+        return result["contracts"][filename][contractname]["evm"]["deployedBytecode"]["sourceMap"]
+
+    assert get("contracts/foo.vy", "foo").startswith("-1:-1:0")
+    assert get("contracts/bar.vy", "bar").startswith("-1:-1:1")
+
+
+def test_relative_import_paths(input_json):
+    input_json["sources"]["contracts/potato/baz/baz.vy"] = {"content": """from ... import foo"""}
+    input_json["sources"]["contracts/potato/baz/potato.vy"] = {"content": """from . import baz"""}
+    input_json["sources"]["contracts/potato/footato.vy"] = {"content": """from baz import baz"""}
+    compile_from_input_dict(input_json)
diff --git a/tests/cli/vyper_json/test_get_contracts.py b/tests/cli/vyper_json/test_get_contracts.py
deleted file mode 100644
index 86a5052f72..0000000000
--- a/tests/cli/vyper_json/test_get_contracts.py
+++ /dev/null
@@ -1,71 +0,0 @@
-#!/usr/bin/env python3
-
-import pytest
-
-from vyper.cli.vyper_json import get_input_dict_contracts
-from vyper.exceptions import JSONError
-from vyper.utils import keccak256
-
-FOO_CODE = """
-import contracts.bar as Bar
-
-@external
-def foo(a: address) -> bool:
-    return Bar(a).bar(1)
-"""
-
-BAR_CODE = """
-@external
-def bar(a: uint256) -> bool:
-    return True
-"""
-
-
-def test_no_sources():
-    with pytest.raises(KeyError):
-        get_input_dict_contracts({})
-
-
-def test_contracts_urls():
-    with pytest.raises(JSONError):
-        get_input_dict_contracts({"sources": {"foo.vy": {"urls": ["https://foo.code.com/"]}}})
-
-
-def test_contracts_no_content_key():
-    with pytest.raises(JSONError):
-        get_input_dict_contracts({"sources": {"foo.vy": FOO_CODE}})
-
-
-def test_contracts_keccak():
-    hash_ = keccak256(FOO_CODE.encode()).hex()
-
-    input_json = {"sources": {"foo.vy": {"content": FOO_CODE, "keccak256": hash_}}}
-    get_input_dict_contracts(input_json)
-
-    input_json["sources"]["foo.vy"]["keccak256"] = "0x" + hash_
-    get_input_dict_contracts(input_json)
-
-    input_json["sources"]["foo.vy"]["keccak256"] = "0x1234567890"
-    with pytest.raises(JSONError):
-        get_input_dict_contracts(input_json)
-
-
-def test_contracts_bad_path():
-    input_json = {"sources": {"../foo.vy": {"content": FOO_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_contracts(input_json)
-
-
-def test_contract_collision():
-    # ./foo.vy and foo.vy will resolve to the same path
-    input_json = {"sources": {"./foo.vy": {"content": FOO_CODE}, "foo.vy": {"content": FOO_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_contracts(input_json)
-
-
-def test_contracts_return_value():
-    input_json = {
-        "sources": {"foo.vy": {"content": FOO_CODE}, "contracts/bar.vy": {"content": BAR_CODE}}
-    }
-    result = get_input_dict_contracts(input_json)
-    assert result == {"foo.vy": FOO_CODE, "contracts/bar.vy": BAR_CODE}
diff --git a/tests/cli/vyper_json/test_get_inputs.py b/tests/cli/vyper_json/test_get_inputs.py
new file mode 100644
index 0000000000..6e323a91bd
--- /dev/null
+++ b/tests/cli/vyper_json/test_get_inputs.py
@@ -0,0 +1,142 @@
+from pathlib import PurePath
+
+import pytest
+
+from vyper.cli.vyper_json import get_compilation_targets, get_inputs
+from vyper.exceptions import JSONError
+from vyper.utils import keccak256
+
+FOO_CODE = """
+import contracts.bar as Bar
+
+@external
+def foo(a: address) -> bool:
+    return Bar(a).bar(1)
+"""
+
+BAR_CODE = """
+@external
+def bar(a: uint256) -> bool:
+    return True
+"""
+
+
+def test_no_sources():
+    with pytest.raises(KeyError):
+        get_inputs({})
+
+
+def test_contracts_urls():
+    with pytest.raises(JSONError):
+        get_inputs({"sources": {"foo.vy": {"urls": ["https://foo.code.com/"]}}})
+
+
+def test_contracts_no_content_key():
+    with pytest.raises(JSONError):
+        get_inputs({"sources": {"foo.vy": FOO_CODE}})
+
+
+def test_contracts_keccak():
+    hash_ = keccak256(FOO_CODE.encode()).hex()
+
+    input_json = {"sources": {"foo.vy": {"content": FOO_CODE, "keccak256": hash_}}}
+    get_inputs(input_json)
+
+    input_json["sources"]["foo.vy"]["keccak256"] = "0x" + hash_
+    get_inputs(input_json)
+
+    input_json["sources"]["foo.vy"]["keccak256"] = "0x1234567890"
+    with pytest.raises(JSONError):
+        get_inputs(input_json)
+
+
+def test_contracts_outside_pwd():
+    input_json = {"sources": {"../foo.vy": {"content": FOO_CODE}}}
+    get_inputs(input_json)
+
+
+def test_contract_collision():
+    # ./foo.vy and foo.vy will resolve to the same path
+    input_json = {"sources": {"./foo.vy": {"content": FOO_CODE}, "foo.vy": {"content": FOO_CODE}}}
+    with pytest.raises(JSONError):
+        get_inputs(input_json)
+
+
+def test_contracts_return_value():
+    input_json = {
+        "sources": {"foo.vy": {"content": FOO_CODE}, "contracts/bar.vy": {"content": BAR_CODE}}
+    }
+    result = get_inputs(input_json)
+    assert result == {
+        PurePath("foo.vy"): {"content": FOO_CODE},
+        PurePath("contracts/bar.vy"): {"content": BAR_CODE},
+    }
+
+
+BAR_ABI = [
+    {
+        "name": "bar",
+        "outputs": [{"type": "bool", "name": "out"}],
+        "inputs": [{"type": "uint256", "name": "a"}],
+        "stateMutability": "nonpayable",
+        "type": "function",
+    }
+]
+
+
+# tests to get interfaces from input dicts
+
+
+def test_interface_collision():
+    input_json = {
+        "sources": {"foo.vy": {"content": FOO_CODE}},
+        "interfaces": {"bar.json": {"abi": BAR_ABI}, "bar.vy": {"content": BAR_CODE}},
+    }
+    with pytest.raises(JSONError):
+        get_inputs(input_json)
+
+
+def test_json_no_abi():
+    input_json = {
+        "sources": {"foo.vy": {"content": FOO_CODE}},
+        "interfaces": {"bar.json": {"content": BAR_ABI}},
+    }
+    with pytest.raises(JSONError):
+        get_inputs(input_json)
+
+
+def test_vy_no_content():
+    input_json = {
+        "sources": {"foo.vy": {"content": FOO_CODE}},
+        "interfaces": {"bar.vy": {"abi": BAR_CODE}},
+    }
+    with pytest.raises(JSONError):
+        get_inputs(input_json)
+
+
+def test_interfaces_output():
+    input_json = {
+        "sources": {"foo.vy": {"content": FOO_CODE}},
+        "interfaces": {
+            "bar.json": {"abi": BAR_ABI},
+            "interface.folder/bar2.vy": {"content": BAR_CODE},
+        },
+    }
+    targets = get_compilation_targets(input_json)
+    assert targets == [PurePath("foo.vy")]
+
+    result = get_inputs(input_json)
+    assert result == {
+        PurePath("foo.vy"): {"content": FOO_CODE},
+        PurePath("bar.json"): {"abi": BAR_ABI},
+        PurePath("interface.folder/bar2.vy"): {"content": BAR_CODE},
+    }
+
+
+# EIP-2678 -- not currently supported
+@pytest.mark.xfail
+def test_manifest_output():
+    input_json = {"interfaces": {"bar.json": {"contractTypes": {"Bar": {"abi": BAR_ABI}}}}}
+    result = get_inputs(input_json)
+    assert isinstance(result, dict)
+    assert result == {"Bar": {"type": "json", "code": BAR_ABI}}
diff --git a/tests/cli/vyper_json/test_get_settings.py b/tests/cli/vyper_json/test_get_settings.py
index bbe5dab113..989d4565cd 100644
--- a/tests/cli/vyper_json/test_get_settings.py
+++ b/tests/cli/vyper_json/test_get_settings.py
@@ -1,5 +1,3 @@
-#!/usr/bin/env python3
-
 import pytest
 
 from vyper.cli.vyper_json import get_evm_version
diff --git a/tests/cli/vyper_json/test_interfaces.py b/tests/cli/vyper_json/test_interfaces.py
deleted file mode 100644
index 7804ae1c3d..0000000000
--- a/tests/cli/vyper_json/test_interfaces.py
+++ /dev/null
@@ -1,126 +0,0 @@
-#!/usr/bin/env python3
-
-import pytest
-
-from vyper.cli.vyper_json import get_input_dict_interfaces, get_interface_codes
-from vyper.exceptions import JSONError
-
-FOO_CODE = """
-import contracts.bar as Bar
-
-@external
-def foo(a: address) -> bool:
-    return Bar(a).bar(1)
-"""
-
-BAR_CODE = """
-@external
-def bar(a: uint256) -> bool:
-    return True
-"""
-
-BAR_ABI = [
-    {
-        "name": "bar",
-        "outputs": [{"type": "bool", "name": "out"}],
-        "inputs": [{"type": "uint256", "name": "a"}],
-        "stateMutability": "nonpayable",
-        "type": "function",
-        "gas": 313,
-    }
-]
-
-
-# get_input_dict_interfaces tests
-
-
-def test_no_interfaces():
-    result = get_input_dict_interfaces({})
-    assert isinstance(result, dict)
-    assert not result
-
-
-def test_interface_collision():
-    input_json = {"interfaces": {"bar.json": {"abi": BAR_ABI}, "bar.vy": {"content": BAR_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_interfaces(input_json)
-
-
-def test_interfaces_wrong_suffix():
-    input_json = {"interfaces": {"foo.abi": {"content": FOO_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_interfaces(input_json)
-
-    input_json = {"interfaces": {"interface.folder/foo": {"content": FOO_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_interfaces(input_json)
-
-
-def test_json_no_abi():
-    input_json = {"interfaces": {"bar.json": {"content": BAR_ABI}}}
-    with pytest.raises(JSONError):
-        get_input_dict_interfaces(input_json)
-
-
-def test_vy_no_content():
-    input_json = {"interfaces": {"bar.vy": {"abi": BAR_CODE}}}
-    with pytest.raises(JSONError):
-        get_input_dict_interfaces(input_json)
-
-
-def test_interfaces_output():
-    input_json = {
-        "interfaces": {
-            "bar.json": {"abi": BAR_ABI},
-            "interface.folder/bar2.vy": {"content": BAR_CODE},
-        }
-    }
-    result = get_input_dict_interfaces(input_json)
-    assert isinstance(result, dict)
-    assert result == {
-        "bar": {"type": "json", "code": BAR_ABI},
-        "interface.folder/bar2": {"type": "vyper", "code": BAR_CODE},
-    }
-
-
-def test_manifest_output():
-    input_json = {"interfaces": {"bar.json": {"contractTypes": {"Bar": {"abi": BAR_ABI}}}}}
-    result = get_input_dict_interfaces(input_json)
-    assert isinstance(result, dict)
-    assert result == {"Bar": {"type": "json", "code": BAR_ABI}}
-
-
-# get_interface_codes tests
-
-
-def test_interface_codes_from_contracts():
-    # interface should be generated from contract
-    assert get_interface_codes(
-        None, "foo.vy", {"foo.vy": FOO_CODE, "contracts/bar.vy": BAR_CODE}, {}
-    )
-    assert get_interface_codes(
-        None, "foo/foo.vy", {"foo/foo.vy": FOO_CODE, "contracts/bar.vy": BAR_CODE}, {}
-    )
-
-
-def test_interface_codes_from_interfaces():
-    # existing interface should be given preference over contract-as-interface
-    contracts = {"foo.vy": FOO_CODE, "contacts/bar.vy": BAR_CODE}
-    result = get_interface_codes(None, "foo.vy", contracts, {"contracts/bar": "bar"})
-    assert result["Bar"] == "bar"
-
-
-def test_root_path(tmp_path):
-    tmp_path.joinpath("contracts").mkdir()
-    with tmp_path.joinpath("contracts/bar.vy").open("w") as fp:
-        fp.write("bar")
-
-    with pytest.raises(FileNotFoundError):
-        get_interface_codes(None, "foo.vy", {"foo.vy": FOO_CODE}, {})
-
-    # interface from file system should take lowest priority
-    result = get_interface_codes(tmp_path, "foo.vy", {"foo.vy": FOO_CODE}, {})
-    assert result["Bar"] == {"code": "bar", "type": "vyper"}
-    contracts = {"foo.vy": FOO_CODE, "contracts/bar.vy": BAR_CODE}
-    result = get_interface_codes(None, "foo.vy", contracts, {})
-    assert result["Bar"] == {"code": BAR_CODE, "type": "vyper"}
diff --git a/tests/cli/vyper_json/test_output_dict.py b/tests/cli/vyper_json/test_output_dict.py
deleted file mode 100644
index e2a3466ccf..0000000000
--- a/tests/cli/vyper_json/test_output_dict.py
+++ /dev/null
@@ -1,38 +0,0 @@
-#!/usr/bin/env python3
-
-import vyper
-from vyper.cli.vyper_json import format_to_output_dict
-from vyper.compiler import OUTPUT_FORMATS, compile_codes
-
-FOO_CODE = """
-@external
-def foo() -> bool:
-    return True
-"""
-
-
-def test_keys():
-    compiler_data = compile_codes({"foo.vy": FOO_CODE}, output_formats=list(OUTPUT_FORMATS.keys()))
-    output_json = format_to_output_dict(compiler_data)
-    assert sorted(output_json.keys()) == ["compiler", "contracts", "sources"]
-    assert output_json["compiler"] == f"vyper-{vyper.__version__}"
-    data = compiler_data["foo.vy"]
-    assert output_json["sources"]["foo.vy"] == {"id": 0, "ast": data["ast_dict"]["ast"]}
-    assert output_json["contracts"]["foo.vy"]["foo"] == {
-        "abi": data["abi"],
-        "devdoc": data["devdoc"],
-        "interface": data["interface"],
-        "ir": data["ir_dict"],
-        "userdoc": data["userdoc"],
-        "metadata": data["metadata"],
-        "evm": {
-            "bytecode": {"object": data["bytecode"], "opcodes": data["opcodes"]},
-            "deployedBytecode": {
-                "object": data["bytecode_runtime"],
-                "opcodes": data["opcodes_runtime"],
-                "sourceMap": data["source_map"]["pc_pos_map_compressed"],
-                "sourceMapFull": data["source_map_full"],
-            },
-            "methodIdentifiers": data["method_identifiers"],
-        },
-    }
diff --git a/tests/cli/vyper_json/test_output_selection.py b/tests/cli/vyper_json/test_output_selection.py
index 3b12e2b54a..78ad7404f2 100644
--- a/tests/cli/vyper_json/test_output_selection.py
+++ b/tests/cli/vyper_json/test_output_selection.py
@@ -1,60 +1,60 @@
-#!/usr/bin/env python3
+from pathlib import PurePath
 
 import pytest
 
-from vyper.cli.vyper_json import TRANSLATE_MAP, get_input_dict_output_formats
+from vyper.cli.vyper_json import TRANSLATE_MAP, get_output_formats
 from vyper.exceptions import JSONError
 
 
 def test_no_outputs():
     with pytest.raises(KeyError):
-        get_input_dict_output_formats({}, {})
+        get_output_formats({}, {})
 
 
 def test_invalid_output():
     input_json = {"settings": {"outputSelection": {"foo.vy": ["abi", "foobar"]}}}
-    sources = {"foo.vy": ""}
+    targets = [PurePath("foo.vy")]
     with pytest.raises(JSONError):
-        get_input_dict_output_formats(input_json, sources)
+        get_output_formats(input_json, targets)
 
 
 def test_unknown_contract():
     input_json = {"settings": {"outputSelection": {"bar.vy": ["abi"]}}}
-    sources = {"foo.vy": ""}
+    targets = [PurePath("foo.vy")]
     with pytest.raises(JSONError):
-        get_input_dict_output_formats(input_json, sources)
+        get_output_formats(input_json, targets)
 
 
 @pytest.mark.parametrize("output", TRANSLATE_MAP.items())
 def test_translate_map(output):
     input_json = {"settings": {"outputSelection": {"foo.vy": [output[0]]}}}
-    sources = {"foo.vy": ""}
-    assert get_input_dict_output_formats(input_json, sources) == {"foo.vy": [output[1]]}
+    targets = [PurePath("foo.vy")]
+    assert get_output_formats(input_json, targets) == {PurePath("foo.vy"): [output[1]]}
 
 
 def test_star():
     input_json = {"settings": {"outputSelection": {"*": ["*"]}}}
-    sources = {"foo.vy": "", "bar.vy": ""}
+    targets = [PurePath("foo.vy"), PurePath("bar.vy")]
     expected = sorted(set(TRANSLATE_MAP.values()))
-    result = get_input_dict_output_formats(input_json, sources)
-    assert result == {"foo.vy": expected, "bar.vy": expected}
+    result = get_output_formats(input_json, targets)
+    assert result == {PurePath("foo.vy"): expected, PurePath("bar.vy"): expected}
 
 
 def test_evm():
     input_json = {"settings": {"outputSelection": {"foo.vy": ["abi", "evm"]}}}
-    sources = {"foo.vy": ""}
+    targets = [PurePath("foo.vy")]
     expected = ["abi"] + sorted(v for k, v in TRANSLATE_MAP.items() if k.startswith("evm"))
-    result = get_input_dict_output_formats(input_json, sources)
-    assert result == {"foo.vy": expected}
+    result = get_output_formats(input_json, targets)
+    assert result == {PurePath("foo.vy"): expected}
 
 
 def test_solc_style():
     input_json = {"settings": {"outputSelection": {"foo.vy": {"": ["abi"], "foo.vy": ["ir"]}}}}
-    sources = {"foo.vy": ""}
-    assert get_input_dict_output_formats(input_json, sources) == {"foo.vy": ["abi", "ir_dict"]}
+    targets = [PurePath("foo.vy")]
+    assert get_output_formats(input_json, targets) == {PurePath("foo.vy"): ["abi", "ir_dict"]}
 
 
 def test_metadata():
     input_json = {"settings": {"outputSelection": {"*": ["metadata"]}}}
-    sources = {"foo.vy": ""}
-    assert get_input_dict_output_formats(input_json, sources) == {"foo.vy": ["metadata"]}
+    targets = [PurePath("foo.vy")]
+    assert get_output_formats(input_json, targets) == {PurePath("foo.vy"): ["metadata"]}
diff --git a/tests/cli/vyper_json/test_parse_args_vyperjson.py b/tests/cli/vyper_json/test_parse_args_vyperjson.py
index 11e527843a..3b0f700c7e 100644
--- a/tests/cli/vyper_json/test_parse_args_vyperjson.py
+++ b/tests/cli/vyper_json/test_parse_args_vyperjson.py
@@ -29,7 +29,6 @@ def bar(a: uint256) -> bool:
         "inputs": [{"type": "uint256", "name": "a"}],
         "stateMutability": "nonpayable",
         "type": "function",
-        "gas": 313,
     }
 ]
 
@@ -39,7 +38,7 @@ def bar(a: uint256) -> bool:
         "contracts/foo.vy": {"content": FOO_CODE},
         "contracts/bar.vy": {"content": BAR_CODE},
     },
-    "interfaces": {"contracts/bar.json": {"abi": BAR_ABI}},
+    "interfaces": {"contracts/ibar.json": {"abi": BAR_ABI}},
     "settings": {"outputSelection": {"*": ["*"]}},
 }
 
diff --git a/tests/compiler/test_bytecode_runtime.py b/tests/compiler/test_bytecode_runtime.py
index 9519b03772..613ee4d2b8 100644
--- a/tests/compiler/test_bytecode_runtime.py
+++ b/tests/compiler/test_bytecode_runtime.py
@@ -48,14 +48,14 @@ def _parse_cbor_metadata(initcode):
 
 
 def test_bytecode_runtime():
-    out = vyper.compile_code(simple_contract_code, ["bytecode_runtime", "bytecode"])
+    out = vyper.compile_code(simple_contract_code, output_formats=["bytecode_runtime", "bytecode"])
 
     assert len(out["bytecode"]) > len(out["bytecode_runtime"])
     assert out["bytecode_runtime"].removeprefix("0x") in out["bytecode"].removeprefix("0x")
 
 
 def test_bytecode_signature():
-    out = vyper.compile_code(simple_contract_code, ["bytecode_runtime", "bytecode"])
+    out = vyper.compile_code(simple_contract_code, output_formats=["bytecode_runtime", "bytecode"])
 
     runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
     initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
@@ -72,7 +72,9 @@ def test_bytecode_signature():
 def test_bytecode_signature_dense_jumptable():
     settings = Settings(optimize=OptimizationLevel.CODESIZE)
 
-    out = vyper.compile_code(many_functions, ["bytecode_runtime", "bytecode"], settings=settings)
+    out = vyper.compile_code(
+        many_functions, output_formats=["bytecode_runtime", "bytecode"], settings=settings
+    )
 
     runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
     initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
@@ -89,7 +91,9 @@ def test_bytecode_signature_dense_jumptable():
 def test_bytecode_signature_sparse_jumptable():
     settings = Settings(optimize=OptimizationLevel.GAS)
 
-    out = vyper.compile_code(many_functions, ["bytecode_runtime", "bytecode"], settings=settings)
+    out = vyper.compile_code(
+        many_functions, output_formats=["bytecode_runtime", "bytecode"], settings=settings
+    )
 
     runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
     initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
@@ -104,7 +108,7 @@ def test_bytecode_signature_sparse_jumptable():
 
 
 def test_bytecode_signature_immutables():
-    out = vyper.compile_code(has_immutables, ["bytecode_runtime", "bytecode"])
+    out = vyper.compile_code(has_immutables, output_formats=["bytecode_runtime", "bytecode"])
 
     runtime_code = bytes.fromhex(out["bytecode_runtime"].removeprefix("0x"))
     initcode = bytes.fromhex(out["bytecode"].removeprefix("0x"))
diff --git a/tests/compiler/test_compile_code.py b/tests/compiler/test_compile_code.py
index cdbf9d1f52..7af133e362 100644
--- a/tests/compiler/test_compile_code.py
+++ b/tests/compiler/test_compile_code.py
@@ -11,4 +11,4 @@ def a() -> bool:
     return True
 """
     with pytest.warns(vyper.warnings.ContractSizeLimitWarning):
-        vyper.compile_code(code, ["bytecode_runtime"])
+        vyper.compile_code(code, output_formats=["bytecode_runtime"])
diff --git a/tests/compiler/test_input_bundle.py b/tests/compiler/test_input_bundle.py
new file mode 100644
index 0000000000..c49c81219b
--- /dev/null
+++ b/tests/compiler/test_input_bundle.py
@@ -0,0 +1,208 @@
+import json
+from pathlib import Path, PurePath
+
+import pytest
+
+from vyper.compiler.input_bundle import ABIInput, FileInput, FilesystemInputBundle, JSONInputBundle
+
+
+# FilesystemInputBundle which uses same search path as make_file
+@pytest.fixture
+def input_bundle(tmp_path):
+    return FilesystemInputBundle([tmp_path])
+
+
+def test_load_file(make_file, input_bundle, tmp_path):
+    make_file("foo.vy", "contents")
+
+    file = input_bundle.load_file(Path("foo.vy"))
+
+    assert isinstance(file, FileInput)
+    assert file == FileInput(0, tmp_path / Path("foo.vy"), "contents")
+
+
+def test_search_path_context_manager(make_file, tmp_path):
+    ib = FilesystemInputBundle([])
+
+    make_file("foo.vy", "contents")
+
+    with pytest.raises(FileNotFoundError):
+        # no search path given
+        ib.load_file(Path("foo.vy"))
+
+    with ib.search_path(tmp_path):
+        file = ib.load_file(Path("foo.vy"))
+
+    assert isinstance(file, FileInput)
+    assert file == FileInput(0, tmp_path / Path("foo.vy"), "contents")
+
+
+def test_search_path_precedence(make_file, tmp_path, tmp_path_factory, input_bundle):
+    # test search path precedence.
+    # most recent search path is the highest precedence
+    tmpdir = tmp_path_factory.mktemp("some_directory")
+    tmpdir2 = tmp_path_factory.mktemp("some_other_directory")
+
+    for i, directory in enumerate([tmp_path, tmpdir, tmpdir2]):
+        with (directory / "foo.vy").open("w") as f:
+            f.write(f"contents {i}")
+
+    ib = FilesystemInputBundle([tmp_path, tmpdir, tmpdir2])
+
+    file = ib.load_file("foo.vy")
+
+    assert isinstance(file, FileInput)
+    assert file == FileInput(0, tmpdir2 / "foo.vy", "contents 2")
+
+    with ib.search_path(tmpdir):
+        file = ib.load_file("foo.vy")
+
+        assert isinstance(file, FileInput)
+        assert file == FileInput(1, tmpdir / "foo.vy", "contents 1")
+
+
+# special rules for handling json files
+def test_load_abi(make_file, input_bundle, tmp_path):
+    contents = json.dumps("some string")
+
+    make_file("foo.json", contents)
+
+    file = input_bundle.load_file("foo.json")
+    assert isinstance(file, ABIInput)
+    assert file == ABIInput(0, tmp_path / "foo.json", "some string")
+
+    # suffix doesn't matter
+    make_file("foo.txt", contents)
+
+    file = input_bundle.load_file("foo.txt")
+    assert isinstance(file, ABIInput)
+    assert file == ABIInput(1, tmp_path / "foo.txt", "some string")
+
+
+# check that unique paths give unique source ids
+def test_source_id_file_input(make_file, input_bundle, tmp_path):
+    make_file("foo.vy", "contents")
+    make_file("bar.vy", "contents 2")
+
+    file = input_bundle.load_file("foo.vy")
+    assert file.source_id == 0
+    assert file == FileInput(0, tmp_path / "foo.vy", "contents")
+
+    file2 = input_bundle.load_file("bar.vy")
+    # source id increments
+    assert file2.source_id == 1
+    assert file2 == FileInput(1, tmp_path / "bar.vy", "contents 2")
+
+    file3 = input_bundle.load_file("foo.vy")
+    assert file3.source_id == 0
+    assert file3 == FileInput(0, tmp_path / "foo.vy", "contents")
+
+
+# check that unique paths give unique source ids
+def test_source_id_json_input(make_file, input_bundle, tmp_path):
+    contents = json.dumps("some string")
+    contents2 = json.dumps(["some list"])
+
+    make_file("foo.json", contents)
+
+    make_file("bar.json", contents2)
+
+    file = input_bundle.load_file("foo.json")
+    assert isinstance(file, ABIInput)
+    assert file == ABIInput(0, tmp_path / "foo.json", "some string")
+
+    file2 = input_bundle.load_file("bar.json")
+    assert isinstance(file2, ABIInput)
+    assert file2 == ABIInput(1, tmp_path / "bar.json", ["some list"])
+
+    file3 = input_bundle.load_file("foo.json")
+    assert isinstance(file3, ABIInput)
+    assert file3 == ABIInput(0, tmp_path / "foo.json", "some string")
+
+
+# test some pathological case where the file changes underneath
+def test_mutating_file_source_id(make_file, input_bundle, tmp_path):
+    make_file("foo.vy", "contents")
+
+    file = input_bundle.load_file("foo.vy")
+    assert file.source_id == 0
+    assert file == FileInput(0, tmp_path / "foo.vy", "contents")
+
+    make_file("foo.vy", "new contents")
+
+    file = input_bundle.load_file("foo.vy")
+    # source id hasn't changed, even though contents have
+    assert file.source_id == 0
+    assert file == FileInput(0, tmp_path / "foo.vy", "new contents")
+
+
+# test the os.normpath behavior of symlink
+# (slightly pathological, for illustration's sake)
+def test_load_file_symlink(make_file, input_bundle, tmp_path, tmp_path_factory):
+    dir1 = tmp_path / "first"
+    dir2 = tmp_path / "second"
+    symlink = tmp_path / "symlink"
+
+    dir1.mkdir()
+    dir2.mkdir()
+    symlink.symlink_to(dir2, target_is_directory=True)
+
+    with (tmp_path / "foo.vy").open("w") as f:
+        f.write("contents of the upper directory")
+
+    with (dir1 / "foo.vy").open("w") as f:
+        f.write("contents of the inner directory")
+
+    # symlink rules would be:
+    # base/symlink/../foo.vy =>
+    # base/first/second/../foo.vy =>
+    # base/first/foo.vy
+    # normpath would be base/symlink/../foo.vy =>
+    # base/foo.vy
+    file = input_bundle.load_file(symlink / ".." / "foo.vy")
+
+    assert file == FileInput(0, tmp_path / "foo.vy", "contents of the upper directory")
+
+
+def test_json_input_bundle_basic():
+    files = {PurePath("foo.vy"): {"content": "some text"}}
+    input_bundle = JSONInputBundle(files, [PurePath(".")])
+
+    file = input_bundle.load_file(PurePath("foo.vy"))
+    assert file == FileInput(0, PurePath("foo.vy"), "some text")
+
+
+def test_json_input_bundle_normpath():
+    files = {PurePath("foo/../bar.vy"): {"content": "some text"}}
+    input_bundle = JSONInputBundle(files, [PurePath(".")])
+
+    expected = FileInput(0, PurePath("bar.vy"), "some text")
+
+    file = input_bundle.load_file(PurePath("bar.vy"))
+    assert file == expected
+
+    file = input_bundle.load_file(PurePath("baz/../bar.vy"))
+    assert file == expected
+
+    file = input_bundle.load_file(PurePath("./bar.vy"))
+    assert file == expected
+
+    with input_bundle.search_path(PurePath("foo")):
+        file = input_bundle.load_file(PurePath("../bar.vy"))
+        assert file == expected
+
+
+def test_json_input_abi():
+    some_abi = ["some abi"]
+    some_abi_str = json.dumps(some_abi)
+    files = {
+        PurePath("foo.json"): {"abi": some_abi},
+        PurePath("bar.txt"): {"content": some_abi_str},
+    }
+    input_bundle = JSONInputBundle(files, [PurePath(".")])
+
+    file = input_bundle.load_file(PurePath("foo.json"))
+    assert file == ABIInput(0, PurePath("foo.json"), some_abi)
+
+    file = input_bundle.load_file(PurePath("bar.txt"))
+    assert file == ABIInput(1, PurePath("bar.txt"), some_abi)
diff --git a/tests/compiler/test_opcodes.py b/tests/compiler/test_opcodes.py
index 20f45ced6b..15d2a617ba 100644
--- a/tests/compiler/test_opcodes.py
+++ b/tests/compiler/test_opcodes.py
@@ -22,7 +22,7 @@ def a() -> bool:
     return True
     """
 
-    out = vyper.compile_code(code, ["opcodes_runtime", "opcodes"])
+    out = vyper.compile_code(code, output_formats=["opcodes_runtime", "opcodes"])
 
     assert len(out["opcodes"]) > len(out["opcodes_runtime"])
     assert out["opcodes_runtime"] in out["opcodes"]
diff --git a/tests/compiler/test_source_map.py b/tests/compiler/test_source_map.py
index 886596bb80..c9a152b09c 100644
--- a/tests/compiler/test_source_map.py
+++ b/tests/compiler/test_source_map.py
@@ -28,7 +28,7 @@ def foo(a: uint256) -> int128:
 
 
 def test_jump_map():
-    source_map = compile_code(TEST_CODE, ["source_map"])["source_map"]
+    source_map = compile_code(TEST_CODE, output_formats=["source_map"])["source_map"]
     pos_map = source_map["pc_pos_map"]
     jump_map = source_map["pc_jump_map"]
 
@@ -46,7 +46,7 @@ def test_jump_map():
 
 
 def test_pos_map_offsets():
-    source_map = compile_code(TEST_CODE, ["source_map"])["source_map"]
+    source_map = compile_code(TEST_CODE, output_formats=["source_map"])["source_map"]
     expanded = expand_source_map(source_map["pc_pos_map_compressed"])
 
     pc_iter = iter(source_map["pc_pos_map"][i] for i in sorted(source_map["pc_pos_map"]))
@@ -76,7 +76,7 @@ def test_error_map():
 def update_foo():
     self.foo += 1
     """
-    error_map = compile_code(code, ["source_map"])["source_map"]["error_map"]
+    error_map = compile_code(code, output_formats=["source_map"])["source_map"]["error_map"]
     assert "safeadd" in list(error_map.values())
     assert "fallback function" in list(error_map.values())
 
diff --git a/tests/conftest.py b/tests/conftest.py
index c9d3f794a0..9b10b7c51c 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -11,6 +11,7 @@
 
 from vyper import compiler
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.input_bundle import FilesystemInputBundle
 from vyper.compiler.settings import OptimizationLevel, _set_debug_mode
 from vyper.ir import compile_ir, optimizer
 
@@ -70,6 +71,34 @@ def keccak():
     return Web3.keccak
 
 
+@pytest.fixture
+def make_file(tmp_path):
+    # writes file_contents to file_name, creating it in the
+    # tmp_path directory. returns final path.
+    def fn(file_name, file_contents):
+        path = tmp_path / file_name
+        path.parent.mkdir(parents=True, exist_ok=True)
+        with path.open("w") as f:
+            f.write(file_contents)
+
+        return path
+
+    return fn
+
+
+# this can either be used for its side effects (to prepare a call
+# to get_contract), or the result can be provided directly to
+# compile_code / CompilerData.
+@pytest.fixture
+def make_input_bundle(tmp_path, make_file):
+    def fn(sources_dict):
+        for file_name, file_contents in sources_dict.items():
+            make_file(file_name, file_contents)
+        return FilesystemInputBundle([tmp_path])
+
+    return fn
+
+
 @pytest.fixture
 def bytes_helper():
     def bytes_helper(str, length):
diff --git a/tests/parser/ast_utils/test_ast_dict.py b/tests/parser/ast_utils/test_ast_dict.py
index f483d0cbe8..1f60c9ac8b 100644
--- a/tests/parser/ast_utils/test_ast_dict.py
+++ b/tests/parser/ast_utils/test_ast_dict.py
@@ -19,7 +19,7 @@ def get_node_ids(ast_struct, ids=None):
         elif v is None or isinstance(v, (str, int)):
             continue
         else:
-            raise Exception("Unknown ast_struct provided.")
+            raise Exception(f"Unknown ast_struct provided. {k}, {v}")
     return ids
 
 
@@ -30,7 +30,7 @@ def test() -> int128:
     a: uint256 = 100
     return 123
     """
-    dict_out = compiler.compile_code(code, ["ast_dict"])
+    dict_out = compiler.compile_code(code, output_formats=["ast_dict"])
     node_ids = get_node_ids(dict_out)
 
     assert len(node_ids) == len(set(node_ids))
@@ -40,7 +40,7 @@ def test_basic_ast():
     code = """
 a: int128
     """
-    dict_out = compiler.compile_code(code, ["ast_dict"])
+    dict_out = compiler.compile_code(code, output_formats=["ast_dict"])
     assert dict_out["ast_dict"]["ast"]["body"][0] == {
         "annotation": {
             "ast_type": "Name",
@@ -89,7 +89,7 @@ def foo() -> uint256: view
 def foo() -> uint256:
     return 1
     """
-    dict_out = compiler.compile_code(code, ["ast_dict"])
+    dict_out = compiler.compile_code(code, output_formats=["ast_dict"])
     assert dict_out["ast_dict"]["ast"]["body"][1] == {
         "col_offset": 0,
         "annotation": {
diff --git a/tests/parser/features/test_init.py b/tests/parser/features/test_init.py
index 83bcbc95ea..29a466e869 100644
--- a/tests/parser/features/test_init.py
+++ b/tests/parser/features/test_init.py
@@ -15,7 +15,7 @@ def __init__(a: uint256):
     assert c.val() == 123
 
     # Make sure the init code does not access calldata
-    assembly = vyper.compile_code(code, ["asm"])["asm"].split(" ")
+    assembly = vyper.compile_code(code, output_formats=["asm"])["asm"].split(" ")
     ir_return_idx_start = assembly.index("{")
     ir_return_idx_end = assembly.index("}")
 
diff --git a/tests/parser/functions/test_bitwise.py b/tests/parser/functions/test_bitwise.py
index 3ba74034ac..1d62a5be79 100644
--- a/tests/parser/functions/test_bitwise.py
+++ b/tests/parser/functions/test_bitwise.py
@@ -32,7 +32,7 @@ def _shr(x: uint256, y: uint256) -> uint256:
 
 
 def test_bitwise_opcodes():
-    opcodes = compile_code(code, ["opcodes"])["opcodes"]
+    opcodes = compile_code(code, output_formats=["opcodes"])["opcodes"]
     assert "SHL" in opcodes
     assert "SHR" in opcodes
 
diff --git a/tests/parser/functions/test_interfaces.py b/tests/parser/functions/test_interfaces.py
index c16e188cfd..8cb0124f29 100644
--- a/tests/parser/functions/test_interfaces.py
+++ b/tests/parser/functions/test_interfaces.py
@@ -1,10 +1,15 @@
+import json
 from decimal import Decimal
 
 import pytest
 
-from vyper.cli.utils import extract_file_interface_imports
-from vyper.compiler import compile_code, compile_codes
-from vyper.exceptions import ArgumentException, InterfaceViolation, StructureException
+from vyper.compiler import compile_code
+from vyper.exceptions import (
+    ArgumentException,
+    InterfaceViolation,
+    NamespaceCollision,
+    StructureException,
+)
 
 
 def test_basic_extract_interface():
@@ -24,7 +29,7 @@ def allowance(_owner: address, _spender: address) -> (uint256, uint256):
     return 1, 2
     """
 
-    out = compile_code(code, ["interface"])
+    out = compile_code(code, output_formats=["interface"])
     out = out["interface"]
     code_pass = "\n".join(code.split("\n")[:-2] + ["    pass"])  # replace with a pass statement.
 
@@ -55,8 +60,9 @@ def allowance(_owner: address, _spender: address) -> (uint256, uint256): view
     def test(_owner: address): nonpayable
     """
 
-    out = compile_codes({"one.vy": code}, ["external_interface"])["one.vy"]
-    out = out["external_interface"]
+    out = compile_code(code, contract_name="One.vy", output_formats=["external_interface"])[
+        "external_interface"
+    ]
 
     assert interface.strip() == out.strip()
 
@@ -75,7 +81,7 @@ def test() -> bool:
     assert_compile_failed(lambda: compile_code(code), InterfaceViolation)
 
 
-def test_external_interface_parsing(assert_compile_failed):
+def test_external_interface_parsing(make_input_bundle, assert_compile_failed):
     interface_code = """
 @external
 def foo() -> uint256:
@@ -86,7 +92,7 @@ def bar() -> uint256:
     pass
     """
 
-    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
     code = """
 import a as FooBarInterface
@@ -102,7 +108,7 @@ def bar() -> uint256:
     return 2
     """
 
-    assert compile_code(code, interface_codes=interface_codes)
+    assert compile_code(code, input_bundle=input_bundle)
 
     not_implemented_code = """
 import a as FooBarInterface
@@ -116,18 +122,17 @@ def foo() -> uint256:
     """
 
     assert_compile_failed(
-        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
-        InterfaceViolation,
+        lambda: compile_code(not_implemented_code, input_bundle=input_bundle), InterfaceViolation
     )
 
 
-def test_missing_event(assert_compile_failed):
+def test_missing_event(make_input_bundle, assert_compile_failed):
     interface_code = """
 event Foo:
     a: uint256
     """
 
-    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
     not_implemented_code = """
 import a as FooBarInterface
@@ -140,19 +145,18 @@ def bar() -> uint256:
     """
 
     assert_compile_failed(
-        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
-        InterfaceViolation,
+        lambda: compile_code(not_implemented_code, input_bundle=input_bundle), InterfaceViolation
     )
 
 
 # check that event types match
-def test_malformed_event(assert_compile_failed):
+def test_malformed_event(make_input_bundle, assert_compile_failed):
     interface_code = """
 event Foo:
     a: uint256
     """
 
-    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
     not_implemented_code = """
 import a as FooBarInterface
@@ -168,19 +172,18 @@ def bar() -> uint256:
     """
 
     assert_compile_failed(
-        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
-        InterfaceViolation,
+        lambda: compile_code(not_implemented_code, input_bundle=input_bundle), InterfaceViolation
     )
 
 
 # check that event non-indexed arg needs to match interface
-def test_malformed_events_indexed(assert_compile_failed):
+def test_malformed_events_indexed(make_input_bundle, assert_compile_failed):
     interface_code = """
 event Foo:
     a: uint256
     """
 
-    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
     not_implemented_code = """
 import a as FooBarInterface
@@ -197,19 +200,18 @@ def bar() -> uint256:
     """
 
     assert_compile_failed(
-        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
-        InterfaceViolation,
+        lambda: compile_code(not_implemented_code, input_bundle=input_bundle), InterfaceViolation
     )
 
 
 # check that event indexed arg needs to match interface
-def test_malformed_events_indexed2(assert_compile_failed):
+def test_malformed_events_indexed2(make_input_bundle, assert_compile_failed):
     interface_code = """
 event Foo:
     a: indexed(uint256)
     """
 
-    interface_codes = {"FooBarInterface": {"type": "vyper", "code": interface_code}}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
     not_implemented_code = """
 import a as FooBarInterface
@@ -226,43 +228,47 @@ def bar() -> uint256:
     """
 
     assert_compile_failed(
-        lambda: compile_code(not_implemented_code, interface_codes=interface_codes),
-        InterfaceViolation,
+        lambda: compile_code(not_implemented_code, input_bundle=input_bundle), InterfaceViolation
     )
 
 
 VALID_IMPORT_CODE = [
     # import statement, import path without suffix
-    ("import a as Foo", "a"),
-    ("import b.a as Foo", "b/a"),
-    ("import Foo as Foo", "Foo"),
-    ("from a import Foo", "a/Foo"),
-    ("from b.a import Foo", "b/a/Foo"),
-    ("from .a import Foo", "./a/Foo"),
-    ("from ..a import Foo", "../a/Foo"),
+    ("import a as Foo", "a.vy"),
+    ("import b.a as Foo", "b/a.vy"),
+    ("import Foo as Foo", "Foo.vy"),
+    ("from a import Foo", "a/Foo.vy"),
+    ("from b.a import Foo", "b/a/Foo.vy"),
+    ("from .a import Foo", "./a/Foo.vy"),
+    ("from ..a import Foo", "../a/Foo.vy"),
 ]
 
 
-@pytest.mark.parametrize("code", VALID_IMPORT_CODE)
-def test_extract_file_interface_imports(code):
-    assert extract_file_interface_imports(code[0]) == {"Foo": code[1]}
+@pytest.mark.parametrize("code,filename", VALID_IMPORT_CODE)
+def test_extract_file_interface_imports(code, filename, make_input_bundle):
+    input_bundle = make_input_bundle({filename: ""})
+
+    assert compile_code(code, input_bundle=input_bundle) is not None
 
 
 BAD_IMPORT_CODE = [
-    "import a",  # must alias absolute imports
-    "import a as A\nimport a as A",  # namespace collisions
-    "from b import a\nfrom a import a",
-    "from . import a\nimport a as a",
-    "import a as a\nfrom . import a",
+    ("import a", StructureException),  # must alias absolute imports
+    ("import a as A\nimport a as A", NamespaceCollision),
+    ("from b import a\nfrom . import a", NamespaceCollision),
+    ("from . import a\nimport a as a", NamespaceCollision),
+    ("import a as a\nfrom . import a", NamespaceCollision),
 ]
 
 
-@pytest.mark.parametrize("code", BAD_IMPORT_CODE)
-def test_extract_file_interface_imports_raises(code, assert_compile_failed):
-    assert_compile_failed(lambda: extract_file_interface_imports(code), StructureException)
+@pytest.mark.parametrize("code,exception_type", BAD_IMPORT_CODE)
+def test_extract_file_interface_imports_raises(
+    code, exception_type, assert_compile_failed, make_input_bundle
+):
+    input_bundle = make_input_bundle({"a.vy": "", "b/a.vy": ""})  # dummy
+    assert_compile_failed(lambda: compile_code(code, input_bundle=input_bundle), exception_type)
 
 
-def test_external_call_to_interface(w3, get_contract):
+def test_external_call_to_interface(w3, get_contract, make_input_bundle):
     token_code = """
 balanceOf: public(HashMap[address, uint256])
 
@@ -271,6 +277,8 @@ def transfer(to: address, _value: uint256):
     self.balanceOf[to] += _value
     """
 
+    input_bundle = make_input_bundle({"one.vy": token_code})
+
     code = """
 import one as TokenCode
 
@@ -292,9 +300,7 @@ def test():
     """
 
     erc20 = get_contract(token_code)
-    test_c = get_contract(
-        code, *[erc20.address], interface_codes={"TokenCode": {"type": "vyper", "code": token_code}}
-    )
+    test_c = get_contract(code, *[erc20.address], input_bundle=input_bundle)
 
     sender = w3.eth.accounts[0]
     assert erc20.balanceOf(sender) == 0
@@ -313,7 +319,7 @@ def test():
         ("epsilon(decimal)", "decimal", Decimal("1E-10")),
     ],
 )
-def test_external_call_to_interface_kwarg(get_contract, kwarg, typ, expected):
+def test_external_call_to_interface_kwarg(get_contract, kwarg, typ, expected, make_input_bundle):
     code_a = f"""
 @external
 @view
@@ -321,6 +327,8 @@ def foo(_max: {typ} = {kwarg}) -> {typ}:
     return _max
     """
 
+    input_bundle = make_input_bundle({"one.vy": code_a})
+
     code_b = f"""
 import one as ContractA
 
@@ -331,11 +339,7 @@ def bar(a_address: address) -> {typ}:
     """
 
     contract_a = get_contract(code_a)
-    contract_b = get_contract(
-        code_b,
-        *[contract_a.address],
-        interface_codes={"ContractA": {"type": "vyper", "code": code_a}},
-    )
+    contract_b = get_contract(code_b, *[contract_a.address], input_bundle=input_bundle)
 
     assert contract_b.bar(contract_a.address) == expected
 
@@ -368,9 +372,7 @@ def test():
     """
 
     erc20 = get_contract(token_code)
-    test_c = get_contract(
-        code, *[erc20.address], interface_codes={"TokenCode": {"type": "vyper", "code": token_code}}
-    )
+    test_c = get_contract(code, *[erc20.address])
 
     sender = w3.eth.accounts[0]
     assert erc20.balanceOf(sender) == 0
@@ -440,11 +442,7 @@ def test_fail3() -> int256:
     """
 
     bad_c = get_contract(external_contract)
-    c = get_contract(
-        code,
-        bad_c.address,
-        interface_codes={"BadCode": {"type": "vyper", "code": external_contract}},
-    )
+    c = get_contract(code, bad_c.address)
     assert bad_c.ok() == 1
     assert bad_c.should_fail() == -(2**255)
 
@@ -502,7 +500,9 @@ def test_fail2() -> Bytes[3]:
 
 
 # test data returned from external interface gets clamped
-def test_json_abi_bytes_clampers(get_contract, assert_tx_failed, assert_compile_failed):
+def test_json_abi_bytes_clampers(
+    get_contract, assert_tx_failed, assert_compile_failed, make_input_bundle
+):
     external_contract = """
 @external
 def returns_Bytes3() -> Bytes[3]:
@@ -546,18 +546,15 @@ def test_fail3() -> Bytes[3]:
     """
 
     bad_c = get_contract(external_contract)
-    bad_c_interface = {
-        "BadJSONInterface": {
-            "type": "json",
-            "code": compile_code(external_contract, ["abi"])["abi"],
-        }
-    }
+
+    bad_json_interface = json.dumps(compile_code(external_contract, output_formats=["abi"])["abi"])
+    input_bundle = make_input_bundle({"BadJSONInterface.json": bad_json_interface})
 
     assert_compile_failed(
-        lambda: get_contract(should_not_compile, interface_codes=bad_c_interface), ArgumentException
+        lambda: get_contract(should_not_compile, input_bundle=input_bundle), ArgumentException
     )
 
-    c = get_contract(code, bad_c.address, interface_codes=bad_c_interface)
+    c = get_contract(code, bad_c.address, input_bundle=input_bundle)
     assert bad_c.returns_Bytes3() == b"123"
 
     assert_tx_failed(lambda: c.test_fail1())
@@ -565,7 +562,7 @@ def test_fail3() -> Bytes[3]:
     assert_tx_failed(lambda: c.test_fail3())
 
 
-def test_units_interface(w3, get_contract):
+def test_units_interface(w3, get_contract, make_input_bundle):
     code = """
 import balanceof as BalanceOf
 
@@ -576,49 +573,41 @@ def test_units_interface(w3, get_contract):
 def balanceOf(owner: address) -> uint256:
     return as_wei_value(1, "ether")
     """
+
     interface_code = """
 @external
 @view
 def balanceOf(owner: address) -> uint256:
     pass
     """
-    interface_codes = {"BalanceOf": {"type": "vyper", "code": interface_code}}
-    c = get_contract(code, interface_codes=interface_codes)
+
+    input_bundle = make_input_bundle({"balanceof.vy": interface_code})
+
+    c = get_contract(code, input_bundle=input_bundle)
 
     assert c.balanceOf(w3.eth.accounts[0]) == w3.to_wei(1, "ether")
 
 
-def test_local_and_global_interface_namespaces():
+def test_simple_implements(make_input_bundle):
     interface_code = """
 @external
 def foo() -> uint256:
     pass
     """
 
-    global_interface_codes = {
-        "FooInterface": {"type": "vyper", "code": interface_code},
-        "BarInterface": {"type": "vyper", "code": interface_code},
-    }
-    local_interface_codes = {
-        "FooContract": {"FooInterface": {"type": "vyper", "code": interface_code}},
-        "BarContract": {"BarInterface": {"type": "vyper", "code": interface_code}},
-    }
-
     code = """
-import a as {0}
+import a as FooInterface
 
-implements: {0}
+implements: FooInterface
 
 @external
 def foo() -> uint256:
     return 1
     """
 
-    codes = {"FooContract": code.format("FooInterface"), "BarContract": code.format("BarInterface")}
+    input_bundle = make_input_bundle({"a.vy": interface_code})
 
-    global_compiled = compile_codes(codes, interface_codes=global_interface_codes)
-    local_compiled = compile_codes(codes, interface_codes=local_interface_codes)
-    assert global_compiled == local_compiled
+    assert compile_code(code, input_bundle=input_bundle) is not None
 
 
 def test_self_interface_is_allowed(get_contract):
@@ -724,20 +713,28 @@ def convert_v1_abi(abi):
 
 
 @pytest.mark.parametrize("type_str", [i[0] for i in type_str_params])
-def test_json_interface_implements(type_str):
+def test_json_interface_implements(type_str, make_input_bundle, make_file):
     code = interface_test_code.format(type_str)
 
-    abi = compile_code(code, ["abi"])["abi"]
+    abi = compile_code(code, output_formats=["abi"])["abi"]
+
     code = f"import jsonabi as jsonabi\nimplements: jsonabi\n{code}"
-    compile_code(code, interface_codes={"jsonabi": {"type": "json", "code": abi}})
-    compile_code(code, interface_codes={"jsonabi": {"type": "json", "code": convert_v1_abi(abi)}})
+
+    input_bundle = make_input_bundle({"jsonabi.json": json.dumps(abi)})
+
+    compile_code(code, input_bundle=input_bundle)
+
+    # !!! overwrite the file
+    make_file("jsonabi.json", json.dumps(convert_v1_abi(abi)))
+
+    compile_code(code, input_bundle=input_bundle)
 
 
 @pytest.mark.parametrize("type_str,value", type_str_params)
-def test_json_interface_calls(get_contract, type_str, value):
+def test_json_interface_calls(get_contract, type_str, value, make_input_bundle, make_file):
     code = interface_test_code.format(type_str)
 
-    abi = compile_code(code, ["abi"])["abi"]
+    abi = compile_code(code, output_formats=["abi"])["abi"]
     c1 = get_contract(code)
 
     code = f"""
@@ -748,9 +745,11 @@ def test_json_interface_calls(get_contract, type_str, value):
 def test_call(a: address, b: {type_str}) -> {type_str}:
     return jsonabi(a).test_json(b)
     """
-    c2 = get_contract(code, interface_codes={"jsonabi": {"type": "json", "code": abi}})
+    input_bundle = make_input_bundle({"jsonabi.json": json.dumps(abi)})
+
+    c2 = get_contract(code, input_bundle=input_bundle)
     assert c2.test_call(c1.address, value) == value
-    c3 = get_contract(
-        code, interface_codes={"jsonabi": {"type": "json", "code": convert_v1_abi(abi)}}
-    )
+
+    make_file("jsonabi.json", json.dumps(convert_v1_abi(abi)))
+    c3 = get_contract(code, input_bundle=input_bundle)
     assert c3.test_call(c1.address, value) == value
diff --git a/tests/parser/functions/test_raw_call.py b/tests/parser/functions/test_raw_call.py
index 81efe64a18..5bb23447e4 100644
--- a/tests/parser/functions/test_raw_call.py
+++ b/tests/parser/functions/test_raw_call.py
@@ -274,8 +274,8 @@ def test_raw_call(_target: address):
 def test_raw_call(_target: address):
     raw_call(_target, method_id("foo()"), max_outsize=0)
     """
-    output1 = compile_code(code1, ["bytecode", "bytecode_runtime"])
-    output2 = compile_code(code2, ["bytecode", "bytecode_runtime"])
+    output1 = compile_code(code1, output_formats=["bytecode", "bytecode_runtime"])
+    output2 = compile_code(code2, output_formats=["bytecode", "bytecode_runtime"])
     assert output1 == output2
 
 
@@ -296,8 +296,8 @@ def test_raw_call(_target: address) -> bool:
     a: bool = raw_call(_target, method_id("foo()"), max_outsize=0, revert_on_failure=False)
     return a
     """
-    output1 = compile_code(code1, ["bytecode", "bytecode_runtime"])
-    output2 = compile_code(code2, ["bytecode", "bytecode_runtime"])
+    output1 = compile_code(code1, output_formats=["bytecode", "bytecode_runtime"])
+    output2 = compile_code(code2, output_formats=["bytecode", "bytecode_runtime"])
     assert output1 == output2
 
 
diff --git a/tests/parser/functions/test_return_struct.py b/tests/parser/functions/test_return_struct.py
index 425caedb75..cdd8342d8a 100644
--- a/tests/parser/functions/test_return_struct.py
+++ b/tests/parser/functions/test_return_struct.py
@@ -17,7 +17,7 @@ def test() -> Voter:
     return a
     """
 
-    out = compile_code(code, ["abi"])
+    out = compile_code(code, output_formats=["abi"])
     abi = out["abi"][0]
 
     assert abi["name"] == "test"
@@ -38,7 +38,7 @@ def test() -> Voter:
     return a
     """
 
-    out = compile_code(code, ["abi"])
+    out = compile_code(code, output_formats=["abi"])
     abi = out["abi"][0]
 
     assert abi["name"] == "test"
diff --git a/tests/parser/syntax/test_codehash.py b/tests/parser/syntax/test_codehash.py
index 5074d14636..c2d9a2e274 100644
--- a/tests/parser/syntax/test_codehash.py
+++ b/tests/parser/syntax/test_codehash.py
@@ -33,7 +33,7 @@ def foo4() -> bytes32:
     return self.a.codehash
     """
     settings = Settings(evm_version=evm_version, optimize=optimize)
-    compiled = compile_code(code, ["bytecode_runtime"], settings=settings)
+    compiled = compile_code(code, output_formats=["bytecode_runtime"], settings=settings)
     bytecode = bytes.fromhex(compiled["bytecode_runtime"][2:])
     hash_ = keccak256(bytecode)
 
diff --git a/tests/parser/syntax/test_interfaces.py b/tests/parser/syntax/test_interfaces.py
index 498f1363d8..9100389dbd 100644
--- a/tests/parser/syntax/test_interfaces.py
+++ b/tests/parser/syntax/test_interfaces.py
@@ -374,7 +374,7 @@ def test_interfaces_success(good_code):
     assert compiler.compile_code(good_code) is not None
 
 
-def test_imports_and_implements_within_interface():
+def test_imports_and_implements_within_interface(make_input_bundle):
     interface_code = """
 from vyper.interfaces import ERC20
 import foo.bar as Baz
@@ -386,6 +386,8 @@ def foobar():
     pass
 """
 
+    input_bundle = make_input_bundle({"foo.vy": interface_code})
+
     code = """
 import foo as Foo
 
@@ -396,9 +398,4 @@ def foobar():
     pass
 """
 
-    assert (
-        compiler.compile_code(
-            code, interface_codes={"Foo": {"type": "vyper", "code": interface_code}}
-        )
-        is not None
-    )
+    assert compiler.compile_code(code, input_bundle=input_bundle) is not None
diff --git a/tests/parser/syntax/test_self_balance.py b/tests/parser/syntax/test_self_balance.py
index 63db58e347..d22d8a2750 100644
--- a/tests/parser/syntax/test_self_balance.py
+++ b/tests/parser/syntax/test_self_balance.py
@@ -20,7 +20,7 @@ def __default__():
     pass
     """
     settings = Settings(evm_version=evm_version)
-    opcodes = compiler.compile_code(code, ["opcodes"], settings=settings)["opcodes"]
+    opcodes = compiler.compile_code(code, output_formats=["opcodes"], settings=settings)["opcodes"]
     if EVM_VERSIONS[evm_version] >= EVM_VERSIONS["istanbul"]:
         assert "SELFBALANCE" in opcodes
     else:
diff --git a/tests/parser/test_selector_table_stability.py b/tests/parser/test_selector_table_stability.py
index abc2c17b8f..3302ff5009 100644
--- a/tests/parser/test_selector_table_stability.py
+++ b/tests/parser/test_selector_table_stability.py
@@ -8,7 +8,9 @@ def test_dense_jumptable_stability():
 
     code = "\n".join(f"@external\ndef {name}():\n  pass" for name in function_names)
 
-    output = compile_code(code, ["asm"], settings=Settings(optimize=OptimizationLevel.CODESIZE))
+    output = compile_code(
+        code, output_formats=["asm"], settings=Settings(optimize=OptimizationLevel.CODESIZE)
+    )
 
     # test that the selector table data is stable across different runs
     # (tox should provide different PYTHONHASHSEEDs).
diff --git a/tests/parser/types/numbers/test_constants.py b/tests/parser/types/numbers/test_constants.py
index 652c8e8bd9..25617651ec 100644
--- a/tests/parser/types/numbers/test_constants.py
+++ b/tests/parser/types/numbers/test_constants.py
@@ -206,7 +206,7 @@ def test() -> uint256:
     return ret
     """
 
-    ir = compile_code(code, ["ir"])["ir"]
+    ir = compile_code(code, output_formats=["ir"])["ir"]
     assert search_for_sublist(
         ir, ["mstore", [MemoryPositions.RESERVED_MEMORY], [2**12 * some_prime]]
     )
diff --git a/vyper/__init__.py b/vyper/__init__.py
index 35237bd044..482d5c3a60 100644
--- a/vyper/__init__.py
+++ b/vyper/__init__.py
@@ -1,6 +1,6 @@
 from pathlib import Path as _Path
 
-from vyper.compiler import compile_code, compile_codes  # noqa: F401
+from vyper.compiler import compile_code  # noqa: F401
 
 try:
     from importlib.metadata import PackageNotFoundError  # type: ignore
diff --git a/vyper/builtins/interfaces/ERC165.py b/vyper/builtins/interfaces/ERC165.vy
similarity index 75%
rename from vyper/builtins/interfaces/ERC165.py
rename to vyper/builtins/interfaces/ERC165.vy
index 0a75431f3c..a4ca451abd 100644
--- a/vyper/builtins/interfaces/ERC165.py
+++ b/vyper/builtins/interfaces/ERC165.vy
@@ -1,6 +1,4 @@
-interface_code = """
 @view
 @external
 def supportsInterface(interface_id: bytes4) -> bool:
     pass
-"""
diff --git a/vyper/builtins/interfaces/ERC20.py b/vyper/builtins/interfaces/ERC20.vy
similarity index 96%
rename from vyper/builtins/interfaces/ERC20.py
rename to vyper/builtins/interfaces/ERC20.vy
index a63408672b..065ca97a9b 100644
--- a/vyper/builtins/interfaces/ERC20.py
+++ b/vyper/builtins/interfaces/ERC20.vy
@@ -1,4 +1,3 @@
-interface_code = """
 # Events
 event Transfer:
     _from: indexed(address)
@@ -37,4 +36,3 @@ def transferFrom(_from: address, _to: address, _value: uint256) -> bool:
 @external
 def approve(_spender: address, _value: uint256) -> bool:
     pass
-"""
diff --git a/vyper/builtins/interfaces/ERC20Detailed.py b/vyper/builtins/interfaces/ERC20Detailed.py
deleted file mode 100644
index 03dd597e8a..0000000000
--- a/vyper/builtins/interfaces/ERC20Detailed.py
+++ /dev/null
@@ -1,22 +0,0 @@
-"""
-NOTE: interface uses `String[1]` where 1 is the lower bound of the string returned by the function.
-    For end-users this means they can't use `implements: ERC20Detailed` unless their implementation
-    uses a value n >= 1. Regardless this is fine as one can't do String[0] where n == 0.
-"""
-
-interface_code = """
-@view
-@external
-def name() -> String[1]:
-    pass
-
-@view
-@external
-def symbol() -> String[1]:
-    pass
-
-@view
-@external
-def decimals() -> uint8:
-    pass
-"""
diff --git a/vyper/builtins/interfaces/ERC20Detailed.vy b/vyper/builtins/interfaces/ERC20Detailed.vy
new file mode 100644
index 0000000000..7c4f546d45
--- /dev/null
+++ b/vyper/builtins/interfaces/ERC20Detailed.vy
@@ -0,0 +1,18 @@
+#NOTE: interface uses `String[1]` where 1 is the lower bound of the string returned by the function.
+#    For end-users this means they can't use `implements: ERC20Detailed` unless their implementation
+#    uses a value n >= 1. Regardless this is fine as one can't do String[0] where n == 0.
+
+@view
+@external
+def name() -> String[1]:
+    pass
+
+@view
+@external
+def symbol() -> String[1]:
+    pass
+
+@view
+@external
+def decimals() -> uint8:
+    pass
diff --git a/vyper/builtins/interfaces/ERC4626.py b/vyper/builtins/interfaces/ERC4626.vy
similarity index 98%
rename from vyper/builtins/interfaces/ERC4626.py
rename to vyper/builtins/interfaces/ERC4626.vy
index 21a9ce723a..05865406cf 100644
--- a/vyper/builtins/interfaces/ERC4626.py
+++ b/vyper/builtins/interfaces/ERC4626.vy
@@ -1,4 +1,3 @@
-interface_code = """
 # Events
 event Deposit:
     sender: indexed(address)
@@ -89,4 +88,3 @@ def previewRedeem(shares: uint256) -> uint256:
 @external
 def redeem(shares: uint256, receiver: address=msg.sender, owner: address=msg.sender) -> uint256:
     pass
-"""
diff --git a/vyper/builtins/interfaces/ERC721.py b/vyper/builtins/interfaces/ERC721.vy
similarity index 97%
rename from vyper/builtins/interfaces/ERC721.py
rename to vyper/builtins/interfaces/ERC721.vy
index 8dea4e4976..464c0e255b 100644
--- a/vyper/builtins/interfaces/ERC721.py
+++ b/vyper/builtins/interfaces/ERC721.vy
@@ -1,4 +1,3 @@
-interface_code = """
 # Events
 
 event Transfer:
@@ -66,5 +65,3 @@ def approve(_approved: address, _tokenId: uint256):
 @external
 def setApprovalForAll(_operator: address, _approved: bool):
     pass
-
-"""
diff --git a/vyper/builtins/interfaces/__init__.py b/vyper/builtins/interfaces/__init__.py
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/vyper/cli/utils.py b/vyper/cli/utils.py
deleted file mode 100644
index 1110ecdfdd..0000000000
--- a/vyper/cli/utils.py
+++ /dev/null
@@ -1,58 +0,0 @@
-from pathlib import Path
-from typing import Sequence
-
-from vyper import ast as vy_ast
-from vyper.exceptions import StructureException
-from vyper.typing import InterfaceImports, SourceCode
-
-
-def get_interface_file_path(base_paths: Sequence, import_path: str) -> Path:
-    relative_path = Path(import_path)
-    for path in base_paths:
-        # Find ABI JSON files
-        file_path = path.joinpath(relative_path)
-        suffix = next((i for i in (".vy", ".json") if file_path.with_suffix(i).exists()), None)
-        if suffix:
-            return file_path.with_suffix(suffix)
-
-        # Find ethPM Manifest files (`from path.to.Manifest import InterfaceName`)
-        # NOTE: Use file parent because this assumes that `file_path`
-        #       coincides with an ABI interface file
-        file_path = file_path.parent
-        suffix = next((i for i in (".vy", ".json") if file_path.with_suffix(i).exists()), None)
-        if suffix:
-            return file_path.with_suffix(suffix)
-
-    raise FileNotFoundError(f" Cannot locate interface '{import_path}{{.vy,.json}}'")
-
-
-def extract_file_interface_imports(code: SourceCode) -> InterfaceImports:
-    ast_tree = vy_ast.parse_to_ast(code)
-
-    imports_dict: InterfaceImports = {}
-    for node in ast_tree.get_children((vy_ast.Import, vy_ast.ImportFrom)):
-        if isinstance(node, vy_ast.Import):  # type: ignore
-            if not node.alias:
-                raise StructureException("Import requires an accompanying `as` statement", node)
-            if node.alias in imports_dict:
-                raise StructureException(f"Interface with alias {node.alias} already exists", node)
-            imports_dict[node.alias] = node.name.replace(".", "/")
-        elif isinstance(node, vy_ast.ImportFrom):  # type: ignore
-            level = node.level  # type: ignore
-            module = node.module or ""  # type: ignore
-            if not level and module == "vyper.interfaces":
-                # uses a builtin interface, so skip adding to imports
-                continue
-
-            base_path = ""
-            if level > 1:
-                base_path = "../" * (level - 1)
-            elif level == 1:
-                base_path = "./"
-            base_path = f"{base_path}{module.replace('.','/')}/"
-
-            if node.name in imports_dict and imports_dict[node.name] != f"{base_path}{node.name}":
-                raise StructureException(f"Interface with name {node.name} already exists", node)
-            imports_dict[node.name] = f"{base_path}{node.name}"
-
-    return imports_dict
diff --git a/vyper/cli/vyper_compile.py b/vyper/cli/vyper_compile.py
index bdd01eebbe..c4f60660cb 100755
--- a/vyper/cli/vyper_compile.py
+++ b/vyper/cli/vyper_compile.py
@@ -3,14 +3,13 @@
 import json
 import sys
 import warnings
-from collections import OrderedDict
 from pathlib import Path
-from typing import Dict, Iterable, Iterator, Optional, Set, TypeVar
+from typing import Any, Iterable, Iterator, Optional, Set, TypeVar
 
 import vyper
 import vyper.codegen.ir_node as ir_node
 from vyper.cli import vyper_json
-from vyper.cli.utils import extract_file_interface_imports, get_interface_file_path
+from vyper.compiler.input_bundle import FileInput, FilesystemInputBundle
 from vyper.compiler.settings import (
     VYPER_TRACEBACK_LIMIT,
     OptimizationLevel,
@@ -18,7 +17,7 @@
     _set_debug_mode,
 )
 from vyper.evm.opcodes import DEFAULT_EVM_VERSION, EVM_VERSIONS
-from vyper.typing import ContractCodes, ContractPath, OutputFormats
+from vyper.typing import ContractPath, OutputFormats
 
 T = TypeVar("T")
 
@@ -219,94 +218,20 @@ def exc_handler(contract_path: ContractPath, exception: Exception) -> None:
     raise exception
 
 
-def get_interface_codes(root_path: Path, contract_sources: ContractCodes) -> Dict:
-    interface_codes: Dict = {}
-    interfaces: Dict = {}
-
-    for file_path, code in contract_sources.items():
-        interfaces[file_path] = {}
-        parent_path = root_path.joinpath(file_path).parent
-
-        interface_codes = extract_file_interface_imports(code)
-        for interface_name, interface_path in interface_codes.items():
-            base_paths = [parent_path]
-            if not interface_path.startswith(".") and root_path.joinpath(file_path).exists():
-                base_paths.append(root_path)
-            elif interface_path.startswith("../") and len(Path(file_path).parent.parts) < Path(
-                interface_path
-            ).parts.count(".."):
-                raise FileNotFoundError(
-                    f"{file_path} - Cannot perform relative import outside of base folder"
-                )
-
-            valid_path = get_interface_file_path(base_paths, interface_path)
-            with valid_path.open() as fh:
-                code = fh.read()
-                if valid_path.suffix == ".json":
-                    contents = json.loads(code.encode())
-
-                    # EthPM Manifest (EIP-2678)
-                    if "contractTypes" in contents:
-                        if (
-                            interface_name not in contents["contractTypes"]
-                            or "abi" not in contents["contractTypes"][interface_name]
-                        ):
-                            raise ValueError(
-                                f"Could not find interface '{interface_name}'"
-                                f" in manifest '{valid_path}'."
-                            )
-
-                        interfaces[file_path][interface_name] = {
-                            "type": "json",
-                            "code": contents["contractTypes"][interface_name]["abi"],
-                        }
-
-                    # ABI JSON file (either `List[ABI]` or `{"abi": List[ABI]}`)
-                    elif isinstance(contents, list) or (
-                        "abi" in contents and isinstance(contents["abi"], list)
-                    ):
-                        interfaces[file_path][interface_name] = {"type": "json", "code": contents}
-
-                    else:
-                        raise ValueError(f"Corrupted file: '{valid_path}'")
-
-                else:
-                    interfaces[file_path][interface_name] = {"type": "vyper", "code": code}
-
-    return interfaces
-
-
 def compile_files(
-    input_files: Iterable[str],
+    input_files: list[str],
     output_formats: OutputFormats,
     root_folder: str = ".",
     show_gas_estimates: bool = False,
     settings: Optional[Settings] = None,
-    storage_layout: Optional[Iterable[str]] = None,
+    storage_layout_paths: list[str] = None,
     no_bytecode_metadata: bool = False,
-) -> OrderedDict:
+) -> dict:
     root_path = Path(root_folder).resolve()
     if not root_path.exists():
         raise FileNotFoundError(f"Invalid root path - '{root_path.as_posix()}' does not exist")
 
-    contract_sources: ContractCodes = OrderedDict()
-    for file_name in input_files:
-        file_path = Path(file_name)
-        try:
-            file_str = file_path.resolve().relative_to(root_path).as_posix()
-        except ValueError:
-            file_str = file_path.as_posix()
-        with file_path.open() as fh:
-            # trailing newline fixes python parsing bug when source ends in a comment
-            # https://bugs.python.org/issue35107
-            contract_sources[file_str] = fh.read() + "\n"
-
-    storage_layouts = OrderedDict()
-    if storage_layout:
-        for storage_file_name, contract_name in zip(storage_layout, contract_sources.keys()):
-            storage_file_path = Path(storage_file_name)
-            with storage_file_path.open() as sfh:
-                storage_layouts[contract_name] = json.load(sfh)
+    input_bundle = FilesystemInputBundle([root_path])
 
     show_version = False
     if "combined_json" in output_formats:
@@ -318,20 +243,44 @@ def compile_files(
     translate_map = {"abi_python": "abi", "json": "abi", "ast": "ast_dict", "ir_json": "ir_dict"}
     final_formats = [translate_map.get(i, i) for i in output_formats]
 
-    compiler_data = vyper.compile_codes(
-        contract_sources,
-        final_formats,
-        exc_handler=exc_handler,
-        interface_codes=get_interface_codes(root_path, contract_sources),
-        settings=settings,
-        storage_layouts=storage_layouts,
-        show_gas_estimates=show_gas_estimates,
-        no_bytecode_metadata=no_bytecode_metadata,
-    )
+    if storage_layout_paths:
+        if len(storage_layout_paths) != len(input_files):
+            raise ValueError(
+                "provided {len(storage_layout_paths)} storage "
+                "layouts, but {len(input_files)} source files"
+            )
+
+    ret: dict[Any, Any] = {}
     if show_version:
-        compiler_data["version"] = vyper.__version__
+        ret["version"] = vyper.__version__
 
-    return compiler_data
+    for file_name in input_files:
+        file_path = Path(file_name)
+        file = input_bundle.load_file(file_path)
+        assert isinstance(file, FileInput)  # mypy hint
+
+        storage_layout_override = None
+        if storage_layout_paths:
+            storage_file_path = storage_layout_paths.pop(0)
+            with open(storage_file_path) as sfh:
+                storage_layout_override = json.load(sfh)
+
+        output = vyper.compile_code(
+            file.source_code,
+            contract_name=str(file.path),
+            source_id=file.source_id,
+            input_bundle=input_bundle,
+            output_formats=final_formats,
+            exc_handler=exc_handler,
+            settings=settings,
+            storage_layout_override=storage_layout_override,
+            show_gas_estimates=show_gas_estimates,
+            no_bytecode_metadata=no_bytecode_metadata,
+        )
+
+        ret[file_path] = output
+
+    return ret
 
 
 if __name__ == "__main__":
diff --git a/vyper/cli/vyper_json.py b/vyper/cli/vyper_json.py
index f6d82c3fe0..2720f20d23 100755
--- a/vyper/cli/vyper_json.py
+++ b/vyper/cli/vyper_json.py
@@ -4,15 +4,14 @@
 import json
 import sys
 import warnings
-from pathlib import Path
-from typing import Any, Callable, Dict, Hashable, List, Optional, Tuple, Union
+from pathlib import Path, PurePath
+from typing import Any, Callable, Hashable, Optional
 
 import vyper
-from vyper.cli.utils import extract_file_interface_imports, get_interface_file_path
+from vyper.compiler.input_bundle import FileInput, JSONInputBundle
 from vyper.compiler.settings import OptimizationLevel, Settings
 from vyper.evm.opcodes import EVM_VERSIONS
 from vyper.exceptions import JSONError
-from vyper.typing import ContractCodes, ContractPath
 from vyper.utils import keccak256
 
 TRANSLATE_MAP = {
@@ -97,15 +96,15 @@ def _parse_args(argv):
         print(output_json)
 
 
-def exc_handler_raises(file_path: Union[str, None], exception: Exception, component: str) -> None:
+def exc_handler_raises(file_path: Optional[str], exception: Exception, component: str) -> None:
     if file_path:
         print(f"Unhandled exception in '{file_path}':")
     exception._exc_handler = True  # type: ignore
     raise exception
 
 
-def exc_handler_to_dict(file_path: Union[str, None], exception: Exception, component: str) -> Dict:
-    err_dict: Dict = {
+def exc_handler_to_dict(file_path: Optional[str], exception: Exception, component: str) -> dict:
+    err_dict: dict = {
         "type": type(exception).__name__,
         "component": component,
         "severity": "error",
@@ -129,23 +128,7 @@ def exc_handler_to_dict(file_path: Union[str, None], exception: Exception, compo
     return output_json
 
 
-def _standardize_path(path_str: str) -> str:
-    try:
-        path = Path(path_str)
-
-        if path.is_absolute():
-            path = path.resolve()
-        else:
-            pwd = Path(".").resolve()
-            path = path.resolve().relative_to(pwd)
-
-    except ValueError:
-        raise JSONError(f"{path_str} - path exists outside base folder")
-
-    return path.as_posix()
-
-
-def get_evm_version(input_dict: Dict) -> Optional[str]:
+def get_evm_version(input_dict: dict) -> Optional[str]:
     if "settings" not in input_dict:
         return None
 
@@ -168,76 +151,75 @@ def get_evm_version(input_dict: Dict) -> Optional[str]:
     return evm_version
 
 
-def get_input_dict_contracts(input_dict: Dict) -> ContractCodes:
-    contract_sources: ContractCodes = {}
+def get_compilation_targets(input_dict: dict) -> list[PurePath]:
+    # TODO: once we have modules, add optional "compilation_targets" key
+    # which specifies which sources we actually want to compile.
+
+    return [PurePath(p) for p in input_dict["sources"].keys()]
+
+
+def get_inputs(input_dict: dict) -> dict[PurePath, Any]:
+    ret = {}
+    seen = {}
+
     for path, value in input_dict["sources"].items():
+        path = PurePath(path)
         if "urls" in value:
             raise JSONError(f"{path} - 'urls' is not a supported field, use 'content' instead")
         if "content" not in value:
             raise JSONError(f"{path} missing required field - 'content'")
         if "keccak256" in value:
-            hash_ = value["keccak256"].lower()
-            if hash_.startswith("0x"):
-                hash_ = hash_[2:]
+            hash_ = value["keccak256"].lower().removeprefix("0x")
             if hash_ != keccak256(value["content"].encode("utf-8")).hex():
                 raise JSONError(
                     f"Calculated keccak of '{path}' does not match keccak given in input JSON"
                 )
-        key = _standardize_path(path)
-        if key in contract_sources:
-            raise JSONError(f"Contract namespace collision: {key}")
-        contract_sources[key] = value["content"]
-    return contract_sources
+        if path.stem in seen:
+            raise JSONError(f"Contract namespace collision: {path}")
 
-
-def get_input_dict_interfaces(input_dict: Dict) -> Dict:
-    interface_sources: Dict = {}
+        # value looks like {"content": <source code>}
+        # this will be interpreted by JSONInputBundle later
+        ret[path] = value
+        seen[path.stem] = True
 
     for path, value in input_dict.get("interfaces", {}).items():
-        key = _standardize_path(path)
-
-        if key.endswith(".json"):
-            # EthPM Manifest v3 (EIP-2678)
-            if "contractTypes" in value:
-                for name, ct in value["contractTypes"].items():
-                    if name in interface_sources:
-                        raise JSONError(f"Interface namespace collision: {name}")
-
-                    interface_sources[name] = {"type": "json", "code": ct["abi"]}
-
-                continue  # Skip to next interface
-
-            # ABI JSON file (`{"abi": List[ABI]}`)
-            elif "abi" in value:
-                interface = {"type": "json", "code": value["abi"]}
-
-            # ABI JSON file (`List[ABI]`)
-            elif isinstance(value, list):
-                interface = {"type": "json", "code": value}
-
-            else:
-                raise JSONError(f"Interface '{path}' must have 'abi' field")
-
-        elif key.endswith(".vy"):
-            if "content" not in value:
-                raise JSONError(f"Interface '{path}' must have 'content' field")
-
-            interface = {"type": "vyper", "code": value["content"]}
-
+        path = PurePath(path)
+        if path.stem in seen:
+            raise JSONError(f"Interface namespace collision: {path}")
+
+        if isinstance(value, list):
+            # backwards compatibility - straight ABI with no "abi" key.
+            # (should probably just reject these)
+            value = {"abi": value}
+
+        # some validation
+        if not isinstance(value, dict):
+            raise JSONError("invalid interface (must be a dictionary):\n{json.dumps(value)}")
+        if "content" in value:
+            if not isinstance(value["content"], str):
+                raise JSONError(f"invalid 'content' (expected string):\n{json.dumps(value)}")
+        elif "abi" in value:
+            if not isinstance(value["abi"], list):
+                raise JSONError(f"invalid 'abi' (expected list):\n{json.dumps(value)}")
         else:
-            raise JSONError(f"Interface '{path}' must have suffix '.vy' or '.json'")
-
-        key = key.rsplit(".", maxsplit=1)[0]
-        if key in interface_sources:
-            raise JSONError(f"Interface namespace collision: {key}")
+            raise JSONError(
+                "invalid interface (must contain either 'content' or 'abi'):\n{json.dumps(value)}"
+            )
+        if "content" in value and "abi" in value:
+            raise JSONError(
+                "invalid interface (found both 'content' and 'abi'):\n{json.dumps(value)}"
+            )
 
-        interface_sources[key] = interface
+        ret[path] = value
+        seen[path.stem] = True
 
-    return interface_sources
+    return ret
 
 
-def get_input_dict_output_formats(input_dict: Dict, contract_sources: ContractCodes) -> Dict:
-    output_formats = {}
+# get unique output formats for each contract, given the input_dict
+# NOTE: would maybe be nice to raise on duplicated output formats
+def get_output_formats(input_dict: dict, targets: list[PurePath]) -> dict[PurePath, list[str]]:
+    output_formats: dict[PurePath, list[str]] = {}
     for path, outputs in input_dict["settings"]["outputSelection"].items():
         if isinstance(outputs, dict):
             # if outputs are given in solc json format, collapse them into a single list
@@ -248,6 +230,7 @@ def get_input_dict_output_formats(input_dict: Dict, contract_sources: ContractCo
         for key in [i for i in ("evm", "evm.bytecode", "evm.deployedBytecode") if i in outputs]:
             outputs.remove(key)
             outputs.update([i for i in TRANSLATE_MAP if i.startswith(key)])
+
         if "*" in outputs:
             outputs = TRANSLATE_MAP.values()
         else:
@@ -259,107 +242,23 @@ def get_input_dict_output_formats(input_dict: Dict, contract_sources: ContractCo
         outputs = sorted(set(outputs))
 
         if path == "*":
-            output_keys = list(contract_sources.keys())
+            output_paths = targets
         else:
-            output_keys = [_standardize_path(path)]
-            if output_keys[0] not in contract_sources:
-                raise JSONError(f"outputSelection references unknown contract '{output_keys[0]}'")
+            output_paths = [PurePath(path)]
+            if output_paths[0] not in targets:
+                raise JSONError(f"outputSelection references unknown contract '{output_paths[0]}'")
 
-        for key in output_keys:
-            output_formats[key] = outputs
+        for output_path in output_paths:
+            output_formats[output_path] = outputs
 
     return output_formats
 
 
-def get_interface_codes(
-    root_path: Union[Path, None],
-    contract_path: ContractPath,
-    contract_sources: ContractCodes,
-    interface_sources: Dict,
-) -> Dict:
-    interface_codes: Dict = {}
-    interfaces: Dict = {}
-
-    code = contract_sources[contract_path]
-    interface_codes = extract_file_interface_imports(code)
-    for interface_name, interface_path in interface_codes.items():
-        # If we know the interfaces already (e.g. EthPM Manifest file)
-        if interface_name in interface_sources:
-            interfaces[interface_name] = interface_sources[interface_name]
-            continue
-
-        path = Path(contract_path).parent.joinpath(interface_path).as_posix()
-        keys = [_standardize_path(path)]
-        if not interface_path.startswith("."):
-            keys.append(interface_path)
-
-        key = next((i for i in keys if i in interface_sources), None)
-        if key:
-            interfaces[interface_name] = interface_sources[key]
-            continue
-
-        key = next((i + ".vy" for i in keys if i + ".vy" in contract_sources), None)
-        if key:
-            interfaces[interface_name] = {"type": "vyper", "code": contract_sources[key]}
-            continue
-
-        if root_path is None:
-            raise FileNotFoundError(f"Cannot locate interface '{interface_path}{{.vy,.json}}'")
-
-        parent_path = root_path.joinpath(contract_path).parent
-        base_paths = [parent_path]
-        if not interface_path.startswith("."):
-            base_paths.append(root_path)
-        elif interface_path.startswith("../") and len(Path(contract_path).parent.parts) < Path(
-            interface_path
-        ).parts.count(".."):
-            raise FileNotFoundError(
-                f"{contract_path} - Cannot perform relative import outside of base folder"
-            )
-
-        valid_path = get_interface_file_path(base_paths, interface_path)
-        with valid_path.open() as fh:
-            code = fh.read()
-        if valid_path.suffix == ".json":
-            code_dict = json.loads(code.encode())
-            # EthPM Manifest v3 (EIP-2678)
-            if "contractTypes" in code_dict:
-                if interface_name not in code_dict["contractTypes"]:
-                    raise JSONError(f"'{interface_name}' not found in '{valid_path}'")
-
-                if "abi" not in code_dict["contractTypes"][interface_name]:
-                    raise JSONError(f"Missing abi for '{interface_name}' in '{valid_path}'")
-
-                abi = code_dict["contractTypes"][interface_name]["abi"]
-                interfaces[interface_name] = {"type": "json", "code": abi}
-
-            # ABI JSON (`{"abi": List[ABI]}`)
-            elif "abi" in code_dict:
-                interfaces[interface_name] = {"type": "json", "code": code_dict["abi"]}
-
-            # ABI JSON (`List[ABI]`)
-            elif isinstance(code_dict, list):
-                interfaces[interface_name] = {"type": "json", "code": code_dict}
-
-            else:
-                raise JSONError(f"Unexpected type in file: '{valid_path}'")
-
-        else:
-            interfaces[interface_name] = {"type": "vyper", "code": code}
-
-    return interfaces
-
-
 def compile_from_input_dict(
-    input_dict: Dict,
-    exc_handler: Callable = exc_handler_raises,
-    root_folder: Union[str, None] = None,
-) -> Tuple[Dict, Dict]:
-    root_path = None
-    if root_folder is not None:
-        root_path = Path(root_folder).resolve()
-        if not root_path.exists():
-            raise FileNotFoundError(f"Invalid root path - '{root_path.as_posix()}' does not exist")
+    input_dict: dict, exc_handler: Callable = exc_handler_raises, root_folder: Optional[str] = None
+) -> tuple[dict, dict]:
+    if root_folder is None:
+        root_folder = "."
 
     if input_dict["language"] != "Vyper":
         raise JSONError(f"Invalid language '{input_dict['language']}' - Only Vyper is supported.")
@@ -382,46 +281,50 @@ def compile_from_input_dict(
 
     no_bytecode_metadata = not input_dict["settings"].get("bytecodeMetadata", True)
 
-    contract_sources: ContractCodes = get_input_dict_contracts(input_dict)
-    interface_sources = get_input_dict_interfaces(input_dict)
-    output_formats = get_input_dict_output_formats(input_dict, contract_sources)
+    compilation_targets = get_compilation_targets(input_dict)
+    sources = get_inputs(input_dict)
+    output_formats = get_output_formats(input_dict, compilation_targets)
 
-    compiler_data, warning_data = {}, {}
+    input_bundle = JSONInputBundle(sources, search_paths=[Path(root_folder)])
+
+    res, warnings_dict = {}, {}
     warnings.simplefilter("always")
-    for id_, contract_path in enumerate(sorted(contract_sources)):
+    for contract_path in compilation_targets:
         with warnings.catch_warnings(record=True) as caught_warnings:
             try:
-                interface_codes = get_interface_codes(
-                    root_path, contract_path, contract_sources, interface_sources
-                )
-            except Exception as exc:
-                return exc_handler(contract_path, exc, "parser"), {}
-            try:
-                data = vyper.compile_codes(
-                    {contract_path: contract_sources[contract_path]},
-                    output_formats[contract_path],
-                    interface_codes=interface_codes,
-                    initial_id=id_,
+                # use load_file to get a unique source_id
+                file = input_bundle.load_file(contract_path)
+                assert isinstance(file, FileInput)  # mypy hint
+                data = vyper.compile_code(
+                    file.source_code,
+                    contract_name=str(file.path),
+                    input_bundle=input_bundle,
+                    output_formats=output_formats[contract_path],
+                    source_id=file.source_id,
                     settings=settings,
                     no_bytecode_metadata=no_bytecode_metadata,
                 )
+                assert isinstance(data, dict)
+                data["source_id"] = file.source_id
             except Exception as exc:
                 return exc_handler(contract_path, exc, "compiler"), {}
-            compiler_data[contract_path] = data[contract_path]
+            res[contract_path] = data
             if caught_warnings:
-                warning_data[contract_path] = caught_warnings
+                warnings_dict[contract_path] = caught_warnings
 
-    return compiler_data, warning_data
+    return res, warnings_dict
 
 
-def format_to_output_dict(compiler_data: Dict) -> Dict:
-    output_dict: Dict = {"compiler": f"vyper-{vyper.__version__}", "contracts": {}, "sources": {}}
-    for id_, (path, data) in enumerate(compiler_data.items()):
-        output_dict["sources"][path] = {"id": id_}
+# convert output of compile_input_dict to final output format
+def format_to_output_dict(compiler_data: dict) -> dict:
+    output_dict: dict = {"compiler": f"vyper-{vyper.__version__}", "contracts": {}, "sources": {}}
+    for path, data in compiler_data.items():
+        path = str(path)  # Path breaks json serializability
+        output_dict["sources"][path] = {"id": data["source_id"]}
         if "ast_dict" in data:
             output_dict["sources"][path]["ast"] = data["ast_dict"]["ast"]
 
-        name = Path(path).stem
+        name = PurePath(path).stem
         output_dict["contracts"][path] = {name: {}}
         output_contracts = output_dict["contracts"][path][name]
 
@@ -459,7 +362,7 @@ def format_to_output_dict(compiler_data: Dict) -> Dict:
 
 
 # https://stackoverflow.com/a/49518779
-def _raise_on_duplicate_keys(ordered_pairs: List[Tuple[Hashable, Any]]) -> Dict:
+def _raise_on_duplicate_keys(ordered_pairs: list[tuple[Hashable, Any]]) -> dict:
     """
     Raise JSONError if a duplicate key exists in provided ordered list
     of pairs, otherwise return a dict.
@@ -474,17 +377,15 @@ def _raise_on_duplicate_keys(ordered_pairs: List[Tuple[Hashable, Any]]) -> Dict:
 
 
 def compile_json(
-    input_json: Union[Dict, str],
+    input_json: dict | str,
     exc_handler: Callable = exc_handler_raises,
-    root_path: Union[str, None] = None,
-    json_path: Union[str, None] = None,
-) -> Dict:
+    root_folder: Optional[str] = None,
+    json_path: Optional[str] = None,
+) -> dict:
     try:
         if isinstance(input_json, str):
             try:
-                input_dict: Dict = json.loads(
-                    input_json, object_pairs_hook=_raise_on_duplicate_keys
-                )
+                input_dict = json.loads(input_json, object_pairs_hook=_raise_on_duplicate_keys)
             except json.decoder.JSONDecodeError as exc:
                 new_exc = JSONError(str(exc), exc.lineno, exc.colno)
                 return exc_handler(json_path, new_exc, "json")
@@ -492,7 +393,7 @@ def compile_json(
             input_dict = input_json
 
         try:
-            compiler_data, warn_data = compile_from_input_dict(input_dict, exc_handler, root_path)
+            compiler_data, warn_data = compile_from_input_dict(input_dict, exc_handler, root_folder)
             if "errors" in compiler_data:
                 return compiler_data
         except KeyError as exc:
diff --git a/vyper/cli/vyper_serve.py b/vyper/cli/vyper_serve.py
index 401e59e7ba..9771dc922d 100755
--- a/vyper/cli/vyper_serve.py
+++ b/vyper/cli/vyper_serve.py
@@ -91,11 +91,11 @@ def _compile(self, data):
 
         try:
             code = data["code"]
-            out_dict = vyper.compile_codes(
-                {"": code},
+            out_dict = vyper.compile_code(
+                code,
                 list(vyper.compiler.OUTPUT_FORMATS.keys()),
                 evm_version=data.get("evm_version", DEFAULT_EVM_VERSION),
-            )[""]
+            )
             out_dict["ir"] = str(out_dict["ir"])
             out_dict["ir_runtime"] = str(out_dict["ir_runtime"])
         except VyperException as e:
diff --git a/vyper/compiler/__init__.py b/vyper/compiler/__init__.py
index b1c4201361..62ea05b243 100644
--- a/vyper/compiler/__init__.py
+++ b/vyper/compiler/__init__.py
@@ -1,21 +1,15 @@
 from collections import OrderedDict
+from pathlib import Path
 from typing import Any, Callable, Dict, Optional, Sequence, Union
 
 import vyper.ast as vy_ast  # break an import cycle
 import vyper.codegen.core as codegen
 import vyper.compiler.output as output
+from vyper.compiler.input_bundle import InputBundle, PathLike
 from vyper.compiler.phases import CompilerData
 from vyper.compiler.settings import Settings
 from vyper.evm.opcodes import DEFAULT_EVM_VERSION, anchor_evm_version
-from vyper.typing import (
-    ContractCodes,
-    ContractPath,
-    InterfaceDict,
-    InterfaceImports,
-    OutputDict,
-    OutputFormats,
-    StorageLayout,
-)
+from vyper.typing import ContractPath, OutputFormats, StorageLayout
 
 OUTPUT_FORMATS = {
     # requires vyper_module
@@ -47,119 +41,25 @@
 }
 
 
-def compile_codes(
-    contract_sources: ContractCodes,
-    output_formats: Union[OutputDict, OutputFormats, None] = None,
-    exc_handler: Union[Callable, None] = None,
-    interface_codes: Union[InterfaceDict, InterfaceImports, None] = None,
-    initial_id: int = 0,
-    settings: Settings = None,
-    storage_layouts: Optional[dict[ContractPath, Optional[StorageLayout]]] = None,
-    show_gas_estimates: bool = False,
-    no_bytecode_metadata: bool = False,
-) -> OrderedDict:
-    """
-    Generate compiler output(s) from one or more contract source codes.
-
-    Arguments
-    ---------
-    contract_sources: Dict[str, str]
-        Vyper source codes to be compiled. Formatted as `{"contract name": "source code"}`
-    output_formats: List, optional
-        List of compiler outputs to generate. Possible options are all the keys
-        in `OUTPUT_FORMATS`. If not given, the deployment bytecode is generated.
-    exc_handler: Callable, optional
-        Callable used to handle exceptions if the compilation fails. Should accept
-        two arguments - the name of the contract, and the exception that was raised
-    initial_id: int, optional
-        The lowest source ID value to be used when generating the source map.
-    settings: Settings, optional
-        Compiler settings
-    show_gas_estimates: bool, optional
-        Show gas estimates for abi and ir output modes
-    interface_codes: Dict, optional
-        Interfaces that may be imported by the contracts during compilation.
-
-        * May be a singular dictionary shared across all sources to be compiled,
-          i.e. `{'interface name': "definition"}`
-        * or may be organized according to contracts that are being compiled, i.e.
-          `{'contract name': {'interface name': "definition"}`
-
-        * Interface definitions are formatted as: `{'type': "json/vyper", 'code': "interface code"}`
-        * JSON interfaces are given as lists, vyper interfaces as strings
-    no_bytecode_metadata: bool, optional
-        Do not add metadata to bytecode. Defaults to False
-
-    Returns
-    -------
-    Dict
-        Compiler output as `{'contract name': {'output key': "output data"}}`
-    """
-    settings = settings or Settings()
-
-    if output_formats is None:
-        output_formats = ("bytecode",)
-    if isinstance(output_formats, Sequence):
-        output_formats = dict((k, output_formats) for k in contract_sources.keys())
-
-    out: OrderedDict = OrderedDict()
-    for source_id, contract_name in enumerate(sorted(contract_sources), start=initial_id):
-        source_code = contract_sources[contract_name]
-        interfaces: Any = interface_codes
-        storage_layout_override = None
-        if storage_layouts and contract_name in storage_layouts:
-            storage_layout_override = storage_layouts[contract_name]
-
-        if (
-            isinstance(interfaces, dict)
-            and contract_name in interfaces
-            and isinstance(interfaces[contract_name], dict)
-        ):
-            interfaces = interfaces[contract_name]
-
-        # make IR output the same between runs
-        codegen.reset_names()
-
-        compiler_data = CompilerData(
-            source_code,
-            contract_name,
-            interfaces,
-            source_id,
-            settings,
-            storage_layout_override,
-            show_gas_estimates,
-            no_bytecode_metadata,
-        )
-        with anchor_evm_version(compiler_data.settings.evm_version):
-            for output_format in output_formats[contract_name]:
-                if output_format not in OUTPUT_FORMATS:
-                    raise ValueError(f"Unsupported format type {repr(output_format)}")
-                try:
-                    out.setdefault(contract_name, {})
-                    formatter = OUTPUT_FORMATS[output_format]
-                    out[contract_name][output_format] = formatter(compiler_data)
-                except Exception as exc:
-                    if exc_handler is not None:
-                        exc_handler(contract_name, exc)
-                    else:
-                        raise exc
-
-    return out
-
-
 UNKNOWN_CONTRACT_NAME = "<unknown>"
 
 
 def compile_code(
     contract_source: str,
-    output_formats: Optional[OutputFormats] = None,
-    interface_codes: Optional[InterfaceImports] = None,
+    contract_name: str = UNKNOWN_CONTRACT_NAME,
+    source_id: int = 0,
+    input_bundle: InputBundle = None,
     settings: Settings = None,
+    output_formats: Optional[OutputFormats] = None,
     storage_layout_override: Optional[StorageLayout] = None,
+    no_bytecode_metadata: bool = False,
     show_gas_estimates: bool = False,
+    exc_handler: Optional[Callable] = None,
 ) -> dict:
     """
-    Generate compiler output(s) from a single contract source code.
+    Generate consumable compiler output(s) from a single contract source code.
+    Basically, a wrapper around CompilerData which munges the output
+    data into the requested output formats.
 
     Arguments
     ---------
@@ -175,11 +75,11 @@ def compile_code(
         Compiler settings.
     show_gas_estimates: bool, optional
         Show gas estimates for abi and ir output modes
-    interface_codes: Dict, optional
-        Interfaces that may be imported by the contracts during compilation.
-
-        * Formatted as as `{'interface name': {'type': "json/vyper", 'code': "interface code"}}`
-        * JSON interfaces are given as lists, vyper interfaces as strings
+    exc_handler: Callable, optional
+        Callable used to handle exceptions if the compilation fails. Should accept
+        two arguments - the name of the contract, and the exception that was raised
+    no_bytecode_metadata: bool, optional
+        Do not add metadata to bytecode. Defaults to False
 
     Returns
     -------
@@ -187,14 +87,37 @@ def compile_code(
         Compiler output as `{'output key': "output data"}`
     """
 
-    contract_sources = {UNKNOWN_CONTRACT_NAME: contract_source}
-    storage_layouts = {UNKNOWN_CONTRACT_NAME: storage_layout_override}
+    settings = settings or Settings()
+
+    if output_formats is None:
+        output_formats = ("bytecode",)
 
-    return compile_codes(
-        contract_sources,
-        output_formats,
-        interface_codes=interface_codes,
-        settings=settings,
-        storage_layouts=storage_layouts,
-        show_gas_estimates=show_gas_estimates,
-    )[UNKNOWN_CONTRACT_NAME]
+    # make IR output the same between runs
+    codegen.reset_names()
+
+    compiler_data = CompilerData(
+        contract_source,
+        input_bundle,
+        Path(contract_name),
+        source_id,
+        settings,
+        storage_layout_override,
+        show_gas_estimates,
+        no_bytecode_metadata,
+    )
+
+    ret = {}
+    with anchor_evm_version(compiler_data.settings.evm_version):
+        for output_format in output_formats:
+            if output_format not in OUTPUT_FORMATS:
+                raise ValueError(f"Unsupported format type {repr(output_format)}")
+            try:
+                formatter = OUTPUT_FORMATS[output_format]
+                ret[output_format] = formatter(compiler_data)
+            except Exception as exc:
+                if exc_handler is not None:
+                    exc_handler(contract_name, exc)
+                else:
+                    raise exc
+
+    return ret
diff --git a/vyper/compiler/input_bundle.py b/vyper/compiler/input_bundle.py
new file mode 100644
index 0000000000..1e41c3f137
--- /dev/null
+++ b/vyper/compiler/input_bundle.py
@@ -0,0 +1,180 @@
+import contextlib
+import json
+import os
+from dataclasses import dataclass
+from pathlib import Path, PurePath
+from typing import Any, Iterator, Optional
+
+from vyper.exceptions import JSONError
+
+# a type to make mypy happy
+PathLike = Path | PurePath
+
+
+@dataclass
+class CompilerInput:
+    # an input to the compiler, basically an abstraction for file contents
+    source_id: int
+    path: PathLike
+
+    @staticmethod
+    def from_string(source_id: int, path: PathLike, file_contents: str) -> "CompilerInput":
+        try:
+            s = json.loads(file_contents)
+            return ABIInput(source_id, path, s)
+        except (ValueError, TypeError):
+            return FileInput(source_id, path, file_contents)
+
+
+@dataclass
+class FileInput(CompilerInput):
+    source_code: str
+
+
+@dataclass
+class ABIInput(CompilerInput):
+    # some json input, which has already been parsed into a dict or list
+    # this is needed because json inputs present json interfaces as json
+    # objects, not as strings. this class helps us avoid round-tripping
+    # back to a string to pretend it's a file.
+    abi: Any  # something that json.load() returns
+
+
+class _NotFound(Exception):
+    pass
+
+
+# wrap os.path.normpath, but return the same type as the input
+def _normpath(path):
+    return path.__class__(os.path.normpath(path))
+
+
+# an "input bundle" to the compiler, representing the files which are
+# available to the compiler. it is useful because it parametrizes I/O
+# operations over different possible input types. you can think of it
+# as a virtual filesystem which models the compiler's interactions
+# with the outside world. it exposes a "load_file" operation which
+# searches for a file from a set of search paths, and also provides
+# id generation service to get a unique source id per file.
+class InputBundle:
+    # a list of search paths
+    search_paths: list[PathLike]
+
+    def __init__(self, search_paths):
+        self.search_paths = search_paths
+        self._source_id_counter = 0
+        self._source_ids: dict[PathLike, int] = {}
+
+    def _load_from_path(self, path):
+        raise NotImplementedError(f"not implemented! {self.__class__}._load_from_path()")
+
+    def _generate_source_id(self, path: PathLike) -> int:
+        if path not in self._source_ids:
+            self._source_ids[path] = self._source_id_counter
+            self._source_id_counter += 1
+
+        return self._source_ids[path]
+
+    def load_file(self, path: PathLike | str) -> CompilerInput:
+        # search path precedence
+        tried = []
+        for sp in reversed(self.search_paths):
+            # note from pathlib docs:
+            # > If the argument is an absolute path, the previous path is ignored.
+            # Path("/a") / Path("/b") => Path("/b")
+            to_try = sp / path
+
+            # normalize the path with os.path.normpath, to break down
+            # things like "foo/bar/../x.vy" => "foo/x.vy", with all
+            # the caveats around symlinks that os.path.normpath comes with.
+            to_try = _normpath(to_try)
+            try:
+                res = self._load_from_path(to_try)
+                break
+            except _NotFound:
+                tried.append(to_try)
+
+        else:
+            formatted_search_paths = "\n".join(["  " + str(p) for p in tried])
+            raise FileNotFoundError(
+                f"could not find {path} in any of the following locations:\n"
+                f"{formatted_search_paths}"
+            )
+
+        # try to parse from json, so that return types are consistent
+        # across FilesystemInputBundle and JSONInputBundle.
+        if isinstance(res, FileInput):
+            return CompilerInput.from_string(res.source_id, res.path, res.source_code)
+
+        return res
+
+    def add_search_path(self, path: PathLike) -> None:
+        self.search_paths.append(path)
+
+    # temporarily add something to the search path (within the
+    # scope of the context manager) with highest precedence.
+    # if `path` is None, do nothing
+    @contextlib.contextmanager
+    def search_path(self, path: Optional[PathLike]) -> Iterator[None]:
+        if path is None:
+            yield  # convenience, so caller does not have to handle null path
+
+        else:
+            self.search_paths.append(path)
+            try:
+                yield
+            finally:
+                self.search_paths.pop()
+
+
+# regular input. takes a search path(s), and `load_file()` will search all
+# search paths for the file and read it from the filesystem
+class FilesystemInputBundle(InputBundle):
+    def _load_from_path(self, path: Path) -> CompilerInput:
+        try:
+            with path.open() as f:
+                code = f.read()
+        except FileNotFoundError:
+            raise _NotFound(path)
+
+        source_id = super()._generate_source_id(path)
+
+        return FileInput(source_id, path, code)
+
+
+# fake filesystem for JSON inputs. takes a base path, and `load_file()`
+# "reads" the file from the JSON input. Note that this input bundle type
+# never actually interacts with the filesystem -- it is guaranteed to be pure!
+class JSONInputBundle(InputBundle):
+    input_json: dict[PurePath, Any]
+
+    def __init__(self, input_json, search_paths):
+        super().__init__(search_paths)
+        self.input_json = {}
+        for path, item in input_json.items():
+            path = _normpath(path)
+
+            # should be checked by caller
+            assert path not in self.input_json
+            self.input_json[_normpath(path)] = item
+
+    def _load_from_path(self, path: PurePath) -> CompilerInput:
+        try:
+            value = self.input_json[path]
+        except KeyError:
+            raise _NotFound(path)
+
+        source_id = super()._generate_source_id(path)
+
+        if "content" in value:
+            return FileInput(source_id, path, value["content"])
+
+        if "abi" in value:
+            return ABIInput(source_id, path, value["abi"])
+
+        # TODO: ethPM support
+        # if isinstance(contents, dict) and "contractTypes" in contents:
+
+        # unreachable, based on how JSONInputBundle is constructed in
+        # the codebase.
+        raise JSONError(f"Unexpected type in file: '{path}'")  # pragma: nocover
diff --git a/vyper/compiler/output.py b/vyper/compiler/output.py
index 1c38fcff9b..e47f300ba9 100644
--- a/vyper/compiler/output.py
+++ b/vyper/compiler/output.py
@@ -1,6 +1,5 @@
 import warnings
 from collections import OrderedDict, deque
-from pathlib import Path
 
 import asttokens
 
@@ -17,7 +16,7 @@
 
 def build_ast_dict(compiler_data: CompilerData) -> dict:
     ast_dict = {
-        "contract_name": compiler_data.contract_name,
+        "contract_name": str(compiler_data.contract_path),
         "ast": ast_to_dict(compiler_data.vyper_module),
     }
     return ast_dict
@@ -35,7 +34,7 @@ def build_userdoc(compiler_data: CompilerData) -> dict:
 
 def build_external_interface_output(compiler_data: CompilerData) -> str:
     interface = compiler_data.vyper_module_folded._metadata["type"]
-    stem = Path(compiler_data.contract_name).stem
+    stem = compiler_data.contract_path.stem
     # capitalize words separated by '_'
     # ex: test_interface.vy -> TestInterface
     name = "".join([x.capitalize() for x in stem.split("_")])
diff --git a/vyper/compiler/phases.py b/vyper/compiler/phases.py
index 72be4396e4..bfbb336d54 100644
--- a/vyper/compiler/phases.py
+++ b/vyper/compiler/phases.py
@@ -1,6 +1,7 @@
 import copy
 import warnings
 from functools import cached_property
+from pathlib import Path, PurePath
 from typing import Optional, Tuple
 
 from vyper import ast as vy_ast
@@ -8,12 +9,15 @@
 from vyper.codegen.core import anchor_opt_level
 from vyper.codegen.global_context import GlobalContext
 from vyper.codegen.ir_node import IRnode
+from vyper.compiler.input_bundle import FilesystemInputBundle, InputBundle
 from vyper.compiler.settings import OptimizationLevel, Settings
 from vyper.exceptions import StructureException
 from vyper.ir import compile_ir, optimizer
 from vyper.semantics import set_data_positions, validate_semantics
 from vyper.semantics.types.function import ContractFunctionT
-from vyper.typing import InterfaceImports, StorageLayout
+from vyper.typing import StorageLayout
+
+DEFAULT_CONTRACT_NAME = PurePath("VyperContract.vy")
 
 
 class CompilerData:
@@ -49,8 +53,8 @@ class CompilerData:
     def __init__(
         self,
         source_code: str,
-        contract_name: str = "VyperContract",
-        interface_codes: Optional[InterfaceImports] = None,
+        input_bundle: InputBundle = None,
+        contract_path: Path | PurePath = DEFAULT_CONTRACT_NAME,
         source_id: int = 0,
         settings: Settings = None,
         storage_layout: StorageLayout = None,
@@ -62,15 +66,11 @@ def __init__(
 
         Arguments
         ---------
-        source_code : str
+        source_code: str
             Vyper source code.
-        contract_name : str, optional
+        contract_path: Path, optional
             The name of the contract being compiled.
-        interface_codes: Dict, optional
-            Interfaces that may be imported by the contracts during compilation.
-            * Formatted as as `{'interface name': {'type': "json/vyper", 'code': "interface code"}}`
-            * JSON interfaces are given as lists, vyper interfaces as strings
-        source_id : int, optional
+        source_id: int, optional
             ID number used to identify this contract in the source map.
         settings: Settings
             Set optimization mode.
@@ -79,20 +79,22 @@ def __init__(
         no_bytecode_metadata: bool, optional
             Do not add metadata to bytecode. Defaults to False
         """
-        self.contract_name = contract_name
+        self.contract_path = contract_path
         self.source_code = source_code
-        self.interface_codes = interface_codes
         self.source_id = source_id
         self.storage_layout_override = storage_layout
         self.show_gas_estimates = show_gas_estimates
         self.no_bytecode_metadata = no_bytecode_metadata
+
         self.settings = settings or Settings()
+        self.input_bundle = input_bundle or FilesystemInputBundle([Path(".")])
 
         _ = self._generate_ast  # force settings to be calculated
 
     @cached_property
     def _generate_ast(self):
-        settings, ast = generate_ast(self.source_code, self.source_id, self.contract_name)
+        contract_name = str(self.contract_path)
+        settings, ast = generate_ast(self.source_code, self.source_id, contract_name)
 
         # validate the compiler settings
         # XXX: this is a bit ugly, clean up later
@@ -133,12 +135,12 @@ def vyper_module_unfolded(self) -> vy_ast.Module:
         # This phase is intended to generate an AST for tooling use, and is not
         # used in the compilation process.
 
-        return generate_unfolded_ast(self.vyper_module, self.interface_codes)
+        return generate_unfolded_ast(self.contract_path, self.vyper_module, self.input_bundle)
 
     @cached_property
     def _folded_module(self):
         return generate_folded_ast(
-            self.vyper_module, self.interface_codes, self.storage_layout_override
+            self.contract_path, self.vyper_module, self.input_bundle, self.storage_layout_override
         )
 
     @property
@@ -220,7 +222,7 @@ def generate_ast(
         Vyper source code.
     source_id : int
         ID number used to identify this contract in the source map.
-    contract_name : str
+    contract_name: str
         Name of the contract.
 
     Returns
@@ -231,20 +233,24 @@ def generate_ast(
     return vy_ast.parse_to_ast_with_settings(source_code, source_id, contract_name)
 
 
+# destructive -- mutates module in place!
 def generate_unfolded_ast(
-    vyper_module: vy_ast.Module, interface_codes: Optional[InterfaceImports]
+    contract_path: Path | PurePath, vyper_module: vy_ast.Module, input_bundle: InputBundle
 ) -> vy_ast.Module:
     vy_ast.validation.validate_literal_nodes(vyper_module)
     vy_ast.folding.replace_builtin_functions(vyper_module)
-    # note: validate_semantics does type inference on the AST
-    validate_semantics(vyper_module, interface_codes)
+
+    with input_bundle.search_path(contract_path.parent):
+        # note: validate_semantics does type inference on the AST
+        validate_semantics(vyper_module, input_bundle)
 
     return vyper_module
 
 
 def generate_folded_ast(
+    contract_path: Path,
     vyper_module: vy_ast.Module,
-    interface_codes: Optional[InterfaceImports],
+    input_bundle: InputBundle,
     storage_layout_overrides: StorageLayout = None,
 ) -> Tuple[vy_ast.Module, StorageLayout]:
     """
@@ -262,11 +268,15 @@ def generate_folded_ast(
     StorageLayout
         Layout of variables in storage
     """
+
     vy_ast.validation.validate_literal_nodes(vyper_module)
 
     vyper_module_folded = copy.deepcopy(vyper_module)
     vy_ast.folding.fold(vyper_module_folded)
-    validate_semantics(vyper_module_folded, interface_codes)
+
+    with input_bundle.search_path(contract_path.parent):
+        validate_semantics(vyper_module_folded, input_bundle)
+
     symbol_tables = set_data_positions(vyper_module_folded, storage_layout_overrides)
 
     return vyper_module_folded, symbol_tables
diff --git a/vyper/semantics/analysis/__init__.py b/vyper/semantics/analysis/__init__.py
index 9e987d1cd0..7db230167e 100644
--- a/vyper/semantics/analysis/__init__.py
+++ b/vyper/semantics/analysis/__init__.py
@@ -7,11 +7,11 @@
 from .utils import _ExprAnalyser
 
 
-def validate_semantics(vyper_ast, interface_codes):
+def validate_semantics(vyper_ast, input_bundle):
     # validate semantics and annotate AST with type/semantics information
     namespace = get_namespace()
 
     with namespace.enter_scope():
-        add_module_namespace(vyper_ast, interface_codes)
+        add_module_namespace(vyper_ast, input_bundle)
         vy_ast.expansion.expand_annotated_ast(vyper_ast)
         validate_functions(vyper_ast)
diff --git a/vyper/semantics/analysis/module.py b/vyper/semantics/analysis/module.py
index e59422294c..239438f35b 100644
--- a/vyper/semantics/analysis/module.py
+++ b/vyper/semantics/analysis/module.py
@@ -1,13 +1,13 @@
-import importlib
-import pkgutil
-from typing import Optional, Union
+import os
+from pathlib import Path, PurePath
+from typing import Optional
 
 import vyper.builtins.interfaces
 from vyper import ast as vy_ast
+from vyper.compiler.input_bundle import ABIInput, FileInput, FilesystemInputBundle, InputBundle
 from vyper.evm.opcodes import version_check
 from vyper.exceptions import (
     CallViolation,
-    CompilerPanic,
     ExceptionList,
     InvalidLiteral,
     InvalidType,
@@ -15,30 +15,27 @@
     StateAccessViolation,
     StructureException,
     SyntaxException,
-    UndeclaredDefinition,
     VariableDeclarationException,
     VyperException,
 )
 from vyper.semantics.analysis.base import VarInfo
 from vyper.semantics.analysis.common import VyperNodeVisitorBase
-from vyper.semantics.analysis.levenshtein_utils import get_levenshtein_error_suggestions
 from vyper.semantics.analysis.utils import check_constant, validate_expected_type
 from vyper.semantics.data_locations import DataLocation
 from vyper.semantics.namespace import Namespace, get_namespace
 from vyper.semantics.types import EnumT, EventT, InterfaceT, StructT
 from vyper.semantics.types.function import ContractFunctionT
 from vyper.semantics.types.utils import type_from_annotation
-from vyper.typing import InterfaceDict
 
 
-def add_module_namespace(vy_module: vy_ast.Module, interface_codes: InterfaceDict) -> None:
+def add_module_namespace(vy_module: vy_ast.Module, input_bundle: InputBundle) -> None:
     """
     Analyze a Vyper module AST node, add all module-level objects to the
     namespace and validate top-level correctness
     """
 
     namespace = get_namespace()
-    ModuleAnalyzer(vy_module, interface_codes, namespace)
+    ModuleAnalyzer(vy_module, input_bundle, namespace)
 
 
 def _find_cyclic_call(fn_names: list, self_members: dict) -> Optional[list]:
@@ -58,10 +55,10 @@ class ModuleAnalyzer(VyperNodeVisitorBase):
     scope_name = "module"
 
     def __init__(
-        self, module_node: vy_ast.Module, interface_codes: InterfaceDict, namespace: Namespace
+        self, module_node: vy_ast.Module, input_bundle: InputBundle, namespace: Namespace
     ) -> None:
         self.ast = module_node
-        self.interface_codes = interface_codes or {}
+        self.input_bundle = input_bundle
         self.namespace = namespace
 
         # TODO: Move computation out of constructor
@@ -287,17 +284,19 @@ def visit_FunctionDef(self, node):
     def visit_Import(self, node):
         if not node.alias:
             raise StructureException("Import requires an accompanying `as` statement", node)
-        _add_import(node, node.name, node.alias, node.alias, self.interface_codes, self.namespace)
+        # import x.y[name] as y[alias]
+        self._add_import(node, 0, node.name, node.alias)
 
     def visit_ImportFrom(self, node):
-        _add_import(
-            node,
-            node.module,
-            node.name,
-            node.alias or node.name,
-            self.interface_codes,
-            self.namespace,
-        )
+        # from m.n[module] import x[name] as y[alias]
+        alias = node.alias or node.name
+
+        module = node.module or ""
+        if module:
+            module += "."
+
+        qualified_module_name = module + node.name
+        self._add_import(node, node.level, qualified_module_name, alias)
 
     def visit_InterfaceDef(self, node):
         obj = InterfaceT.from_ast(node)
@@ -313,41 +312,87 @@ def visit_StructDef(self, node):
         except VyperException as exc:
             raise exc.with_annotation(node) from None
 
+    def _add_import(
+        self, node: vy_ast.VyperNode, level: int, qualified_module_name: str, alias: str
+    ) -> None:
+        type_ = self._load_import(level, qualified_module_name)
+
+        try:
+            self.namespace[alias] = type_
+        except VyperException as exc:
+            raise exc.with_annotation(node) from None
+
+    # load an InterfaceT from an import.
+    # raises FileNotFoundError
+    def _load_import(self, level: int, module_str: str) -> InterfaceT:
+        if _is_builtin(module_str):
+            return _load_builtin_import(level, module_str)
+
+        path = _import_to_path(level, module_str)
+
+        try:
+            file = self.input_bundle.load_file(path.with_suffix(".vy"))
+            assert isinstance(file, FileInput)  # mypy hint
+            interface_ast = vy_ast.parse_to_ast(file.source_code, contract_name=str(file.path))
+            return InterfaceT.from_ast(interface_ast)
+        except FileNotFoundError:
+            pass
+
+        try:
+            file = self.input_bundle.load_file(path.with_suffix(".json"))
+            assert isinstance(file, ABIInput)  # mypy hint
+            return InterfaceT.from_json_abi(str(file.path), file.abi)
+        except FileNotFoundError:
+            raise ModuleNotFoundError(module_str)
+
+
+# convert an import to a path (without suffix)
+def _import_to_path(level: int, module_str: str) -> PurePath:
+    base_path = ""
+    if level > 1:
+        base_path = "../" * (level - 1)
+    elif level == 1:
+        base_path = "./"
+    return PurePath(f"{base_path}{module_str.replace('.','/')}/")
+
+
+# can add more, e.g. "vyper.builtins.interfaces", etc.
+BUILTIN_PREFIXES = ["vyper.interfaces"]
+
+
+def _is_builtin(module_str):
+    return any(module_str.startswith(prefix) for prefix in BUILTIN_PREFIXES)
+
+
+def _load_builtin_import(level: int, module_str: str) -> InterfaceT:
+    if not _is_builtin(module_str):
+        raise ModuleNotFoundError(f"Not a builtin: {module_str}") from None
+
+    builtins_path = vyper.builtins.interfaces.__path__[0]
+    # hygiene: convert to relpath to avoid leaking user directory info
+    # (note Path.relative_to cannot handle absolute to relative path
+    # conversion, so we must use the `os` module).
+    builtins_path = os.path.relpath(builtins_path)
+
+    search_path = Path(builtins_path).parent.parent.parent
+    # generate an input bundle just because it knows how to build paths.
+    input_bundle = FilesystemInputBundle([search_path])
+
+    # remap builtins directory --
+    # vyper/interfaces => vyper/builtins/interfaces
+    remapped_module = module_str
+    if remapped_module.startswith("vyper.interfaces"):
+        remapped_module = remapped_module.removeprefix("vyper.interfaces")
+        remapped_module = vyper.builtins.interfaces.__package__ + remapped_module
 
-def _add_import(
-    node: Union[vy_ast.Import, vy_ast.ImportFrom],
-    module: str,
-    name: str,
-    alias: str,
-    interface_codes: InterfaceDict,
-    namespace: dict,
-) -> None:
-    if module == "vyper.interfaces":
-        interface_codes = _get_builtin_interfaces()
-    if name not in interface_codes:
-        suggestions_str = get_levenshtein_error_suggestions(name, _get_builtin_interfaces(), 1.0)
-        raise UndeclaredDefinition(f"Unknown interface: {name}. {suggestions_str}", node)
-
-    if interface_codes[name]["type"] == "vyper":
-        interface_ast = vy_ast.parse_to_ast(interface_codes[name]["code"], contract_name=name)
-        type_ = InterfaceT.from_ast(interface_ast)
-    elif interface_codes[name]["type"] == "json":
-        type_ = InterfaceT.from_json_abi(name, interface_codes[name]["code"])  # type: ignore
-    else:
-        raise CompilerPanic(f"Unknown interface format: {interface_codes[name]['type']}")
+    path = _import_to_path(level, remapped_module).with_suffix(".vy")
 
     try:
-        namespace[alias] = type_
-    except VyperException as exc:
-        raise exc.with_annotation(node) from None
-
-
-def _get_builtin_interfaces():
-    interface_names = [i.name for i in pkgutil.iter_modules(vyper.builtins.interfaces.__path__)]
-    return {
-        name: {
-            "type": "vyper",
-            "code": importlib.import_module(f"vyper.builtins.interfaces.{name}").interface_code,
-        }
-        for name in interface_names
-    }
+        file = input_bundle.load_file(path)
+        assert isinstance(file, FileInput)  # mypy hint
+    except FileNotFoundError:
+        raise ModuleNotFoundError(f"Not a builtin: {module_str}") from None
+
+    # TODO: it might be good to cache this computation
+    interface_ast = vy_ast.parse_to_ast(file.source_code, contract_name=module_str)
+    return InterfaceT.from_ast(interface_ast)
diff --git a/vyper/typing.py b/vyper/typing.py
index 18e201e814..ad3964dff9 100644
--- a/vyper/typing.py
+++ b/vyper/typing.py
@@ -7,17 +7,9 @@
 # Compiler
 ContractPath = str
 SourceCode = str
-ContractCodes = Dict[ContractPath, SourceCode]
 OutputFormats = Sequence[str]
-OutputDict = Dict[ContractPath, OutputFormats]
 StorageLayout = Dict
 
-# Interfaces
-InterfaceAsName = str
-InterfaceImportPath = str
-InterfaceImports = Dict[InterfaceAsName, InterfaceImportPath]
-InterfaceDict = Dict[ContractPath, InterfaceImports]
-
 # Opcodes
 OpcodeGasCost = Union[int, Tuple]
 OpcodeValue = Tuple[Optional[int], int, int, OpcodeGasCost]

From 4f7661478d01b4f5e67d8e964c702f8b1973af16 Mon Sep 17 00:00:00 2001
From: sudo rm -rf --no-preserve-root / <pcaversaccio@users.noreply.github.com>
Date: Tue, 7 Nov 2023 23:22:33 +0100
Subject: [PATCH 159/161] docs: update resources section (#3656)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

* docs: update `resources.rst` file
* correct 🐍 snekmate branding
* We like longer hyphens :)
* Add `Foundry-Vyper` to bottom
* Add titanoboa reference
---
 docs/resources.rst | 42 ++++++++++++++++++++++--------------------
 1 file changed, 22 insertions(+), 20 deletions(-)

diff --git a/docs/resources.rst b/docs/resources.rst
index 7f0d0600a9..a3dfa480ed 100644
--- a/docs/resources.rst
+++ b/docs/resources.rst
@@ -3,45 +3,47 @@
 Other resources and learning material
 #####################################
 
-Vyper has an active community. You can find third party tutorials,
-examples, courses and other learning material.
+Vyper has an active community. You can find third-party tutorials, examples, courses, and other learning material.
 
 General
 -------
 
-- `Ape Academy - Learn how to build vyper projects <https://academy.apeworx.io/>`__ by ApeWorX
-- `More Vyper by Example <https://vyper-by-example.org/>`__ by Smart Contract Engineer
-- `Vyper cheat Sheet <https://reference.auditless.com/cheatsheet>`__
-- `Vyper Hub for development <https://github.com/zcor/vyper-dev>`__
-- `Vyper greatest hits smart contract examples <https://github.com/pynchmeister/vyper-greatest-hits/tree/main/contracts>`__
+- `Ape Academy – Learn how to build Vyper projects <https://academy.apeworx.io/>`_ by ApeWorX
+- `More Vyper by Example <https://vyper-by-example.org/>`_ by Smart Contract Engineer
+- `Vyper cheat Sheet <https://reference.auditless.com/cheatsheet>`_
+- `Vyper Hub for development <https://github.com/zcor/vyper-dev>`_
+- `Vyper greatest hits smart contract examples <https://github.com/pynchmeister/vyper-greatest-hits/tree/main/contracts>`_
+- `A curated list of Vyper resources, libraries, tools, and more <https://github.com/stars/pcaversaccio/lists/vyper>`_
 
 Frameworks and tooling
 ----------------------
 
-- `ApeWorX - The Ethereum development framework for Python Developers, Data Scientists, and Security Professionals <https://www.apeworx.io/>`__
-- `Foundry x Vyper - Foundry template to compile Vyper contracts <https://github.com/0xKitsune/Foundry-Vyper>`__
-- `Snekmate - Vyper smart contract building blocks <https://github.com/pcaversaccio/snekmate>`__
-- `Serpentor - A set of smart contracts tools for governance <https://github.com/yearn/serpentor>`__
-- `Smart contract development frameworks and tools for Vyper on Ethreum.org <https://ethereum.org/en/developers/docs/programming-languages/python/>`__
+- `Titanoboa – An experimental Vyper interpreter with pretty tracebacks, forking, debugging features and more <https://github.com/vyperlang/titanoboa/>`_
+- `ApeWorX – The Ethereum development framework for Python Developers, Data Scientists, and Security Professionals <https://www.apeworx.io/>`_
+- `VyperDeployer – A helper smart contract to compile and test Vyper contracts in Foundry <https://github.com/pcaversaccio/snekmate/blob/main/lib/utils/VyperDeployer.sol>`_
+- `🐍 snekmate – Vyper smart contract building blocks <https://github.com/pcaversaccio/snekmate>`_
+- `Serpentor – A set of smart contracts tools for governance <https://github.com/yearn/serpentor>`_
+- `Smart contract development frameworks and tools for Vyper on Ethreum.org <https://ethereum.org/en/developers/docs/programming-languages/python/>`_
 
 Security
 --------
 
-- `VyperPunk - learn to secure and hack Vyper smart contracts <https://github.com/SupremacyTeam/VyperPunk>`__
-- `VyperExamples - Vyper vulnerability examples <https://www.vyperexamples.com/reentrancy>`__
+- `VyperPunk – learn to secure and hack Vyper smart contracts <https://github.com/SupremacyTeam/VyperPunk>`_
+- `VyperExamples – Vyper vulnerability examples <https://www.vyperexamples.com/reentrancy>`_
 
 Conference presentations
 ------------------------
 
-- `Vyper Smart Contract Programming Language by Patrick Collins (2022, 30 mins) <https://www.youtube.com/watch?v=b-sOMNF9quo&t=1444s>`__
-- `Python and DeFi by Curve Finance (2022, 15 mins) <https://www.youtube.com/watch?v=4HOU3z0LoDg>`__
-- `My experience with Vyper over the years by Benjamin Scherrey (2022, 15 mins) <https://www.youtube.com/watch?v=_j7qF_GlyWE>`__
-- `Short introduction to Vyper by Edison Que (3 mins) <https://www.youtube.com/watch?v=dXqln-keyHw&t=4s>`__
+- `Vyper Smart Contract Programming Language by Patrick Collins (2022, 30 mins) <https://www.youtube.com/watch?v=b-sOMNF9quo&t=1444s>`_
+- `Python and DeFi by Curve Finance (2022, 15 mins) <https://www.youtube.com/watch?v=4HOU3z0LoDg>`_
+- `My experience with Vyper over the years by Benjamin Scherrey (2022, 15 mins) <https://www.youtube.com/watch?v=_j7qF_GlyWE>`_
+- `Short introduction to Vyper by Edison Que (3 mins) <https://www.youtube.com/watch?v=dXqln-keyHw&t=4s>`_
 
 Unmaintained
 ------------
 
 These resources have not been updated for a while, but may still offer interesting content.
 
-- `Awesome Vyper curated resources <https://github.com/spadebuilders/awesome-vyper>`__
-- `Brownie - Python framework for developing smart contracts (deprecated) <https://eth-brownie.readthedocs.io/en/stable/>`__
+- `Awesome Vyper curated resources <https://github.com/spadebuilders/awesome-vyper>`_
+- `Brownie – Python framework for developing smart contracts (deprecated) <https://eth-brownie.readthedocs.io/en/stable/>`_
+- `Foundry x Vyper – Foundry template to compile Vyper contracts <https://github.com/0xKitsune/Foundry-Vyper>`_

From a87fb8c42c74f418b230003bcc66766a6c374f86 Mon Sep 17 00:00:00 2001
From: nfwsncked <75267395+nfwsncked@users.noreply.github.com>
Date: Wed, 8 Nov 2023 00:41:08 +0100
Subject: [PATCH 160/161] chore: improve assert descriptions in crowdfund.vy
 (#3064)

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
Co-authored-by: El De-dog-lo <3859395+fubuloubu@users.noreply.github.com>
---
 examples/crowdfund.vy | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/examples/crowdfund.vy b/examples/crowdfund.vy
index 3891ad0b74..56b34308f1 100644
--- a/examples/crowdfund.vy
+++ b/examples/crowdfund.vy
@@ -18,15 +18,15 @@ def __init__(_beneficiary: address, _goal: uint256, _timelimit: uint256):
 @external
 @payable
 def participate():
-    assert block.timestamp < self.deadline, "deadline not met (yet)"
+    assert block.timestamp < self.deadline, "deadline has expired"
 
     self.funders[msg.sender] += msg.value
 
 # Enough money was raised! Send funds to the beneficiary
 @external
 def finalize():
-    assert block.timestamp >= self.deadline, "deadline has passed"
-    assert self.balance >= self.goal, "the goal has not been reached"
+    assert block.timestamp >= self.deadline, "deadline has not expired yet"
+    assert self.balance >= self.goal, "goal has not been reached"
 
     selfdestruct(self.beneficiary)
 

From 806dd9075e83eaabbfbaa397c48c9703317b6154 Mon Sep 17 00:00:00 2001
From: Franfran <51274081+iFrostizz@users.noreply.github.com>
Date: Wed, 8 Nov 2023 00:50:41 +0100
Subject: [PATCH 161/161] test: add unit tests for internal abi type
 construction (#3662)

specifically test some internal sanity checks/validation

---------

Co-authored-by: Charles Cooper <cooper.charles.m@gmail.com>
---
 tests/abi_types/test_invalid_abi_types.py | 26 +++++++++++++++++++++++
 vyper/abi_types.py                        | 16 +++++++-------
 vyper/exceptions.py                       |  4 ++++
 3 files changed, 38 insertions(+), 8 deletions(-)
 create mode 100644 tests/abi_types/test_invalid_abi_types.py

diff --git a/tests/abi_types/test_invalid_abi_types.py b/tests/abi_types/test_invalid_abi_types.py
new file mode 100644
index 0000000000..c8566e066f
--- /dev/null
+++ b/tests/abi_types/test_invalid_abi_types.py
@@ -0,0 +1,26 @@
+import pytest
+
+from vyper.abi_types import (
+    ABI_Bytes,
+    ABI_BytesM,
+    ABI_DynamicArray,
+    ABI_FixedMxN,
+    ABI_GIntM,
+    ABI_String,
+)
+from vyper.exceptions import InvalidABIType
+
+cases_invalid_types = [
+    (ABI_GIntM, ((0, False), (7, False), (300, True), (300, False))),
+    (ABI_FixedMxN, ((0, 0, False), (8, 0, False), (256, 81, True), (300, 80, False))),
+    (ABI_BytesM, ((0,), (33,), (-10,))),
+    (ABI_Bytes, ((-1,), (-69,))),
+    (ABI_DynamicArray, ((ABI_GIntM(256, False), -1), (ABI_String(256), -10))),
+]
+
+
+@pytest.mark.parametrize("typ,params_variants", cases_invalid_types)
+def test_invalid_abi_types(assert_compile_failed, typ, params_variants):
+    # double parametrization cannot work because the 2nd dimension is variable
+    for params in params_variants:
+        assert_compile_failed(lambda: typ(*params), InvalidABIType)
diff --git a/vyper/abi_types.py b/vyper/abi_types.py
index b272996aed..051f8db19f 100644
--- a/vyper/abi_types.py
+++ b/vyper/abi_types.py
@@ -1,4 +1,4 @@
-from vyper.exceptions import CompilerPanic
+from vyper.exceptions import InvalidABIType
 from vyper.utils import ceil32
 
 
@@ -69,7 +69,7 @@ def __repr__(self):
 class ABI_GIntM(ABIType):
     def __init__(self, m_bits, signed):
         if not (0 < m_bits <= 256 and 0 == m_bits % 8):
-            raise CompilerPanic("Invalid M provided for GIntM")
+            raise InvalidABIType("Invalid M provided for GIntM")
 
         self.m_bits = m_bits
         self.signed = signed
@@ -117,9 +117,9 @@ def selector_name(self):
 class ABI_FixedMxN(ABIType):
     def __init__(self, m_bits, n_places, signed):
         if not (0 < m_bits <= 256 and 0 == m_bits % 8):
-            raise CompilerPanic("Invalid M for FixedMxN")
+            raise InvalidABIType("Invalid M for FixedMxN")
         if not (0 < n_places and n_places <= 80):
-            raise CompilerPanic("Invalid N for FixedMxN")
+            raise InvalidABIType("Invalid N for FixedMxN")
 
         self.m_bits = m_bits
         self.n_places = n_places
@@ -142,7 +142,7 @@ def is_complex_type(self):
 class ABI_BytesM(ABIType):
     def __init__(self, m_bytes):
         if not 0 < m_bytes <= 32:
-            raise CompilerPanic("Invalid M for BytesM")
+            raise InvalidABIType("Invalid M for BytesM")
 
         self.m_bytes = m_bytes
 
@@ -173,7 +173,7 @@ def selector_name(self):
 class ABI_StaticArray(ABIType):
     def __init__(self, subtyp, m_elems):
         if not m_elems >= 0:
-            raise CompilerPanic("Invalid M")
+            raise InvalidABIType("Invalid M")
 
         self.subtyp = subtyp
         self.m_elems = m_elems
@@ -200,7 +200,7 @@ def is_complex_type(self):
 class ABI_Bytes(ABIType):
     def __init__(self, bytes_bound):
         if not bytes_bound >= 0:
-            raise CompilerPanic("Negative bytes_bound provided to ABI_Bytes")
+            raise InvalidABIType("Negative bytes_bound provided to ABI_Bytes")
 
         self.bytes_bound = bytes_bound
 
@@ -234,7 +234,7 @@ def selector_name(self):
 class ABI_DynamicArray(ABIType):
     def __init__(self, subtyp, elems_bound):
         if not elems_bound >= 0:
-            raise CompilerPanic("Negative bound provided to DynamicArray")
+            raise InvalidABIType("Negative bound provided to DynamicArray")
 
         self.subtyp = subtyp
         self.elems_bound = elems_bound
diff --git a/vyper/exceptions.py b/vyper/exceptions.py
index 8b2020285a..3bde20356e 100644
--- a/vyper/exceptions.py
+++ b/vyper/exceptions.py
@@ -336,3 +336,7 @@ class UnfoldableNode(VyperInternalException):
 
 class TypeCheckFailure(VyperInternalException):
     """An issue was not caught during type checking that should have been."""
+
+
+class InvalidABIType(VyperInternalException):
+    """An internal routine constructed an invalid ABI type"""