From db6698b68b364f5ca6924e0debb8f97211c40867 Mon Sep 17 00:00:00 2001 From: Mark Koch Date: Wed, 28 Aug 2024 11:15:58 +0100 Subject: [PATCH 1/2] feat: Type check array subscripts --- guppylang/checker/core.py | 43 +++++++++- guppylang/checker/expr_checker.py | 82 +++++++++++++++++-- guppylang/checker/linearity_checker.py | 2 + guppylang/nodes.py | 16 +++- guppylang/prelude/builtins.py | 10 ++- tests/error/array_errors/linear_index.err | 7 -- tests/error/array_errors/linear_index.py | 17 ---- .../inout_errors/subscript_not_setable.err | 7 ++ .../inout_errors/subscript_not_setable.py | 28 +++++++ tests/error/type_errors/not_subscriptable.err | 7 ++ tests/error/type_errors/not_subscriptable.py | 12 +++ .../error/type_errors/subscript_bad_item.err | 7 ++ tests/error/type_errors/subscript_bad_item.py | 13 +++ tests/integration/test_array.py | 2 + tests/integration/test_list.py | 3 + 15 files changed, 220 insertions(+), 36 deletions(-) delete mode 100644 tests/error/array_errors/linear_index.err delete mode 100644 tests/error/array_errors/linear_index.py create mode 100644 tests/error/inout_errors/subscript_not_setable.err create mode 100644 tests/error/inout_errors/subscript_not_setable.py create mode 100644 tests/error/type_errors/not_subscriptable.err create mode 100644 tests/error/type_errors/not_subscriptable.py create mode 100644 tests/error/type_errors/subscript_bad_item.err create mode 100644 tests/error/type_errors/subscript_bad_item.py diff --git a/guppylang/checker/core.py b/guppylang/checker/core.py index 3a03dd31..60ec1c4d 100644 --- a/guppylang/checker/core.py +++ b/guppylang/checker/core.py @@ -60,10 +60,10 @@ #: #: All places are equipped with a unique id, a type and an optional definition AST #: location. During linearity checking, they are tracked separately. -Place: TypeAlias = "Variable | FieldAccess" +Place: TypeAlias = "Variable | FieldAccess | SubscriptAccess" #: Unique identifier for a `Place`. -PlaceId: TypeAlias = "Variable.Id | FieldAccess.Id" +PlaceId: TypeAlias = "Variable.Id | FieldAccess.Id | SubscriptAccess.Id" @dataclass(frozen=True) @@ -154,6 +154,45 @@ def replace_defined_at(self, node: AstNode | None) -> "FieldAccess": return replace(self, exact_defined_at=node) +@dataclass(frozen=True) +class SubscriptAccess: + """A place identifying a subscript `place[item]` access.""" + + parent: Place + item: Variable + ty: Type + item_expr: ast.expr + getitem_call: ast.expr + #: Only populated if this place occurs in an inout position + setitem_call: ast.expr | None = None + + @dataclass(frozen=True) + class Id: + """Identifier for subscript places.""" + + parent: PlaceId + item: Variable.Id + + @cached_property + def id(self) -> "SubscriptAccess.Id": + """The unique `PlaceId` identifier for this place.""" + return SubscriptAccess.Id(self.parent.id, self.item.id) + + @cached_property + def defined_at(self) -> AstNode | None: + """Optional location where this place was last assigned to.""" + return self.parent.defined_at + + @property + def describe(self) -> str: + """A human-readable description of this place for error messages.""" + return f"Subscript `{self}`" + + def __str__(self) -> str: + """String representation of this place.""" + return f"{self.parent}[...]" + + PyScope = dict[str, Any] diff --git a/guppylang/checker/expr_checker.py b/guppylang/checker/expr_checker.py index cef50fb4..7ed7ee02 100644 --- a/guppylang/checker/expr_checker.py +++ b/guppylang/checker/expr_checker.py @@ -24,6 +24,7 @@ import sys import traceback from contextlib import suppress +from dataclasses import replace from typing import Any, NoReturn, cast from guppylang.ast_util import ( @@ -35,12 +36,15 @@ with_loc, with_type, ) +from guppylang.cfg.builder import tmp_vars from guppylang.checker.core import ( Context, DummyEvalDict, FieldAccess, Globals, Locals, + Place, + SubscriptAccess, Variable, ) from guppylang.definition.ty import TypeDef @@ -56,6 +60,7 @@ DesugaredListComp, FieldAccessAndDrop, GlobalName, + InoutReturnSentinel, IterEnd, IterHasNext, IterNext, @@ -63,6 +68,7 @@ MakeIter, PlaceNode, PyExpr, + SubscriptAccessAndDrop, TensorCall, TypeApply, ) @@ -447,7 +453,7 @@ def _synthesize_binary( node, ) - def _synthesize_instance_func( + def synthesize_instance_func( self, node: ast.expr, args: list[ast.expr], @@ -495,16 +501,37 @@ def visit_Compare(self, node: ast.Compare) -> tuple[ast.expr, Type]: def visit_Subscript(self, node: ast.Subscript) -> tuple[ast.expr, Type]: node.value, ty = self.synthesize(node.value) + item_expr, item_ty = self.synthesize(node.slice) + # Give the item a unique name so we can refer to it later in case we also want + # to compile a call to `__setitem__` + item = Variable(next(tmp_vars), item_ty, item_expr) + item_node = with_type(item_ty, with_loc(item_expr, PlaceNode(place=item))) + # Check a call to the `__getitem__` instance function exp_sig = FunctionType( [ - FuncInput(ty, InputFlags.NoFlags), + FuncInput(ty, InputFlags.Inout), FuncInput(ExistentialTypeVar.fresh("Key", False), InputFlags.NoFlags), ], ExistentialTypeVar.fresh("Val", False), ) - return self._synthesize_instance_func( - node.value, [node.slice], "__getitem__", "not subscriptable", exp_sig + getitem_expr, result_ty = self.synthesize_instance_func( + node.value, [item_node], "__getitem__", "not subscriptable", exp_sig ) + # Subscripting a place is itself a place + expr: ast.expr + if isinstance(node.value, PlaceNode): + place = SubscriptAccess( + node.value.place, item, result_ty, item_expr, getitem_expr + ) + expr = PlaceNode(place=place) + else: + # If the subscript is not on a place, then there is no way to address the + # other indices after this one has been projected out (e.g. `f()[0]` makes + # you loose access to all elements besides 0). + expr = SubscriptAccessAndDrop( + item=item, item_expr=item_expr, getitem_expr=getitem_expr + ) + return with_loc(node, expr), result_ty def visit_Call(self, node: ast.Call) -> tuple[ast.expr, Type]: if len(node.keywords) > 0: @@ -550,7 +577,7 @@ def visit_MakeIter(self, node: MakeIter) -> tuple[ast.expr, Type]: exp_sig = FunctionType( [FuncInput(ty, InputFlags.NoFlags)], ExistentialTypeVar.fresh("Iter", False) ) - expr, ty = self._synthesize_instance_func( + expr, ty = self.synthesize_instance_func( node.value, [], "__iter__", "not iterable", exp_sig ) @@ -574,7 +601,7 @@ def visit_IterHasNext(self, node: IterHasNext) -> tuple[ast.expr, Type]: exp_sig = FunctionType( [FuncInput(ty, InputFlags.NoFlags)], TupleType([bool_type(), ty]) ) - return self._synthesize_instance_func( + return self.synthesize_instance_func( node.value, [], "__hasnext__", "not an iterator", exp_sig, True ) @@ -584,14 +611,14 @@ def visit_IterNext(self, node: IterNext) -> tuple[ast.expr, Type]: [FuncInput(ty, InputFlags.NoFlags)], TupleType([ExistentialTypeVar.fresh("T", False), ty]), ) - return self._synthesize_instance_func( + return self.synthesize_instance_func( node.value, [], "__next__", "not an iterator", exp_sig, True ) def visit_IterEnd(self, node: IterEnd) -> tuple[ast.expr, Type]: node.value, ty = self.synthesize(node.value) exp_sig = FunctionType([FuncInput(ty, InputFlags.NoFlags)], NoneType()) - return self._synthesize_instance_func( + return self.synthesize_instance_func( node.value, [], "__end__", "not an iterator", exp_sig, True ) @@ -714,6 +741,8 @@ def type_check_args( new_args: list[ast.expr] = [] for inp, func_inp in zip(inputs, func_ty.inputs, strict=True): a, s = ExprChecker(ctx).check(inp, func_inp.ty.substitute(subst), "argument") + if InputFlags.Inout in func_inp.flags and isinstance(a, PlaceNode): + a.place = check_inout_arg_place(a.place, ctx, a) new_args.append(a) subst |= s @@ -734,6 +763,43 @@ def type_check_args( return new_args, subst +def check_inout_arg_place(place: Place, ctx: Context, node: PlaceNode) -> Place: + """Performs additional checks for place arguments in @inout position. + + In particular, we need to check that places involving `place[item]` subscripts + implement the corresponding `__setitem__` method. + """ + match place: + case Variable(): + return place + case FieldAccess(parent=parent): + return replace(place, parent=check_inout_arg_place(parent, ctx, node)) + case SubscriptAccess(parent=parent, item=item, ty=ty): + # Check a call to the `__setitem__` instance function + exp_sig = FunctionType( + [ + FuncInput(parent.ty, InputFlags.Inout), + FuncInput(item.ty, InputFlags.NoFlags), + FuncInput(ty, InputFlags.NoFlags), + ], + NoneType(), + ) + setitem_args = [ + with_type(parent.ty, with_loc(node, PlaceNode(parent))), + with_type(item.ty, with_loc(node, PlaceNode(item))), + with_type(ty, with_loc(node, InoutReturnSentinel(var=place))), + ] + setitem_call, _ = ExprSynthesizer(ctx).synthesize_instance_func( + setitem_args[0], + setitem_args[1:], + "__setitem__", + "not assignable", + exp_sig, + True, + ) + return replace(place, setitem_call=setitem_call) + + def synthesize_call( func_ty: FunctionType, args: list[ast.expr], node: AstNode, ctx: Context ) -> tuple[list[ast.expr], Type, Inst]: diff --git a/guppylang/checker/linearity_checker.py b/guppylang/checker/linearity_checker.py index 534246c3..7a518646 100644 --- a/guppylang/checker/linearity_checker.py +++ b/guppylang/checker/linearity_checker.py @@ -18,6 +18,7 @@ Locals, Place, PlaceId, + SubscriptAccess, Variable, ) from guppylang.definition.value import CallableDef @@ -169,6 +170,7 @@ def _reassign_inout_args(self, func_ty: FunctionType, args: list[ast.expr]) -> N match arg: case PlaceNode(place=place): for leaf in leaf_places(place): + assert not isinstance(leaf, SubscriptAccess) leaf = leaf.replace_defined_at(arg) self.scope.assign(leaf) case arg if inp.ty.linear: diff --git a/guppylang/nodes.py b/guppylang/nodes.py index a79b41d4..6b3394d2 100644 --- a/guppylang/nodes.py +++ b/guppylang/nodes.py @@ -94,6 +94,20 @@ class FieldAccessAndDrop(ast.expr): ) +class SubscriptAccessAndDrop(ast.expr): + """A subscript element access on an object, dropping all the remaining items.""" + + item: "Variable" + item_expr: ast.expr + getitem_expr: ast.expr + + _fields = ( + "item", + "item_expr", + "getitem_expr", + ) + + class MakeIter(ast.expr): """Creates an iterator using the `__iter__` magic method. @@ -205,7 +219,7 @@ class InoutReturnSentinel(ast.expr): """An invisible expression corresponding to an implicit use of @inout vars whenever a function returns.""" - var: "Variable | str" + var: "Place | str" _fields = ("var",) diff --git a/guppylang/prelude/builtins.py b/guppylang/prelude/builtins.py index d3303323..56c2f818 100644 --- a/guppylang/prelude/builtins.py +++ b/guppylang/prelude/builtins.py @@ -655,7 +655,15 @@ class Array: "ArrayGet", args=[int_arg(), type_arg()], variable_remap={0: 1, 1: 0} ), ) - def __getitem__(self: array[T, n], idx: int) -> T: ... + def __getitem__(self: array[L, n] @ inout, idx: int) -> L: ... + + @guppy.hugr_op( + builtins, + custom_op( + "ArraySet", args=[int_arg(), type_arg()], variable_remap={0: 1, 1: 0} + ), + ) + def __setitem__(self: array[L, n] @ inout, idx: int, value: L) -> None: ... @guppy.custom(builtins, checker=ArrayLenChecker()) def __len__(self: array[T, n]) -> int: ... diff --git a/tests/error/array_errors/linear_index.err b/tests/error/array_errors/linear_index.err deleted file mode 100644 index dfa0a247..00000000 --- a/tests/error/array_errors/linear_index.err +++ /dev/null @@ -1,7 +0,0 @@ -Guppy compilation failed. Error in file $FILE:14 - -12: @guppy(module) -13: def main(qs: array[qubit, 42]) -> int: -14: return qs[0] - ^^ -GuppyTypeError: Cannot instantiate non-linear type variable `T` in type `forall n, T: nat. (array[T, n], int) -> T` with linear type `qubit` diff --git a/tests/error/array_errors/linear_index.py b/tests/error/array_errors/linear_index.py deleted file mode 100644 index 79a6bc02..00000000 --- a/tests/error/array_errors/linear_index.py +++ /dev/null @@ -1,17 +0,0 @@ -import guppylang.prelude.quantum as quantum -from guppylang.decorator import guppy -from guppylang.module import GuppyModule -from guppylang.prelude.builtins import array -from guppylang.prelude.quantum import qubit - - -module = GuppyModule("test") -module.load(quantum) - - -@guppy(module) -def main(qs: array[qubit, 42]) -> int: - return qs[0] - - -module.compile() \ No newline at end of file diff --git a/tests/error/inout_errors/subscript_not_setable.err b/tests/error/inout_errors/subscript_not_setable.err new file mode 100644 index 00000000..9d8fe387 --- /dev/null +++ b/tests/error/inout_errors/subscript_not_setable.err @@ -0,0 +1,7 @@ +Guppy compilation failed. Error in file $FILE:24 + +22: @guppy(module) +23: def test(c: MyImmutableContainer) -> MyImmutableContainer: +24: foo(c[0]) + ^^^^ +GuppyTypeError: Expression of type `MyImmutableContainer` is not assignable since it does not implement the `__setitem__` method diff --git a/tests/error/inout_errors/subscript_not_setable.py b/tests/error/inout_errors/subscript_not_setable.py new file mode 100644 index 00000000..7a1323fc --- /dev/null +++ b/tests/error/inout_errors/subscript_not_setable.py @@ -0,0 +1,28 @@ +from guppylang.decorator import guppy +from guppylang.module import GuppyModule +from guppylang.prelude.builtins import inout +from guppylang.prelude.quantum import qubit, quantum + +module = GuppyModule("test") +module.load(quantum) + + +@guppy.declare(module) +def foo(q: qubit @inout) -> None: ... + + +@guppy.struct(module) +class MyImmutableContainer: + q: qubit + + @guppy.declare(module) + def __getitem__(self: "MyImmutableContainer" @inout, idx: int) -> qubit: ... + + +@guppy(module) +def test(c: MyImmutableContainer) -> MyImmutableContainer: + foo(c[0]) + return c + + +module.compile() diff --git a/tests/error/type_errors/not_subscriptable.err b/tests/error/type_errors/not_subscriptable.err new file mode 100644 index 00000000..0611a3bf --- /dev/null +++ b/tests/error/type_errors/not_subscriptable.err @@ -0,0 +1,7 @@ +Guppy compilation failed. Error in file $FILE:9 + +7: @guppy(module) +8: def foo(x: int) -> None: +9: x[0] + ^ +GuppyTypeError: Expression of type `int` is not subscriptable diff --git a/tests/error/type_errors/not_subscriptable.py b/tests/error/type_errors/not_subscriptable.py new file mode 100644 index 00000000..a93e2961 --- /dev/null +++ b/tests/error/type_errors/not_subscriptable.py @@ -0,0 +1,12 @@ +from guppylang.decorator import guppy +from guppylang.module import GuppyModule + +module = GuppyModule("test") + + +@guppy(module) +def foo(x: int) -> None: + x[0] + + +module.compile() diff --git a/tests/error/type_errors/subscript_bad_item.err b/tests/error/type_errors/subscript_bad_item.err new file mode 100644 index 00000000..7337c3b0 --- /dev/null +++ b/tests/error/type_errors/subscript_bad_item.err @@ -0,0 +1,7 @@ +Guppy compilation failed. Error in file $FILE:10 + +8: @guppy(module) +9: def foo(xs: array[int, 42]) -> int: +10: return xs[1.0] + ^^^ +GuppyTypeError: Expected argument of type `int`, got `float` diff --git a/tests/error/type_errors/subscript_bad_item.py b/tests/error/type_errors/subscript_bad_item.py new file mode 100644 index 00000000..ee4e0a6e --- /dev/null +++ b/tests/error/type_errors/subscript_bad_item.py @@ -0,0 +1,13 @@ +from guppylang.decorator import guppy +from guppylang.module import GuppyModule +from guppylang.prelude.builtins import array + +module = GuppyModule("test") + + +@guppy(module) +def foo(xs: array[int, 42]) -> int: + return xs[1.0] + + +module.compile() diff --git a/tests/integration/test_array.py b/tests/integration/test_array.py index 49ac3fc7..1ce01107 100644 --- a/tests/integration/test_array.py +++ b/tests/integration/test_array.py @@ -1,3 +1,4 @@ +import pytest from hugr import ops from hugr.std.int import IntVal @@ -23,6 +24,7 @@ def main(xs: array[float, 42]) -> int: assert val.val.v == 42 +@pytest.mark.skip("Skipped until Hugr lowering is updated") def test_index(validate): @compile_guppy def main(xs: array[int, 5], i: int) -> int: diff --git a/tests/integration/test_list.py b/tests/integration/test_list.py index e90f1bfe..30a1a6d5 100644 --- a/tests/integration/test_list.py +++ b/tests/integration/test_list.py @@ -1,3 +1,5 @@ +import pytest + from tests.util import compile_guppy @@ -37,6 +39,7 @@ def test(xs: list[int]) -> list[int]: validate(test) +@pytest.mark.skip("Requires updating lists to use inout") def test_subscript(validate): @compile_guppy def test(xs: list[float], i: int) -> float: From be4e452e6b9f7a2d48fb3246ef6eae68b309d522 Mon Sep 17 00:00:00 2001 From: Mark Koch Date: Fri, 30 Aug 2024 15:39:15 +0100 Subject: [PATCH 2/2] Improve error message --- guppylang/checker/expr_checker.py | 2 +- tests/error/inout_errors/subscript_not_setable.err | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/guppylang/checker/expr_checker.py b/guppylang/checker/expr_checker.py index 7ed7ee02..1242baa5 100644 --- a/guppylang/checker/expr_checker.py +++ b/guppylang/checker/expr_checker.py @@ -793,7 +793,7 @@ def check_inout_arg_place(place: Place, ctx: Context, node: PlaceNode) -> Place: setitem_args[0], setitem_args[1:], "__setitem__", - "not assignable", + "not allowed in a subscripted `@inout` position", exp_sig, True, ) diff --git a/tests/error/inout_errors/subscript_not_setable.err b/tests/error/inout_errors/subscript_not_setable.err index 9d8fe387..510cfca5 100644 --- a/tests/error/inout_errors/subscript_not_setable.err +++ b/tests/error/inout_errors/subscript_not_setable.err @@ -4,4 +4,4 @@ Guppy compilation failed. Error in file $FILE:24 23: def test(c: MyImmutableContainer) -> MyImmutableContainer: 24: foo(c[0]) ^^^^ -GuppyTypeError: Expression of type `MyImmutableContainer` is not assignable since it does not implement the `__setitem__` method +GuppyTypeError: Expression of type `MyImmutableContainer` is not allowed in a subscripted `@inout` position since it does not implement the `__setitem__` method