From f60f34209815d30be753519825e0253b946221dd Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 08:38:30 -0400 Subject: [PATCH 1/9] refactor: extract _is_valid_samplesheet_parameter_type --- latch/resources/workflow.py | 29 +++++++++++++++++++---------- 1 file changed, 19 insertions(+), 10 deletions(-) diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index 14f84a22..239c3f29 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -81,16 +81,7 @@ def decorator(f: Callable): if meta_param.samplesheet is not True: continue - annotation = wf_params[name].annotation - - origin = get_origin(annotation) - args = get_args(annotation) - valid = ( - origin is not None - and issubclass(origin, list) - and is_dataclass(args[0]) - ) - if not valid: + if not _is_valid_samplesheet_parameter_type(wf_param[name]): click.secho( f"parameter marked as samplesheet is not valid: {name} " f"in workflow {f.__name__} must be a list of dataclasses", @@ -108,3 +99,21 @@ def decorator(f: Callable): return _workflow(f, wf_name_override=wf_name_override) return decorator + + +def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: + """ + Check if a parameter in the workflow function's signature is annotated with a valid type for a + samplesheet LatchParameter. + """ + annotation = parameter.annotation + + origin = get_origin(annotation) + args = get_args(annotation) + valid = ( + origin is not None + and issubclass(origin, list) + and is_dataclass(args[0]) + ) + + return valid From 939d3e116a7461a1400b156e91154966fe9b766f Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 10:25:31 -0400 Subject: [PATCH 2/9] feat: Support Optional samplesheet types --- latch/resources/workflow.py | 164 +++++++++++++++++++++++++++++-- tests/resources/test_workflow.py | 124 +++++++++++++++++++++++ 2 files changed, 282 insertions(+), 6 deletions(-) create mode 100644 tests/resources/test_workflow.py diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index 239c3f29..a835d3c0 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -1,7 +1,10 @@ import inspect +import sys +import typing from dataclasses import is_dataclass from textwrap import dedent -from typing import Callable, Dict, Union, get_args, get_origin +from types import UnionType +from typing import Any, Callable, Dict, Union, get_args, get_origin import click import os @@ -12,6 +15,42 @@ from latch_cli.utils import best_effort_display_name +if sys.version_info >= (3, 10): + from typing import TypeAlias + from typing import TypeGuard + from types import UnionType +else: + from typing_extensions import TypeAlias + from typing_extensions import TypeGuard + + # NB: `types.UnionType`, available since Python 3.10, is **not** a `type`, but is a class. + # We declare an empty class here to use in the instance checks below. + class UnionType: + pass + + +# NB: since `_GenericAlias` is a private attribute of the `typing` module, mypy doesn't find it +TypeAnnotation: TypeAlias = Union[type, typing._GenericAlias, UnionType] # type: ignore[name-defined] +""" +A function parameter's type annotation may be any of the following: + 1) `type`, when declaring any of the built-in Python types + 2) `typing._GenericAlias`, when declaring generic collection types or union types using pre-PEP + 585 and pre-PEP 604 syntax (e.g. `List[int]`, `Optional[int]`, or `Union[int, None]`) + 3) `types.UnionType`, when declaring union types using PEP604 syntax (e.g. `int | None`) + 4) `types.GenericAlias`, when declaring generic collection types using PEP 585 syntax (e.g. + `list[int]`) + +`types.GenericAlias` is a subclass of `type`, but `typing._GenericAlias` and `types.UnionType` are +not and must be considered explicitly. +""" + +# TODO When dropping support for Python 3.9, deprecate this in favor of performing instance checks +# directly on the `TypeAnnotation` union type. +# NB: since `_GenericAlias` is a private attribute of the `typing` module, mypy doesn't find it +TYPE_ANNOTATION_TYPES = (type, typing._GenericAlias, UnionType) # type: ignore[attr-defined] + + + def _generate_metadata(f: Callable) -> LatchMetadata: signature = inspect.signature(f) metadata = LatchMetadata(f.__name__, LatchAuthor()) @@ -108,12 +147,125 @@ def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: """ annotation = parameter.annotation - origin = get_origin(annotation) - args = get_args(annotation) - valid = ( - origin is not None + # If the parameter did not have a type annotation, short-circuit and return False + if not _is_type_annotation(annotation): + return False + + return ( + _is_list_of_dataclasses_type(annotation) + or (_is_optional_type(annotation) and _is_list_of_dataclasses_type(_unpack_optional_type(annotation))) + ) + + +def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: + """ + Check if the type is a list of dataclasses. + + Args: + dtype: A type. + + Returns: + True if the type is a list of dataclasses. + False otherwise. + + Raises: + TypeError: If the input is not a `type`. + """ + if not isinstance(dtype, TYPE_ANNOTATION_TYPES): + raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + + origin = get_origin(dtype) + args = get_args(dtype) + + return ( + not _is_optional_type(dtype) + and origin is not None and issubclass(origin, list) + and len(args) == 1 and is_dataclass(args[0]) ) - return valid + +def _is_optional_type(dtype: TypeAnnotation) -> bool: + """ + Check if a type is `Optional`. + + An optional type may be declared using three syntaxes: `Optional[T]`, `Union[T, None]`, or `T | + None`. All of these syntaxes is supported by this function. + + Args: + dtype: A type. + + Returns: + True if the type is a union type with exactly two elements, one of which is `None`. + False otherwise. + + Raises: + TypeError: If the input is not a `type`. + """ + if not isinstance(dtype, TYPE_ANNOTATION_TYPES): + raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + + origin = get_origin(dtype) + args = get_args(dtype) + + # Optional[T] has `typing.Union` as its origin, but PEP604 syntax (e.g. `int | None`) has + # `types.UnionType` as its origin. + return (origin is Union or origin is UnionType) and len(args) == 2 and type(None) in args + + +def _unpack_optional_type(dtype: TypeAnnotation) -> type: + """ + Given a type of `Optional[T]`, return `T`. + + Args: + dtype: A type of `Optional[T]`, `T | None`, or `Union[T, None]`. + + Returns: + The type `T`. + + Raises: + TypeError: If the input is not a `type`. + ValueError: If the input type is not `Optional[T]`. + """ + if not isinstance(dtype, TYPE_ANNOTATION_TYPES): + raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + + if not _is_optional_type(dtype): + raise ValueError(f"Expected Optional[T], got {type(dtype)}: {dtype}") + + args = get_args(dtype) + + # Types declared as `Optional[T]` or `T | None` should have the non-None type as the first + # argument. However, it is technically correct for someone to write `None | T`, so we shouldn't + # make assumptions about the argument ordering. (And I'm not certain the ordering is guaranteed + # anywhere by Python spec.) + base_type = [arg for arg in args if arg is not type(None)][0] + + return base_type + + +def _is_type_annotation(annotation: Any) -> TypeGuard[TypeAnnotation]: + """ + Check if the annotation on an `inspect.Parameter` instance is a type annotation. + + If the corresponding parameter **did not** have a type annotation, `annotation` is set to the + special class variable `Parameter.empty`. + + NB: `Parameter.empty` itself is a subclass of `type` + Otherwise, the annotation is assumed to be a type. + + Args: + annotation: The annotation on an `inspect.Parameter` instance. + + Returns: + True if the annotation is not `Parameter.empty`. + False otherwise. + + Raises: + TypeError: If the annotation is neither a type nor `Parameter.empty`. + """ + if not isinstance(annotation, TYPE_ANNOTATION_TYPES): + raise TypeError(f"Annotation must be a type, not {type(annotation).__name__}") + + return annotation is not inspect.Parameter.empty diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py new file mode 100644 index 00000000..d99e2bd8 --- /dev/null +++ b/tests/resources/test_workflow.py @@ -0,0 +1,124 @@ +import inspect +import sys +import typing +from dataclasses import dataclass +from typing import List +from typing import Any +from typing import Collection, Iterable, Optional, Union, Mapping, Dict, Set, Tuple + +import pytest + +from anno import _is_list_of_dataclasses_type +from anno import _is_valid_samplesheet_parameter_type +from anno import _is_optional_type +from anno import _is_type_annotation +from anno import _unpack_optional_type +from anno import TypeAnnotation + +PRIMITIVE_TYPES = [int, float, bool, str] +COLLECTION_TYPES = [List[int], Dict[str, int], Set[int], Tuple[int], Mapping[str, int], Iterable[int], Collection[int]] + +if sys.version_info >= (3, 10): + COLLECTION_TYPES += [list[int], dict[str, int], set[int], tuple[int]] + +OPTIONAL_TYPES = [Optional[T] for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] +OPTIONAL_TYPES += [Union[T, None] for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] + + +@dataclass +class FakeDataclass: + """A dataclass for testing.""" + foo: str + bar: int + + +@pytest.mark.parametrize( + "dtype", + [ + List[FakeDataclass], + Optional[List[FakeDataclass]], + Union[List[FakeDataclass], None], + ] +) +def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: + """ + `_is_valid_samplesheet_parameter_type` should accept a type that is a list of dataclasses, or an + `Optional` list of dataclasses. + """ + parameter = inspect.Parameter("foo", kind=inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=dtype) + assert _is_valid_samplesheet_parameter_type(parameter) is True + + +def test_is_list_of_dataclasses_type() -> None: + """ + `_is_list_of_dataclasses_type` should accept a type that is a list of dataclasses. + """ + assert _is_list_of_dataclasses_type(List[FakeDataclass]) is True + + +@pytest.mark.parametrize("bad_type", [ + str, # Not a list + int, # Not a list + List[str], # Not a list of dataclasses + List[int], # Not a list of dataclasses + FakeDataclass, # Not a list +]) +def test_is_list_of_dataclasses_type_rejects_bad_type(bad_type: type) -> None: + """ + `_is_list_of_dataclasses_type` should reject anything else. + """ + assert _is_list_of_dataclasses_type(bad_type) is False + + +def test_is_list_of_dataclasses_type_raises_if_not_a_type() -> None: + """ + `is_list_of_dataclasses_type` should raise a `TypeError` if the input is not a type. + """ + with pytest.raises(TypeError): + _is_list_of_dataclasses_type([FakeDataclass("hello", 1)]) + + +@pytest.mark.parametrize("dtype", OPTIONAL_TYPES) +def test_is_optional_type(dtype: TypeAnnotation) -> None: + """`_is_optional_type` should return True for `Optional[T]` types.""" + assert _is_optional_type(dtype) is True + + +@pytest.mark.parametrize("dtype", PRIMITIVE_TYPES + COLLECTION_TYPES) +def test_is_optional_type_returns_false_if_not_optional(dtype: TypeAnnotation) -> None: + """`_is_optional_type` should return False for non-Optional types.""" + assert _is_optional_type(dtype) is False + + +@pytest.mark.parametrize("dtype", PRIMITIVE_TYPES + COLLECTION_TYPES) +def test_unpack_optional_type(dtype: TypeAnnotation) -> None: + """`_unpack_optional_type()` should return the base type of `Optional[T]` types.""" + assert _unpack_optional_type(Optional[dtype]) is dtype + assert _unpack_optional_type(Union[dtype, None]) is dtype + if sys.version_info >= (3, 10): + assert _unpack_optional_type(dtype | None) is dtype + + + +@pytest.mark.parametrize("annotation", PRIMITIVE_TYPES + COLLECTION_TYPES + OPTIONAL_TYPES) +def test_is_type_annotation(annotation: TypeAnnotation) -> None: + """ + `_is_type_annotation()` should return True for any valid type annotation. + """ + assert _is_type_annotation(annotation) is True + + +def test_is_type_annotation_returns_false_if_empty() -> None: + """ + `_is_type_annotation()` should only return False if the annotation is `Parameter.empty`. + """ + assert _is_type_annotation(inspect.Parameter.empty) is False + + +@pytest.mark.parametrize("bad_annotation", [1, "abc", [1, 2], {"foo": 1}, FakeDataclass("hello", 1)]) +def test_is_type_annotation_raises_if_annotation_is_not_a_type(bad_annotation: Any) -> None: + """ + `_is_type_annotation()` should raise `TypeError` for any non-type object. + """ + with pytest.raises(TypeError): + _is_type_annotation(bad_annotation) \ No newline at end of file From 21590f99eb2d6f73af7541669e59c51ca9c8883e Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 10:28:00 -0400 Subject: [PATCH 3/9] chore: clean-up doc: add docs doc: fix TypeError messages fix: remove unguarded UnionType import test: fix imports --- latch/resources/workflow.py | 71 ++++++++++++++++++-------------- tests/resources/__init__.py | 0 tests/resources/test_workflow.py | 13 +++--- 3 files changed, 46 insertions(+), 38 deletions(-) create mode 100644 tests/resources/__init__.py diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index a835d3c0..37f83adc 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -3,7 +3,6 @@ import typing from dataclasses import is_dataclass from textwrap import dedent -from types import UnionType from typing import Any, Callable, Dict, Union, get_args, get_origin import click @@ -50,7 +49,6 @@ class UnionType: TYPE_ANNOTATION_TYPES = (type, typing._GenericAlias, UnionType) # type: ignore[attr-defined] - def _generate_metadata(f: Callable) -> LatchMetadata: signature = inspect.signature(f) metadata = LatchMetadata(f.__name__, LatchAuthor()) @@ -72,7 +70,7 @@ def _inject_metadata(f: Callable, metadata: LatchMetadata) -> None: # so that when users call @workflow without any arguments or # parentheses, the workflow still serializes as expected def workflow( - metadata: Union[LatchMetadata, Callable] + metadata: Union[LatchMetadata, Callable], ) -> Union[PythonFunctionWorkflow, Callable]: if isinstance(metadata, Callable): f = metadata @@ -141,9 +139,18 @@ def decorator(f: Callable): def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: - """ - Check if a parameter in the workflow function's signature is annotated with a valid type for a - samplesheet LatchParameter. + """Check if a workflow parameter is hinted with a valid type for a samplesheet LatchParameter. + + Currently, a samplesheet LatchParameter must be defined as a list of dataclasses, or as an + `Optional` list of dataclasses when the parameter is part of a `ForkBranch`. + + Args: + parameter: A parameter from the workflow function's signature. + + Returns: + True if the parameter is annotated as a list of dataclasses, or as an `Optional` list of + dataclasses. + False otherwise. """ annotation = parameter.annotation @@ -151,15 +158,14 @@ def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: if not _is_type_annotation(annotation): return False - return ( - _is_list_of_dataclasses_type(annotation) - or (_is_optional_type(annotation) and _is_list_of_dataclasses_type(_unpack_optional_type(annotation))) + return _is_list_of_dataclasses_type(annotation) or ( + _is_optional_type(annotation) + and _is_list_of_dataclasses_type(_unpack_optional_type(annotation)) ) def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: - """ - Check if the type is a list of dataclasses. + """Check if the type is a list of dataclasses. Args: dtype: A type. @@ -169,10 +175,10 @@ def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: False otherwise. Raises: - TypeError: If the input is not a `type`. + TypeError: If the input is not a valid `TypeAnnotation` type (see above). """ if not isinstance(dtype, TYPE_ANNOTATION_TYPES): - raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + raise TypeError(f"Expected type annotation, got {type(dtype)}: {dtype}") origin = get_origin(dtype) args = get_args(dtype) @@ -187,8 +193,7 @@ def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: def _is_optional_type(dtype: TypeAnnotation) -> bool: - """ - Check if a type is `Optional`. + """Check if a type is `Optional`. An optional type may be declared using three syntaxes: `Optional[T]`, `Union[T, None]`, or `T | None`. All of these syntaxes is supported by this function. @@ -201,22 +206,25 @@ def _is_optional_type(dtype: TypeAnnotation) -> bool: False otherwise. Raises: - TypeError: If the input is not a `type`. + TypeError: If the input is not a valid `TypeAnnotation` type (see above). """ if not isinstance(dtype, TYPE_ANNOTATION_TYPES): - raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + raise TypeError(f"Expected type annotation, got {type(dtype)}: {dtype}") origin = get_origin(dtype) args = get_args(dtype) # Optional[T] has `typing.Union` as its origin, but PEP604 syntax (e.g. `int | None`) has # `types.UnionType` as its origin. - return (origin is Union or origin is UnionType) and len(args) == 2 and type(None) in args + return ( + (origin is Union or origin is UnionType) + and len(args) == 2 + and type(None) in args + ) def _unpack_optional_type(dtype: TypeAnnotation) -> type: - """ - Given a type of `Optional[T]`, return `T`. + """Given a type of `Optional[T]`, return `T`. Args: dtype: A type of `Optional[T]`, `T | None`, or `Union[T, None]`. @@ -225,14 +233,14 @@ def _unpack_optional_type(dtype: TypeAnnotation) -> type: The type `T`. Raises: - TypeError: If the input is not a `type`. + TypeError: If the input is not a valid `TypeAnnotation` type (see above). ValueError: If the input type is not `Optional[T]`. """ if not isinstance(dtype, TYPE_ANNOTATION_TYPES): - raise TypeError(f"Expected `type`, got {type(dtype)}: {dtype}") + raise TypeError(f"Expected type annotation, got {type(dtype)}: {dtype}") if not _is_optional_type(dtype): - raise ValueError(f"Expected Optional[T], got {type(dtype)}: {dtype}") + raise ValueError(f"Expected `Optional[T]`, got {type(dtype)}: {dtype}") args = get_args(dtype) @@ -245,26 +253,27 @@ def _unpack_optional_type(dtype: TypeAnnotation) -> type: return base_type +# NB: `inspect.Parameter.annotation` is typed as `Any`, so here we narrow the type. def _is_type_annotation(annotation: Any) -> TypeGuard[TypeAnnotation]: - """ - Check if the annotation on an `inspect.Parameter` instance is a type annotation. + """Check if the annotation on an `inspect.Parameter` instance is a type annotation. If the corresponding parameter **did not** have a type annotation, `annotation` is set to the - special class variable `Parameter.empty`. - - NB: `Parameter.empty` itself is a subclass of `type` - Otherwise, the annotation is assumed to be a type. + special class variable `inspect.Parameter.empty`. Otherwise, the annotation should be a valid + type annotation. Args: annotation: The annotation on an `inspect.Parameter` instance. Returns: - True if the annotation is not `Parameter.empty`. + True if the type annotation is not `inspect.Parameter.empty`. False otherwise. Raises: - TypeError: If the annotation is neither a type nor `Parameter.empty`. + TypeError: If the annotation is neither a valid `TypeAnnotation` type (see above) nor + `inspect.Parameter.empty`. """ + # NB: `inspect.Parameter.empty` is a subclass of `type`, so this check passes for unannotated + # parameters. if not isinstance(annotation, TYPE_ANNOTATION_TYPES): raise TypeError(f"Annotation must be a type, not {type(annotation).__name__}") diff --git a/tests/resources/__init__.py b/tests/resources/__init__.py new file mode 100644 index 00000000..e69de29b diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index d99e2bd8..e0b25761 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -1,6 +1,5 @@ import inspect import sys -import typing from dataclasses import dataclass from typing import List from typing import Any @@ -8,12 +7,12 @@ import pytest -from anno import _is_list_of_dataclasses_type -from anno import _is_valid_samplesheet_parameter_type -from anno import _is_optional_type -from anno import _is_type_annotation -from anno import _unpack_optional_type -from anno import TypeAnnotation +from latch.resources.workflow import _is_list_of_dataclasses_type +from latch.resources.workflow import _is_valid_samplesheet_parameter_type +from latch.resources.workflow import _is_optional_type +from latch.resources.workflow import _is_type_annotation +from latch.resources.workflow import _unpack_optional_type +from latch.resources.workflow import TypeAnnotation PRIMITIVE_TYPES = [int, float, bool, str] COLLECTION_TYPES = [List[int], Dict[str, int], Set[int], Tuple[int], Mapping[str, int], Iterable[int], Collection[int]] From f506b5b1e4670e0a7f54262bfc86ae376f1a5e10 Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 11:13:19 -0400 Subject: [PATCH 4/9] test: Test PEP 604 types --- tests/resources/test_workflow.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index e0b25761..5928ed93 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -14,15 +14,18 @@ from latch.resources.workflow import _unpack_optional_type from latch.resources.workflow import TypeAnnotation -PRIMITIVE_TYPES = [int, float, bool, str] -COLLECTION_TYPES = [List[int], Dict[str, int], Set[int], Tuple[int], Mapping[str, int], Iterable[int], Collection[int]] +PRIMITIVE_TYPES: List[type] = [int, float, bool, str] +COLLECTION_TYPES: List[TypeAnnotation] = [List[int], Dict[str, int], Set[int], Tuple[int], Mapping[str, int], Iterable[int], Collection[int]] if sys.version_info >= (3, 10): COLLECTION_TYPES += [list[int], dict[str, int], set[int], tuple[int]] -OPTIONAL_TYPES = [Optional[T] for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] +OPTIONAL_TYPES: List[TypeAnnotation] = [Optional[T] for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] OPTIONAL_TYPES += [Union[T, None] for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] +if sys.version_info >= (3, 10): + OPTIONAL_TYPES += [T | None for T in (PRIMITIVE_TYPES + COLLECTION_TYPES)] + @dataclass class FakeDataclass: From 03c44f52661e7acc8f403bbe61bf6e55e8b2925e Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 12:33:53 -0400 Subject: [PATCH 5/9] test: add PEP 585 and 604 samplesheet types --- tests/resources/test_workflow.py | 24 +++++++++++++++++------- 1 file changed, 17 insertions(+), 7 deletions(-) diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index 5928ed93..c58da4ad 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -34,14 +34,24 @@ class FakeDataclass: bar: int -@pytest.mark.parametrize( - "dtype", - [ - List[FakeDataclass], - Optional[List[FakeDataclass]], - Union[List[FakeDataclass], None], +# Enumerate the possible ways to declare a list or optional list of dataclasses +SAMPLESHEET_TYPES: List[TypeAnnotation] = [ + List[FakeDataclass], + Optional[List[FakeDataclass]], + Union[List[FakeDataclass], None], +] + +if sys.version_info >= (3, 10): + SAMPLESHEET_TYPES += [ + list[FakeDataclass], + Optional[list[FakeDataclass]], + Union[list[FakeDataclass], None], + list[FakeDataclass] | None, + List[FakeDataclass] | None, ] -) + + +@pytest.mark.parametrize("dtype", SAMPLESHEET_TYPES) def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: """ `_is_valid_samplesheet_parameter_type` should accept a type that is a list of dataclasses, or an From ede1b0ba9c8100f6b320f3f57c43bae0705b9de2 Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 12:36:08 -0400 Subject: [PATCH 6/9] test: cover non-samplesheet types --- tests/resources/test_workflow.py | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index c58da4ad..ba1393cd 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -61,6 +61,15 @@ def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: assert _is_valid_samplesheet_parameter_type(parameter) is True +@pytest.mark.parametrize("dtype", PRIMITIVE_TYPES + COLLECTION_TYPES + OPTIONAL_TYPES) +def test_is_valid_samplesheet_parameter_type_rejects_invalid_types(dtype: TypeAnnotation) -> None: + """ + `_is_valid_samplesheet_parameter_type` should reject any other type. + """ + parameter = inspect.Parameter("foo", kind=inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=dtype) + assert _is_valid_samplesheet_parameter_type(parameter) is False + + def test_is_list_of_dataclasses_type() -> None: """ `_is_list_of_dataclasses_type` should accept a type that is a list of dataclasses. From 40e01e468f340d08495d1c0c4eb150c9a4b3e759 Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 13:26:19 -0400 Subject: [PATCH 7/9] fix: PR requests --- latch/resources/workflow.py | 23 ++++++++--------------- 1 file changed, 8 insertions(+), 15 deletions(-) diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index 37f83adc..26aad6b5 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -4,6 +4,8 @@ from dataclasses import is_dataclass from textwrap import dedent from typing import Any, Callable, Dict, Union, get_args, get_origin +from typing_extensions import TypeAlias +from typing_extensions import TypeGuard import click import os @@ -15,13 +17,8 @@ if sys.version_info >= (3, 10): - from typing import TypeAlias - from typing import TypeGuard from types import UnionType else: - from typing_extensions import TypeAlias - from typing_extensions import TypeGuard - # NB: `types.UnionType`, available since Python 3.10, is **not** a `type`, but is a class. # We declare an empty class here to use in the instance checks below. class UnionType: @@ -118,7 +115,7 @@ def decorator(f: Callable): if meta_param.samplesheet is not True: continue - if not _is_valid_samplesheet_parameter_type(wf_param[name]): + if not _is_valid_samplesheet_parameter_type(wf_params[name].annotation): click.secho( f"parameter marked as samplesheet is not valid: {name} " f"in workflow {f.__name__} must be a list of dataclasses", @@ -138,7 +135,7 @@ def decorator(f: Callable): return decorator -def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: +def _is_valid_samplesheet_parameter_type(annotation: Any) -> TypeGuard[TypeAnnotation]: """Check if a workflow parameter is hinted with a valid type for a samplesheet LatchParameter. Currently, a samplesheet LatchParameter must be defined as a list of dataclasses, or as an @@ -152,8 +149,6 @@ def _is_valid_samplesheet_parameter_type(parameter: inspect.Parameter) -> bool: dataclasses. False otherwise. """ - annotation = parameter.annotation - # If the parameter did not have a type annotation, short-circuit and return False if not _is_type_annotation(annotation): return False @@ -184,8 +179,7 @@ def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: args = get_args(dtype) return ( - not _is_optional_type(dtype) - and origin is not None + origin is not None and issubclass(origin, list) and len(args) == 1 and is_dataclass(args[0]) @@ -217,7 +211,8 @@ def _is_optional_type(dtype: TypeAnnotation) -> bool: # Optional[T] has `typing.Union` as its origin, but PEP604 syntax (e.g. `int | None`) has # `types.UnionType` as its origin. return ( - (origin is Union or origin is UnionType) + origin is not None + and (origin is Union or origin is UnionType) and len(args) == 2 and type(None) in args ) @@ -242,13 +237,11 @@ def _unpack_optional_type(dtype: TypeAnnotation) -> type: if not _is_optional_type(dtype): raise ValueError(f"Expected `Optional[T]`, got {type(dtype)}: {dtype}") - args = get_args(dtype) - # Types declared as `Optional[T]` or `T | None` should have the non-None type as the first # argument. However, it is technically correct for someone to write `None | T`, so we shouldn't # make assumptions about the argument ordering. (And I'm not certain the ordering is guaranteed # anywhere by Python spec.) - base_type = [arg for arg in args if arg is not type(None)][0] + base_type = [arg for arg in get_args(dtype) if arg is not type(None)][0] return base_type From 4f4ae28092c0044dd75c5cd4b2305f87f778c12e Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Fri, 19 Jul 2024 13:34:56 -0400 Subject: [PATCH 8/9] fix: PR updates --- latch/resources/workflow.py | 1 + tests/resources/test_workflow.py | 6 ++---- 2 files changed, 3 insertions(+), 4 deletions(-) diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index 26aad6b5..f9b7ba03 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -180,6 +180,7 @@ def _is_list_of_dataclasses_type(dtype: TypeAnnotation) -> bool: return ( origin is not None + and inspect.isclass(origin) and issubclass(origin, list) and len(args) == 1 and is_dataclass(args[0]) diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index ba1393cd..9242b021 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -57,8 +57,7 @@ def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: `_is_valid_samplesheet_parameter_type` should accept a type that is a list of dataclasses, or an `Optional` list of dataclasses. """ - parameter = inspect.Parameter("foo", kind=inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=dtype) - assert _is_valid_samplesheet_parameter_type(parameter) is True + assert _is_valid_samplesheet_parameter_type(dtype) is True @pytest.mark.parametrize("dtype", PRIMITIVE_TYPES + COLLECTION_TYPES + OPTIONAL_TYPES) @@ -66,8 +65,7 @@ def test_is_valid_samplesheet_parameter_type_rejects_invalid_types(dtype: TypeAn """ `_is_valid_samplesheet_parameter_type` should reject any other type. """ - parameter = inspect.Parameter("foo", kind=inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=dtype) - assert _is_valid_samplesheet_parameter_type(parameter) is False + assert _is_valid_samplesheet_parameter_type(dtype) is False def test_is_list_of_dataclasses_type() -> None: From 8c50966050f75aa1bb1c58d8f2d74746f0c53150 Mon Sep 17 00:00:00 2001 From: Matt Stone Date: Mon, 22 Jul 2024 11:03:46 -0400 Subject: [PATCH 9/9] refactor: import _GenericAlias from typing --- latch/resources/workflow.py | 15 +++++++++------ tests/resources/test_workflow.py | 13 ++++++++++++- 2 files changed, 21 insertions(+), 7 deletions(-) diff --git a/latch/resources/workflow.py b/latch/resources/workflow.py index f9b7ba03..e742e019 100644 --- a/latch/resources/workflow.py +++ b/latch/resources/workflow.py @@ -1,9 +1,14 @@ import inspect import sys -import typing from dataclasses import is_dataclass from textwrap import dedent -from typing import Any, Callable, Dict, Union, get_args, get_origin +from typing import Any +from typing import Callable +from typing import Dict +from typing import Union +from typing import _GenericAlias # type: ignore[attr-defined] # NB: mypy can't see private attrs +from typing import get_args +from typing import get_origin from typing_extensions import TypeAlias from typing_extensions import TypeGuard @@ -25,8 +30,7 @@ class UnionType: pass -# NB: since `_GenericAlias` is a private attribute of the `typing` module, mypy doesn't find it -TypeAnnotation: TypeAlias = Union[type, typing._GenericAlias, UnionType] # type: ignore[name-defined] +TypeAnnotation: TypeAlias = Union[type, _GenericAlias, UnionType] """ A function parameter's type annotation may be any of the following: 1) `type`, when declaring any of the built-in Python types @@ -42,8 +46,7 @@ class UnionType: # TODO When dropping support for Python 3.9, deprecate this in favor of performing instance checks # directly on the `TypeAnnotation` union type. -# NB: since `_GenericAlias` is a private attribute of the `typing` module, mypy doesn't find it -TYPE_ANNOTATION_TYPES = (type, typing._GenericAlias, UnionType) # type: ignore[attr-defined] +TYPE_ANNOTATION_TYPES = (type, _GenericAlias, UnionType) # type: ignore[attr-defined] def _generate_metadata(f: Callable) -> LatchMetadata: diff --git a/tests/resources/test_workflow.py b/tests/resources/test_workflow.py index 9242b021..da6d0fd3 100644 --- a/tests/resources/test_workflow.py +++ b/tests/resources/test_workflow.py @@ -50,6 +50,17 @@ class FakeDataclass: List[FakeDataclass] | None, ] +BAD_SAMPLESHEET_TYPES: List[TypeAnnotation] = PRIMITIVE_TYPES + COLLECTION_TYPES + OPTIONAL_TYPES +BAD_SAMPLESHEET_TYPES += [ + Union[List[FakeDataclass], int], + Union[Optional[List[FakeDataclass]], int], + Optional[Union[List[FakeDataclass], int]], + Union[List[FakeDataclass], Optional[int]], + Union[Optional[int], List[FakeDataclass]], + List[Union[FakeDataclass, int]], + List[Optional[FakeDataclass]], +] + @pytest.mark.parametrize("dtype", SAMPLESHEET_TYPES) def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: @@ -60,7 +71,7 @@ def test_is_valid_samplesheet_parameter_type(dtype: TypeAnnotation) -> None: assert _is_valid_samplesheet_parameter_type(dtype) is True -@pytest.mark.parametrize("dtype", PRIMITIVE_TYPES + COLLECTION_TYPES + OPTIONAL_TYPES) +@pytest.mark.parametrize("dtype", BAD_SAMPLESHEET_TYPES) def test_is_valid_samplesheet_parameter_type_rejects_invalid_types(dtype: TypeAnnotation) -> None: """ `_is_valid_samplesheet_parameter_type` should reject any other type.