diff options
author | S. Solomon Darnell | 2025-03-28 21:52:21 -0500 |
---|---|---|
committer | S. Solomon Darnell | 2025-03-28 21:52:21 -0500 |
commit | 4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch) | |
tree | ee3dc5af3b6313e921cd920906356f5d4febc4ed /.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set | |
parent | cc961e04ba734dd72309fb548a2f97d67d578813 (diff) | |
download | gn-ai-master.tar.gz |
Diffstat (limited to '.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set')
14 files changed, 371 insertions, 0 deletions
diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/__init__.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/__init__.py new file mode 100644 index 00000000..69c1cdbd --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/__init__.py @@ -0,0 +1,25 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +__path__ = __import__("pkgutil").extend_path(__path__, __name__) + +from .delay_metadata_schema import DelayMetadataSchema +from .feature_schema import FeatureSchema +from .feature_set_schema import FeatureSetSchema +from .featureset_spec_metadata_schema import FeaturesetSpecMetadataSchema +from .feature_set_specification_schema import FeatureSetSpecificationSchema +from .materialization_settings_schema import MaterializationSettingsSchema +from .source_metadata_schema import SourceMetadataSchema +from .timestamp_column_metadata_schema import TimestampColumnMetadataSchema + +__all__ = [ + "DelayMetadataSchema", + "FeatureSchema", + "FeatureSetSchema", + "FeaturesetSpecMetadataSchema", + "FeatureSetSpecificationSchema", + "MaterializationSettingsSchema", + "SourceMetadataSchema", + "TimestampColumnMetadataSchema", +] diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/delay_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/delay_metadata_schema.py new file mode 100644 index 00000000..5ad78a7a --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/delay_metadata_schema.py @@ -0,0 +1,21 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class DelayMetadataSchema(metaclass=PatchedSchemaMeta): + days = fields.Int(required=False) + hours = fields.Int(required=False) + minutes = fields.Int(required=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.delay_metadata import DelayMetadata + + return DelayMetadata(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_schema.py new file mode 100644 index 00000000..6d248270 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_schema.py @@ -0,0 +1,29 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class FeatureSchema(metaclass=PatchedSchemaMeta): + name = fields.Str( + required=True, + allow_none=False, + ) + data_type = fields.Str( + required=True, + allow_none=False, + data_key="type", + ) + description = fields.Str(required=False) + tags = fields.Dict(keys=fields.Str(), values=fields.Str(), required=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.feature import Feature + + return Feature(description=data.pop("description", None), **data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_backfill_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_backfill_schema.py new file mode 100644 index 00000000..0ee5af8e --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_backfill_schema.py @@ -0,0 +1,22 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +from marshmallow import fields + +from azure.ai.ml._schema._feature_set.feature_window_schema import FeatureWindowSchema +from azure.ai.ml._schema._feature_set.materialization_settings_schema import MaterializationComputeResourceSchema +from azure.ai.ml._schema.core.fields import NestedField +from azure.ai.ml._schema.core.schema import YamlFileSchema + + +class FeatureSetBackfillSchema(YamlFileSchema): + name = fields.Str(required=True) + version = fields.Str(required=True) + feature_window = NestedField(FeatureWindowSchema) + description = fields.Str() + tags = fields.Dict() + resource = NestedField(MaterializationComputeResourceSchema) + spark_configuration = fields.Dict() + data_status = fields.List(fields.Str()) + job_id = fields.Str() diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_schema.py new file mode 100644 index 00000000..08722402 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_schema.py @@ -0,0 +1,27 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +from marshmallow import fields, post_dump, validate + +from azure.ai.ml._schema import NestedField +from azure.ai.ml._schema.core.schema import YamlFileSchema + +from .feature_set_specification_schema import FeatureSetSpecificationSchema +from .materialization_settings_schema import MaterializationSettingsSchema + + +class FeatureSetSchema(YamlFileSchema): + name = fields.Str(required=True, allow_none=False) + version = fields.Str(required=True, allow_none=False) + latest_version = fields.Str(dump_only=True) + specification = NestedField(FeatureSetSpecificationSchema, required=True, allow_none=False) + entities = fields.List(fields.Str, required=True, allow_none=False) + stage = fields.Str(validate=validate.OneOf(["Development", "Production", "Archived"]), dump_default="Development") + description = fields.Str() + tags = fields.Dict(keys=fields.Str(), values=fields.Str()) + materialization_settings = NestedField(MaterializationSettingsSchema) + + @post_dump + def remove_empty_values(self, data, **kwargs): # pylint: disable=unused-argument + return {key: value for key, value in data.items() if value} diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_specification_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_specification_schema.py new file mode 100644 index 00000000..64b399fb --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_set_specification_schema.py @@ -0,0 +1,19 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class FeatureSetSpecificationSchema(metaclass=PatchedSchemaMeta): + path = fields.Str(required=True, allow_none=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.feature_set_specification import FeatureSetSpecification + + return FeatureSetSpecification(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_transformation_code_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_transformation_code_metadata_schema.py new file mode 100644 index 00000000..8b173865 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_transformation_code_metadata_schema.py @@ -0,0 +1,22 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class FeatureTransformationCodeMetadataSchema(metaclass=PatchedSchemaMeta): + path = fields.Str(required=False) + transformer_class = fields.Str(required=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.feature_transformation_code_metadata import ( + FeatureTransformationCodeMetadata, + ) + + return FeatureTransformationCodeMetadata(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_window_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_window_schema.py new file mode 100644 index 00000000..d114c731 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/feature_window_schema.py @@ -0,0 +1,11 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +from marshmallow import fields +from azure.ai.ml._schema.core.schema import YamlFileSchema + + +class FeatureWindowSchema(YamlFileSchema): + feature_window_end = fields.Str() + feature_window_start = fields.Str() diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_metadata_schema.py new file mode 100644 index 00000000..251ccd6e --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_metadata_schema.py @@ -0,0 +1,33 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from typing import Dict + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.fields import NestedField +from azure.ai.ml._schema.core.schema import YamlFileSchema +from azure.ai.ml._schema._feature_store_entity.data_column_schema import DataColumnSchema + +from .source_metadata_schema import SourceMetadataSchema +from .delay_metadata_schema import DelayMetadataSchema +from .feature_schema import FeatureSchema +from .feature_transformation_code_metadata_schema import FeatureTransformationCodeMetadataSchema + + +class FeaturesetSpecMetadataSchema(YamlFileSchema): + source = fields.Nested(SourceMetadataSchema, required=True) + feature_transformation_code = fields.Nested(FeatureTransformationCodeMetadataSchema, required=False) + features = fields.List(NestedField(FeatureSchema), required=True, allow_none=False) + index_columns = fields.List(NestedField(DataColumnSchema), required=False) + source_lookback = fields.Nested(DelayMetadataSchema, required=False) + temporal_join_lookback = fields.Nested(DelayMetadataSchema, required=False) + + @post_load + def make(self, data: Dict, **kwargs): + from azure.ai.ml.entities._feature_set.featureset_spec_metadata import FeaturesetSpecMetadata + + return FeaturesetSpecMetadata(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_properties_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_properties_schema.py new file mode 100644 index 00000000..e3a56542 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/featureset_spec_properties_schema.py @@ -0,0 +1,55 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +from marshmallow import fields + +from azure.ai.ml._schema.core.fields import NestedField +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta, YamlFileSchema + +from .source_process_code_metadata_schema import SourceProcessCodeSchema +from .timestamp_column_metadata_schema import TimestampColumnMetadataSchema + + +# pylint: disable-next=name-too-long +class FeatureTransformationCodePropertiesSchema(metaclass=PatchedSchemaMeta): + path = fields.Str(data_key="Path") + transformer_class = fields.Str(data_key="TransformerClass") + + +class DelayMetadataPropertiesSchema(metaclass=PatchedSchemaMeta): + days = fields.Int(data_key="Days") + hours = fields.Int(data_key="Hours") + minutes = fields.Int(data_key="Minutes") + + +class FeaturePropertiesSchema(metaclass=PatchedSchemaMeta): + name = fields.Str(data_key="FeatureName") + data_type = fields.Str(data_key="DataType") + description = fields.Str(data_key="Description") + tags = fields.Dict(keys=fields.Str(), values=fields.Str(), data_key="Tags") + + +class ColumnPropertiesSchema(metaclass=PatchedSchemaMeta): + name = fields.Str(data_key="ColumnName") + type = fields.Str(data_key="DataType") + + +class SourcePropertiesSchema(metaclass=PatchedSchemaMeta): + type = fields.Str(required=True) + path = fields.Str(required=False) + timestamp_column = fields.Nested(TimestampColumnMetadataSchema, data_key="timestampColumn") + source_delay = fields.Nested(DelayMetadataPropertiesSchema, data_key="sourceDelay") + source_process_code = fields.Nested(SourceProcessCodeSchema) + dict = fields.Dict(keys=fields.Str(), values=fields.Str(), data_key="kwargs") + + +class FeaturesetSpecPropertiesSchema(YamlFileSchema): + source = fields.Nested(SourcePropertiesSchema, data_key="source") + feature_transformation_code = fields.Nested( + FeatureTransformationCodePropertiesSchema, data_key="featureTransformationCode" + ) + features = fields.List(NestedField(FeaturePropertiesSchema), data_key="features") + index_columns = fields.List(NestedField(ColumnPropertiesSchema), data_key="indexColumns") + source_lookback = fields.Nested(DelayMetadataPropertiesSchema, data_key="sourceLookback") + temporal_join_lookback = fields.Nested(DelayMetadataPropertiesSchema, data_key="temporalJoinLookback") diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/materialization_settings_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/materialization_settings_schema.py new file mode 100644 index 00000000..8cf68b67 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/materialization_settings_schema.py @@ -0,0 +1,37 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema import NestedField +from azure.ai.ml._schema._notification.notification_schema import NotificationSchema +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta +from azure.ai.ml._schema.schedule.trigger import RecurrenceTriggerSchema + + +class MaterializationComputeResourceSchema(metaclass=PatchedSchemaMeta): + instance_type = fields.Str() + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.materialization_compute_resource import MaterializationComputeResource + + return MaterializationComputeResource(instance_type=data.pop("instance_type"), **data) + + +class MaterializationSettingsSchema(metaclass=PatchedSchemaMeta): + schedule = NestedField(RecurrenceTriggerSchema) + notification = NestedField(NotificationSchema) + resource = NestedField(MaterializationComputeResourceSchema) + spark_configuration = fields.Dict() + offline_enabled = fields.Boolean() + online_enabled = fields.Boolean() + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.materialization_settings import MaterializationSettings + + return MaterializationSettings(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_metadata_schema.py new file mode 100644 index 00000000..345c9084 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_metadata_schema.py @@ -0,0 +1,30 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from typing import Dict + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + +from .delay_metadata_schema import DelayMetadataSchema +from .source_process_code_metadata_schema import SourceProcessCodeSchema +from .timestamp_column_metadata_schema import TimestampColumnMetadataSchema + + +class SourceMetadataSchema(metaclass=PatchedSchemaMeta): + type = fields.Str(required=True) + path = fields.Str(required=False) + timestamp_column = fields.Nested(TimestampColumnMetadataSchema, required=False) + source_delay = fields.Nested(DelayMetadataSchema, required=False) + source_process_code = fields.Nested(SourceProcessCodeSchema, load_only=True, required=False) + dict = fields.Dict(keys=fields.Str(), values=fields.Str(), data_key="kwargs", load_only=True, required=False) + + @post_load + def make(self, data: Dict, **kwargs): + from azure.ai.ml.entities._feature_set.source_metadata import SourceMetadata + + return SourceMetadata(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_process_code_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_process_code_metadata_schema.py new file mode 100644 index 00000000..b8b93739 --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/source_process_code_metadata_schema.py @@ -0,0 +1,20 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class SourceProcessCodeSchema(metaclass=PatchedSchemaMeta): + path = fields.Str(required=True, allow_none=False) + process_class = fields.Str(required=True, allow_none=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.source_process_code_metadata import SourceProcessCodeMetadata + + return SourceProcessCodeMetadata(**data) diff --git a/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/timestamp_column_metadata_schema.py b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/timestamp_column_metadata_schema.py new file mode 100644 index 00000000..6d7982be --- /dev/null +++ b/.venv/lib/python3.12/site-packages/azure/ai/ml/_schema/_feature_set/timestamp_column_metadata_schema.py @@ -0,0 +1,20 @@ +# --------------------------------------------------------- +# Copyright (c) Microsoft Corporation. All rights reserved. +# --------------------------------------------------------- + +# pylint: disable=unused-argument + +from marshmallow import fields, post_load + +from azure.ai.ml._schema.core.schema import PatchedSchemaMeta + + +class TimestampColumnMetadataSchema(metaclass=PatchedSchemaMeta): + name = fields.Str(required=True) + format = fields.Str(required=False) + + @post_load + def make(self, data, **kwargs): + from azure.ai.ml.entities._feature_set.timestamp_column_metadata import TimestampColumnMetadata + + return TimestampColumnMetadata(**data) |