`tests.system.providers.amazon.aws.example_sagemaker`¶

Module Contents¶

Functions¶

`set_up`(env_id, role_arn)
`delete_ecr_repository`(repository_name)
`delete_logs`(env_id)
`delete_model_group`(group_name, model_version_arn)
`delete_pipeline`(pipeline_name)
`delete_docker_image`(image_name)

Attributes¶

`DAG_ID`
`ROLE_ARN_KEY`
`sys_test_context_task`
`KNN_IMAGES_BY_REGION`
`DATASET`
`SAMPLE_SIZE`
`PREPROCESS_SCRIPT_TEMPLATE`
`test_context`
`test_run`

tests.system.providers.amazon.aws.example_sagemaker.DAG_ID = example_sagemaker[source]¶

tests.system.providers.amazon.aws.example_sagemaker.ROLE_ARN_KEY = ROLE_ARN[source]¶

tests.system.providers.amazon.aws.example_sagemaker.sys_test_context_task[source]¶

tests.system.providers.amazon.aws.example_sagemaker.KNN_IMAGES_BY_REGION[source]¶

tests.system.providers.amazon.aws.example_sagemaker.DATASET = Multiline-String[source]¶

Show Value

        5.1,3.5,1.4,0.2,Iris-setosa
        4.9,3.0,1.4,0.2,Iris-setosa
        7.0,3.2,4.7,1.4,Iris-versicolor
        6.4,3.2,4.5,1.5,Iris-versicolor
        4.9,2.5,4.5,1.7,Iris-virginica
        7.3,2.9,6.3,1.8,Iris-virginica

tests.system.providers.amazon.aws.example_sagemaker.SAMPLE_SIZE[source]¶

tests.system.providers.amazon.aws.example_sagemaker.PREPROCESS_SCRIPT_TEMPLATE = Multiline-String[source]¶

Show Value

import boto3
import numpy as np
import pandas as pd

def main():
    # Load the Iris dataset from {input_path}/input.csv, split it into train/test
    # subsets, and write them to {output_path}/ for the Processing Operator.

    columns = ['sepal_length', 'sepal_width', 'petal_length', 'petal_width', 'species']
    iris = pd.read_csv('{input_path}/input.csv', names=columns)

    # Process data
    iris['species'] = iris['species'].replace({{'Iris-virginica': 0, 'Iris-versicolor': 1, 'Iris-setosa': 2}})
    iris = iris[['species', 'sepal_length', 'sepal_width', 'petal_length', 'petal_width']]

    # Split into test and train data
    iris_train, iris_test = np.split(
        iris.sample(frac=1, random_state=np.random.RandomState()), [int(0.7 * len(iris))]
    )

    # Remove the "answers" from the test set
    iris_test.drop(['species'], axis=1, inplace=True)

    # Write the splits to disk
    iris_train.to_csv('{output_path}/train.csv', index=False, header=False)
    iris_test.to_csv('{output_path}/test.csv', index=False, header=False)

    print('Preprocessing Done.')

if __name__ == "__main__":
    main()

tests.system.providers.amazon.aws.example_sagemaker.set_up(env_id, role_arn)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.delete_ecr_repository(repository_name)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.delete_logs(env_id)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.delete_model_group(group_name, model_version_arn)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.delete_pipeline(pipeline_name)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.delete_docker_image(image_name)[source]¶

tests.system.providers.amazon.aws.example_sagemaker.test_context[source]¶

tests.system.providers.amazon.aws.example_sagemaker.test_run[source]¶

tests.system.providers.amazon.aws.example_sagemaker¶

Module Contents¶

Functions¶

Attributes¶

`tests.system.providers.amazon.aws.example_sagemaker`¶