import datetime import re import uuid import boto3 import pytest from botocore.exceptions import ClientError from moto import mock_sagemaker from moto.core import DEFAULT_ACCOUNT_ID as ACCOUNT_ID TEST_REGION_NAME = "us-east-1" TEST_ROLE_ARN = f"arn:aws:iam::{ACCOUNT_ID}:role/FakeRole" GENERIC_TAGS_PARAM = [ {"Key": "newkey1", "Value": "newval1"}, {"Key": "newkey2", "Value": "newval2"}, ] TEST_MODEL_NAME = "MyModel" TEST_ENDPOINT_NAME = "MyEndpoint" TEST_ENDPOINT_CONFIG_NAME = "MyEndpointConfig" TEST_VARIANT_NAME = "MyProductionVariant" TEST_INSTANCE_TYPE = "ml.t2.medium" TEST_MEMORY_SIZE = 1024 TEST_CONCURRENCY = 10 TEST_PRODUCTION_VARIANTS = [ { "VariantName": TEST_VARIANT_NAME, "ModelName": TEST_MODEL_NAME, "InitialInstanceCount": 1, "InstanceType": TEST_INSTANCE_TYPE, }, ] TEST_SERVERLESS_PRODUCTION_VARIANTS = [ { "VariantName": TEST_VARIANT_NAME, "ModelName": TEST_MODEL_NAME, "ServerlessConfig": { "MemorySizeInMB": TEST_MEMORY_SIZE, "MaxConcurrency": TEST_CONCURRENCY, }, }, ] @pytest.fixture(name="sagemaker_client") def fixture_sagemaker_client(): with mock_sagemaker(): yield boto3.client("sagemaker", region_name=TEST_REGION_NAME) def create_endpoint_config_helper(sagemaker_client, production_variants): _create_model(sagemaker_client, TEST_MODEL_NAME) resp = sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=production_variants, ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$", resp["EndpointConfigArn"], ) resp = sagemaker_client.describe_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$", resp["EndpointConfigArn"], ) assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME assert resp["ProductionVariants"] == production_variants def test_create_endpoint_config(sagemaker_client): with pytest.raises(ClientError) as e: sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=TEST_PRODUCTION_VARIANTS, ) assert e.value.response["Error"]["Message"].startswith("Could not find model") # Testing instance-based endpoint configuration create_endpoint_config_helper(sagemaker_client, TEST_PRODUCTION_VARIANTS) def test_create_endpoint_config_serverless(sagemaker_client): with pytest.raises(ClientError) as e: sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=TEST_SERVERLESS_PRODUCTION_VARIANTS, ) assert e.value.response["Error"]["Message"].startswith("Could not find model") # Testing serverless endpoint configuration create_endpoint_config_helper(sagemaker_client, TEST_SERVERLESS_PRODUCTION_VARIANTS) def test_delete_endpoint_config(sagemaker_client): _create_model(sagemaker_client, TEST_MODEL_NAME) resp = sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=TEST_PRODUCTION_VARIANTS, ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$", resp["EndpointConfigArn"], ) resp = sagemaker_client.describe_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$", resp["EndpointConfigArn"], ) sagemaker_client.delete_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME ) with pytest.raises(ClientError) as e: sagemaker_client.describe_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME ) assert e.value.response["Error"]["Message"].startswith( "Could not find endpoint configuration" ) with pytest.raises(ClientError) as e: sagemaker_client.delete_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME ) assert e.value.response["Error"]["Message"].startswith( "Could not find endpoint configuration" ) def test_create_endpoint_invalid_instance_type(sagemaker_client): _create_model(sagemaker_client, TEST_MODEL_NAME) instance_type = "InvalidInstanceType" production_variants = TEST_PRODUCTION_VARIANTS production_variants[0]["InstanceType"] = instance_type with pytest.raises(ClientError) as e: sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=production_variants, ) assert e.value.response["Error"]["Code"] == "ValidationException" expected_message = ( f"Value '{instance_type}' at 'instanceType' failed to satisfy " "constraint: Member must satisfy enum value set: [" ) assert expected_message in e.value.response["Error"]["Message"] def test_create_endpoint_invalid_memory_size(sagemaker_client): _create_model(sagemaker_client, TEST_MODEL_NAME) memory_size = 1111 production_variants = TEST_SERVERLESS_PRODUCTION_VARIANTS production_variants[0]["ServerlessConfig"]["MemorySizeInMB"] = memory_size with pytest.raises(ClientError) as e: sagemaker_client.create_endpoint_config( EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, ProductionVariants=production_variants, ) assert e.value.response["Error"]["Code"] == "ValidationException" expected_message = ( f"Value '{memory_size}' at 'MemorySizeInMB' failed to satisfy " "constraint: Member must satisfy enum value set: [" ) assert expected_message in e.value.response["Error"]["Message"] def test_create_endpoint(sagemaker_client): with pytest.raises(ClientError) as e: sagemaker_client.create_endpoint( EndpointName=TEST_ENDPOINT_NAME, EndpointConfigName="NonexistentEndpointConfig", ) assert e.value.response["Error"]["Message"].startswith( "Could not find endpoint configuration" ) _create_model(sagemaker_client, TEST_MODEL_NAME) _create_endpoint_config( sagemaker_client, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) resp = sagemaker_client.create_endpoint( EndpointName=TEST_ENDPOINT_NAME, EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME, Tags=GENERIC_TAGS_PARAM, ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"] ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"] ) assert resp["EndpointName"] == TEST_ENDPOINT_NAME assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME assert resp["EndpointStatus"] == "InService" assert isinstance(resp["CreationTime"], datetime.datetime) assert isinstance(resp["LastModifiedTime"], datetime.datetime) assert resp["ProductionVariants"][0]["VariantName"] == TEST_VARIANT_NAME resp = sagemaker_client.list_tags(ResourceArn=resp["EndpointArn"]) assert resp["Tags"] == GENERIC_TAGS_PARAM def test_delete_endpoint(sagemaker_client): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) sagemaker_client.delete_endpoint(EndpointName=TEST_ENDPOINT_NAME) with pytest.raises(ClientError) as e: sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) assert e.value.response["Error"]["Message"].startswith("Could not find endpoint") with pytest.raises(ClientError) as e: sagemaker_client.delete_endpoint(EndpointName=TEST_ENDPOINT_NAME) assert e.value.response["Error"]["Message"].startswith("Could not find endpoint") def test_add_tags_endpoint(sagemaker_client): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) resource_arn = ( f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}" f":endpoint/{TEST_ENDPOINT_NAME}" ) response = sagemaker_client.add_tags( ResourceArn=resource_arn, Tags=GENERIC_TAGS_PARAM ) assert response["ResponseMetadata"]["HTTPStatusCode"] == 200 response = sagemaker_client.list_tags(ResourceArn=resource_arn) assert response["Tags"] == GENERIC_TAGS_PARAM def test_delete_tags_endpoint(sagemaker_client): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) resource_arn = ( f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}" f":endpoint/{TEST_ENDPOINT_NAME}" ) response = sagemaker_client.add_tags( ResourceArn=resource_arn, Tags=GENERIC_TAGS_PARAM ) assert response["ResponseMetadata"]["HTTPStatusCode"] == 200 tag_keys = [tag["Key"] for tag in GENERIC_TAGS_PARAM] response = sagemaker_client.delete_tags(ResourceArn=resource_arn, TagKeys=tag_keys) assert response["ResponseMetadata"]["HTTPStatusCode"] == 200 response = sagemaker_client.list_tags(ResourceArn=resource_arn) assert response["Tags"] == [] def test_list_tags_endpoint(sagemaker_client): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) tags = [] for _ in range(80): tags.append({"Key": str(uuid.uuid4()), "Value": "myValue"}) resource_arn = ( f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}" f":endpoint/{TEST_ENDPOINT_NAME}" ) response = sagemaker_client.add_tags(ResourceArn=resource_arn, Tags=tags) assert response["ResponseMetadata"]["HTTPStatusCode"] == 200 response = sagemaker_client.list_tags(ResourceArn=resource_arn) assert len(response["Tags"]) == 50 assert response["Tags"] == tags[:50] response = sagemaker_client.list_tags( ResourceArn=resource_arn, NextToken=response["NextToken"] ) assert len(response["Tags"]) == 30 assert response["Tags"] == tags[50:] def test_update_endpoint_weights_and_capacities_one_variant(sagemaker_client): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) new_desired_weight = 1.5 new_desired_instance_count = 123 response = sagemaker_client.update_endpoint_weights_and_capacities( EndpointName=TEST_ENDPOINT_NAME, DesiredWeightsAndCapacities=[ { "VariantName": TEST_VARIANT_NAME, "DesiredWeight": new_desired_weight, "DesiredInstanceCount": new_desired_instance_count, }, ], ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", response["EndpointArn"], ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"] ) assert resp["EndpointName"] == TEST_ENDPOINT_NAME assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME assert resp["EndpointStatus"] == "InService" assert isinstance(resp["CreationTime"], datetime.datetime) assert isinstance(resp["LastModifiedTime"], datetime.datetime) assert resp["ProductionVariants"][0]["VariantName"] == TEST_VARIANT_NAME assert ( resp["ProductionVariants"][0]["DesiredInstanceCount"] == new_desired_instance_count ) assert ( resp["ProductionVariants"][0]["CurrentInstanceCount"] == new_desired_instance_count ) assert resp["ProductionVariants"][0]["DesiredWeight"] == new_desired_weight assert resp["ProductionVariants"][0]["CurrentWeight"] == new_desired_weight def test_update_endpoint_weights_and_capacities_two_variants(sagemaker_client): production_variants = [ { "VariantName": "MyProductionVariant1", "ModelName": TEST_MODEL_NAME, "InitialInstanceCount": 1, "InstanceType": TEST_INSTANCE_TYPE, }, { "VariantName": "MyProductionVariant2", "ModelName": TEST_MODEL_NAME, "InitialInstanceCount": 1, "InstanceType": TEST_INSTANCE_TYPE, }, ] _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME, production_variants, ) desired_weights_and_capacities = [ { "VariantName": "MyProductionVariant1", "DesiredWeight": 1.5, "DesiredInstanceCount": 123, }, { "VariantName": "MyProductionVariant2", "DesiredWeight": 1.5, "DesiredInstanceCount": 123, }, ] new_desired_weight = 1.5 new_desired_instance_count = 123 response = sagemaker_client.update_endpoint_weights_and_capacities( EndpointName=TEST_ENDPOINT_NAME, DesiredWeightsAndCapacities=desired_weights_and_capacities, ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", response["EndpointArn"], ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"] ) assert resp["EndpointName"] == TEST_ENDPOINT_NAME assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME assert resp["EndpointStatus"] == "InService" assert isinstance(resp["CreationTime"], datetime.datetime) assert isinstance(resp["LastModifiedTime"], datetime.datetime) assert resp["ProductionVariants"][0]["VariantName"] == "MyProductionVariant1" assert ( resp["ProductionVariants"][0]["DesiredInstanceCount"] == new_desired_instance_count ) assert ( resp["ProductionVariants"][0]["CurrentInstanceCount"] == new_desired_instance_count ) assert resp["ProductionVariants"][0]["DesiredWeight"] == new_desired_weight assert resp["ProductionVariants"][0]["CurrentWeight"] == new_desired_weight assert resp["ProductionVariants"][1]["VariantName"] == "MyProductionVariant2" assert ( resp["ProductionVariants"][1]["DesiredInstanceCount"] == new_desired_instance_count ) assert ( resp["ProductionVariants"][1]["CurrentInstanceCount"] == new_desired_instance_count ) assert resp["ProductionVariants"][1]["DesiredWeight"] == new_desired_weight assert resp["ProductionVariants"][1]["CurrentWeight"] == new_desired_weight def test_update_endpoint_weights_and_capacities_should_throw_clienterror_no_variant( sagemaker_client, ): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del old_resp["ResponseMetadata"] variant_name = "SillyNotCorrectName" new_desired_weight = 1.5 new_desired_instance_count = 123 with pytest.raises(ClientError) as exc: sagemaker_client.update_endpoint_weights_and_capacities( EndpointName=TEST_ENDPOINT_NAME, DesiredWeightsAndCapacities=[ { "VariantName": variant_name, "DesiredWeight": new_desired_weight, "DesiredInstanceCount": new_desired_instance_count, }, ], ) err = exc.value.response["Error"] assert err["Message"] == ( f'The variant name(s) "{variant_name}" is/are not present within ' f'endpoint configuration "{TEST_ENDPOINT_CONFIG_NAME}".' ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del resp["ResponseMetadata"] assert resp == old_resp def test_update_endpoint_weights_and_capacities_should_throw_clienterror_no_endpoint( sagemaker_client, ): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del old_resp["ResponseMetadata"] endpoint_name = "SillyEndpointName" variant_name = "SillyNotCorrectName" new_desired_weight = 1.5 new_desired_instance_count = 123 with pytest.raises(ClientError) as exc: sagemaker_client.update_endpoint_weights_and_capacities( EndpointName=endpoint_name, DesiredWeightsAndCapacities=[ { "VariantName": variant_name, "DesiredWeight": new_desired_weight, "DesiredInstanceCount": new_desired_instance_count, }, ], ) err = exc.value.response["Error"] assert err["Message"] == ( f'Could not find endpoint "arn:aws:sagemaker:us-east-1:' f'{ACCOUNT_ID}:endpoint/{endpoint_name}".' ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del resp["ResponseMetadata"] assert resp == old_resp def test_update_endpoint_weights_and_capacities_should_throw_clienterror_nonunique_variant( sagemaker_client, ): _set_up_sagemaker_resources( sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME ) old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del old_resp["ResponseMetadata"] desired_weights_and_capacities = [ { "VariantName": TEST_VARIANT_NAME, "DesiredWeight": 1.5, "DesiredInstanceCount": 123, }, { "VariantName": TEST_VARIANT_NAME, "DesiredWeight": 1.5, "DesiredInstanceCount": 123, }, ] with pytest.raises(ClientError) as exc: sagemaker_client.update_endpoint_weights_and_capacities( EndpointName=TEST_ENDPOINT_NAME, DesiredWeightsAndCapacities=desired_weights_and_capacities, ) err = exc.value.response["Error"] assert err["Message"] == ( f'The variant name "{TEST_VARIANT_NAME}" was non-unique within the request.' ) resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME) del resp["ResponseMetadata"] assert resp == old_resp def _set_up_sagemaker_resources( boto_client, endpoint_name, endpoint_config_name, model_name, production_variants=None, ): _create_model(boto_client, model_name) _create_endpoint_config( boto_client, endpoint_config_name, model_name, production_variants ) _create_endpoint(boto_client, endpoint_name, endpoint_config_name) def _create_model(boto_client, model_name): resp = boto_client.create_model( ModelName=model_name, PrimaryContainer={ "Image": "382416733822.dkr.ecr.us-east-1.amazonaws.com/factorization-machines:1", "ModelDataUrl": "s3://MyBucket/model.tar.gz", }, ExecutionRoleArn=TEST_ROLE_ARN, ) assert resp["ResponseMetadata"]["HTTPStatusCode"] == 200 def _create_endpoint_config( boto_client, endpoint_config_name, model_name, production_variants=None ): if not production_variants: production_variants = [ { "VariantName": TEST_VARIANT_NAME, "ModelName": model_name, "InitialInstanceCount": 1, "InstanceType": TEST_INSTANCE_TYPE, }, ] resp = boto_client.create_endpoint_config( EndpointConfigName=endpoint_config_name, ProductionVariants=production_variants ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{endpoint_config_name}$", resp["EndpointConfigArn"], ) def _create_endpoint(boto_client, endpoint_name, endpoint_config_name): resp = boto_client.create_endpoint( EndpointName=endpoint_name, EndpointConfigName=endpoint_config_name ) assert re.match( rf"^arn:aws:sagemaker:.*:.*:endpoint/{endpoint_name}$", resp["EndpointArn"] )