moto/tests/test_sagemaker/test_sagemaker_endpoint.py

597 lines
20 KiB
Python
Raw Normal View History

import datetime
import re
import uuid
import boto3
import pytest
from botocore.exceptions import ClientError
2024-01-07 12:03:33 +00:00
from moto import mock_aws
2022-08-13 09:49:43 +00:00
from moto.core import DEFAULT_ACCOUNT_ID as ACCOUNT_ID
TEST_REGION_NAME = "us-east-1"
TEST_ROLE_ARN = f"arn:aws:iam::{ACCOUNT_ID}:role/FakeRole"
GENERIC_TAGS_PARAM = [
{"Key": "newkey1", "Value": "newval1"},
{"Key": "newkey2", "Value": "newval2"},
]
TEST_MODEL_NAME = "MyModel"
TEST_ENDPOINT_NAME = "MyEndpoint"
TEST_ENDPOINT_CONFIG_NAME = "MyEndpointConfig"
TEST_VARIANT_NAME = "MyProductionVariant"
TEST_INSTANCE_TYPE = "ml.t2.medium"
TEST_MEMORY_SIZE = 1024
TEST_CONCURRENCY = 10
TEST_PRODUCTION_VARIANTS = [
{
"VariantName": TEST_VARIANT_NAME,
"ModelName": TEST_MODEL_NAME,
"InitialInstanceCount": 1,
"InstanceType": TEST_INSTANCE_TYPE,
},
]
TEST_SERVERLESS_PRODUCTION_VARIANTS = [
{
"VariantName": TEST_VARIANT_NAME,
"ModelName": TEST_MODEL_NAME,
"ServerlessConfig": {
"MemorySizeInMB": TEST_MEMORY_SIZE,
"MaxConcurrency": TEST_CONCURRENCY,
},
},
]
@pytest.fixture(name="sagemaker_client")
def fixture_sagemaker_client():
2024-01-07 12:03:33 +00:00
with mock_aws():
yield boto3.client("sagemaker", region_name=TEST_REGION_NAME)
def create_endpoint_config_helper(sagemaker_client, production_variants):
_create_model(sagemaker_client, TEST_MODEL_NAME)
resp = sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=production_variants,
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$",
resp["EndpointConfigArn"],
)
resp = sagemaker_client.describe_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$",
resp["EndpointConfigArn"],
)
assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME
assert resp["ProductionVariants"] == production_variants
def test_create_endpoint_config(sagemaker_client):
with pytest.raises(ClientError) as e:
sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=TEST_PRODUCTION_VARIANTS,
)
assert e.value.response["Error"]["Message"].startswith("Could not find model")
# Testing instance-based endpoint configuration
create_endpoint_config_helper(sagemaker_client, TEST_PRODUCTION_VARIANTS)
def test_create_endpoint_config_serverless(sagemaker_client):
with pytest.raises(ClientError) as e:
sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=TEST_SERVERLESS_PRODUCTION_VARIANTS,
)
assert e.value.response["Error"]["Message"].startswith("Could not find model")
# Testing serverless endpoint configuration
create_endpoint_config_helper(sagemaker_client, TEST_SERVERLESS_PRODUCTION_VARIANTS)
def test_delete_endpoint_config(sagemaker_client):
_create_model(sagemaker_client, TEST_MODEL_NAME)
resp = sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=TEST_PRODUCTION_VARIANTS,
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$",
resp["EndpointConfigArn"],
)
resp = sagemaker_client.describe_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{TEST_ENDPOINT_CONFIG_NAME}$",
resp["EndpointConfigArn"],
)
sagemaker_client.delete_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME
)
with pytest.raises(ClientError) as e:
sagemaker_client.describe_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME
)
2020-10-06 06:46:05 +00:00
assert e.value.response["Error"]["Message"].startswith(
"Could not find endpoint configuration"
)
with pytest.raises(ClientError) as e:
sagemaker_client.delete_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME
)
2020-10-06 06:46:05 +00:00
assert e.value.response["Error"]["Message"].startswith(
"Could not find endpoint configuration"
)
def test_create_endpoint_invalid_instance_type(sagemaker_client):
_create_model(sagemaker_client, TEST_MODEL_NAME)
instance_type = "InvalidInstanceType"
production_variants = TEST_PRODUCTION_VARIANTS
production_variants[0]["InstanceType"] = instance_type
with pytest.raises(ClientError) as e:
sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=production_variants,
)
2020-10-06 06:04:09 +00:00
assert e.value.response["Error"]["Code"] == "ValidationException"
expected_message = (
f"Value '{instance_type}' at 'instanceType' failed to satisfy "
"constraint: Member must satisfy enum value set: ["
)
2020-10-06 06:04:09 +00:00
assert expected_message in e.value.response["Error"]["Message"]
def test_create_endpoint_invalid_memory_size(sagemaker_client):
_create_model(sagemaker_client, TEST_MODEL_NAME)
memory_size = 1111
production_variants = TEST_SERVERLESS_PRODUCTION_VARIANTS
production_variants[0]["ServerlessConfig"]["MemorySizeInMB"] = memory_size
with pytest.raises(ClientError) as e:
sagemaker_client.create_endpoint_config(
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
ProductionVariants=production_variants,
)
assert e.value.response["Error"]["Code"] == "ValidationException"
expected_message = (
f"Value '{memory_size}' at 'MemorySizeInMB' failed to satisfy "
"constraint: Member must satisfy enum value set: ["
)
assert expected_message in e.value.response["Error"]["Message"]
def test_create_endpoint(sagemaker_client):
with pytest.raises(ClientError) as e:
sagemaker_client.create_endpoint(
EndpointName=TEST_ENDPOINT_NAME,
EndpointConfigName="NonexistentEndpointConfig",
)
2020-10-06 06:46:05 +00:00
assert e.value.response["Error"]["Message"].startswith(
"Could not find endpoint configuration"
)
_create_model(sagemaker_client, TEST_MODEL_NAME)
_create_endpoint_config(
sagemaker_client, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
resp = sagemaker_client.create_endpoint(
EndpointName=TEST_ENDPOINT_NAME,
EndpointConfigName=TEST_ENDPOINT_CONFIG_NAME,
Tags=GENERIC_TAGS_PARAM,
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"]
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"]
)
assert resp["EndpointName"] == TEST_ENDPOINT_NAME
assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME
assert resp["EndpointStatus"] == "InService"
assert isinstance(resp["CreationTime"], datetime.datetime)
assert isinstance(resp["LastModifiedTime"], datetime.datetime)
assert resp["ProductionVariants"][0]["VariantName"] == TEST_VARIANT_NAME
resp = sagemaker_client.list_tags(ResourceArn=resp["EndpointArn"])
assert resp["Tags"] == GENERIC_TAGS_PARAM
def test_delete_endpoint(sagemaker_client):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
sagemaker_client.delete_endpoint(EndpointName=TEST_ENDPOINT_NAME)
with pytest.raises(ClientError) as e:
sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
2020-10-06 06:04:09 +00:00
assert e.value.response["Error"]["Message"].startswith("Could not find endpoint")
with pytest.raises(ClientError) as e:
sagemaker_client.delete_endpoint(EndpointName=TEST_ENDPOINT_NAME)
2020-10-06 06:04:09 +00:00
assert e.value.response["Error"]["Message"].startswith("Could not find endpoint")
def test_add_tags_endpoint(sagemaker_client):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
resource_arn = (
f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}"
f":endpoint/{TEST_ENDPOINT_NAME}"
)
response = sagemaker_client.add_tags(
ResourceArn=resource_arn, Tags=GENERIC_TAGS_PARAM
)
assert response["ResponseMetadata"]["HTTPStatusCode"] == 200
response = sagemaker_client.list_tags(ResourceArn=resource_arn)
assert response["Tags"] == GENERIC_TAGS_PARAM
def test_delete_tags_endpoint(sagemaker_client):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
resource_arn = (
f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}"
f":endpoint/{TEST_ENDPOINT_NAME}"
)
response = sagemaker_client.add_tags(
ResourceArn=resource_arn, Tags=GENERIC_TAGS_PARAM
)
assert response["ResponseMetadata"]["HTTPStatusCode"] == 200
tag_keys = [tag["Key"] for tag in GENERIC_TAGS_PARAM]
response = sagemaker_client.delete_tags(ResourceArn=resource_arn, TagKeys=tag_keys)
assert response["ResponseMetadata"]["HTTPStatusCode"] == 200
response = sagemaker_client.list_tags(ResourceArn=resource_arn)
assert response["Tags"] == []
def test_list_tags_endpoint(sagemaker_client):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
tags = []
for _ in range(80):
tags.append({"Key": str(uuid.uuid4()), "Value": "myValue"})
resource_arn = (
f"arn:aws:sagemaker:{TEST_REGION_NAME}:{ACCOUNT_ID}"
f":endpoint/{TEST_ENDPOINT_NAME}"
)
response = sagemaker_client.add_tags(ResourceArn=resource_arn, Tags=tags)
assert response["ResponseMetadata"]["HTTPStatusCode"] == 200
response = sagemaker_client.list_tags(ResourceArn=resource_arn)
assert len(response["Tags"]) == 50
assert response["Tags"] == tags[:50]
response = sagemaker_client.list_tags(
ResourceArn=resource_arn, NextToken=response["NextToken"]
)
assert len(response["Tags"]) == 30
assert response["Tags"] == tags[50:]
def test_update_endpoint_weights_and_capacities_one_variant(sagemaker_client):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
new_desired_weight = 1.5
new_desired_instance_count = 123
response = sagemaker_client.update_endpoint_weights_and_capacities(
EndpointName=TEST_ENDPOINT_NAME,
DesiredWeightsAndCapacities=[
{
"VariantName": TEST_VARIANT_NAME,
"DesiredWeight": new_desired_weight,
"DesiredInstanceCount": new_desired_instance_count,
},
],
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$",
response["EndpointArn"],
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"]
)
assert resp["EndpointName"] == TEST_ENDPOINT_NAME
assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME
assert resp["EndpointStatus"] == "InService"
assert isinstance(resp["CreationTime"], datetime.datetime)
assert isinstance(resp["LastModifiedTime"], datetime.datetime)
assert resp["ProductionVariants"][0]["VariantName"] == TEST_VARIANT_NAME
assert (
resp["ProductionVariants"][0]["DesiredInstanceCount"]
== new_desired_instance_count
)
assert (
resp["ProductionVariants"][0]["CurrentInstanceCount"]
== new_desired_instance_count
)
assert resp["ProductionVariants"][0]["DesiredWeight"] == new_desired_weight
assert resp["ProductionVariants"][0]["CurrentWeight"] == new_desired_weight
def test_update_endpoint_weights_and_capacities_two_variants(sagemaker_client):
production_variants = [
{
"VariantName": "MyProductionVariant1",
"ModelName": TEST_MODEL_NAME,
"InitialInstanceCount": 1,
"InstanceType": TEST_INSTANCE_TYPE,
},
{
"VariantName": "MyProductionVariant2",
"ModelName": TEST_MODEL_NAME,
"InitialInstanceCount": 1,
"InstanceType": TEST_INSTANCE_TYPE,
},
]
_set_up_sagemaker_resources(
sagemaker_client,
TEST_ENDPOINT_NAME,
TEST_ENDPOINT_CONFIG_NAME,
TEST_MODEL_NAME,
production_variants,
)
desired_weights_and_capacities = [
{
"VariantName": "MyProductionVariant1",
"DesiredWeight": 1.5,
"DesiredInstanceCount": 123,
},
{
"VariantName": "MyProductionVariant2",
"DesiredWeight": 1.5,
"DesiredInstanceCount": 123,
},
]
new_desired_weight = 1.5
new_desired_instance_count = 123
response = sagemaker_client.update_endpoint_weights_and_capacities(
EndpointName=TEST_ENDPOINT_NAME,
DesiredWeightsAndCapacities=desired_weights_and_capacities,
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$",
response["EndpointArn"],
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{TEST_ENDPOINT_NAME}$", resp["EndpointArn"]
)
assert resp["EndpointName"] == TEST_ENDPOINT_NAME
assert resp["EndpointConfigName"] == TEST_ENDPOINT_CONFIG_NAME
assert resp["EndpointStatus"] == "InService"
assert isinstance(resp["CreationTime"], datetime.datetime)
assert isinstance(resp["LastModifiedTime"], datetime.datetime)
assert resp["ProductionVariants"][0]["VariantName"] == "MyProductionVariant1"
assert (
resp["ProductionVariants"][0]["DesiredInstanceCount"]
== new_desired_instance_count
)
assert (
resp["ProductionVariants"][0]["CurrentInstanceCount"]
== new_desired_instance_count
)
assert resp["ProductionVariants"][0]["DesiredWeight"] == new_desired_weight
assert resp["ProductionVariants"][0]["CurrentWeight"] == new_desired_weight
assert resp["ProductionVariants"][1]["VariantName"] == "MyProductionVariant2"
assert (
resp["ProductionVariants"][1]["DesiredInstanceCount"]
== new_desired_instance_count
)
assert (
resp["ProductionVariants"][1]["CurrentInstanceCount"]
== new_desired_instance_count
)
assert resp["ProductionVariants"][1]["DesiredWeight"] == new_desired_weight
assert resp["ProductionVariants"][1]["CurrentWeight"] == new_desired_weight
def test_update_endpoint_weights_and_capacities_should_throw_clienterror_no_variant(
sagemaker_client,
):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del old_resp["ResponseMetadata"]
variant_name = "SillyNotCorrectName"
new_desired_weight = 1.5
new_desired_instance_count = 123
with pytest.raises(ClientError) as exc:
sagemaker_client.update_endpoint_weights_and_capacities(
EndpointName=TEST_ENDPOINT_NAME,
DesiredWeightsAndCapacities=[
{
"VariantName": variant_name,
"DesiredWeight": new_desired_weight,
"DesiredInstanceCount": new_desired_instance_count,
},
],
)
err = exc.value.response["Error"]
assert err["Message"] == (
f'The variant name(s) "{variant_name}" is/are not present within '
f'endpoint configuration "{TEST_ENDPOINT_CONFIG_NAME}".'
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del resp["ResponseMetadata"]
assert resp == old_resp
def test_update_endpoint_weights_and_capacities_should_throw_clienterror_no_endpoint(
sagemaker_client,
):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del old_resp["ResponseMetadata"]
endpoint_name = "SillyEndpointName"
variant_name = "SillyNotCorrectName"
new_desired_weight = 1.5
new_desired_instance_count = 123
with pytest.raises(ClientError) as exc:
sagemaker_client.update_endpoint_weights_and_capacities(
EndpointName=endpoint_name,
DesiredWeightsAndCapacities=[
{
"VariantName": variant_name,
"DesiredWeight": new_desired_weight,
"DesiredInstanceCount": new_desired_instance_count,
},
],
)
err = exc.value.response["Error"]
assert err["Message"] == (
f'Could not find endpoint "arn:aws:sagemaker:us-east-1:'
f'{ACCOUNT_ID}:endpoint/{endpoint_name}".'
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del resp["ResponseMetadata"]
assert resp == old_resp
def test_update_endpoint_weights_and_capacities_should_throw_clienterror_nonunique_variant(
sagemaker_client,
):
_set_up_sagemaker_resources(
sagemaker_client, TEST_ENDPOINT_NAME, TEST_ENDPOINT_CONFIG_NAME, TEST_MODEL_NAME
)
old_resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del old_resp["ResponseMetadata"]
desired_weights_and_capacities = [
{
"VariantName": TEST_VARIANT_NAME,
"DesiredWeight": 1.5,
"DesiredInstanceCount": 123,
},
{
"VariantName": TEST_VARIANT_NAME,
"DesiredWeight": 1.5,
"DesiredInstanceCount": 123,
},
]
with pytest.raises(ClientError) as exc:
sagemaker_client.update_endpoint_weights_and_capacities(
EndpointName=TEST_ENDPOINT_NAME,
DesiredWeightsAndCapacities=desired_weights_and_capacities,
)
err = exc.value.response["Error"]
assert err["Message"] == (
f'The variant name "{TEST_VARIANT_NAME}" was non-unique within the request.'
)
resp = sagemaker_client.describe_endpoint(EndpointName=TEST_ENDPOINT_NAME)
del resp["ResponseMetadata"]
assert resp == old_resp
def _set_up_sagemaker_resources(
boto_client,
endpoint_name,
endpoint_config_name,
model_name,
production_variants=None,
):
_create_model(boto_client, model_name)
_create_endpoint_config(
boto_client, endpoint_config_name, model_name, production_variants
)
_create_endpoint(boto_client, endpoint_name, endpoint_config_name)
def _create_model(boto_client, model_name):
resp = boto_client.create_model(
ModelName=model_name,
PrimaryContainer={
"Image": "382416733822.dkr.ecr.us-east-1.amazonaws.com/factorization-machines:1",
"ModelDataUrl": "s3://MyBucket/model.tar.gz",
},
ExecutionRoleArn=TEST_ROLE_ARN,
)
assert resp["ResponseMetadata"]["HTTPStatusCode"] == 200
def _create_endpoint_config(
boto_client, endpoint_config_name, model_name, production_variants=None
):
if not production_variants:
production_variants = [
{
"VariantName": TEST_VARIANT_NAME,
"ModelName": model_name,
"InitialInstanceCount": 1,
"InstanceType": TEST_INSTANCE_TYPE,
},
]
resp = boto_client.create_endpoint_config(
EndpointConfigName=endpoint_config_name, ProductionVariants=production_variants
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint-config/{endpoint_config_name}$",
resp["EndpointConfigArn"],
)
def _create_endpoint(boto_client, endpoint_name, endpoint_config_name):
resp = boto_client.create_endpoint(
EndpointName=endpoint_name, EndpointConfigName=endpoint_config_name
)
assert re.match(
rf"^arn:aws:sagemaker:.*:.*:endpoint/{endpoint_name}$", resp["EndpointArn"]
)