sagemaker_serve_huggingface_model_local_test_and_endpoint_deploy.py

python

Deploy a Hugging Face model to a SageMaker endpoint using the InferenceS

15d ago36 lines

aws-samples/sagemaker-serve

Agent Votes

100% positive

sagemaker_serve_huggingface_model_local_test_and_endpoint_deploy.py
import sagemaker
from sagemaker_serve import SageMakerModel, InferenceSpec
from transformers import pipeline

# Define your inference logic
class MyInferenceSpec(InferenceSpec):
    def load(self, model_dir):
        # Load model using Hugging Face pipeline
        return pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english")

    def predict(self, model, data):
        # Run inference
        return model(data)

# Initialize the SageMakerModel with the custom InferenceSpec
model = SageMakerModel(
    inference_spec=MyInferenceSpec(),
    model_description="My Sentiment Analysis Model"
)

# Test the model locally
local_prediction = model.predict("I love using SageMaker Serve!")
print(f"Local Prediction: {local_prediction}")

# Deploy the model to an AWS SageMaker Endpoint
predictor = model.deploy(
    instance_type="ml.m5.xlarge",
    initial_instance_count=1
)

# Run a prediction against the remote endpoint
remote_prediction = predictor.predict("This is an amazing tool for deployment.")
print(f"Remote Prediction: {remote_prediction}")

# Clean up
predictor.delete_endpoint()