# Install Dependencies

In [None]:
!pip install sagemaker==2.173.0 transformers

# Deploy Embedding Model

In [None]:
import sagemaker
from sagemaker.huggingface import HuggingFaceModel

role = sagemaker.get_execution_role()

hub_config = {
    'HF_MODEL_ID': 'sentence-transformers/all-MiniLM-L6-v2',
    'HF_TASK': 'feature-extraction'
}

huggingface_model = HuggingFaceModel(
    env=hub_config,
    role=role,
    transformers_version="4.6",
    pytorch_version="1.7",
    py_version="py36",
)

encoder = huggingface_model.deploy(
    initial_instance_count=1,
    instance_type="ml.m5.large",
    endpoint_name="minilm-embedding"
)

# Invoke Endpoint (Example)

In [None]:
import boto3
import json

runtime = boto3.client("runtime.sagemaker")
EMBEDDING_ENDPOINT="minilm-embedding"

response = runtime.invoke_endpoint(EndpointName=EMBEDDING_ENDPOINT, ContentType="application/json", Body=json.dumps({"inputs":["Text for embedding"]}))
print(json.loads(response['Body'].read().decode('utf-8')))