In [None]:
import sagemaker
from sagemaker.huggingface.model import HuggingFaceModel
import boto3

iam_client = boto3.client('iam')
role = iam_client.get_role(RoleName='sagemaker_access_iam_role')['Role']['Arn']
sess = sagemaker.Session()

# create Hugging Face Model Class
huggingface_model = HuggingFaceModel(
   model_data="s3://sagemaker-whisper-model/whisper.tar.gz",  # path to your trained SageMaker model
   role=role,                                            # IAM role with permissions to create an endpoint
   transformers_version="4.47.0",                           # Transformers version used
   pytorch_version="2.5.1",                                # PyTorch version used
   py_version='py311',                                    # Python version used
)

# deploy model to SageMaker Inference
predictor = huggingface_model.deploy(
   initial_instance_count=1,
   instance_type="ml.t2.medium"
)

# example request: you always need to define "inputs"
data = {
   "inputs": "نعتمد في فطورنا"
}

# request
predictor.predict(data)