In [None]:
import json
import sagemaker
import boto3
from sagemaker.huggingface import HuggingFaceModel, get_huggingface_llm_image_uri

try:
    role = sagemaker.get_execution_role()
except ValueError:
    iam = boto3.client('iam')
    role = iam.get_role(RoleName='sagemaker_execution_role')['Role']['Arn']

# Hub Model configuration. https://huggingface.co/models
hub = {
    'HF_MODEL_ID': 'databricks/dolly-v2-7b',
    'SM_NUM_GPUS': json.dumps(1)
}

# create Hugging Face Model Class
huggingface_model = HuggingFaceModel(
    image_uri=get_huggingface_llm_image_uri("huggingface", version="1.1.0"),
    env=hub,
    role=role,
)

# deploy model to SageMaker Inference
predictor = huggingface_model.deploy(
    initial_instance_count=1,
    instance_type="ml.g4dn.2xlarge",
    container_startup_health_check_timeout=3000,
  )

# send request
predictor.predict({
    "inputs": "My name is Julien and I like to",
})

In [None]:
import json
import requests

url = 'https://gf0w714oo7.execute-api.us-west-2.amazonaws.com/prod'
input_data = json.dumps(
    {
        'inputs': 'what is the time?'
    }
)

response = requests.post(url, data=input_data)
print(response.text)

In [None]:
context = """Transformers is a media franchise produced by 
American toy company Hasbro and Japanese toy company Takara Tomy. 
It primarily follows the heroic Autobots and the villainous Decepticons, 
two alien robot factions at war that can transform into other forms, 
such as vehicles and animals. The franchise encompasses toys, animation, 
comic books, video games and films. As of 2011, it generated more than ¥2 
trillion ($25 billion) in revenue,[1] making it one of the highest-grossing 
media franchises of all time."""

In [None]:
prompt = f"what is the context talking about? context: {context}"

input_data = json.dumps(
    {
        'inputs': prompt
    }
)
response = requests.post(url, data=input_data)
print(response.text)

In [None]:
prompt = f"""Answer the question below based on the context.

Question: what was the revenue generated by the transformers movie?

Context: {context}"""


In [None]:
input_data = json.dumps(
    {
        'inputs': prompt
    }
)
response = requests.post(url, data=input_data)
print(response.text)