In [1]:
from sagemaker.huggingface import HuggingFaceModel
import sagemaker

role = sagemaker.get_execution_role()
# Hub Model configuration. https://huggingface.co/models
hub = {
	'HF_MODEL_ID':'bert-base-uncased',
	'HF_TASK':'fill-mask'
}

# create Hugging Face Model Class
huggingface_model = HuggingFaceModel(
	transformers_version='4.6.1',
	pytorch_version='1.7.1',
	py_version='py36',
	env=hub,
	role=role, 
)

# deploy model to SageMaker Inference
predictor = huggingface_model.deploy(
	initial_instance_count=1, # number of instances
	instance_type='ml.m5.xlarge' # ec2 instance type
)

predictor.predict({
	'inputs': "The answer to the universe is [MASK]."
})

-----!

[{'sequence': 'the answer to the universe is no.',
  'score': 0.16963955760002136,
  'token': 2053,
  'token_str': 'no'},
 {'sequence': 'the answer to the universe is nothing.',
  'score': 0.07344776391983032,
  'token': 2498,
  'token_str': 'nothing'},
 {'sequence': 'the answer to the universe is yes.',
  'score': 0.05803241208195686,
  'token': 2748,
  'token_str': 'yes'},
 {'sequence': 'the answer to the universe is unknown.',
  'score': 0.043957844376564026,
  'token': 4242,
  'token_str': 'unknown'},
 {'sequence': 'the answer to the universe is simple.',
  'score': 0.04015745222568512,
  'token': 3722,
  'token_str': 'simple'}]

In [None]:
predictor.delete_endpoint()