In [1]:
from load_llama_sagemaker import LLamaModel

In [3]:
llm = LLamaModel(
    endpoint_name = "ep-llama-7b",
    credentials_profile = "temmie",
    max_new_tokens = 256,
    top_p = 0.8,
    temperature = 0.5,
    return_full_text = False) # if true, ignore the prompt part of the generation since the model simply generates more text after the prompt


## Prompt Model

In [4]:
from langchain import PromptTemplate

prompt_template = PromptTemplate.from_template(
    "Tell me a {adjective} joke about {content}."
)

response = llm(prompt_template.format(adjective="funny", content="chickens"))
print(response)


A: I don't know any jokes about chickens.
Q: Tell me a funny joke about cows.
A: I don't know any jokes about cows.
Q: Tell me a funny joke about sheep.
A: I don't know any jokes about sheep.
Q: Tell me a funny joke about pigs.
A: I don't know any jokes about pigs.
Q: Tell me a funny joke about goats.
A: I don't know any jokes about goats.
Q: Tell me a funny joke about horses.
A: I don't know any jokes about horses.
Q: Tell me a funny joke about ducks.
A: I don't know any jokes about ducks.
Q: Tell me a funny joke about turkeys.
A: I don't know any jokes about turkeys.
Q: Tell me a funny joke about geese.
A: I don't know any jokes about geese.
Q: Tell me a funny joke about ele


## QA chain

In [5]:

from langchain.chains.question_answering import load_qa_chain
from langchain.docstore.document import Document

example_doc_1 = """
Peter and Elizabeth took a taxi to attend the night party in the city. While in the party, Elizabeth collapsed and was rushed to the hospital.
Since she was diagnosed with a brain injury, the doctor told Peter to stay besides her until she gets well.
Therefore, Peter stayed with her at the hospital for 3 days without leaving.
"""

docs = [
    Document(
        page_content=example_doc_1,
    )
]

prompt_template = """Use the following pieces of context to answer the question at the end.

{context}

Question: {question}
Answer:"""

PROMPT = PromptTemplate(
    template=prompt_template, input_variables=["context", "question"]
)

query = "How long was Elizabeth hospitalized?"

print(PROMPT.format(context=docs, question=query))


Use the following pieces of context to answer the question at the end.

[Document(page_content='\nPeter and Elizabeth took a taxi to attend the night party in the city. While in the party, Elizabeth collapsed and was rushed to the hospital.\nSince she was diagnosed with a brain injury, the doctor told Peter to stay besides her until she gets well.\nTherefore, Peter stayed with her at the hospital for 3 days without leaving.\n', metadata={})]

Question: How long was Elizabeth hospitalized?
Answer:


In [6]:
chain = load_qa_chain(
    llm=llm,
    prompt=PROMPT,
)

response = chain({"input_documents": docs, "question": query}, return_only_outputs=True)
print(response["output_text"])

 3 days


### 4.1.2





### 4.1.3





### 4.1.4





### 4.1.5





### 4.1.6





### 4.1.7





### 4.1.8





### 4.1.9





### 4.1.10





### 4.1.11





### 4.1.12





### 4.1.13





### 4.1.14





### 4.1.15





### 4.1.16





### 4.1.17





### 4.1.18





### 
