# Ollama - Llama 2 7B

## Setup

In [1]:
from llama_index.llms.ollama import Ollama

In [2]:
llm = Ollama(model="llama2")

#### Call `complete` with a prompt

In [6]:
resp = llm.stream_complete("Who is Paul Graham?")

In [7]:
print(resp)

<generator object llm_completion_callback.<locals>.wrap.<locals>.wrapped_llm_predict.<locals>.wrapped_gen at 0x1436b19e0>


#### Call `chat` with a list of messages

In [None]:
from llama_index.llms import ChatMessage

messages = [
    ChatMessage(role="system", content="You are a pirate with a colorful personality"),
    ChatMessage(role="user", content="What is your name"),
]
resp = llm.chat(messages)

In [None]:
print(resp)

### Streaming

Using `stream_complete` endpoint 

In [8]:
response = llm.stream_complete("Who is Paul Graham?")

In [9]:
for r in response:
    print(r.delta, end="")

{"model":"llama2","created_at":"2023-09-08T04:25:18.678077Z","response":" Paul","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.696443Z","response":" Graham","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.713829Z","response":" is","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.73154Z","response":" a","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.749669Z","response":" well","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.767559Z","response":"-","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.784887Z","response":"known","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.802392Z","response":" entrepr","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.819969Z","response":"ene","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.837426Z","response":"ur","done":false}{"model":"llama2","created_at":"2023-09-08T04:25:18.854878Z","response":",","don

Using `stream_chat` endpoint

In [None]:
from llama_index.llms import ChatMessage

messages = [
    ChatMessage(role="system", content="You are a pirate with a colorful personality"),
    ChatMessage(role="user", content="What is your name"),
]
resp = llm.stream_chat(messages)

In [None]:
for r in resp:
    print(r.delta, end="")

## Configure Model

In [None]:
from llama_index.llms import Replicate

llm = Replicate(
    model="a16z-infra/llama13b-v2-chat:df7690f1994d94e96ad9d568eac121aecf50684a0b0963b25a41cc40061269e5",
    temperature=0.9,
    context_window=32,
)

In [None]:
resp = llm.complete("Who is Paul Graham?")

In [None]:
print(resp)