In [7]:
from dotenv import load_dotenv
from langchain_core.prompts import PromptTemplate
from langchain_core.output_parsers import StrOutputParser
from langchain_community.llms import GPT4All, Ollama
import os
import requests

load_dotenv()
OLLAMA_URL = os.getenv("OLLAMA_URL")

In [None]:
llm = GPT4All(
    model=".models/mistral-7b-openorca.gguf2.Q4_0.gguf",
    device="gpu",
    n_threads=4
)

In [8]:
payload = requests.get(f"{OLLAMA_URL}/api/tags").json()
model_names = [model['name'] for model in payload['models']]
model_names = ("\n".join(model_names)).rstrip("\n")
print(model_names)

gemma:7b
llama2:13b
mistral:7b
mixtral:8x7b


In [12]:
llm = Ollama(
    model="gemma:7b",
    base_url=OLLAMA_URL,
    temperature=0.7,
)

In [13]:
template = """{question}

Make sure to answer this in list format and keep it brief. Answer strictly in {language} only."""
prompt = PromptTemplate.from_template(template)

output_parser = StrOutputParser()

In [14]:
chain = prompt | llm | output_parser

output = chain.invoke({
    "question": "Which humans have entered space till date?",
    "language": "Hindi"
})
print(output)

* Neil Armstrong
* Edwin Aldrin
* Charles Duke
* Eugene Cernan
* John Young
