# Using the model

We will be using a Llama 3.1 1B model served on Ollama using the `langchain_openai` package by using their OpenAI compatible API

In [1]:
from os import chdir

chdir("..")

from app.core.config import settings

In [2]:
dict(settings)

{'OLLAMA_BASE_URL': 'http://localhost:11434',
 'OLLAMA_CHAT_MODEL': 'llama3.2:1b',
 'OLLAMA_EMBEDDINGS_MODEL': 'nomic-embed-text:v1.5'}

In [4]:
from langchain_ollama.embeddings import OllamaEmbeddings
from langchain_ollama.chat_models import ChatOllama

chat_model = ChatOllama(
    base_url=settings.OLLAMA_BASE_URL,
    model=settings.OLLAMA_CHAT_MODEL,
    temperature=0,
    # seed=1234,
    # num_ctx=500,
)

embeddings = OllamaEmbeddings(base_url=settings.OLLAMA_BASE_URL, model=settings.OLLAMA_EMBEDDINGS_MODEL)

In [7]:
chat_model.invoke("Hi").content

'Hello. Is there something I can help you with or would you like to chat?'

In [5]:
embeddings.embed_query("Hi")

[0.016887862,
 0.019088851,
 -0.18419065,
 -0.0024268853,
 0.02140486,
 0.04968468,
 0.026290359,
 -0.001271837,
 -0.0043434734,
 -0.04628604,
 -0.033755906,
 0.05956408,
 0.05130368,
 0.021707745,
 0.054271504,
 -0.05489216,
 0.015553318,
 -0.029409276,
 -0.00044955208,
 0.04402231,
 -0.010041787,
 -0.048644483,
 -0.007184181,
 -0.0050699515,
 0.17365333,
 0.0061469106,
 0.044951472,
 0.056092214,
 0.008709584,
 -0.01743973,
 0.01963067,
 -0.043726824,
 0.024087066,
 -0.0034915323,
 0.021775989,
 0.0003854982,
 0.033556964,
 0.018540718,
 0.03190329,
 0.049050834,
 -0.013493951,
 -0.00068559486,
 -0.00705767,
 -0.01168491,
 0.022750506,
 0.020039497,
 -0.01712272,
 0.014474819,
 0.03943749,
 -0.03964942,
 0.003029184,
 -0.010558184,
 -0.033091,
 0.051144995,
 0.05773237,
 0.044090617,
 0.039234094,
 0.020687792,
 0.034188665,
 0.03427767,
 0.04429034,
 0.050567843,
 0.02949041,
 0.072905876,
 0.01211663,
 -0.044011537,
 -0.019905621,
 0.021228302,
 -0.0068726316,
 -0.023828484,
 0.065