# Install Dependencies

In [2]:
!pip install datasets transformers langchain einops sentence-transformers



# Configure the embedding model

HuggingFaceEmbeddings is a class that provides functionality to use pre-trained models from HuggingFace for generating embeddings

In [3]:
from langchain.embeddings import HuggingFaceEmbeddings

# The model_name parameter specifies the pre-trained model to use. In this case, 'nomic-ai/nomic-embed-text-v1.5' is used.
# The model_kwargs parameter is a dictionary that can be used to pass additional arguments to the model. Here, 'trust_remote_code' is set to True, which means that the model will trust and execute remote code.
emb = HuggingFaceEmbeddings(model_name='nomic-ai/nomic-embed-text-v1.5', model_kwargs={'trust_remote_code':True})

  from .autonotebook import tqdm as notebook_tqdm
<All keys matched successfully>


# Define the text input

In [4]:
# This can be any text!
text = "This is a test document."

# Generate the embedding

In [5]:
# The method returns a list of embeddings, where each embedding is a high-dimensional vector that represents the semantic content of the text.
res = emb.embed_query(text)

In [6]:
# Print the length of the embeddings list
# This gives us an idea of how many embeddings were generated for the text.
print(len(res))

768


In [7]:
# Print the embeddings itself
# Each embedding is a high-dimensional vector, so this will print a list of vectors.
print(res)

[0.7055405378341675, 0.4733888804912567, -3.6945576667785645, -1.0959097146987915, 0.6916875839233398, -0.7252398729324341, 0.40410763025283813, -0.06588228046894073, 0.23866510391235352, -0.7481763362884521, 0.2985946536064148, 0.7290288805961609, 0.3696836531162262, -0.4106758236885071, -0.3627206087112427, -0.9940328598022461, 0.7113051414489746, -1.6113718748092651, 0.09331997483968735, 0.04567493498325348, 0.10984012484550476, 0.10997241735458374, -2.0760669708251953, -0.2516232132911682, 2.585610866546631, 0.6344131827354431, -1.7511849403381348, 0.18512144684791565, -1.579018473625183, -1.0607389211654663, 0.690180778503418, -0.14475826919078827, 0.9499956369400024, -0.42626500129699707, -0.5214138031005859, -2.2995524406433105, 0.34503909945487976, 0.9812821745872498, -0.13331809639930725, 0.6769289970397949, -0.2583778500556946, 0.6046335101127625, -1.1301310062408447, -0.6406277418136597, 0.7976546287536621, 0.7306954860687256, -0.03462890163064003, 1.131739616394043, -0.0276

# Discussion Questions

- What did you learn?
- Try this idea out, ask a friend