In [1]:
import os
from dotenv import load_dotenv

load_dotenv()

True

In [2]:
from langchain_core.documents import Document

texts = [
    "안녕, 만나서 반가워.",
    "LangChain simplifies the process of building applications with large language models",
    "랭체인 한국어 튜토리얼은 LangChain의 공식 문서, cookbook 및 다양한 실용 예제를 바탕으로 하여 사용자가 LangChain을 더 쉽고 효과적으로 활용할 수 있도록 구성되어 있습니다. ",
    "LangChain은 초거대 언어모델로 애플리케이션을 구축하는 과정을 단순화합니다.",
    "Retrieval-Augmented Generation (RAG) is an effective technique for improving AI responses.",
]

### 구글

In [3]:
from langchain_google_genai import GoogleGenerativeAIEmbeddings

google_embeddings = GoogleGenerativeAIEmbeddings(model="models/gemini-embedding-exp-03-07")

In [4]:
embedded_documents = google_embeddings.embed_documents(texts)
embedded_documents

[[-0.02867422252893448,
  0.012470046058297157,
  -0.0018582296324893832,
  -0.0896618440747261,
  -0.007612487766891718,
  -0.00011338542390149087,
  -0.009838642552495003,
  -0.018059002235531807,
  0.001211587805300951,
  0.007167136762291193,
  -0.0008226422942243516,
  -0.01603224314749241,
  -0.0016729526687413454,
  0.006944333203136921,
  0.16366255283355713,
  -0.020049894228577614,
  0.016397571191191673,
  -0.0010212707566097379,
  -0.0012129347305744886,
  -0.03213430196046829,
  -0.0036619629245251417,
  0.007234617602080107,
  0.002082657301798463,
  0.004666237160563469,
  -0.024821359664201736,
  0.011383009143173695,
  0.007977013476192951,
  -0.0022123067174106836,
  0.01029234379529953,
  0.0011341830249875784,
  0.011574743315577507,
  0.01505206897854805,
  0.0074724662117660046,
  0.015942512080073357,
  0.00463251955807209,
  0.004384673200547695,
  0.021426690742373466,
  0.0010252807987853885,
  -0.02618018165230751,
  -0.0024632613640278578,
  0.00599870039150

In [5]:
embedded_query = google_embeddings.embed_query("LangChain 에 대해서 알려주세요.")
embedded_query

[0.047535259276628494,
 -0.007320969365537167,
 -0.01979604922235012,
 -0.01156556885689497,
 0.03500209376215935,
 -0.0022982934024184942,
 0.019403301179409027,
 -0.014846716076135635,
 0.05063337832689285,
 0.01358968298882246,
 0.0024244303349405527,
 -0.0029055767226964235,
 -0.0035915113985538483,
 -0.07664375007152557,
 -0.002075160387903452,
 -0.04456327483057976,
 0.026316599920392036,
 -0.018741970881819725,
 0.0075382208451628685,
 -0.005002249963581562,
 -0.0008795993053354323,
 0.020541541278362274,
 -0.0004263149749021977,
 0.0033323182724416256,
 -0.03401729092001915,
 -0.032001446932554245,
 0.008120776154100895,
 -0.02856406755745411,
 -0.06301163882017136,
 0.04512149840593338,
 -0.018086763098835945,
 0.0014650990488007665,
 -0.06647098064422607,
 0.006042827852070332,
 0.01350508164614439,
 -0.0042027817107737064,
 0.018926264718174934,
 0.02394809201359749,
 0.008567214012145996,
 -0.0271740835160017,
 0.023504110053181648,
 -0.06275533884763718,
 -0.04541422054171

### 허깅페이스

In [6]:
from langchain_huggingface.embeddings import HuggingFaceEndpointEmbeddings

model_name = "intfloat/multilingual-e5-large-instruct"

hf_embeddings = HuggingFaceEndpointEmbeddings(
    model=model_name,
    task="feature-extraction",
    huggingfacehub_api_token=os.environ["HUGGINGFACEHUB_API_TOKEN"],
)

  from .autonotebook import tqdm as notebook_tqdm


In [7]:
embedded_documents = hf_embeddings.embed_documents(texts)
embedded_documents

[[0.0511920228600502,
  0.011308946646749973,
  0.012826327234506607,
  -0.03129677101969719,
  0.024386851117014885,
  -0.031839631497859955,
  -0.0413723848760128,
  0.007222234271466732,
  0.0444776751101017,
  -0.023085832595825195,
  0.028797687962651253,
  0.010783929377794266,
  -0.013323882594704628,
  -0.028462374582886696,
  -0.04694923013448715,
  -0.021683266386389732,
  -0.025736218318343163,
  0.001958938781172037,
  0.0007779121515341103,
  -0.011368482373654842,
  0.026559341698884964,
  0.002380043501034379,
  -0.006590391043573618,
  -0.050234053283929825,
  -0.030206533148884773,
  -0.0036191269755363464,
  -0.0500679649412632,
  -0.015691475942730904,
  -0.0187184177339077,
  -0.02677012048661709,
  0.027322877198457718,
  0.007506826426833868,
  -0.03852768614888191,
  -0.040268901735544205,
  -0.012338859960436821,
  0.023780303075909615,
  0.023508718237280846,
  0.029794201254844666,
  -0.01239995751529932,
  0.06362667679786682,
  -0.015463155694305897,
  0.035