In [None]:
! pip install llama-index python-dotenv openai

In [3]:
import os
from dotenv import load_dotenv
import openai

load_dotenv()

openai.api_key = os.getenv("OPENAI_API_KEY")

zilliz_uri = os.getenv("ZILLIZ_URI")
zilliz_token = os.getenv("ZILLIZ_TOKEN")

In [1]:
from llama_index.vector_stores import MilvusVectorStore
from llama_index import VectorStoreIndex, StorageContext, ServiceContext

In [9]:
from langchain.embeddings.huggingface import HuggingFaceEmbeddings
from llama_index import LangchainEmbedding

embed_model = LangchainEmbedding(
  HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L12-v2")
)
service_context = ServiceContext.from_defaults(embed_model=embed_model)

In [13]:
vdb = MilvusVectorStore(
    uri = zilliz_uri,
    token = zilliz_token,
    collection_name = "tds_articles",
    similarity_metric = "L2",
    text_key="paragraph"
)

In [14]:
store = StorageContext.from_defaults(vector_store=vdb)

In [15]:
vector_index = VectorStoreIndex.from_vector_store(vector_store=vdb, service_context=service_context)

In [16]:
query_engine = vector_index.as_query_engine()

In [17]:
query_engine.query("What is a large language model?")

Response(response='A large language model refers to a type of language model that has been developed to handle and process a significant amount of data and information. It is designed to have a larger capacity and capability compared to traditional language models, allowing it to generate more accurate and contextually relevant responses or predictions.', source_nodes=[NodeWithScore(node=TextNode(id_='764f220f-37b7-4f2c-bf3c-07df14330be3', embedding=None, metadata={}, excluded_embed_metadata_keys=[], excluded_llm_metadata_keys=[], relationships={}, hash='7e3207d34fa042975d8321bf9c2b8ab275ff63968ed46f977eba9cac20cd721b', text='The following papers introduce some milestones on the journey toward large language models.', start_char_idx=None, end_char_idx=None, text_template='{metadata_str}\n\n{content}', metadata_template='{key}: {value}', metadata_seperator='\n'), score=0.5377379655838013), NodeWithScore(node=TextNode(id_='9972ec1b-5f42-4338-9b83-c792648afbd3', embedding=None, metadata={