## Storage

In [None]:
from llama_index.core import VectorStoreIndex
from llama_index.readers.file import FlatReader
from llama_index.embeddings.huggingface import HuggingFaceEmbedding
from llama_index.core.node_parser import SentenceSplitter
from pathlib import Path

sentence_spilit = SentenceSplitter(
    chunk_size=1024
)

embed_model = HuggingFaceEmbedding(model_name="intfloat/multilingual-e5-large",device='cpu')
md_docs = FlatReader().load_data(Path("./MockupData/finops.md"))
md_nodes = sentence_spilit.get_nodes_from_documents(md_docs)

print(len(md_nodes))
index = VectorStoreIndex(md_nodes,embed_model=embed_model)
# Query index
query_engine = index.as_retriever(similarity_top_k = 5)
response = query_engine.retrieve("FinOps คืออะไร?")
print('-------------RAG-------------')
print(len(response))

In [None]:
from llama_index.core.vector_stores import SimpleVectorStore
from llama_index.core.storage.docstore import SimpleDocumentStore
from llama_index.core.storage.index_store import SimpleIndexStore
from llama_index.core import VectorStoreIndex,StorageContext
from llama_index.readers.file import FlatReader
from llama_index.embeddings.huggingface import HuggingFaceEmbedding
from llama_index.core.node_parser import SentenceSplitter
from pathlib import Path

sentence_spilit = SentenceSplitter(
    chunk_size=1024
)

storage_context = StorageContext.from_defaults(
    vector_store=SimpleVectorStore(),
    docstore=SimpleDocumentStore(),
    index_store=SimpleIndexStore(),
)

embed_model = HuggingFaceEmbedding(model_name="intfloat/multilingual-e5-large",device='cpu')
md_docs = FlatReader().load_data(Path("./MockupData/finops.md"))
md_nodes = sentence_spilit.get_nodes_from_documents(md_docs)

print(len(md_nodes))
index = VectorStoreIndex(md_nodes,embed_model=embed_model,storage_context=storage_context)
index.set_index_id("FinOps")
index.storage_context.persist(persist_dir="./localstore/")
# Query index
query_engine = index.as_retriever(similarity_top_k = 5)
response = query_engine.retrieve("FinOps คืออะไร?")
print('-------------RAG-------------')
print(len(response))

In [2]:
from llama_index.core import StorageContext, load_index_from_storage
from llama_index.embeddings.huggingface import HuggingFaceEmbedding

embed_model = HuggingFaceEmbedding(model_name="intfloat/multilingual-e5-large",device='cpu')
load_index = load_index_from_storage(StorageContext.from_defaults(persist_dir='./localstore/'),embed_model=embed_model)
query_engine = load_index.as_retriever(similarity_top_k = 5)
response = query_engine.retrieve("FinOps คืออะไร?")
print('-------------RAG-------------')
print(len(response))

-------------RAG-------------
5
