In [1]:
import logging
import sys
import pickle

from llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext
from llama_index.core.query_engine.query_bundle import QueryBundle
from llama_index.core.query_engine.base_query_engine import BaseQueryEngine


logging.basicConfig(stream=sys.stdout, level=logging.INFO)
logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))

from llama_index.llms import LlamaCPP
from llama_index.llms.llama_utils import messages_to_prompt, completion_to_prompt
import torch
from langchain.embeddings.huggingface import HuggingFaceEmbeddings
from llama_index.embeddings import LangchainEmbedding

custom_cache_folder = "C:/Users/Digital/.cache/huggingface/hub/models--thenlper--gte-large/snapshots/8cb729e8b44d9ec9d85c1cec4167ed28b43b04c2/1_Pooling/"

# Load documents
documents = SimpleDirectoryReader("Data").load_data()

# Create LlamaCPP instance
llm = LlamaCPP(
    model_url='https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf',
    model_path=None,
    temperature=0.1,
    max_new_tokens=256,
    context_window=3900,
    generate_kwargs={},
    model_kwargs={"n_gpu_layers": -1},
    messages_to_prompt=messages_to_prompt,
    completion_to_prompt=completion_to_prompt,
    verbose=True,
)

# Create LangchainEmbedding instance
embed_model = LangchainEmbedding(HuggingFaceEmbeddings(model_name="thenlper/gte-large", cache_folder=custom_cache_folder))

# Create ServiceContext
service_context = ServiceContext.from_defaults(chunk_size=256, llm=llm, embed_model=embed_model)

# Create VectorStoreIndex
index = VectorStoreIndex.from_documents(documents, service_context=service_context)


# Create query engine from loaded index
query_engine = index.as_query_engine()

# Query the loaded index
response = query_engine.query("What is 67?")
print(response)


ModuleNotFoundError: No module named 'llama_index.core.query_engine'

In [2]:
import logging
import sys
import pickle

from llama_index import VectorStoreIndex, SimpleDirectoryReader, ServiceContext
from llama_index.query_engine.query_bundle import QueryBundle
from llama_index.query_engine.base_query_engine import BaseQueryEngine

logging.basicConfig(stream=sys.stdout, level=logging.INFO)
logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))

from llama_index.llms import LlamaCPP
from llama_index.llms.llama_utils import messages_to_prompt, completion_to_prompt
import torch
from langchain.embeddings.huggingface import HuggingFaceEmbeddings
from llama_index.embeddings import LangchainEmbedding

custom_cache_folder = "C:/Users/Digital/.cache/huggingface/hub/models--thenlper--gte-large/snapshots/8cb729e8b44d9ec9d85c1cec4167ed28b43b04c2/1_Pooling/"

# Load documents
documents = SimpleDirectoryReader("Data").load_data()

# Create LlamaCPP instance
llm = LlamaCPP(
    model_url='https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.1-GGUF/resolve/main/mistral-7b-instruct-v0.1.Q4_K_M.gguf',
    model_path=None,
    temperature=0.1,
    max_new_tokens=256,
    context_window=3900,
    generate_kwargs={},
    model_kwargs={"n_gpu_layers": -1},
    messages_to_prompt=messages_to_prompt,
    completion_to_prompt=completion_to_prompt,
    verbose=True,
)

# Create LangchainEmbedding instance
embed_model = LangchainEmbedding(HuggingFaceEmbeddings(model_name="thenlper/gte-large", cache_folder=custom_cache_folder))

# Create ServiceContext
service_context = ServiceContext.from_defaults(chunk_size=256, llm=llm, embed_model=embed_model)

# Create VectorStoreIndex
index = VectorStoreIndex.from_documents(documents, service_context=service_context)

# Save the query engine and vector index
with open('query_engine.pkl', 'wb') as file:
    pickle.dump(index.as_query_engine(), file)

with open('vector_index.pkl', 'wb') as file:
    pickle.dump(index, file)

# Load index from the saved file
with open('vector_index.pkl', 'rb') as file:
    loaded_index = pickle.load(file)

# Create query engine from loaded index
loaded_query_engine = loaded_index.as_query_engine()

# Query the loaded index
response = loaded_query_engine.query("What is 67?")
print(response)


ModuleNotFoundError: No module named 'llama_index.query_engine.query_bundle'

In [5]:
pip install llama_index.query_engine


Defaulting to user installation because normal site-packages is not writeable
Note: you may need to restart the kernel to use updated packages.


ERROR: Could not find a version that satisfies the requirement llama_index.query_engine (from versions: none)
ERROR: No matching distribution found for llama_index.query_engine
