In [None]:
import os
import faiss
import openai
import langchain  # You need to install the langchain library first
from langchain.document_loaders import TextLoader
from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.text_splitter import CharacterTextSplitter
from langchain.vectorstores import FAISS

# Load the document, split it into chunks, embed each chunk and load it into the vector store.

# Initialize OpenAI API (You need to set your API key here)
openai.api_key = "YOUR_OPENAI_API_KEY"

# Initialize LangChain (Replace "config_path" with the path to your config file)
lc = langchain.LangChain(config_path="config_path")

# Initialize Faiss index
d = 768  # Dimension of the embeddings (Assuming GPT-3.5 produces 768-dimensional embeddings)
index = faiss.IndexFlatL2(d)

# Function to read log data from the folder
def read_log_data(folder_path):
    log_data = []
    db_documents = []
    for filename in os.listdir(folder_path):
        if filename.endswith(".log"):
            file_path_name = os.path.join(folder_path, filename)
            raw_documents = TextLoader(file_path_name).load()
            text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
            documents = text_splitter.split_documents(raw_documents)
    db = FAISS.from_documents(db_documents, OpenAIEmbeddings())
    return db



folder_path = "path_to_log_folder"
db = read_and_process_data(folder_path)
query = "What did the president say about Ketanji Brown Jackson"
docs = db.similarity_search(query)
print(docs[0].page_content)

EMBEDDING_MODEL = "text-embedding-ada-002"
GPT_MODEL = "gpt-3.5-turbo"

query = 'Which athletes won the gold medal in curling at the 2022 Winter Olympics?'

response = openai.ChatCompletion.create(
    messages=[
        {'role': 'system', 'content': 'You answer questions about the 2022 Winter Olympics.'},
        {'role': 'user', 'content': query},
    ],
    model=GPT_MODEL,
    temperature=0,
)

print(response['choices'][0]['message']['content'])



In [None]:
reference_link-https://python.langchain.com/docs/modules/data_connection/vectorstores/integrations/faiss
https://github.com/openai/openai-cookbook/blob/main/examples/Question_answering_using_embeddings.ipynb