In [3]:
import pinecone
import openai
import numpy as np
import os
from dotenv import load_dotenv

# Langchain
from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.text_splitter import CharacterTextSplitter
from langchain.vectorstores import Pinecone
from langchain.document_loaders import TextLoader

# Load variables from the .env file
load_dotenv('./Sn33k/.env')

# Access the variables
OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
PINECONE_API_KEY = os.getenv("PINECONE_API_KEY")
INDEX_NAME = os.getenv("PINECONE_INDEX_NAME")
PINECONE_ENVIRONMENT= os.getenv("PINECONE_ENVIRONMENT")

openai.api_key = OPENAI_API_KEY
os.environ["OPENAI_API_KEY"] = OPENAI_API_KEY

In [4]:
# initialize pinecone
pinecone.init(
    api_key=PINECONE_API_KEY,  # find at app.pinecone.io
    environment=PINECONE_ENVIRONMENT,  # next to api key in console
)

index_name = "mindfulhack"

embeddings = OpenAIEmbeddings(model='text-embedding-ada-002')
# if you already have an index, you can load it like this
docsearch = Pinecone.from_existing_index(index_name, embeddings)

# List all indexes information
index_description = pinecone.describe_index(index_name)
print('index_description: ', index_description)

index = pinecone.Index(index_name) 
index_stats_response = index.describe_index_stats()
print('index_stats_response: ', index_stats_response)

index_description:  IndexDescription(name='mindfulhack', metric='cosine', replicas=1, dimension=1536.0, shards=1, pods=1, pod_type='starter', status={'ready': True, 'state': 'Ready'}, metadata_config=None, source_collection='')
index_stats_response:  {'dimension': 1536,
 'index_fullness': 0.0,
 'namespaces': {},
 'total_vector_count': 0}


## Test QAChain

In [4]:
from llm.chains import QAretrivalChain
from pineconeManager.Retrival import PineconeRetrival
PINECONE_API_KEY = "1b1d5b95-2f20-476d-baa8-458cf5779640"
PINECONE_INDEX_NAME = "mindfulhack"
PINECONE_ENVIRONMENT="gcp-starter"

pineconeRetrival = PineconeRetrival(PINECONE_API_KEY=PINECONE_API_KEY, INDEX_NAME=PINECONE_INDEX_NAME, PINECONE_ENVIRONMENT=PINECONE_ENVIRONMENT)



index_stats_response:  {'dimension': 1536,
 'index_fullness': 0.00187,
 'namespaces': {'': {'vector_count': 187}},
 'total_vector_count': 187}
index_description:  IndexDescription(name='mindfulhack', metric='cosine', replicas=1, dimension=1536.0, shards=1, pods=1, pod_type='starter', status={'ready': True, 'state': 'Ready'}, metadata_config=None, source_collection='')


In [5]:
pineconeRetrival

<pineconeManager.Retrival.PineconeRetrival at 0x1bf9926eb00>

In [6]:
pineconeRetrival.getPineconeRelevantDocuments("What problems do I face?")

TypeError: 'str' object is not callable

# Insert shit into Pinecone testing

In [2]:
from pineconeManager.Upsert import PineconeUpsert

pineconeUpsert = PineconeUpsert(PINECONE_API_KEY=PINECONE_API_KEY, INDEX_NAME=PINECONE_INDEX_NAME, PINECONE_ENVIRONMENT=PINECONE_ENVIRONMENT)

# Read breakup.txt 
with open('breakup.txt', 'r') as file:
    breakup_text = file.read().replace('\n', '')


pineconeUpsert.upsert(text = breakup_text)

Inserting: Iâ€™m here to help. Whatâ€™s g...
