In [7]:
! pip install langchain
import os

OPENAI_API_KEY = os.getenv('OPENAI_API_KEY') or ''
OPENAI_API_BASE = os.getenv('OPENAI_API_BASE') or 'https://fintechx-oai-eus.openai.azure.com/'
WEAVIATE_URL = os.getenv('WEAVIATE_URL') or 'http://localhost:8080'

## Import data from file

# Load data from file and split file into right-sized chunks 
# for embeddings processing

from langchain.text_splitter import CharacterTextSplitter
from langchain.document_loaders import TextLoader

loader = TextLoader("../data/state_of_the_union.txt")
documents = loader.load()
text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
docs = text_splitter.split_documents(documents)


## create Embeddings reference to OpenAI Embeddings API 

from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.text_splitter import CharacterTextSplitter
from langchain.vectorstores import Weaviate

model_name = 'text-embedding-ada-002'

embeddings = OpenAIEmbeddings(
    deployment="embeddings",
    model=model_name,
    openai_api_base='https://fintechx-oai-eus.openai.azure.com/',
    openai_api_type="azure",
    openai_api_key="1108a83ade0d421488d061b3dc01439b",
)

## create weaviate vector store

import weaviate

# print(len(docs))
# # print(docs[0])
# print(f'connecting to {WEAVIATE_URL}')

client= weaviate.Client(url=WEAVIATE_URL)
weaviate = Weaviate(client, 'MyOwnClass', 'text', embeddings)

# print(docs[0].metadata['source'])

properties = {
    "text": docs[0].page_content,
    "source": docs[0].metadata['source']
}

print(properties)
new_record_uuid = client.batch.add_data_object(properties, "MyOwnClass")
client.batch.flush()
client.data_object.get(new_record_uuid)


{'text': 'Madam Speaker, Madam Vice President, our First Lady and Second Gentleman. Members of Congress and the Cabinet. Justices of the Supreme Court. My fellow Americans.  \n\nLast year COVID-19 kept us apart. This year we are finally together again. \n\nTonight, we meet as Democrats Republicans and Independents. But most importantly as Americans. \n\nWith a duty to one another to the American people to the Constitution. \n\nAnd with an unwavering resolve that freedom will always triumph over tyranny. \n\nSix days ago, Russia’s Vladimir Putin sought to shake the foundations of the free world thinking he could make it bend to his menacing ways. But he badly miscalculated. \n\nHe thought he could roll into Ukraine and the world would roll over. Instead he met a wall of strength he never imagined. \n\nHe met the Ukrainian people. \n\nFrom President Zelenskyy to every Ukrainian, their fearlessness, their courage, their determination, inspires the world.', 'source': '../data/state_of_the_



{'class': 'MyOwnClass',
 'creationTimeUnix': 1687435939620,
 'id': 'e4903726-17cc-4211-ab1b-35d124701953',
 'lastUpdateTimeUnix': 1687435939620,
 'properties': {'source': '../data/state_of_the_union.txt',
  'text': 'Madam Speaker, Madam Vice President, our First Lady and Second Gentleman. Members of Congress and the Cabinet. Justices of the Supreme Court. My fellow Americans.  \n\nLast year COVID-19 kept us apart. This year we are finally together again. \n\nTonight, we meet as Democrats Republicans and Independents. But most importantly as Americans. \n\nWith a duty to one another to the American people to the Constitution. \n\nAnd with an unwavering resolve that freedom will always triumph over tyranny. \n\nSix days ago, Russia’s Vladimir Putin sought to shake the foundations of the free world thinking he could make it bend to his menacing ways. But he badly miscalculated. \n\nHe thought he could roll into Ukraine and the world would roll over. Instead he met a wall of strength he ne

In [6]:
## Clear database

import weaviate, os

WEAVIATE_URL = os.getenv('WEAVIATE_URL') or 'http://localhost:8080'


client = weaviate.Client(
    url=WEAVIATE_URL,  
    # auth_client_secret=weaviate.AuthApiKey(api_key="YOUR-WEAVIATE-API-KEY"),  # Replace w/ your Weaviate instance API key
    additional_headers={
        "X-OpenAI-Api-Key": "",
    },
)

client.schema.delete_all()  # ⚠️ uncomment to start from scratch by deleting ALL data









{'class': 'MyOwnClass',
 'creationTimeUnix': 1687435812008,
 'id': '0b657cda-7703-4d30-a034-9f993f1fa4d7',
 'lastUpdateTimeUnix': 1687435812008,
 'properties': {'source': '../data/state_of_the_union.txt',
  'text': 'Madam Speaker, Madam Vice President, our First Lady and Second Gentleman. Members of Congress and the Cabinet. Justices of the Supreme Court. My fellow Americans.  \n\nLast year COVID-19 kept us apart. This year we are finally together again. \n\nTonight, we meet as Democrats Republicans and Independents. But most importantly as Americans. \n\nWith a duty to one another to the American people to the Constitution. \n\nAnd with an unwavering resolve that freedom will always triumph over tyranny. \n\nSix days ago, Russia’s Vladimir Putin sought to shake the foundations of the free world thinking he could make it bend to his menacing ways. But he badly miscalculated. \n\nHe thought he could roll into Ukraine and the world would roll over. Instead he met a wall of strength he ne