In [1]:
from openai import OpenAI
client = OpenAI()

# Function to get the vector embedding for a given text
def get_vector_embeddings(text):
    response = client.embeddings.create(
        input=text,
        model="text-embedding-ada-002"
    )
    embeddings = [r.embedding for r in response.data]
    return embeddings[0]

get_vector_embeddings("Your text string goes here")

[-0.007021795958280563,
 -0.0052579473704099655,
 0.011873218230903149,
 -0.024888738989830017,
 -0.024579644203186035,
 0.03972522169351578,
 -0.010065694339573383,
 -0.00940719060599804,
 -0.013257419690489769,
 -0.01002537738531828,
 -0.011732110753655434,
 0.007747493218630552,
 -0.01416454091668129,
 0.007760932203382254,
 0.010280715301632881,
 -0.005053005181252956,
 0.022940106689929962,
 -0.0015496666310355067,
 0.015024627558887005,
 -0.010388226248323917,
 0.004844703245908022,
 0.01245780847966671,
 0.004844703245908022,
 0.01089218258857727,
 -0.006692544091492891,
 -0.0003231621813029051,
 0.005570400506258011,
 -0.012578757479786873,
 0.016381951048970222,
 0.0044885738752782345,
 0.006605191621929407,
 -0.00718306191265583,
 -0.015091821551322937,
 -0.006581673864275217,
 -0.018505288287997246,
 0.0041694012470543385,
 0.003178286598995328,
 -0.018975647166371346,
 0.030291153118014336,
 -0.007465277798473835,
 0.008117061108350754,
 0.009521421045064926,
 -0.0011330625

In [3]:
from langchain.text_splitter import RecursiveCharacterTextSplitter

text_splitter = RecursiveCharacterTextSplitter.from_tiktoken_encoder(
    chunk_size=100,  # 100 tokens
    chunk_overlap=20,  # 20 tokens of overlap
)

text = """
Welcome to the "Unicorn Enterprises: Where Magic Happens" Employee Handbook! We're thrilled to have you join our team of dreamers, doers, and unicorn enthusiasts. At Unicorn Enterprises, we believe that work should be as enchanting as it is productive. This handbook is your ticket to the magical world of our company, where we'll outline the principles, policies, and practices that guide us on this extraordinary journey. So, fasten your seatbelts and get ready to embark on an adventure like no other!
Certainly, here are five middle paragraphs for your fake employee handbook:

**1: Our Magical Culture**

At Unicorn Enterprises, we take pride in our unique and enchanting company culture. We believe that creativity and innovation flourish best when people are happy and inspired. From our weekly "Wear Your Favorite Mythical Creature Costume" day on Fridays to our in-house unicorn petting zoo, we aim to infuse magic into every corner of our workplace. So, don't be surprised if you find a fairy tale book in the breakroom or a gnome guiding you to the restroom. Our culture is designed to spark your imagination and encourage collaboration among our magical team.

**2: Unicorn Code of Conduct**

While we embrace creativity, we also value professionalism. Our Unicorn Code of Conduct ensures that we maintain a harmonious and respectful environment. Treating all team members, regardless of their unicorn species, with kindness and respect is essential. We also encourage open communication and constructive feedback because, in our world, every opinion matters, just like every horn on a unicorn's head!

**3: Magical Work-Life Balance**

At Unicorn Enterprises, we understand the importance of maintaining a balanced life. We offer flexible work hours, magical mental health days, and even an on-site wizard to provide stress-relief spells when needed. We believe that a happy and well-rested employee is a creative and productive employee. So, don't hesitate to use our relaxation chambers or join a group meditation session under the office rainbow.

**4: Enchanted Benefits**

Our commitment to your well-being extends to our magical benefits package. You'll enjoy a treasure chest of perks, including unlimited unicorn rides, a bottomless cauldron of coffee and potions, and access to our company library filled with spellbinding books. We also offer competitive health and dental plans, ensuring your physical well-being is as robust as your magical spirit.

**5: Continuous Learning and Growth**

At Unicorn Enterprises, we believe in continuous learning and growth. We provide access to a plethora of online courses, enchanted workshops, and wizard-led training sessions. Whether you're aspiring to master new spells or conquer new challenges, we're here to support your personal and professional development.

As we conclude this handbook, remember that at Unicorn Enterprises, the pursuit of excellence is a never-ending quest. Our company's success depends on your passion, creativity, and commitment to making the impossible possible. We encourage you to always embrace the magic within and outside of work, and to share your ideas and innovations to keep our enchanted journey going. Thank you for being a part of our mystical family, and together, we'll continue to create a world where magic and business thrive hand in hand!
"""

chunks = text_splitter.split_text(text=text)
print(chunks[0:3])

['Welcome to the "Unicorn Enterprises: Where Magic Happens" Employee Handbook! We\'re thrilled to have you join our team of dreamers, doers, and unicorn enthusiasts. At Unicorn Enterprises, we believe that work should be as enchanting as it is productive. This handbook is your ticket to the magical world of our company, where we\'ll outline the principles, policies, and practices that guide us on this extraordinary journey. So, fasten your seatbelts and get ready', 'practices that guide us on this extraordinary journey. So, fasten your seatbelts and get ready to embark on an adventure like no other!', 'Certainly, here are five middle paragraphs for your fake employee handbook:']


In [4]:
import numpy as np
import faiss

# Get vector embeddings for the chunks from last example
emb = [get_vector_embeddings(chunk) for chunk in chunks]
vectors = np.array(emb)

# Create a FAISS index
index = faiss.IndexFlatL2(vectors.shape[1])
index.add(vectors)

# Function to perform a vector search
def vector_search(query_text, k=1):
    query_vector = get_vector_embeddings(query_text)
    distances, indices = index.search(
        np.array([query_vector]), k)
    return [(chunks[i], float(dist)) for dist, 
        i in zip(distances[0], indices[0])]

# Example search
user_query = "do we get free unicorn rides?"
search_results = vector_search(user_query)
print(f"Search results for {user_query}:", search_results)

Search results for do we get free unicorn rides?: [('At Unicorn Enterprises, we take pride in our unique and enchanting company culture. We believe that creativity and innovation flourish best when people are happy and inspired. From our weekly "Wear Your Favorite Mythical Creature Costume" day on Fridays to our in-house unicorn petting zoo, we aim to infuse magic into every corner of our workplace. So, don\'t be surprised if you find a fairy tale book in the breakroom or a gnome guiding you to the restroom. Our culture', 0.351819783449173)]


In [5]:
# Function to perform a vector search and then ask # GPT-3.5-turbo a question:
def search_and_chat(user_query, k=1):
  
  # Perform the vector search
  search_results = vector_search(user_query, k)
  print(f"Search results: {search_results}\n\n")

  prompt_with_context = f"""Context:{search_results}\
  Answer the question: {user_query}"""
  
  # Create a list of messages for the chat
  messages = [
      {"role": "system", "content": """Please answer the
      questions provided by the user. Use only the context
      provided to you to respond to the user, if you don't
      know the answer say \"I don't know\"."""},
      {"role": "user", "content": prompt_with_context},
  ]

  # Get the model's response
  response = client.chat.completions.create(
    model="gpt-3.5-turbo", messages=messages)

  # Print the assistant's reply
  print(f"""Response: 
  {response.choices[0].message.content}""")

# Example search and chat
search_and_chat("How often can I wear a costume to work?")

Search results: [('At Unicorn Enterprises, we take pride in our unique and enchanting company culture. We believe that creativity and innovation flourish best when people are happy and inspired. From our weekly "Wear Your Favorite Mythical Creature Costume" day on Fridays to our in-house unicorn petting zoo, we aim to infuse magic into every corner of our workplace. So, don\'t be surprised if you find a fairy tale book in the breakroom or a gnome guiding you to the restroom. Our culture', 0.4365059733390808)]


Response: 
  You can wear a costume to work every Friday as part of our weekly "Wear Your Favorite Mythical Creature Costume" day.


In [8]:
# Save the index to a file
faiss.write_index(index, "my_index_file.index")

In [6]:
# Load the index from a file
index = faiss.read_index("my_index_file.index")