In [None]:
import os
from cerebras.cloud.sdk import Cerebras
from langchain.memory import ConversationBufferMemory
from langchain.chains import ConversationChain

# Initialize Cerebras client
api_key = os.environ.get("CEREBRAS_API_KEY")
if not api_key:
    raise ValueError("CEREBRAS_API_KEY environment variable is not set.")

client = Cerebras(api_key=api_key)

# Initialize LangChain memory
memory = ConversationBufferMemory()

# Function to interact with Cerebras API
def get_cerebras_response(prompt):
    response = client.chat.completions.create(
        messages=[{"role": "user", "content": prompt}],
        model="llama3.1-8b",
    )
    return response.choices[0].message["content"]

# Create a conversation chain
def chat():
    print("Welcome to the Cerebras Chat! Type 'exit' to end the conversation.")
    while True:
        user_input = input("You: ")
        if user_input.lower() == "/exit":
            print("Goodbye!")
            break

        # Add user input to memory
        memory.chat_memory.add_user_message(user_input)

        # Get the conversation history from memory
        history = memory.load_memory_variables({})["history"]

        # Generate a prompt with conversation history
        prompt = f"{history}\nUser: {user_input}\nAI:"

        # Get response from Cerebras API
        ai_response = get_cerebras_response(prompt)

        # Add AI response to memory
        memory.chat_memory.add_ai_message(ai_response)

        # Print AI response
        print(f"AI: {ai_response}")

# Start the chat
if __name__ == "__main__":
    chat()

In [3]:
import os
from cerebras.cloud.sdk import Cerebras
from langchain.memory import ConversationBufferMemory

# Initialize Cerebras client
api_key = os.environ.get("CEREBRAS_API_KEY")
if not api_key:
    raise ValueError("CEREBRAS_API_KEY environment variable is not set.")

client = Cerebras(api_key=api_key)

# Initialize LangChain memory
memory = ConversationBufferMemory()

# Function to interact with Cerebras API
def get_cerebras_response(prompt):
    response = client.chat.completions.create(
        messages=[{"role": "user", "content": prompt}],
        model="llama3.1-8b",
    )
    # Debug: Print the entire response to inspect its structure
    print("Response Object:", response)
    
    # Adjust this based on the actual response structure
    # Example: If response.choices[0].message.content is the correct path
    return response.choices[0].message.content

# Create a conversation chain
def chat():
    print("Welcome to the Cerebras Chat! Type '/exit' to end the conversation.")
    while True:
        user_input = input("You: ")
        if user_input.lower() == "/exit":
            print("Goodbye!")
            break

        # Add user input to memory
        memory.chat_memory.add_user_message(user_input)

        # Get the conversation history from memory
        history = memory.load_memory_variables({})["history"]

        # Generate a prompt with conversation history
        prompt = f"{history}\nUser: {user_input}\nAI:"

        # Get response from Cerebras API
        ai_response = get_cerebras_response(prompt)

        # Add AI response to memory
        memory.chat_memory.add_ai_message(ai_response)

        # Print AI response
        print(f"AI: {ai_response}")

# Start the chat
if __name__ == "__main__":
    chat()

Welcome to the Cerebras Chat! Type '/exit' to end the conversation.
Response Object: ChatCompletion(id='chatcmpl-6bf7b910-796e-4a38-ade9-5a83b8aa7050', choices=[Choice(finish_reason='stop', index=0, message=ChoiceMessage(role='assistant', content='Hello, how can I assist you today?', tool_calls=None), logprobs=None)], created=1737920853, model='llama3.1-8b', object='chat.completion', system_fingerprint='fp_6381a6c109', time_info=TimeInfo(completion_time=0.004537883, prompt_time=0.002304832, queue_time=9.4071e-05, total_time=0.008230447769165039, created=1737920853), usage=Usage(completion_tokens=10, prompt_tokens=45, total_tokens=55), service_tier=None)
AI: Hello, how can I assist you today?
Response Object: ChatCompletion(id='chatcmpl-f8e36301-7b3f-48af-81f7-743f1072cfcf', choices=[Choice(finish_reason='stop', index=0, message=ChoiceMessage(role='assistant', content="I'm functioning within normal parameters, thank you for asking. I'm a large language model, so I don't have emotions or

In [None]:
import os
from cerebras.cloud.sdk import Cerebras
from langchain.memory import ConversationBufferMemory
import Prompts  # Import the system prompt

# Initialize Cerebras client
api_key = os.environ.get("CEREBRAS_API_KEY")
if not api_key:
    raise ValueError("CEREBRAS_API_KEY environment variable is not set.")

client = Cerebras(api_key=api_key)

# Initialize LangChain memory
memory = ConversationBufferMemory()

# Add the system prompt to memory at the start
memory.chat_memory.add_ai_message(Prompts.SYSTEM_PROMPT)

# Function to interact with Cerebras API
def get_cerebras_response(prompt):
    response = client.chat.completions.create(
        messages=[
            {"role": "system", "content": Prompts.SYSTEM_PROMPT},  # Use the imported system prompt
            {"role": "user", "content": prompt},
        ],
        model="llama3.1-8b",
    )
    # Debug: Print the entire response to inspect its structure
    print("Response Object:", response)
    
    # Adjust this based on the actual response structure
    # Example: If response.choices[0].message.content is the correct path
    return response.choices[0].message.content

# Create a conversation chain
def chat():
    print("Welcome to the Cerebras Chat! Type '/exit' to end the conversation.")
    while True:
        user_input = input("You: ")
        if user_input.lower() == "/exit":
            print("Goodbye!")
            break

        # Add user input to memory
        memory.chat_memory.add_user_message(user_input)

        # Get the conversation history from memory
        history = memory.load_memory_variables({})["history"]

        # Generate a prompt with conversation history
        prompt = f"{history}\nUser: {user_input}\nAI:"

        # Get response from Cerebras API
        ai_response = get_cerebras_response(prompt)

        # Add AI response to memory
        memory.chat_memory.add_ai_message(ai_response)

        # Print AI response
        print(f"AI: {ai_response}")

# Start the chat
if __name__ == "__main__":
    chat()

In [5]:
from sentence_transformers import SentenceTransformer

# Load a pre-trained model
model = SentenceTransformer('all-MiniLM-L6-v2')

# Generate embeddings for a list of sentences
sentences = ["Why is fast inference important?", "Another example sentence."]
embeddings = model.encode(sentences)

# Print the embeddings
for i, embedding in enumerate(embeddings):
    print(f"Sentence {i+1} embedding: {embedding}")





modules.json:   0%|          | 0.00/349 [00:00<?, ?B/s]

config_sentence_transformers.json:   0%|          | 0.00/116 [00:00<?, ?B/s]

README.md:   0%|          | 0.00/10.7k [00:00<?, ?B/s]

sentence_bert_config.json:   0%|          | 0.00/53.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/612 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/90.9M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/350 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/112 [00:00<?, ?B/s]

1_Pooling/config.json:   0%|          | 0.00/190 [00:00<?, ?B/s]

Sentence 1 embedding: [ 8.06947052e-03 -2.71037910e-02  1.46680363e-02  2.53898632e-02
  8.83517340e-02  8.36232826e-02 -9.71423090e-03 -2.15860885e-02
  1.32945910e-01  7.30283419e-03  5.35557568e-02  4.74516749e-02
 -7.58148283e-02  1.85709894e-02  2.10473891e-02 -7.62794316e-02
  4.90425862e-02  2.82031316e-02 -1.04074053e-01 -1.06027097e-01
 -7.64405206e-02 -7.09755868e-02  3.54747591e-03 -5.77596501e-02
  1.23879053e-02 -2.61637568e-02 -7.29246736e-02  5.60407620e-03
  4.58459519e-02 -7.74129927e-02  3.91115667e-03  8.99396017e-02
  5.18182442e-02 -2.04544906e-02 -7.04014301e-02  4.11856100e-02
  1.38570555e-02  4.05999869e-02  5.35294414e-02  7.36391246e-02
 -1.86293647e-02 -8.58724350e-04 -6.17122278e-03  1.55163156e-02
  4.34640869e-02 -1.53533416e-02  5.85178770e-02  6.05299473e-02
 -2.31038909e-02 -8.63915868e-03 -8.17053542e-02  5.16521484e-02
 -3.93878669e-02 -3.19278315e-02  2.04254128e-02  5.16047403e-02
  2.42191944e-02  4.90597971e-02 -1.19914291e-02 -2.75306050e-02
 -4