In [None]:
#csv to embeddings
import pandas as pd
from langchain_huggingface.embeddings import HuggingFaceEmbeddings

# Load the CSV file
file_path = 'articles.csv'
try:
    df = pd.read_csv(file_path)
except FileNotFoundError:
    print(f"File not found: {file_path}")
    raise

# Ensure the 'articles' column exists
text_column = 'articles'  # Update this based on the actual column name
if text_column not in df.columns:
    raise KeyError(f"Column '{text_column}' not found in the DataFrame. Available columns: {df.columns}")

# Initialize the HuggingFaceEmbeddings model
embedding_model_name = "sentence-transformers/all-MiniLM-L6-v2"
embeddings = HuggingFaceEmbeddings(model_name=embedding_model_name)

# Generate embeddings
def generate_embeddings(texts):
    return [embeddings.embed_query(text) for text in texts]

df['embeddings'] = generate_embeddings(df[text_column])

# Save the embeddings to a CSV file
output_file = 'embeddings.csv'
df[[text_column, 'embeddings']].to_csv(output_file, index=False)
print(f"Embeddings saved to {output_file}")
