In [None]:
import pandas as pd
from sentence_transformers import SentenceTransformer, util

# Load pre-trained Sentence-BERT model
model = SentenceTransformer('paraphrase-MiniLM-L6-v2')

# Read data from two different sheets
sheet1_df = pd.read_excel('Book1.xlsx', sheet_name='Sheet1')
sheet2_df = pd.read_excel('Book1.xlsx', sheet_name='Sheet2')

# Ensure that 'Sheet1' and 'Sheet2' have columns 'Sentence1' and 'Sentence2'
# Adjust the column names based on your actual column names in the Excel sheets

# Calculate similarity scores
similarity_scores = []

for index, (row1, row2) in enumerate(zip(sheet1_df.iterrows(), sheet2_df.iterrows())):
    sentence1 = row1[1]['Sen']
    sentence2 = row2[1]['HJ']

    # Embed sentences and calculate cosine similarity
    embeddings = model.encode([sentence1, sentence2], convert_to_tensor=True)
    similarity = util.pytorch_cos_sim(embeddings[0], embeddings[1]).item()
    similarity_scores.append(similarity)

# Add similarity scores to a new column in one of the DataFrames (assuming they have the same length)
sheet1_df['Similarity_Score'] = similarity_scores

# Save the results back to Excel
sheet1_df.to_excel('output_file.xlsx', index=False)
