In [1]:
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity

def calculate_cosine_similarity(text1, text2):
    """
    Calculates the cosine similarity between two strings.
    
    Parameters:
    text1 (str): The first string.
    text2 (str): The second string.
    
    Returns:
    float: The cosine similarity score.
    """
    # Create a TfidfVectorizer object
    vectorizer = TfidfVectorizer()
    
    # Transform the texts into TF-IDF vectors
    tfidf_matrix = vectorizer.fit_transform([text1, text2])
    
    # Compute the cosine similarity between the vectors
    similarity = cosine_similarity(tfidf_matrix[0:1], tfidf_matrix[1:2])
    
    return similarity[0][0]

# Test the function
string1 = "Natural Language Processing is amazing."
string2 = "I love working on Natural Language Processing projects."

similarity_score = calculate_cosine_similarity(string1, string2)
print(f"Cosine Similarity: {similarity_score:.4f}")


Cosine Similarity: 0.3446
