### Jaccard and Cosine Similarity

In [6]:
import numpy as np
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity

def jaccard_similarity(text1, text2):
    words_text1 = set(text1.lower().split())
    words_text2 = set(text2.lower().split())
    intersection = words_text1.intersection(words_text2)
    union = words_text1.union(words_text2)
    return len(intersection) / len(union)

def cosine_similarity_tfidf(text1, text2):
    vectorizer = TfidfVectorizer()
    tfidf_matrix = vectorizer.fit_transform([text1, text2])
    similarity = cosine_similarity(tfidf_matrix[0], tfidf_matrix[1])
    return similarity[0][0]

def detect_plagiarism(text1, text2, jaccard_threshold=0.5, cosine_threshold=0.7):
    jaccard_sim = jaccard_similarity(text1, text2)
    cosine_sim = cosine_similarity_tfidf(text1, text2)
    
    print(f"\n\nJaccard Similarity: {jaccard_sim:.2f}")
    print(f"Cosine Similarity: {cosine_sim:.2f}")
    
    if jaccard_sim > jaccard_threshold or cosine_sim > cosine_threshold:
        return "Plagiarism Detected"
    else:
        return "No Plagiarism Detected"

text1 = input("Enter text: ")
text2 = input("\nEnter text: ")

result = detect_plagiarism(text1, text2)
print(result)

Enter text: The Industrial Revolution was a transformative period that reshaped economies and societies worldwide. Beginning in the late 18th century, it marked a shift from agrarian economies to industrialized ones, characterized by mechanized production, urbanization, and technological innovation. Factories emerged as centers of mass production, leading to increased productivity but also challenging traditional labor structures. The rise of industries spurred economic growth, but it also brought social challenges, such as poor working conditions and income inequality. Ultimately, the Industrial Revolution laid the foundation for modern economic systems and technological advancements.

Enter text: The Industrial Revolution was a significant turning point that transformed economies and societies. Starting in the late 1700s, it initiated a transition from agriculture-based economies to industrialized ones, introducing mechanized production and urban expansion. Factories became key hubs 

### Levenshtein and Cosine Similarity

In [10]:
import difflib
import numpy as np
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.metrics.pairwise import cosine_similarity

def levenshtein_similarity(text1, text2):
    seq = difflib.SequenceMatcher(None, text1, text2)
    return seq.ratio()

def cosine_similarity_count(text1, text2):
    vectorizer = CountVectorizer().fit_transform([text1, text2])
    vectors = vectorizer.toarray()
    similarity = cosine_similarity([vectors[0]], [vectors[1]])
    return similarity[0][0]

def detect_plagiarism(text1, text2, levenshtein_threshold=0.6, cosine_threshold=0.7):
    lev_sim = levenshtein_similarity(text1, text2)
    cosine_sim = cosine_similarity_count(text1, text2)
    
    print(f"\n\nLevenshtein Similarity: {lev_sim:.2f}")
    print(f"Cosine Similarity: {cosine_sim:.2f}")
    
    if lev_sim > levenshtein_threshold or cosine_sim > cosine_threshold:
        return "\n\nPlagiarism Detected"
    else:
        return "\n\nNo Plagiarism Detected"

text1 = input("Enter text: ")
text2 = input("\n\nEnter text: ")

result = detect_plagiarism(text1, text2)
print(result)

Enter text: Enter text: The Industrial Revolution was a significant turning point that transformed economies and societies. Starting in the late 1700s, it initiated a transition from agriculture-based economies to industrialized ones, introducing mechanized production and urban expansion. Factories became key hubs of mass production, boosting efficiency but also altering traditional labor patterns. While industrial growth stimulated economies, it also created social issues, including harsh working environments and wealth disparities. In the end, the Industrial Revolution played a crucial role in shaping contemporary economic models and technological progress.


Enter text: Enter text: The Industrial Revolution was a significant turning point that transformed economies and societies. Starting in the late 1700s, it initiated a transition from agriculture-based economies to industrialized ones, introducing mechanized production and urban expansion. Factories became key hubs of mass produc

### Plagiarism and AI Generated Text Detector

In [19]:
import difflib
import numpy as np
from sklearn.feature_extraction.text import CountVectorizer, TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity
import openai

def levenshtein_similarity(text1, text2):
    seq = difflib.SequenceMatcher(None, text1, text2)
    return seq.ratio()

def cosine_similarity_tfidf(text1, text2):
    vectorizer = TfidfVectorizer()
    tfidf_matrix = vectorizer.fit_transform([text1, text2])
    similarity = cosine_similarity(tfidf_matrix[0], tfidf_matrix[1])
    return similarity[0][0]

def detect_ai_generated_text(text, ai_threshold=0.6):
    ai_samples = [
        "Bu məqalə süni intellekt tərəfindən yazılmışdır.",
        "Bu, bir AI tərəfindən yaradılmış mətn nümunəsidir.",
        "Süni intellekt əsaslı məzmun yaradılması." 
    ]
    
    similarities = [cosine_similarity_tfidf(text, sample) for sample in ai_samples]
    max_similarity = max(similarities)
    
    print(f"\nMax AI Similarity: {max_similarity:.2f}")
    
    if max_similarity > ai_threshold:
        return "AI-Generated Text Detected"
    else:
        return "Human-Written Text"

def detect_plagiarism(text1, text2, levenshtein_threshold=0.6, cosine_threshold=0.7):
    lev_sim = levenshtein_similarity(text1, text2)
    cosine_sim = cosine_similarity_tfidf(text1, text2)
    
    print(f"\n\nLevenshtein Similarity: {lev_sim:.2f}")
    print(f"Cosine Similarity: {cosine_sim:.2f}")
    
    if lev_sim > levenshtein_threshold or cosine_sim > cosine_threshold:
        return "Plagiarism Detected"
    else:
        return "No Plagiarism Detected"

text1 = input("Enter text: ")
text2 = input("\nEnter text: ")

authorship_result = detect_ai_generated_text(text1)
print(authorship_result)

plagiarism_result = detect_plagiarism(text1, text2)
print(plagiarism_result)

Enter text: "Bu məqalə süni intellekt tərəfindən yazılmışdır."

Enter text: "Bu məqalə süni intellekt tərəfindən yazılmışdır."

Max AI Similarity: 1.00
AI-Generated Text Detected


Levenshtein Similarity: 1.00
Cosine Similarity: 1.00
Plagiarism Detected
