In [1]:
pip install gensim



In [3]:
pip install nltk



In [8]:
import nltk
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize, sent_tokenize
import heapq

# Download the necessary NLTK data
nltk.download('punkt')
nltk.download('stopwords')

def summarize_text(text, summary_length=2):
    sentences = sent_tokenize(text)
    stop_words = set(stopwords.words('english'))
    word_frequencies = {}
    for word in word_tokenize(text):
        if word.lower() not in stop_words:
            if word not in word_frequencies:
                word_frequencies[word] = 1
            else:
                word_frequencies[word] += 1

    max_frequency = max(word_frequencies.values())
    for word in word_frequencies:
        word_frequencies[word] = word_frequencies[word] / max_frequency
    sentence_scores = {}
    for sent in sentences:
        for word in word_tokenize(sent.lower()):
            if word in word_frequencies:
                if len(sent.split(' ')) < 30:
                    if sent not in sentence_scores:
                        sentence_scores[sent] = word_frequencies[word]
                    else:
                        sentence_scores[sent] += word_frequencies[word]

    summary_sentences = heapq.nlargest(summary_length, sentence_scores, key=sentence_scores.get)
    summary = ' '.join(summary_sentences)
    return summary

text = """
Artificial Intelligence (AI) is a rapidly advancing field of computer science concerned with building smart machines capable of performing tasks that typically require human intelligence. AI is an interdisciplinary field, drawing on insights from mathematics, computer science, psychology, neuroscience, cognitive science, linguistics, operations research, economics, and many other disciplines. Research in AI has produced numerous advances in areas such as reasoning, knowledge representation, natural language processing, perception, and the ability to move and manipulate objects. AI can be categorized into narrow AI, which is designed for a specific task, and general AI, which has the ability to perform any intellectual task that a human can do. While narrow AI is already prevalent in various applications, general AI remains a long-term goal. AI has the potential to revolutionize industries, but it also raises ethical concerns regarding privacy, employment, and the impact on society.
"""
def print_summary_in_lines(summary):
    sentences = summary.split('. ')
    for sentence in sentences:
        print(sentence.strip() + '.')
summary = summarize_text(text, summary_length=2)
print("Original Text Length:", len(text.split()))
print("Summary Text Length:", len(summary.split()))
#print("\nSummary:\n", summary)
print("Summary in new line\n")
print_summary_in_lines(summary)

Original Text Length: 142
Summary Text Length: 50
Summary in new line

AI is an interdisciplinary field, drawing on insights from mathematics, computer science, psychology, neuroscience, cognitive science, linguistics, operations research, economics, and many other disciplines.
Research in AI has produced numerous advances in areas such as reasoning, knowledge representation, natural language processing, perception, and the ability to move and manipulate objects..


[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


In [5]:
pip install transformers



In [9]:
from transformers import pipeline
summarizer = pipeline("summarization", model="facebook/bart-large-cnn")

def bert_summarize(text, max_length=130, min_length=30):

    summary = summarizer(text, max_length=max_length, min_length=min_length, do_sample=False)
    return summary[0]['summary_text']

text = """
Artificial Intelligence (AI) is a rapidly advancing field of computer science concerned with building smart machines capable of performing tasks that typically require human intelligence. AI is an interdisciplinary field, drawing on insights from mathematics, computer science, psychology, neuroscience, cognitive science, linguistics, operations research, economics, and many other disciplines. Research in AI has produced numerous advances in areas such as reasoning, knowledge representation, natural language processing, perception, and the ability to move and manipulate objects. AI can be categorized into narrow AI, which is designed for a specific task, and general AI, which has the ability to perform any intellectual task that a human can do. While narrow AI is already prevalent in various applications, general AI remains a long-term goal. AI has the potential to revolutionize industries, but it also raises ethical concerns regarding privacy, employment, and the impact on society.
"""
def print_summary_in_lines(summary):
    sentences = summary.split('. ')
    for sentence in sentences:
        print(sentence.strip() + '.')
summary = bert_summarize(text, max_length=50, min_length=25)
print("Original Text Length:", len(text.split()))
print("Summary Text Length:", len(summary.split()))
print("\nSummary:\n", summary)
print_summary_in_lines(summary)


Original Text Length: 142
Summary Text Length: 40

Summary:
 Artificial Intelligence (AI) is a rapidly advancing field of computer science. It is concerned with building smart machines capable of performing tasks that typically require human intelligence. AI has the potential to revolutionize industries, but it also raises ethical concerns
Artificial Intelligence (AI) is a rapidly advancing field of computer science.
It is concerned with building smart machines capable of performing tasks that typically require human intelligence.
AI has the potential to revolutionize industries, but it also raises ethical concerns.
