# Apply NER to identify entities such as names, organizations, and locations in a given text. Perform sentence segmentation on a paragraph and explain its importance in NLP tasks.

In [16]:
import spacy
import pandas as pd
from collections import Counter

In [17]:
nlp = spacy.load("en_core_web_sm")

In [18]:
text ="Artificial Intelligence has rapidly transformed the modern world, influencing industries, governments, and individuals alike. The concept of machines mimicking human intelligence dates back to the 1950s, when British mathematician Alan Turing introduced the idea of intelligent machines. His work at the University of Manchester laid the foundation for what would later become one of the most influential fields in computer science. Today, AI is no longer a theoretical idea but a practical technology deployed across the globe."

In [19]:
print("Total Words:", len(text.split()))

Total Words: 77


In [20]:
doc = nlp(text)

In [21]:
entities = []
for ent in doc.ents:
    entities.append([ent.text, ent.label_])

# Convert to DataFrame
df_ner = pd.DataFrame(entities, columns=["Entity", "Label"])
entity_counts = Counter(df_ner["Label"])

print("\nEntity Type Counts:")
for label, count in entity_counts.items():
    print(f"{label}: {count}")
print("\nSample Named Entities:")
print(df_ner.head(25))


Entity Type Counts:
ORG: 2
DATE: 2
NORP: 1
PERSON: 1
GPE: 1

Sample Named Entities:
                         Entity   Label
0       Artificial Intelligence     ORG
1                     the 1950s    DATE
2                       British    NORP
3                   Alan Turing  PERSON
4  the University of Manchester     ORG
5                         Today    DATE
6                            AI     GPE
