# Implement Named Entity Recognition.


In [8]:
# Step 1: Install spaCy (if not already installed)
!pip install -U spacy

# Step 2: Download the English model
!python -m spacy download en_core_web_sm

# Step 3: Import spaCy
import spacy

# Step 4: Load English model
nlp = spacy.load("en_core_web_sm")




Collecting en-core-web-sm==3.8.0
  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.8.0/en_core_web_sm-3.8.0-py3-none-any.whl (12.8 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m12.8/12.8 MB[0m [31m83.8 MB/s[0m eta [36m0:00:00[0m
[?25h[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
[38;5;3m⚠ Restart to reload dependencies[0m
If you are in a Jupyter or Colab notebook, you may need to restart Python in
order to load all the package's dependencies. You can do this by selecting the
'Restart kernel' or 'Restart runtime' option.
Named Entities:

Annasaheb Dange College of Engineering and Technology (ORG)
Sangli (GPE)
Maharashtra (NORP)
Artificial Intelligence and Data Science Engineering (ORG)


In [9]:
# Step 5: Custom text
text = """
Prathamesh Jadhav is studying at Annasaheb Dange College of Engineering and Technology in Sangli.
He lives in Maharashtra and is pursuing a degree in Artificial Intelligence and Data Science Engineering.
"""

# Step 6: Process the text
doc = nlp(text)

# Step 7: Display named entities
print("Named Entities:\n")
for ent in doc.ents:
    print(f"{ent.text} ({ent.label_})")

Named Entities:

Annasaheb Dange College of Engineering and Technology (ORG)
Sangli (GPE)
Maharashtra (NORP)
Artificial Intelligence and Data Science Engineering (ORG)


# Named Entity Recognition (NER)

In [10]:
# Step 1: Install and load spaCy
!pip install -U spacy
!python -m spacy download en_core_web_sm

# Step 2: Import required libraries
import spacy
from collections import Counter

# Step 3: Load English NLP model
nlp = spacy.load("en_core_web_sm")

# Step 4: Input a paragraph from a newspaper or academic article
text = """
In a groundbreaking development, researchers at the Massachusetts Institute of Technology (MIT) have created a new AI model capable of detecting early-stage Alzheimer's disease.
The study, published in the journal Nature Medicine, involved over 5,000 participants from the United States, Canada, and Germany.
Dr. Emily Chen, a leading neuroscientist, said the model could change the landscape of preventive healthcare.
Funding for the project was provided by the National Institutes of Health (NIH) and Google Health.
"""

# Step 5: Process the text with spaCy
doc = nlp(text)

# Step 6: Extract and count named entities by type
entity_counts = Counter(ent.label_ for ent in doc.ents)

# Step 7: Display named entities and their types
print("Named Entities Found:\n")
for ent in doc.ents:
    print(f"{ent.text} ({ent.label_})")

# Step 8: Display counts by entity type
print("\n\nEntity Counts by Type:\n")
for label, count in entity_counts.items():
    print(f"{label} ({spacy.explain(label)}): {count}")


Collecting en-core-web-sm==3.8.0
  Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.8.0/en_core_web_sm-3.8.0-py3-none-any.whl (12.8 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m12.8/12.8 MB[0m [31m100.9 MB/s[0m eta [36m0:00:00[0m
[?25h[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
[38;5;3m⚠ Restart to reload dependencies[0m
If you are in a Jupyter or Colab notebook, you may need to restart Python in
order to load all the package's dependencies. You can do this by selecting the
'Restart kernel' or 'Restart runtime' option.
Named Entities Found:

the Massachusetts Institute of Technology (ORG)
MIT (ORG)
AI (GPE)
Nature Medicine (PRODUCT)
5,000 (CARDINAL)
the United States (GPE)
Canada (GPE)
Germany (GPE)
Emily Chen (PERSON)
the National Institutes of Health (ORG)
NIH (ORG)
Google Health (ORG)


Entity Counts by Type:

ORG (Companies, agencies, instituti