In [None]:
!pip install spacy

import spacy
import pandas as pd

nlp = spacy.load("en_core_web_sm")

corpus = [
    "Google hired John Doe as a software engineer in California.",
    "Dr. Smith published a paper at MIT on Artificial Intelligence.",
    "Facebook partnered with Jane Miller to lead the new research team.",
    "Amazon announced that Michael Johnson will join as VP of Cloud Computing."
]

print("Original Text Dataset:\n")
for doc in corpus:
    print("-", doc)

print("\n--- Named Entity Recognition Results ---\n")
for text in corpus:
    doc = nlp(text)
    print(f"Text: {text}")
    for ent in doc.ents:
        print(f" - {ent.text} ({ent.label_})")
    print()

persons = []
organizations = []

for text in corpus:
    doc = nlp(text)
    person = [ent.text for ent in doc.ents if ent.label_ == "PERSON"]
    org = [ent.text for ent in doc.ents if ent.label_ == "ORG"]


    for p in person:
        for o in org:
            persons.append(p)
            organizations.append(o)

df = pd.DataFrame({"Person": persons, "Organization": organizations})

print("\n--- Extracted Structured Information ---\n")
print(df)

df.to_csv("ner_results.csv", index=False)
print("\nResults saved as ner_results.csv")


Original Text Dataset:

- Google hired John Doe as a software engineer in California.
- Dr. Smith published a paper at MIT on Artificial Intelligence.
- Facebook partnered with Jane Miller to lead the new research team.
- Amazon announced that Michael Johnson will join as VP of Cloud Computing.

--- Named Entity Recognition Results ---

Text: Google hired John Doe as a software engineer in California.
 - Google (ORG)
 - John Doe (PERSON)
 - California (GPE)

Text: Dr. Smith published a paper at MIT on Artificial Intelligence.
 - Smith (PERSON)
 - MIT (ORG)
 - Artificial Intelligence (ORG)

Text: Facebook partnered with Jane Miller to lead the new research team.
 - Jane Miller (PERSON)

Text: Amazon announced that Michael Johnson will join as VP of Cloud Computing.
 - Amazon (ORG)
 - Michael Johnson (PERSON)
 - Cloud Computing (PERSON)


--- Extracted Structured Information ---

            Person             Organization
0         John Doe                   Google
1            Smith   