In [1]:
import spacy

In [2]:
#Load english model
!python -m spacy download en_core_web_sm
nlp = spacy.load("en_core_web_sm")

Collecting en-core-web-sm==3.8.0
  Using cached https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.8.0/en_core_web_sm-3.8.0-py3-none-any.whl (12.8 MB)
[38;5;2m✔ Download and installation successful[0m
You can now load the package via spacy.load('en_core_web_sm')
[38;5;3m⚠ Restart to reload dependencies[0m
If you are in a Jupyter or Colab notebook, you may need to restart Python in
order to load all the package's dependencies. You can do this by selecting the
'Restart kernel' or 'Restart runtime' option.


In [3]:
text = "Google is buying a startup for $1 billion."

In [4]:
doc = nlp(text)

In [6]:
# Print word, coarse tag (POS) and fine-grained tag (TAG)
print(f"{'WORD':<12}{'POS':<6}{'TAG':<6}EXPLANATION")
print("." * 40)

for token in doc:
    print(f"{token.text:<12}{token.pos_:<6}{token.tag_:<6}{spacy.explain(token.tag_)}")


WORD        POS   TAG   EXPLANATION
........................................
Google      PROPN NNP   noun, proper singular
is          AUX   VBZ   verb, 3rd person singular present
buying      VERB  VBG   verb, gerund or present participle
a           DET   DT    determiner
startup     NOUN  NN    noun, singular or mass
for         ADP   IN    conjunction, subordinating or preposition
$           SYM   $     symbol, currency
1           NUM   CD    cardinal number
billion     NUM   CD    cardinal number
.           PUNCT .     punctuation mark, sentence closer


In [7]:
from spacy import displacy
NER = spacy.load("en_core_web_sm")

In [10]:
raw_text = "The Indian Space Research Organisation or is the latest term for the national space agency of India, headquartered in Bengaluru. It operates under Department of Space which is directly overseen by the Prime Minister of India while Chairman of ISRO acts as executive of DOS as well."


In [12]:
doc = nlp(raw_text)

for ent in doc.ents:
    print(ent.text, ent.label_)


The Indian Space Research Organisation ORG
India GPE
Bengaluru GPE
Department of Space ORG
India GPE
ISRO ORG
DOS ORG


In [13]:
displacy.render(doc ,style ="ent",jupyter=True)

In [14]:
raw_text1 = "The Mars Orbiter Mission (MOM), also known as Mangalyaan, was launched by the Indian Space Research Organisation in 2013 to demonstrate India’s capability in interplanetary exploration. The mission successfully entered Mars orbit on its first attempt, making India the first nation to achieve this feat. MOM focused on studying Martian surface features, atmosphere, and mineral composition, while also showcasing cost-effective spacecraft design and mission execution."

In [15]:
doc = nlp(raw_text1)

for ent in doc.ents:
    print(ent.text, ent.label_)

The Mars Orbiter Mission ORG
Mangalyaan PERSON
the Indian Space Research Organisation ORG
2013 DATE
India GPE
Mars LOC
first ORDINAL
India GPE
first ORDINAL
Martian NORP


In [16]:
displacy.render(doc ,style ="ent",jupyter=True)