In [2]:
import spacy

In [3]:
nlp = spacy.load("en_core_web_sm")

In [4]:
doc = nlp("Sachin isn't out. Sachin has scored 100 O.D.I. centuries and 100 Test Centuries.Got $1 Billon in Cash Prize")
for token in doc:
    print(token)

Sachin
is
n't
out
.
Sachin
has
scored
100
O.D.I.
centuries
and
100
Test
Centuries
.
Got
$
1
Billon
in
Cash
Prize


In [5]:
doc

Sachin isn't out. Sachin has scored 100 O.D.I. centuries and 100 Test Centuries.Got $1 Billon in Cash Prize

In [6]:
for token in doc:
    print(f"{token.text:{20}}{token.lemma_:{15}} {token.pos_:{15}} {token.is_stop}" )

Sachin              Sachin          PROPN           False
is                  be              AUX             True
n't                 n't             PART            True
out                 out             ADV             True
.                   .               PUNCT           False
Sachin              Sachin          PROPN           False
has                 have            AUX             True
scored              score           VERB            False
100                 100             NUM             False
O.D.I.              O.D.I.          PROPN           False
centuries           century         NOUN            False
and                 and             CCONJ           True
100                 100             NUM             False
Test                Test            PROPN           False
Centuries           Centuries       PROPN           False
.                   .               PUNCT           False
Got                 got             VERB            False
$                  

# Dependency Parsing

In [7]:
for chunk in doc.noun_chunks:
    print(f'{chunk.text:{35}} {chunk.root.text:{15}} {chunk.root.dep_}')

Sachin                              Sachin          nsubj
Sachin                              Sachin          nsubj
100 O.D.I. centuries                centuries       dobj
100 Test Centuries                  Centuries       conj
$1 Billon                           Billon          dobj
Cash Prize                          Prize           pobj


In [8]:
doc = nlp("Apple is Very Big Company with $1 Billion in Revenue ")
for ent in doc.ents:
    print(ent.text,ent.label_)

Apple ORG
$1 Billion MONEY
Revenue GPE


In [9]:
doc = nlp("Orange is Fruit i like.In COuntries Like India")
for ent in doc.ents:
    print(ent.text,ent.label_)

Fruit ORG
India GPE


# Sentence Segmentation

In [10]:
# doc.sents
for sent in doc.sents:
    print(sent)

Orange is Fruit i like.
In COuntries Like India


In [11]:
for token in doc:
    print(token.text, token.pos_, token.dep_)

Orange PROPN nsubj
is AUX ROOT
Fruit PROPN attr
i PRON nsubj
like VERB relcl
. PUNCT punct
In ADP ROOT
COuntries PROPN pobj
Like ADP prep
India PROPN pobj


In [None]:
import spacy
from spacy import displacy

nlp = spacy.load("en_core_web_sm")
doc = nlp("This is a sentence.")
displacy.serve(doc, style="dep")




Using the 'dep' visualizer
Serving on http://0.0.0.0:5000 ...



In [None]:
doc = nlp("Orange is Fruit i like.In COuntries Like India")
displacy.serve(doc, style="dep")