In [17]:
import spacy
from spacy import displacy
import warnings
warnings.filterwarnings("ignore")

## Tokenisation

In [12]:
nlp = spacy.load("en_core_web_sm")
doc = nlp("Apple is looking at buying U.K. startup for $1 billion")
for token in doc:
    print(token.text)

Apple
is
looking
at
buying
U.K.
startup
for
$
1
billion


## POS-TAGGING

### Printing tags and deps

In [13]:
doc = nlp("Apple is looking at buying U.K. startup for $1 billion")
for token in doc:
    print(token.text, token.lemma_, token.pos_, token.tag_, token.dep_,
            token.shape_, token.is_alpha, token.is_stop,"\n")

Apple Apple PROPN NNP nsubj Xxxxx True False 

is be AUX VBZ aux xx True True 

looking look VERB VBG ROOT xxxx True False 

at at ADP IN prep xx True True 

buying buy VERB VBG pcomp xxxx True False 

U.K. U.K. PROPN NNP dobj X.X. False False 

startup startup NOUN NN advcl xxxx True False 

for for ADP IN prep xxx True True 

$ $ SYM $ quantmod $ False False 

1 1 NUM CD compound d False False 

billion billion NUM CD pobj xxxx True False 



### Visualisation

In [22]:
doc = nlp("Apple is looking at buying U.K. startup for $1 billion")
options = {"compact": True, "bg": "#09a3d5",
           "color": "white", "font": "Source Sans Pro"}
# options={}
displacy.render(doc, style="dep",options=options)

### Visualisation by individual sentence

In [21]:
nlp = spacy.load("en_core_web_sm")
text = """In ancient Rome, some neighbors live in three adjacent houses. In the center is the house of Senex, who lives there with wife Domina, son Hero, and several slaves, including head slave Hysterium and the musical's main character Pseudolus. A slave belonging to Hero, Pseudolus wishes to buy, win, or steal his freedom. One of the neighboring houses is owned by Marcus Lycus, who is a buyer and seller of beautiful women; the other belongs to the ancient Erronius, who is abroad searching for his long-lost children (stolen in infancy by pirates). One day, Senex and Domina go on a trip and leave Pseudolus in charge of Hero. Hero confides in Pseudolus that he is in love with the lovely Philia, one of the courtesans in the House of Lycus (albeit still a virgin)."""
doc = nlp(text)
sentence_spans = list(doc.sents)
displacy.render(sentence_spans, style="dep")

## Named Entities

### Printing Entities

In [25]:
doc = nlp("Apple is looking at buying U.K. startup for $1 billion")

for ent in doc.ents:
    print(ent.text, ent.start_char, ent.end_char, ent.label_)

Apple 0 5 ORG
U.K. 27 31 GPE
$1 billion 44 54 MONEY


### Visualisation

In [26]:
displacy.render(doc, style="ent")

In [31]:
text = "But Google is starting from behind. The company made a late push into hardware, and Apple's Siri, available on iPhones, and Amazon's Alexa software, which runs on its Echo and Dot devices, have clear leads in consumer adoption."

doc = nlp(text)
# options={"ents":["LOC"]}
# options={"ents":["ORG"]}
options=
displacy.render(doc, style="ent",options=options)