In [1]:
import spacy
import en_core_web_sm
nlp = en_core_web_sm.load()

In [3]:
doc_object = '"Mr. O\'Neill thinks that the boys\' stories about Chile\'s capital aren\'t amusing"'

In [4]:
print(doc_object)

"Mr. O'Neill thinks that the boys' stories about Chile's capital aren't amusing"


In [5]:
nlp_sentence = nlp(doc_object)
nlp_sentence

"Mr. O'Neill thinks that the boys' stories about Chile's capital aren't amusing"

In [7]:
for token in nlp_sentence:
    print(token.text, token.pos_, end=" | ")

" PUNCT | Mr. PROPN | O'Neill PROPN | thinks VERB | that ADP | the DET | boys NOUN | ' PART | stories NOUN | about ADP | Chile PROPN | 's PART | capital NOUN | are VERB | n't ADV | amusing ADJ | " PUNCT | 

In [11]:
sentence = "Access our website between 9 a.m. and 1 p.m. every weekend at www.lyit.ie."

In [12]:
nlp_sentence = nlp(sentence)
nlp_sentence

for token in nlp_sentence:
    print(token.text)

Access
our
website
between
9
a.m.
and
1
p.m.
every
weekend
at
www.lyit.ie
.


In [14]:
sentence = "I live about 20km from here. A taxi will cost around £50."

In [15]:
nlp_sentence = nlp(sentence)
nlp_sentence

for token in nlp_sentence:
    print(token.text)

I
live
about
20
km
from
here
.
A
taxi
will
cost
around
£
50
.


In [16]:
doc_object = nlp(u"I really like to work with words!")

for token in doc_object:
    print(token)

I
really
like
to
work
with
words
!


In [17]:
doc_object[0]

I

In [18]:
doc_object[3:6]

to work with

In [19]:
doc_object[-2:]

words!

In [42]:
doc_object = nlp(u"Samsung in Ireland are pleased with their new folding screen that they released after a $9 million investment.")

print(doc_object.ents)
for entity in doc_object.ents:
    print(entity)

(Samsung, Ireland, $9 million)
Samsung
Ireland
$9 million


In [27]:
doc_object = nlp(u"I like my car")

print(doc_object.ents)
for entity in doc_object.ents:
    print(entity)

()


In [90]:
def show_entity_info(doc_object):
    if doc_object:
        for entity in doc_object.ents:
            print(f"{entity.text:{30}} {entity.label_:{30}} {spacy.explain(entity.label_)}")
    else:
        print("No entities found in text.")

In [44]:
show_entity_info(doc_object)

Samsung ORG        Companies, agencies, institutions, etc.
Ireland GPE        Countries, cities, states
$9 million MONEY      Monetary values, including unit


In [47]:
doc_object = nlp(u"Autonomous cars shift insurance liability toward manufacturers")

In [60]:
for chunk in doc_object.noun_chunks:
    print(f"{chunk.text:{20}} {chunk.root.text:{20}} {spacy.explain(chunk.root.dep_):{25}} {chunk.root.head}")

Autonomous cars      cars                 nominal subject           shift
insurance liability  liability            direct object             shift
manufacturers        manufacturers        object of preposition     toward


In [62]:
from spacy import displacy

In [75]:
displacy.render(doc_object, style='dep', jupyter=True, options={"distance":100, "color":"Blue", "arrow_stroke":4, "arrow_spacing":20, "word_spacing":50})

In [76]:
text_file = open("noun-chunks.txt")
noun_chunks = text_file.read()

In [78]:
print(noun_chunks)

When Sebastian Thrun started working on self-driving cars at Google in 2007, few people outside of the company took him seriously. 
"I can tell you very senior CEOs of major American car companies would shake my hand and turn away because I wasn't worth talking to," said Thrun, now the co-founder and CEO of online higher education startup Udacity, in an interview with Recode earlier this week. 
A little less than a decade later, dozens of self-driving startups have cropped up while automakers around the world clamor, wallet in hand, to secure their place in the fast-moving world of fully automated transportation.


In [83]:
doc_object = nlp(noun_chunks)

In [91]:
show_entity_info(doc_object)

Sebastian Thrun                PERSON                         People, including fictional
Google                         ORG                            Companies, agencies, institutions, etc.
2007                           DATE                           Absolute or relative dates or periods

                              GPE                            Countries, cities, states
American                       NORP                           Nationalities or religious or political groups
Thrun                          PERSON                         People, including fictional
Recode                         ORG                            Companies, agencies, institutions, etc.
earlier this week              DATE                           Absolute or relative dates or periods

                              GPE                            Countries, cities, states
less than a decade later       DATE                           Absolute or relative dates or periods
dozens                         

In [99]:
displacy.render(doc_object, style='dep', jupyter=True, options={"distance":200, "color":"Blue", "arrow_stroke":4, "arrow_spacing":10, "word_spacing":30})