In [1]:
from spacy.lang.en import English

In [2]:
nlp = English()

In [3]:
doc = nlp("Hello world!")

In [4]:
for token in doc:
    print(token.text)

Hello
world
!


In [5]:
span = doc[1:3]
print(span)

world!


In [6]:
doc = nlp("it cost $5")

In [7]:
print("index:", [token.i for token in doc])
print(" Text:" ,[token.text for token in doc])
print("is_alpha", [token.is_alpha for token in doc])
print("is_punct", [token.is_punct for token in doc])
print("like_num", [token.like_num for token in doc])

index: [0, 1, 2, 3]
 Text: ['it', 'cost', '$', '5']
is_alpha [True, True, False, False]
is_punct [False, False, False, False]
like_num [False, False, False, True]


In [10]:
import spacy

In [11]:
nlp = spacy.load('en_core_web_md')

In [12]:
text = "It’s official: Apple is the first U.S. public company to reach a $1 trillion market value"

In [13]:
doc = nlp(text)

In [14]:
for token in doc:
    token_text = token.text
    token_pos = token.pos_
    token_dep = token.dep_
    print(token_text,token_pos, token_dep)

It PRON nsubj
’s VERB ccomp
official ADJ acomp
: PUNCT punct
Apple PROPN nsubj
is AUX ROOT
the DET det
first ADJ amod
U.S. PROPN nmod
public ADJ amod
company NOUN attr
to PART aux
reach VERB relcl
a DET det
$ SYM quantmod
1 NUM compound
trillion NUM nummod
market NOUN compound
value NOUN dobj


In [15]:
text = "Upcoming iPhone X release date leaked as Apple reveals pre-orders"

In [16]:
doc = nlp(text)

In [18]:
for ent in doc.ents:
    print(ent.text, ent.label_)

iPhone X LAW
Apple ORG


In [19]:
spacy.explain('LAW')

'Named documents made into laws.'

In [20]:
from spacy.matcher import Matcher

In [21]:
matcher = Matcher(nlp.vocab)

In [28]:
pattern = [{"Text":"iPhone"}, {"Text": "X"}]

In [29]:
matcher.add("Iphone_pattern",None, pattern)

In [30]:
doc = nlp("Upcoming iPhone X release date leaked")

In [32]:
matches = matcher(doc)

In [34]:
for match_id, start, end in matches:
    matched_span = doc[start:end]
    print(matched_span.text)

iPhone X


In [35]:
doc = nlp(
    "After making the iOS update you won't notice a radical system-wide "
    "redesign: nothing like the aesthetic upheaval we got with iOS 7. Most of "
    "iOS 11's furniture remains the same as in iOS 10. But you will discover "
    "some tweaks once you delve a little deeper."
)

In [38]:
pattern = [{"TEXT":"iOS"},{"IS_DIGIT":True}]

In [39]:
matcher = Matcher(nlp.vocab)

In [40]:
matcher.add("ios version detect",None, pattern)
matches = matcher(doc)

In [41]:
print("Total matches found:",len(matches))

Total matches found: 3


In [44]:
for match_id, start, end in matches:
    print("match found:",doc[start:end].text)

match found: iOS 7
match found: iOS 11
match found: iOS 10


In [45]:
matcher = Matcher(nlp.vocab)

doc = nlp(
    "i downloaded Fortnite on my laptop and can't open the game at all. Help? "
    "so when I was downloading Minecraft, I got the Windows version where it "
    "is the '.zip' folder and I used the default program to unpack it... do "
    "I also need to download Winzip?"
)

In [46]:
pattern = [{"LEMMA":"download"}, {"POS": "PROPN"}]

In [47]:
matcher.add("Download_things_pattern",None, pattern)
matches = matcher(doc)

In [48]:
print("Total matches found:", len(matches))

Total matches found: 3


In [49]:
for matches_id, start, end in matches:
    print("match found:", doc[start:end].text)

match found: downloaded Fortnite
match found: downloading Minecraft
match found: download Winzip
