In [24]:
import spacy
import pandas as pd
import numpy as np
from datetime import datetime, timedelta
nlp = spacy.load('en_core_web_lg')

In [9]:
doc = nlp("Weston sits next to me at work.")

In [10]:
[token.text for token in doc]

['Weston', 'sits', 'next', 'to', 'me', 'at', 'work', '.']

In [11]:
span = doc[2:4]
span.text

'next to'

In [25]:
from spacy.tokens import Span

doc = nlp("I live in New York")
# Span for "New York" with label GPE (geopolitical)
span = Span(doc, 3, 5, label="GPE")
span.text

TypeError: an integer is required

In [13]:
doc = nlp("Weston sits next to me at work.")
[token.pos_ for token in doc]

['PROPN', 'VERB', 'ADV', 'ADP', 'PRON', 'ADP', 'NOUN', 'PUNCT']

In [14]:
[token.tag_ for token in doc]

['NNP', 'VBZ', 'RB', 'IN', 'PRP', 'IN', 'NN', '.']

In [31]:
doc = nlp("Freeosk is awesome. It is a very friendly, people oriented, and nimble company. They care, genuinely, for their employees and work very hard to make it an awesome place to work.")
[(token.dep_) for token in doc]

['nsubj',
 'ROOT',
 'acomp',
 'punct',
 'nsubj',
 'ROOT',
 'det',
 'advmod',
 'attr',
 'punct',
 'nsubj',
 'conj',
 'punct',
 'cc',
 'amod',
 'conj',
 'punct',
 'nsubj',
 'ROOT',
 'punct',
 'advmod',
 'punct',
 'prep',
 'poss',
 'pobj',
 'cc',
 'conj',
 'advmod',
 'advmod',
 'aux',
 'advcl',
 'nsubj',
 'det',
 'amod',
 'ccomp',
 'aux',
 'relcl',
 'punct']

In [16]:
# Governing action?
[token.head.text for token in doc]

['sits', 'sits', 'sits', 'next', 'to', 'sits', 'at', 'sits']

In [29]:
doc = nlp("Freeosk is awesome. It is a very friendly, people oriented, and nimble company. They care, genuinely, for their employees and work very hard to make it an awesome place to work.")
[(ent.text, ent.label_) for ent in doc.ents]

[('Freeosk', 'ORG')]

In [18]:
doc = nlp("This a sentence. This is another one.")
# doc.sents is a generator that yields sentence spans
[sent.text for sent in doc.sents]
# ['This is a sentence.', 'This is another one.']

['This a sentence.', 'This is another one.']

In [21]:
doc = nlp("I have a red car")
# doc.noun_chunks is a generator that yields spans
[chunk.text for chunk in doc.noun_chunks]

['I', 'a red car']

In [22]:
spacy.explain("RB")
# 'adverb'
spacy.explain("GPE")
# 'Countries, cities, 

'Countries, cities, states'

In [26]:
from spacy import displacy
doc = nlp("Freeosk is awesome. It is a very friendly, people oriented, and nimble company. They care, genuinely, for their employees and work very hard to make it an awesome place to work.")
displacy.render(doc, style="dep")

'<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" id="0" class="displacy" width="5475" height="574.5" style="max-width: none; height: 574.5px; color: #000000; background: #ffffff; font-family: Arial">\n<text class="displacy-token" fill="currentColor" text-anchor="middle" y="484.5">\n    <tspan class="displacy-word" fill="currentColor" x="50">Freeosk</tspan>\n    <tspan class="displacy-tag" dy="2em" fill="currentColor" x="50">PROPN</tspan>\n</text>\n\n<text class="displacy-token" fill="currentColor" text-anchor="middle" y="484.5">\n    <tspan class="displacy-word" fill="currentColor" x="225">is</tspan>\n    <tspan class="displacy-tag" dy="2em" fill="currentColor" x="225">VERB</tspan>\n</text>\n\n<text class="displacy-token" fill="currentColor" text-anchor="middle" y="484.5">\n    <tspan class="displacy-word" fill="currentColor" x="400">awesome.</tspan>\n    <tspan class="displacy-tag" dy="2em" fill="currentColor" x="400">ADJ</tspan>\n</text>\n\n<text cl

In [28]:
displacy.render(doc, style="dep", jupyter=True)