In [1]:
import spacy
import en_core_web_sm

In [2]:
nlp = en_core_web_sm.load()

In [3]:
help(nlp)

Help on English in module spacy.lang.en object:

class English(spacy.language.Language)
 |  English(vocab=True, make_doc=True, max_length=1000000, meta={}, **kwargs)
 |  
 |  A text-processing pipeline. Usually you'll load this once per process,
 |  and pass the instance around your application.
 |  
 |  Defaults (class): Settings, data and factory methods for creating the `nlp`
 |      object and processing pipeline.
 |  lang (unicode): Two-letter language ID, i.e. ISO code.
 |  
 |  DOCS: https://spacy.io/api/language
 |  
 |  Method resolution order:
 |      English
 |      spacy.language.Language
 |      builtins.object
 |  
 |  Data and other attributes defined here:
 |  
 |  Defaults = <class 'spacy.lang.en.EnglishDefaults'>
 |  
 |  
 |  lang = 'en'
 |  
 |  ----------------------------------------------------------------------
 |  Methods inherited from spacy.language.Language:
 |  
 |  __call__(self, text, disable=[], component_cfg=None)
 |      Apply the pipeline to some text

In [4]:
text = 'Apple is looking for buying a U.K. startup for $1 billion'

In [5]:
doc = nlp(text)

In [6]:
for token in doc:
    print(token.text)

Apple
is
looking
for
buying
a
U.K.
startup
for
$
1
billion


In [7]:
doc

Apple is looking for buying a U.K. startup for $1 billion

# PARTS OF SPEECH TAGGING

In [12]:
for token in doc:
    print(f'{token.text:{15}} {token.pos_:}')

Apple           PROPN
is              AUX
looking         VERB
for             ADP
buying          VERB
a               DET
U.K.            PROPN
startup         NOUN
for             ADP
$               SYM
1               NUM
billion         NUM


# VISUALIZATION

In [13]:
from spacy import displacy

In [14]:
displacy.render(doc, style = 'dep', options = {'distance': 100, 'compact': True})

# Name Entity Recognition

In [16]:
for ent in doc.ents:
    print(ent.text, ent.label_)

Apple ORG
U.K. GPE
$1 billion MONEY


In [17]:
displacy.render(doc, style = 'ent', options = {'distance': 100, 'compact': True})