# **Language Processing Pipeline**

In [1]:
import spacy

In [2]:
nlp = spacy.blank('en')

doc = nlp('Captain america ate 100$ of samosa. Then he said I can do this all day')

for token in doc:
  print(token)

Captain
america
ate
100
$
of
samosa
.
Then
he
said
I
can
do
this
all
day


In [3]:
 nlp.pipe_names

[]

**Loading Pre-trained Pipeline**

In [6]:
nlp = spacy.load('en_core_web_sm')

In [7]:
nlp.pipe_names

['tok2vec', 'tagger', 'parser', 'attribute_ruler', 'lemmatizer', 'ner']

In [8]:
doc = nlp('Captain america ate 100$ of samosa. Then he said I can do this all day')

for token in doc:
  print(token, "|", token.pos_, "|", token.lemma_)

Captain | PROPN | Captain
america | PROPN | america
ate | VERB | eat
100 | NUM | 100
$ | NUM | $
of | ADP | of
samosa | PROPN | samosa
. | PUNCT | .
Then | ADV | then
he | PRON | he
said | VERB | say
I | PRON | I
can | AUX | can
do | VERB | do
this | PRON | this
all | DET | all
day | NOUN | day


In [11]:
doc = nlp('Tesla Inc is going to acquire twitter for $45 billion')

for ent in doc.ents:
  print(ent.text, '|', ent.label_, '|', spacy.explain(ent.label_))

Tesla Inc | ORG | Companies, agencies, institutions, etc.
$45 billion | MONEY | Monetary values, including unit


In [12]:
from spacy import displacy

displacy.render(doc, style = 'ent')

In [13]:
nlp = spacy.blank('en')

doc = nlp('Tesla Inc va racheter Twitter pour $45 milliards de dollars')

In [14]:
source_nlp = spacy.load('en_core_web_sm')

In [15]:
nlp.add_pipe('ner', source = source_nlp)

<spacy.pipeline.ner.EntityRecognizer at 0x7b1a8c6f6c70>

In [16]:
nlp.pipe_names

['ner']

In [21]:
doc = nlp('Tesla Inc is going to acquire twitter for $45 billion')

In [22]:
for ent in doc.ents:
  print(ent.text, "|", ent.label_, "|", spacy.explain(ent.label_))

Tesla Inc | ORG | Companies, agencies, institutions, etc.
$45 billion | MONEY | Monetary values, including unit


In [23]:
displacy.render(doc, style = 'ent')