### Execute this cell to install required python module

After you've installed this once, you can delete this cell.

In [5]:
# !pip install spacy
# !python -m spacy download en_core_web_sm
# # !python -m spacy download en_core_web_lg

# Named Entity Recognition & Parts of Speech Tagging
## Using [Spacy's pre-trained NER and POS tagger](https://spacy.io/api/annotation#named-entities)

In [2]:
import spacyhttp://localhost:8888/notebooks/Dropbox/2_study_software%20engineer/2_bootcamp/19-05-04/Activities/04-NER/NER_and_POS.ipynb#Using-Spacy's-pre-trained-NER-and-POS-tagger
from spacy import displacy
from tabulate import tabulate

# Load English tokenizer, tagger, parser, NER and word vectors
nlp = spacy.load("en_core_web_sm")


text = ("A live 1957 recording of John Coltrane and Thelonious Monk sat in the Library of Congress’s "
        "archives unnoticed for 48 years, before the library’s Magnetic Recording Laboratory supervisor "
        "Larry Appelbaum found it. For 60 years , Verve stored a live recording of Ella Fitzgerald "
        "performing at Zardi’s Jazzland in Hollywood, before releasing it in 2017 just after what would "
        "have been her 100th birthday.")

# Process document
doc = nlp(text)

# Analyze syntax
print("Noun phrases:\n",[chunk.text for chunk in doc.noun_chunks])
print("\nVerbs:\n", [token.lemma_ for token in doc if token.pos_ == "VERB"])
print()

# Extract Entities
ent_list = []
for entity in doc.ents:
    ent_list.append([entity.text, entity.label_])
    
print(tabulate(ent_list, headers=['Entity', 'Entity Type']))



Noun phrases:
 ['A live 1957 recording', 'John Coltrane', 'Thelonious Monk', 'the Library', 'Congress', '’s archives', '48 years', 'the library', '’s Magnetic Recording Laboratory supervisor Larry Appelbaum', 'it', '60 years', 'Verve', 'a live recording', 'Ella Fitzgerald', 'Zardi’s Jazzland', 'Hollywood', 'it', 'what', 'her 100th birthday']

Verbs:
 ['sit', 'find', 'store', 'perform', 'release', 'would', 'have', 'be']

Entity                            Entity Type
--------------------------------  -------------
1957                              DATE
John Coltrane                     PERSON
Thelonious Monk                   ORG
the Library of Congress           ORG
48 years                          DATE
’s Magnetic Recording Laboratory  ORG
Larry Appelbaum                   PERSON
60 years                          DATE
Verve                             ORG
Ella Fitzgerald                   PERSON
Zardi’s Jazzland                  FAC
Hollywood                         GPE
2017          

# Spacy Visuals

In [3]:
sentence_spans = list(doc.sents)
displacy.render(sentence_spans, style="ent")

In [4]:
displacy.render(sentence_spans, style="dep", options={"word_spacing":15})