**Demonstration of pos_tagging**

In [None]:
#pos_tagging - pos_tag
import nltk
from nltk import pos_tag
nltk.download('averaged_perceptron_tagger')
nltk.download('punkt')

In [None]:
# Word Tokenization
text = 'This website uses cookies of google'
tokens = nltk.word_tokenize(text)
print(tokens)

['This', 'website', 'uses', 'cookies', 'of', 'google']


In [None]:
# get the POS tags for statement
postag = pos_tag(tokens)
print(postag)

[('This', 'DT'), ('website', 'JJ'), ('uses', 'VBZ'), ('cookies', 'NNS'), ('of', 'IN'), ('google', 'NN')]


In [None]:
# get the list of POS tags
nltk.download('tagsets')
nltk.help.brown_tagset()

In [None]:
# get more info of specific tag
nltk.help.upenn_tagset('NNS')

NNS: noun, common, plural
    undergraduates scotches bric-a-brac products bodyguards facets coasts
    divestitures storehouses designs clubs fragrances averages
    subjectivists apprehensions muses factory-jobs ...


In [None]:
text = 'I left the room'
tokens = nltk.word_tokenize(text)
print(tokens)
postag = pos_tag(tokens)
print(postag)

['I', 'left', 'the', 'room']
[('I', 'PRP'), ('left', 'VBD'), ('the', 'DT'), ('room', 'NN')]


In [None]:
text = 'left of the room'
tokens = nltk.word_tokenize(text)
print(tokens)
postag = pos_tag(tokens)
print(postag)

['left', 'of', 'the', 'room']
[('left', 'NN'), ('of', 'IN'), ('the', 'DT'), ('room', 'NN')]


In [None]:
# spaCy is an open-source library for Natural Language Processing (NLP), written in Python.
# The library features models for NER, POS tagging, dependency parsing.
!pip install spacy
import spacy
from spacy import displacy

In [None]:
import spacy
from spacy import displacy

# Load the language model
nlp = spacy.load("en_core_web_sm")

sentence = 'Deemed universities charge huge fees'

# nlp function returns an object with individual token information,
# linguistic features and relationships
doc = nlp(sentence)

print ("{:<15} | {:<8} | {:<15} ".format('Token','Relation','Head'))
# print ("-" * 70)

for token in doc:
  # Print the token, dependency nature, head and all dependents of the token
  print ("{:<15} | {:<8} | {:<15}"
         .format(str(token.text), str(token.dep_), str(token.head.text)))

 # Use displayCy to visualize the dependency
displacy.render(doc, style='dep', jupyter=True,options={'distance': 120})


Token           | Relation | Head            
Deemed          | amod     | universities   
universities    | nsubj    | charge         
charge          | ROOT     | charge         
huge            | amod     | fees           
fees            | dobj     | charge         


In [None]:
# to get meaning of relationship
print(spacy.explain("amod"))

adjectival modifier


**Named Entity Recognition (NER)**

In [None]:
# Example: 1

In [None]:
# Named Entity Recognition (NER)

import spacy
from spacy import displacy

text = "Sebastian Thrun started working on self-driving cars at Google in 2007."

nlp = spacy.load("en_core_web_sm")
doc = nlp(text)
doc.user_data["title"] = "Entity Recognizer"
displacy.render(doc, style="ent", jupyter=True)

In [4]:
# Example 2

In [3]:
import spacy
from spacy import displacy

text = """Python was conceived in the late 1980s[43] by Guido van Rossum at Centrum Wiskunde & Informatica (CWI) in the Netherlands as a successor to the ABC programming language, which was inspired by SETL,[44] capable of exception handling and interfacing with the Amoeba operating system.[13] Its implementation began in December 1989.[45] Van Rossum shouldered sole responsibility for the project, as the lead developer, until 12 July 2018, when he announced his "permanent vacation" from his responsibilities as Python's "benevolent dictator for life", a title the Python community bestowed upon him to reflect his long-term commitment as the project's chief decision-maker.[46] In January 2019, active Python core developers elected a five-member Steering Council to lead the project.[47][48]"""
nlp = spacy.load("en_core_web_sm")
doc = nlp(text)
doc.user_data["title"] = "Entity Recognizer"
displacy.render(doc, style="ent", jupyter=True)