In [20]:
import spacy
from prettytable import PrettyTable

## **Downloading the corpus**

In [4]:
#downloading english and pt corpus

#!python -m spacy download en_core_web_sm
#!python -m spacy download pt_core_news_md

Loading the english corpus

In [2]:
nlp_en = spacy.load("en_core_web_sm")



Mapping of the Parts of speech with its description, taken from Spacy's documentation.

In [8]:
pos_desc = {
"ADJ"  : "adjective",
"ADP"  : "adposition",
"ADV"  : "adverb",              
"AUX"  : "auxiliary",
"CONJ" : "conjunction",         
"CCONJ": "coordinating conjunction",
"DET"  : "determiner",
"INTJ" : "interjection",
"NOUN" : "noun",
"NUM"  : "numeral",
"PART" : "particle",
"PRON" : "pronoun",
"PROPN": "proper noun",
"PUNCT": "punctuation",
"SCONJ": "subordinating conjunction",
"SYM"  : "symbol",
"VERB" : "verb",
"X"    : "other",
"SPACE": "space"
}


| POS   | Description               | Examples                                      |
|:-----:|:-------------------------:|:---------------------------------------------:|
| ADJ   | adjective                 | big, old, green, incomprehensible, first      |
| ADP   | adposition                | in, to, during                                |
| ADV   | adverb                    | very, tomorrow, down, where, there            |
| AUX   | auxiliary                 | is, has (done), will (do), should (do)        |
| CONJ  | conjunction               | and, or, but                                  |
| CCONJ | coordinating conjunction  | and, or, but                                  |
| DET   | determiner                | a, an, the                                    |
| INTJ  | interjection              | psst, ouch, bravo, hello                      |
| NOUN  | noun                      | girl, cat, tree, air, beauty                  |
| NUM   | numeral                   | 1, 2017, one, seventy-seven, IV, MMXIV        |
| PART  | particle                  | ’s, not,                                      |
| PRON  | pronoun                   | I, you, he, she, myself, themselves, somebody |
| PROPN | proper noun               | Mary, John, London, NATO, HBO                 |
| PUNCT | punctuation               | ., (, ), ?                                    |
| SCONJ | subordinating conjunction | if, while, that                               |
| SYM   | symbol                    | $, %, §, ©, +, −, ×, ÷, =, :), 😝             |
| VERB  | verb                      | run, runs, running, eat, ate, eating          |
| X     | other                     | sfpksdpsxmsa                                  |
| SPACE | space                     |                                               |


We'll only keep a few of the parts of speech to make the comparision easier

In [24]:
only_keeping_pos = ["ADJ", "NOUN", "PROPN", "VERB", "ADV"]

In [25]:
def pos_tagger(doc):
    table = PrettyTable(["Word", "POS", "POS Description"])
    for token in doc:
        if token.pos_ in only_keeping_pos:
            table.add_row([token.lemma_, token.pos_, pos_desc[token.pos_]])
    print(table)

## **English**

In [26]:
text_en = "Luciano's family Luciano is eight years old and has a family that he greatly admires."
doc_en = nlp_en(text_en)

pos_tagger(doc_en)

+---------+-------+-----------------+
|   Word  |  POS  | POS Description |
+---------+-------+-----------------+
| Luciano | PROPN |   proper noun   |
|  family |  NOUN |       noun      |
| Luciano | PROPN |   proper noun   |
|   year  |  NOUN |       noun      |
|   old   |  ADJ  |    adjective    |
|   have  |  VERB |       verb      |
|  family |  NOUN |       noun      |
| greatly |  ADV  |      adverb     |
|  admire |  VERB |       verb      |
+---------+-------+-----------------+


## **Portuguese**

In [27]:
nlp_pt = spacy.load('pt_core_news_md')

In [28]:
text_pt = "A família de Luciano Luciano tem oito anos e possui uma família que admira muito."
doc_pt = nlp_pt(text_pt)

pos_tagger(doc_pt)

+---------+-------+-----------------+
|   Word  |  POS  | POS Description |
+---------+-------+-----------------+
| família |  NOUN |       noun      |
| Luciano | PROPN |   proper noun   |
| Luciano | PROPN |   proper noun   |
|   ter   |  VERB |       verb      |
|   ano   |  NOUN |       noun      |
| possuir |  VERB |       verb      |
| família |  NOUN |       noun      |
| admirar |  VERB |       verb      |
+---------+-------+-----------------+
