In [1]:
from textblob import TextBlob

In [2]:
wiki=TextBlob("Python is a high-level, general-purpose programming language")

In [3]:
#Parts of speech Tagging
wiki.tags

[('Python', 'NNP'),
 ('is', 'VBZ'),
 ('a', 'DT'),
 ('high-level', 'JJ'),
 ('general-purpose', 'JJ'),
 ('programming', 'NN'),
 ('language', 'NN')]

In [4]:
#Noun Phrase Extraction
wiki.noun_phrases

WordList(['python'])

#### Sentiment Analysis

In [5]:
testimonial = TextBlob("Textblob is amazingly simple to use. What great fun!")

In [6]:
testimonial.sentiment

Sentiment(polarity=0.39166666666666666, subjectivity=0.4357142857142857)

In [7]:
testimonial.sentiment.polarity

0.39166666666666666

####Tokenization

In [8]:
zen = TextBlob("Beautiful is better than ugly. "
"Explicit is better than implicit. "
"Simple is better than complex.")

In [9]:
zen.words

WordList(['Beautiful', 'is', 'better', 'than', 'ugly', 'Explicit', 'is', 'better', 'than', 'implicit', 'Simple', 'is', 'better', 'than', 'complex'])

In [10]:
zen.sentences

[Sentence("Beautiful is better than ugly."),
 Sentence("Explicit is better than implicit."),
 Sentence("Simple is better than complex.")]

In [11]:
for sentence in zen.sentences:
    print(sentence.sentiment)

Sentiment(polarity=0.2166666666666667, subjectivity=0.8333333333333334)
Sentiment(polarity=0.5, subjectivity=0.5)
Sentiment(polarity=0.06666666666666667, subjectivity=0.41904761904761906)


###Words Inflection and Lemmatization

In [13]:
sentence = TextBlob('Use 4 spaces per indentation level.')

In [14]:
sentence.words

WordList(['Use', '4', 'spaces', 'per', 'indentation', 'level'])

In [15]:
sentence.words[2].singularize()

'space'

In [16]:
sentence.words[-1].pluralize()

'levels'

In [17]:
from textblob import Word
w=Word('octopi')
w.lemmatize()

'octopus'

In [18]:
w=Word("Went")

In [19]:
w.lemmatize("v")

'Went'

#### WordNet Integration

In [20]:
from textblob import Word
from textblob.wordnet import VERB

In [21]:
word=Word("octopus")

In [22]:
word.synsets

[Synset('octopus.n.01'), Synset('octopus.n.02')]

In [23]:
Word("hack").get_synsets(pos=VERB)

[Synset('chop.v.05'),
 Synset('hack.v.02'),
 Synset('hack.v.03'),
 Synset('hack.v.04'),
 Synset('hack.v.05'),
 Synset('hack.v.06'),
 Synset('hack.v.07'),
 Synset('hack.v.08')]

In [24]:
Word("octopus").definitions

['tentacles of octopus prepared as food',
 'bottom-living cephalopod having a soft oval body with eight long tentacles']

In [25]:
from textblob.wordnet import Synset
octopus = Synset('octopus.n.02')
shrimp = Synset('shrimp.n.03')
octopus.path_similarity(shrimp)

0.1111111111111111

#### WordLists

In [26]:
animals=TextBlob("cat dog octopus")

In [27]:
animals.words

WordList(['cat', 'dog', 'octopus'])

In [28]:
animals.words.pluralize()

WordList(['cats', 'dogs', 'octopodes'])

#### Spelling Correction¶

In [29]:
b=TextBlob("I havv goood speling")
print(b.correct())

I have good spelling


In [30]:
from textblob import Word
w=Word('falibility')
w.spellcheck()

[('fallibility', 1.0)]

#### Get Word and Noun Phrase Frequencies

In [31]:
monty=TextBlob("We are no longer the Knights who say Ni. "
...                     "We are now the Knights who say Ekki ekki ekki PTANG.")

In [32]:
monty.word_counts['ekki']

3

In [33]:
monty.words.count('ekki')

3

#### Translation and Language Detection

In [34]:
en_blob = TextBlob(u'Simple is better than complex.')

In [35]:
en_blob.translate(to='es')

TextBlob("Simple es mejor que complejo.")

### Parsing

In [36]:
b = TextBlob("And now for something completely different.")

In [37]:
print(b.parse())

And/CC/O/O now/RB/B-ADVP/O for/IN/B-PP/B-PNP something/NN/B-NP/I-PNP completely/RB/B-ADJP/O different/JJ/I-ADJP/O ././O/O


In [38]:
zen[0:19]

TextBlob("Beautiful is better")

In [39]:
zen.upper()

TextBlob("BEAUTIFUL IS BETTER THAN UGLY. EXPLICIT IS BETTER THAN IMPLICIT. SIMPLE IS BETTER THAN COMPLEX.")

In [40]:
zen.find('Simple')

65

#### n-grams

In [41]:
blob = TextBlob("Now is better than never.")

In [42]:
blob.ngrams(n=3)

[WordList(['Now', 'is', 'better']),
 WordList(['is', 'better', 'than']),
 WordList(['better', 'than', 'never'])]

In [43]:
for s in zen.sentences:
    print(s)

Beautiful is better than ugly.
Explicit is better than implicit.
Simple is better than complex.
