In [None]:
import nltk
nltk.download('punkt')
nltk.download('wordnet')
nltk.download('averaged_perceptron_tagger')
nltk.download('maxent_ne_chunker')
nltk.download('words')
nltk.download('stopwords')


In [3]:
from nltk.tokenize import word_tokenize, sent_tokenize

text = "NLTK is a leading platform for building Python programs to work with human language data."
word_tokens = word_tokenize(text)
sent_tokens = sent_tokenize(text)

print(word_tokens)
print(sent_tokens)


['NLTK', 'is', 'a', 'leading', 'platform', 'for', 'building', 'Python', 'programs', 'to', 'work', 'with', 'human', 'language', 'data', '.']
['NLTK is a leading platform for building Python programs to work with human language data.']


In [4]:
from nltk.stem import PorterStemmer

stemmer = PorterStemmer()
words = ["running", "jumps", "easily", "fairly"]
stemmed_words = [stemmer.stem(word) for word in words]

print(stemmed_words)


['run', 'jump', 'easili', 'fairli']


In [5]:
from nltk.stem import WordNetLemmatizer

lemmatizer = WordNetLemmatizer()
words = ["running", "jumps", "easily", "fairly"]
lemmatized_words = [lemmatizer.lemmatize(word) for word in words]

print(lemmatized_words)


['running', 'jump', 'easily', 'fairly']


In [6]:
from nltk import pos_tag

words = word_tokenize("NLTK is a leading platform for building Python programs to work with human language data.")
pos_tags = pos_tag(words)

print(pos_tags)


[('NLTK', 'NNP'), ('is', 'VBZ'), ('a', 'DT'), ('leading', 'VBG'), ('platform', 'NN'), ('for', 'IN'), ('building', 'VBG'), ('Python', 'NNP'), ('programs', 'NNS'), ('to', 'TO'), ('work', 'VB'), ('with', 'IN'), ('human', 'JJ'), ('language', 'NN'), ('data', 'NNS'), ('.', '.')]


In [7]:
from nltk import ne_chunk

ne_tree = ne_chunk(pos_tags)
print(ne_tree)


(S
  (ORGANIZATION NLTK/NNP)
  is/VBZ
  a/DT
  leading/VBG
  platform/NN
  for/IN
  building/VBG
  (PERSON Python/NNP)
  programs/NNS
  to/TO
  work/VB
  with/IN
  human/JJ
  language/NN
  data/NNS
  ./.)


In [9]:
from nltk.sentiment.vader import SentimentIntensityAnalyzer

sid = SentimentIntensityAnalyzer()
text = "NLTK is a great tool for working with language data!"
sentiment_scores = sid.polarity_scores(text)

print(sentiment_scores)


LookupError: 
**********************************************************************
  Resource [93mvader_lexicon[0m not found.
  Please use the NLTK Downloader to obtain the resource:

  [31m>>> import nltk
  >>> nltk.download('vader_lexicon')
  [0m
  For more information see: https://www.nltk.org/data.html

  Attempted to load [93msentiment/vader_lexicon.zip/vader_lexicon/vader_lexicon.txt[0m

  Searched in:
    - '/teamspace/studios/this_studio/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/share/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/lib/nltk_data'
    - '/usr/share/nltk_data'
    - '/usr/local/share/nltk_data'
    - '/usr/lib/nltk_data'
    - '/usr/local/lib/nltk_data'
    - ''
**********************************************************************


In [8]:
from nltk.classify import NaiveBayesClassifier
from nltk.corpus import movie_reviews

# Load the dataset
documents = [(list(movie_reviews.words(fileid)), category)
             for category in movie_reviews.categories()
             for fileid in movie_reviews.fileids(category)]

# Feature extraction
def document_features(document):
    words = set(document)
    features = {}
    for word in movie_reviews.words():
        features[word] = (word in words)
    return features

# Training the classifier
featuresets = [(document_features(d), c) for (d, c) in documents]
train_set, test_set = featuresets[100:], featuresets[:100]
classifier = NaiveBayesClassifier.train(train_set)

# Testing the classifier
print(nltk.classify.accuracy(classifier, test_set))


LookupError: 
**********************************************************************
  Resource [93mmovie_reviews[0m not found.
  Please use the NLTK Downloader to obtain the resource:

  [31m>>> import nltk
  >>> nltk.download('movie_reviews')
  [0m
  For more information see: https://www.nltk.org/data.html

  Attempted to load [93mcorpora/movie_reviews[0m

  Searched in:
    - '/teamspace/studios/this_studio/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/share/nltk_data'
    - '/home/zeus/miniconda3/envs/cloudspace/lib/nltk_data'
    - '/usr/share/nltk_data'
    - '/usr/local/share/nltk_data'
    - '/usr/lib/nltk_data'
    - '/usr/local/lib/nltk_data'
**********************************************************************
