# Tutorial 1: NLP Base Types

In [1]:
# import des Flair Packages
from flair.data import Sentence 
from flair.models import SequenceTagger

## Creating a Sentence

In [2]:
# The sentence objects holds a sentence that we may want to embed or tag
from flair.data import Sentence

# Make a sentence object by passing a whitespace tokenized string
sentence = Sentence('The grass is green .')

# Print the object to see what's in there
print(sentence)

Sentence: "The grass is green ." - 5 Tokens


In [3]:
# using the token id
print(sentence.get_token(3))
# using the index itself 
print(sentence[3])

Token: 3 is
Token: 4 green


In [4]:
for token in sentence:
    print(token)

Token: 1 The
Token: 2 grass
Token: 3 is
Token: 4 green
Token: 5 .


## Tokenization

In [5]:
# Make a sentence object by passing an untokenized string and the 'use_tokenizer' flag
sentence = Sentence('The grass is green.', use_tokenizer=True)

# Print the object to see what's in there
print(sentence)

Sentence: "The grass is green ." - 5 Tokens


## Adding Tags to Tokens

In [6]:
# add a tag to a word in the sentence
sentence[3].add_tag('ner', 'color')

# print the sentence with all tags of this type
print(sentence.to_tagged_string())

The grass is green <color> .


In [7]:
from flair.data import Label

tag: Label = sentence[3].get_tag('ner')

print(f'"{sentence[3]}" is tagged as "{tag.value}" with confidence score "{tag.score}"')

"Token: 4 green" is tagged as "color" with confidence score "1.0"


## Adding Labels to Sentences

In [8]:
sentence = Sentence('France is the current world cup winner.')

# add a label to a sentence
sentence.add_label('sports')

# a sentence can also belong to multiple classes
sentence.add_labels(['sports', 'world cup'])

#you can also set the labels while initalizing the sentence
sentence = Sentence('France is the current world cup winner.', labels=['sports', 'world cup'])

In [9]:
sentence = Sentence('France is the current world cup winner.', labels=['sports', 'world cup'])

print(sentence)
for label in sentence.labels:
    print(label)

Sentence: "France is the current world cup winner." - 7 Tokens
sports (1.0)
world cup (1.0)


# Tutorial 2: Tagging your text

In [10]:
from flair.models import SequenceTagger

tagger = SequenceTagger.load('ner')

In [14]:
sentence = Sentence('George Washington went to New York .')

#predict NER tags
tagger.predict(sentence)

#print sentence with predicted tags
print(sentence.to_tagged_string())

George <B-PER> Washington <E-PER> went to New <B-LOC> York <E-LOC> .


### Relevant für Ausgabe der erkannten Tokens für den späteren Austausch

In [12]:
for entity in sentence.get_spans('ner'):
    print(entity)

PER-span [1,2]: "George Washington"
LOC-span [5]: "Washington"


Jede Spanne hat seine eigenen Text der sich so ausgeben lässt:

In [13]:
print(sentence.to_dict(tag_type='ner'))

{'text': 'George Washington went to Washington .', 'labels': [], 'entities': [{'text': 'George Washington', 'start_pos': 0, 'end_pos': 17, 'type': 'PER', 'confidence': 0.999882847070694}, {'text': 'Washington', 'start_pos': 26, 'end_pos': 36, 'type': 'LOC', 'confidence': 0.9993128776550293}]}


Dies gibt zusätzlich den Text, die gefundenen Entities, Labels und eine Confidence Score aus, die aussagt wie sicher sich der Tagger bei diesem Tag ist.

## Deutsche Sätze taggen

In [17]:
# load model
tagger = SequenceTagger.load('de-ner')

# make German sentence
sentence = Sentence('George Washington ging nach New York .')

# predict NER tags
tagger.predict(sentence)

# print sentence with predicted tags
print(sentence.to_tagged_string())

George <B-PER> Washington <E-PER> ging nach Washington <S-LOC> .


# Wichtig für uns - PoS Tagging!
Dafür laden wir das deutsche PoS Model: 'de-pos'

In [18]:
# load model
tagger = SequenceTagger.load('de-pos')

# make German sentence
sentence = Sentence('George Washington ging nach Washington .')

# predict NER tags
tagger.predict(sentence)

# print sentence with predicted tags
print(sentence.to_tagged_string())

George <PROPN> Washington <PROPN> ging <VERB> nach <ADP> Washington <PROPN> . <PUNCT>



    ADJ: adjective
    ADP: adposition
    ADV: adverb
    AUX: auxiliary
    CCONJ: coordinating conjunction
    DET: determiner
    INTJ: interjection
    NOUN: noun
    NUM: numeral
    PART: particle
    PRON: pronoun
    PROPN: proper noun
    PUNCT: punctuation
    SCONJ: subordinating conjunction
    SYM: symbol
    VERB: verb
    X: other


## Eine Liste an Texten taggen
Dafür benutzen wir den sentence splitter von segtok

In [19]:
# your text of many sentences
text = "Das ist ein Satz. Das ist ein weiterer Satz. Ich liebe Leipzig."

# use a library to split into sentences
from segtok.segmenter import split_single
sentences = [Sentence(sent, use_tokenizer=True) for sent in split_single(text)]

# predict tags for list of sentences
tagger: SequenceTagger = SequenceTagger.load('de-ner')
tagger.predict(sentences)

[Sentence: "Das ist ein Satz ." - 5 Tokens,
 Sentence: "Das ist ein weiterer Satz ." - 6 Tokens,
 Sentence: "Ich liebe Leipzig ." - 4 Tokens]

## Tagging with Pre-Trained Text Classification Models

In [20]:
from flair.models import TextClassifier

classifier = TextClassifier.load('en-Sentiment')

In [21]:
sentence = Sentence('This film hurts. It is so bad that I am confused.')

# predict NER tags
classifier.predict(sentence)

# print sentence with predicted labels
print(sentence.labels)

[NEGATIVE (1.0)]


# Tutorial 3: Word Embeddings

In [34]:
from flair.embeddings import WordEmbeddings

# init embedding
glove_embedding = WordEmbeddings('glove')

2019-01-11 15:32:45,044 https://s3.eu-central-1.amazonaws.com/alan-nlp/resources/embeddings/glove.gensim.vectors.npy not found in cache, downloading to /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpi0wcewdf



  0%|          | 0/160000128 [00:00<?, ?B/s][A
  0%|          | 53248/160000128 [00:00<06:23, 417146.78B/s][A
  0%|          | 105472/160000128 [00:00<06:00, 443613.32B/s][A
  0%|          | 157696/160000128 [00:00<05:52, 452856.11B/s][A
  0%|          | 209920/160000128 [00:00<05:38, 471563.22B/s][A
  0%|          | 262144/160000128 [00:00<05:38, 472521.39B/s][A
  0%|          | 314368/160000128 [00:00<05:29, 484284.87B/s][A
  0%|          | 366592/160000128 [00:00<05:26, 489126.79B/s][A
  0%|          | 418816/160000128 [00:00<05:24, 492211.88B/s][A
  0%|          | 471040/160000128 [00:00<05:27, 487520.50B/s][A
  0%|          | 523264/160000128 [00:01<05:31, 481082.83B/s][A
  0%|          | 592896/160000128 [00:01<05:24, 491676.59B/s][A
  0%|          | 645120/160000128 [00:01<05:21, 495113.98B/s][A
  0%|          | 697344/160000128 [00:01<05:23, 492279.85B/s][A
  0%|          | 749568/160000128 [00:01<05:20, 497273.72B/s][A
  1%|          | 801792/160000128 [00:01<0

  9%|▉         | 14271488/160000128 [00:28<04:49, 503587.79B/s][A
  9%|▉         | 14322688/160000128 [00:28<04:49, 502700.05B/s][A
  9%|▉         | 14373888/160000128 [00:28<04:54, 493864.68B/s][A
  9%|▉         | 14424064/160000128 [00:29<05:02, 481798.70B/s][A
  9%|▉         | 14473216/160000128 [00:29<05:01, 483108.26B/s][A
  9%|▉         | 14522368/160000128 [00:29<05:07, 473462.04B/s][A
  9%|▉         | 14574592/160000128 [00:29<04:58, 487102.78B/s][A
  9%|▉         | 14623744/160000128 [00:29<05:06, 474516.20B/s][A
  9%|▉         | 14686208/160000128 [00:29<04:44, 511367.50B/s][A
  9%|▉         | 14738432/160000128 [00:30<09:51, 245539.11B/s][A
  9%|▉         | 14954496/160000128 [00:30<07:14, 333555.24B/s][A
  9%|▉         | 15043584/160000128 [00:30<06:28, 372816.98B/s][A
  9%|▉         | 15121408/160000128 [00:30<05:56, 406624.63B/s][A
  9%|▉         | 15192064/160000128 [00:30<05:34, 433141.83B/s][A
 10%|▉         | 15256576/160000128 [00:30<05:28, 440388.54B/s

 18%|█▊        | 28062720/160000128 [00:59<04:37, 475381.10B/s][A
 18%|█▊        | 28115968/160000128 [00:59<04:28, 491128.25B/s][A
 18%|█▊        | 28167168/160000128 [00:59<04:33, 482794.85B/s][A
 18%|█▊        | 28219392/160000128 [01:00<09:29, 231380.47B/s][A
 18%|█▊        | 28319744/160000128 [01:00<07:17, 300815.18B/s][A
 18%|█▊        | 28526592/160000128 [01:00<05:25, 403674.73B/s][A
 18%|█▊        | 28626944/160000128 [01:00<05:08, 425472.37B/s][A
 18%|█▊        | 28711936/160000128 [01:00<04:59, 438940.06B/s][A
 18%|█▊        | 28785664/160000128 [01:00<04:44, 461038.98B/s][A
 18%|█▊        | 28853248/160000128 [01:01<04:40, 467693.70B/s][A
 18%|█▊        | 28914688/160000128 [01:01<04:24, 495877.14B/s][A
 18%|█▊        | 28975104/160000128 [01:01<04:33, 479832.27B/s][A
 18%|█▊        | 29031424/160000128 [01:01<04:22, 498490.66B/s][A
 18%|█▊        | 29087744/160000128 [01:01<04:24, 495127.89B/s][A
 18%|█▊        | 29142016/160000128 [01:01<04:46, 457236.32B/s

 27%|██▋       | 42459136/160000128 [01:28<03:57, 494256.62B/s][A
 27%|██▋       | 42511360/160000128 [01:28<04:00, 488928.44B/s][A
 27%|██▋       | 42563584/160000128 [01:28<03:55, 498020.38B/s][A
 27%|██▋       | 42615808/160000128 [01:29<04:00, 488894.06B/s][A
 27%|██▋       | 42685440/160000128 [01:29<03:56, 496571.90B/s][A
 27%|██▋       | 42737664/160000128 [01:29<04:02, 483132.06B/s][A
 27%|██▋       | 42807296/160000128 [01:29<03:54, 499312.31B/s][A
 27%|██▋       | 42859520/160000128 [01:29<03:58, 491598.96B/s][A
 27%|██▋       | 42911744/160000128 [01:29<04:00, 486429.64B/s][A
 27%|██▋       | 42969088/160000128 [01:29<03:49, 509604.82B/s][A
 27%|██▋       | 43021312/160000128 [01:29<03:54, 498213.51B/s][A
 27%|██▋       | 43071488/160000128 [01:29<03:55, 497371.78B/s][A
 27%|██▋       | 43121664/160000128 [01:30<04:00, 486510.08B/s][A
 27%|██▋       | 43172864/160000128 [01:30<03:56, 493837.94B/s][A
 27%|██▋       | 43225088/160000128 [01:30<03:59, 488222.04B/s

 35%|███▌      | 56698880/160000128 [01:57<03:45, 457342.04B/s][A
 35%|███▌      | 56751104/160000128 [01:57<03:37, 474372.43B/s][A
 36%|███▌      | 56803328/160000128 [01:57<03:37, 475560.40B/s][A
 36%|███▌      | 56855552/160000128 [01:57<03:31, 486558.16B/s][A
 36%|███▌      | 56907776/160000128 [01:58<03:32, 484655.69B/s][A
 36%|███▌      | 56960000/160000128 [01:58<03:28, 495141.96B/s][A
 36%|███▌      | 57012224/160000128 [01:58<03:30, 489474.17B/s][A
 36%|███▌      | 57064448/160000128 [01:58<03:32, 484171.67B/s][A
 36%|███▌      | 57120768/160000128 [01:58<03:23, 505335.03B/s][A
 36%|███▌      | 57171968/160000128 [01:58<03:28, 492810.51B/s][A
 36%|███▌      | 57223168/160000128 [01:58<03:26, 498404.33B/s][A
 36%|███▌      | 57273344/160000128 [01:58<03:31, 485563.29B/s][A
 36%|███▌      | 57329664/160000128 [01:58<03:22, 506471.58B/s][A
 36%|███▌      | 57380864/160000128 [01:59<03:29, 490724.75B/s][A
 36%|███▌      | 57447424/160000128 [01:59<03:30, 487717.46B/s

 44%|████▍     | 71130112/160000128 [02:27<03:15, 454122.43B/s][A
 45%|████▍     | 71234560/160000128 [02:27<03:03, 484821.45B/s][A
 45%|████▍     | 71339008/160000128 [02:27<02:43, 542795.04B/s][A
 45%|████▍     | 71397376/160000128 [02:28<05:33, 265862.94B/s][A
 45%|████▍     | 71634944/160000128 [02:28<04:05, 359305.54B/s][A
 45%|████▍     | 71726080/160000128 [02:28<03:44, 393061.91B/s][A
 45%|████▍     | 71804928/160000128 [02:28<03:31, 416994.41B/s][A
 45%|████▍     | 71874560/160000128 [02:29<03:24, 431836.95B/s][A
 45%|████▍     | 71938048/160000128 [02:29<03:20, 438230.48B/s][A
 45%|████▍     | 71999488/160000128 [02:29<03:07, 469390.31B/s][A
 45%|████▌     | 72056832/160000128 [02:29<03:10, 461483.70B/s][A
 45%|████▌     | 72111104/160000128 [02:29<03:07, 468470.51B/s][A
 45%|████▌     | 72169472/160000128 [02:29<02:56, 497952.21B/s][A
 45%|████▌     | 72223744/160000128 [02:29<02:56, 498095.31B/s][A
 45%|████▌     | 72276992/160000128 [02:29<02:58, 492563.56B/s

 53%|█████▎    | 84969472/160000128 [03:00<02:33, 488878.12B/s][A
 53%|█████▎    | 85021696/160000128 [03:00<02:31, 495035.96B/s][A
 53%|█████▎    | 85073920/160000128 [03:00<02:32, 491655.76B/s][A
 53%|█████▎    | 85126144/160000128 [03:00<02:33, 486483.80B/s][A
 53%|█████▎    | 85178368/160000128 [03:00<02:31, 495281.30B/s][A
 53%|█████▎    | 85230592/160000128 [03:00<02:32, 490539.11B/s][A
 53%|█████▎    | 85292032/160000128 [03:00<02:23, 522095.01B/s][A
 53%|█████▎    | 85345280/160000128 [03:00<02:26, 509756.52B/s][A
 53%|█████▎    | 85403648/160000128 [03:00<02:24, 516589.97B/s][A
 53%|█████▎    | 85455872/160000128 [03:01<02:24, 516125.40B/s][A
 53%|█████▎    | 85508096/160000128 [03:01<02:24, 515928.98B/s][A
 53%|█████▎    | 85560320/160000128 [03:01<02:27, 504665.34B/s][A
 54%|█████▎    | 85611520/160000128 [03:01<02:27, 504102.49B/s][A
 54%|█████▎    | 85662720/160000128 [03:01<02:28, 499389.04B/s][A
 54%|█████▎    | 85712896/160000128 [03:01<02:34, 482081.25B/s

 61%|██████    | 97815552/160000128 [03:33<01:57, 531320.40B/s][A
 61%|██████    | 97870848/160000128 [03:33<02:08, 481974.91B/s][A
 61%|██████    | 97921024/160000128 [03:33<02:11, 472244.78B/s][A
 61%|██████    | 97989632/160000128 [03:34<02:01, 511029.17B/s][A
 61%|██████▏   | 98042880/160000128 [03:34<02:10, 475587.45B/s][A
 61%|██████▏   | 98095104/160000128 [03:34<02:10, 475360.88B/s][A
 61%|██████▏   | 98147328/160000128 [03:34<02:10, 475612.55B/s][A
 61%|██████▏   | 98199552/160000128 [03:34<02:06, 488141.95B/s][A
 61%|██████▏   | 98251776/160000128 [03:34<02:07, 484460.88B/s][A
 61%|██████▏   | 98304000/160000128 [03:34<02:04, 494906.67B/s][A
 61%|██████▏   | 98356224/160000128 [03:34<02:06, 486356.95B/s][A
 62%|██████▏   | 98425856/160000128 [03:34<02:05, 491414.51B/s][A
 62%|██████▏   | 98482176/160000128 [03:35<02:00, 510944.15B/s][A
 62%|██████▏   | 98534400/160000128 [03:35<02:03, 497036.31B/s][A
 62%|██████▏   | 98598912/160000128 [03:35<01:57, 522940.57B/s

 70%|██████▉   | 111735808/160000128 [04:03<03:07, 257736.25B/s][A
 70%|██████▉   | 111767552/160000128 [04:03<03:12, 250659.15B/s][A
 70%|██████▉   | 111797248/160000128 [04:03<03:10, 253116.90B/s][A
 70%|██████▉   | 111847424/160000128 [04:04<03:06, 257547.53B/s][A
 70%|██████▉   | 111875072/160000128 [04:04<03:11, 251208.39B/s][A
 70%|██████▉   | 111901696/160000128 [04:04<03:33, 225635.69B/s][A
 70%|██████▉   | 111934464/160000128 [04:04<03:27, 231722.28B/s][A
 70%|██████▉   | 111969280/160000128 [04:04<03:33, 225005.65B/s][A
 70%|███████   | 112021504/160000128 [04:04<03:00, 265926.61B/s][A
 70%|███████   | 112073728/160000128 [04:04<02:38, 301766.07B/s][A
 70%|███████   | 112125952/160000128 [04:05<02:18, 344696.89B/s][A
 70%|███████   | 112178176/160000128 [04:05<02:04, 383644.41B/s][A
 70%|███████   | 112230400/160000128 [04:05<01:57, 407139.47B/s][A
 70%|███████   | 112282624/160000128 [04:05<01:49, 435621.44B/s][A
 70%|███████   | 112334848/160000128 [04:05<01:4

 78%|███████▊  | 125234176/160000128 [04:31<01:10, 492993.94B/s][A
 78%|███████▊  | 125286400/160000128 [04:32<01:09, 501180.94B/s][A
 78%|███████▊  | 125338624/160000128 [04:32<01:10, 492597.75B/s][A
 78%|███████▊  | 125390848/160000128 [04:32<01:09, 498309.52B/s][A
 78%|███████▊  | 125443072/160000128 [04:32<01:09, 493826.00B/s][A
 78%|███████▊  | 125495296/160000128 [04:32<01:10, 487814.30B/s][A
 78%|███████▊  | 125547520/160000128 [04:32<01:09, 497082.72B/s][A
 78%|███████▊  | 125599744/160000128 [04:32<01:10, 488330.07B/s][A
 79%|███████▊  | 125669376/160000128 [04:32<01:09, 493088.74B/s][A
 79%|███████▊  | 125722624/160000128 [04:32<01:07, 504260.26B/s][A
 79%|███████▊  | 125773824/160000128 [04:33<01:09, 491647.03B/s][A
 79%|███████▊  | 125826048/160000128 [04:33<01:08, 500191.71B/s][A
 79%|███████▊  | 125878272/160000128 [04:33<01:09, 492985.94B/s][A
 79%|███████▊  | 125930496/160000128 [04:33<01:08, 500939.96B/s][A
 79%|███████▊  | 125982720/160000128 [04:33<01:0

 87%|████████▋ | 138883072/160000128 [05:01<00:42, 498236.78B/s][A
 87%|████████▋ | 138934272/160000128 [05:01<00:43, 488051.51B/s][A
 87%|████████▋ | 138986496/160000128 [05:01<00:42, 497517.03B/s][A
 87%|████████▋ | 139038720/160000128 [05:01<00:42, 490704.05B/s][A
 87%|████████▋ | 139090944/160000128 [05:01<00:41, 499709.11B/s][A
 87%|████████▋ | 139143168/160000128 [05:01<00:42, 492158.58B/s][A
 87%|████████▋ | 139195392/160000128 [05:01<00:41, 500583.86B/s][A
 87%|████████▋ | 139247616/160000128 [05:01<00:42, 490234.15B/s][A
 87%|████████▋ | 139299840/160000128 [05:01<00:42, 487673.84B/s][A
 87%|████████▋ | 139356160/160000128 [05:02<00:40, 508096.40B/s][A
 87%|████████▋ | 139411456/160000128 [05:02<00:39, 520763.04B/s][A
 87%|████████▋ | 139464704/160000128 [05:02<00:40, 508954.29B/s][A
 87%|████████▋ | 139515904/160000128 [05:02<00:40, 509808.05B/s][A
 87%|████████▋ | 139567104/160000128 [05:02<00:41, 495823.62B/s][A
 87%|████████▋ | 139617280/160000128 [05:02<00:4

 96%|█████████▌| 152825856/160000128 [05:29<00:14, 489619.09B/s][A
 96%|█████████▌| 152885248/160000128 [05:29<00:13, 516820.43B/s][A
 96%|█████████▌| 152938496/160000128 [05:29<00:13, 505948.17B/s][A
 96%|█████████▌| 152989696/160000128 [05:29<00:14, 493123.41B/s][A
 96%|█████████▌| 153039872/160000128 [05:29<00:14, 493379.82B/s][A
 96%|█████████▌| 153090048/160000128 [05:29<00:14, 484252.47B/s][A
 96%|█████████▌| 153139200/160000128 [05:29<00:14, 486366.82B/s][A
 96%|█████████▌| 153191424/160000128 [05:30<00:14, 482782.83B/s][A
 96%|█████████▌| 153243648/160000128 [05:30<00:13, 493922.08B/s][A
 96%|█████████▌| 153295872/160000128 [05:30<00:13, 488112.81B/s][A
 96%|█████████▌| 153349120/160000128 [05:30<00:13, 500543.74B/s][A
 96%|█████████▌| 153400320/160000128 [05:30<00:13, 487595.47B/s][A
 96%|█████████▌| 153468928/160000128 [05:30<00:12, 523499.71B/s][A
 96%|█████████▌| 153522176/160000128 [05:30<00:13, 470688.28B/s][A
 96%|█████████▌| 153574400/160000128 [05:30<00:1

2019-01-11 15:38:31,999 copying /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpi0wcewdf to cache at /Users/Nils/.flair/embeddings/glove.gensim.vectors.npy
2019-01-11 15:38:32,441 removing temp file /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpi0wcewdf
2019-01-11 15:38:32,572 https://s3.eu-central-1.amazonaws.com/alan-nlp/resources/embeddings/glove.gensim not found in cache, downloading to /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpncl1ua9l



  0%|          | 0/21494764 [00:00<?, ?B/s][A
  0%|          | 52224/21494764 [00:00<00:51, 419194.41B/s][A
  0%|          | 87040/21494764 [00:00<00:54, 394895.41B/s][A
  1%|          | 140288/21494764 [00:00<00:49, 428019.06B/s][A
  1%|          | 191488/21494764 [00:00<00:48, 438501.70B/s][A
  1%|          | 260096/21494764 [00:00<00:44, 480866.94B/s][A
  1%|▏         | 312320/21494764 [00:00<00:43, 490597.04B/s][A
  2%|▏         | 365568/21494764 [00:00<00:46, 455361.96B/s][A
  2%|▏         | 417792/21494764 [00:00<00:44, 471470.58B/s][A
  2%|▏         | 470016/21494764 [00:00<00:44, 472439.45B/s][A
  2%|▏         | 530432/21494764 [00:01<00:41, 505495.02B/s][A
  3%|▎         | 581632/21494764 [00:01<00:42, 492702.59B/s][A
  3%|▎         | 631808/21494764 [00:01<00:42, 494622.24B/s][A
  3%|▎         | 681984/21494764 [00:01<00:43, 483915.10B/s][A
  3%|▎         | 731136/21494764 [00:01<00:42, 483192.35B/s][A
  4%|▎         | 783360/21494764 [00:01<00:42, 482912.51B/

 68%|██████▊   | 14570496/21494764 [00:30<00:16, 420037.32B/s][A
 68%|██████▊   | 14645248/21494764 [00:30<00:15, 448470.39B/s][A
 68%|██████▊   | 14713856/21494764 [00:30<00:15, 442505.75B/s][A
 69%|██████▊   | 14774272/21494764 [00:30<00:14, 469567.64B/s][A
 69%|██████▉   | 14833664/21494764 [00:30<00:14, 455342.12B/s][A
 69%|██████▉   | 14891008/21494764 [00:30<00:13, 485302.99B/s][A
 70%|██████▉   | 14946304/21494764 [00:30<00:13, 490386.59B/s][A
 70%|██████▉   | 15000576/21494764 [00:31<00:12, 504810.65B/s][A
 70%|███████   | 15054848/21494764 [00:31<00:12, 501922.19B/s][A
 70%|███████   | 15108096/21494764 [00:31<00:12, 509714.54B/s][A
 71%|███████   | 15161344/21494764 [00:31<00:13, 478055.66B/s][A
 71%|███████   | 15211520/21494764 [00:31<00:12, 484590.22B/s][A
 71%|███████   | 15261696/21494764 [00:31<00:13, 472780.96B/s][A
 71%|███████   | 15309824/21494764 [00:31<00:13, 461671.64B/s][A
 71%|███████▏  | 15356928/21494764 [00:31<00:13, 451887.24B/s][A
 72%|█████

2019-01-11 15:39:17,071 copying /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpncl1ua9l to cache at /Users/Nils/.flair/embeddings/glove.gensim
2019-01-11 15:39:17,127 removing temp file /var/folders/_1/sr6gl6wj7g9_111_kbc1d_fr0000gn/T/tmpncl1ua9l


In [35]:
# create sentence.
sentence = Sentence('The grass is green .')

# embed a sentence using glove.
glove_embedding.embed(sentence)

# now check out the embedded tokens.
for token in sentence:
    print(token)
    print(token.embedding)

Token: 1 The
tensor([-0.0382, -0.2449,  0.7281, -0.3996,  0.0832,  0.0440, -0.3914,  0.3344,
        -0.5755,  0.0875,  0.2879, -0.0673,  0.3091, -0.2638, -0.1323, -0.2076,
         0.3340, -0.3385, -0.3174, -0.4834,  0.1464, -0.3730,  0.3458,  0.0520,
         0.4495, -0.4697,  0.0263, -0.5415, -0.1552, -0.1411, -0.0397,  0.2828,
         0.1439,  0.2346, -0.3102,  0.0862,  0.2040,  0.5262,  0.1716, -0.0824,
        -0.7179, -0.4153,  0.2033, -0.1276,  0.4137,  0.5519,  0.5791, -0.3348,
        -0.3656, -0.5486, -0.0629,  0.2658,  0.3020,  0.9977, -0.8048, -3.0243,
         0.0125, -0.3694,  2.2167,  0.7220, -0.2498,  0.9214,  0.0345,  0.4674,
         1.1079, -0.1936, -0.0746,  0.2335, -0.0521, -0.2204,  0.0572, -0.1581,
        -0.3080, -0.4162,  0.3797,  0.1501, -0.5321, -0.2055, -1.2526,  0.0716,
         0.7056,  0.4974, -0.4206,  0.2615, -1.5380, -0.3022, -0.0734, -0.2831,
         0.3710, -0.2522,  0.0162, -0.0171, -0.3898,  0.8742, -0.7257, -0.5106,
        -0.5203, -0.1459,  