In [1]:
import pandas as pd
import torch
import tqdm
import transformers

In [2]:
tokenizer = transformers.GPT2Tokenizer.from_pretrained("gpt2")
model = transformers.GPT2LMHeadModel.from_pretrained("gpt2_output/checkpoint-12000/")

In [3]:
input_ids = tokenizer.encode("Walter Hansel Cuvee Alyce Chardonnay 2015 [response]", return_tensors='pt')
greedy_output = model.generate(input_ids, max_length=100)
print(tokenizer.decode(greedy_output[0], skip_special_tokens=True))

Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence


Walter Hansel Cuvee Alyce Chardonnay 2015 [response]	"The 2015 Alyce Chardonnay is a blend of the best lots of Chardonnay from the estate vineyards. The wine is a blend of the best lots of Chardonnay from the estate vineyards. The wine is a blend of the best lots of Chardonnay from the estate vineyards.
The 2015 Alyce Chardonnay is a blend of the best


In [4]:
# activate beam search and early_stopping
beam_outputs = model.generate(
  input_ids, 
  max_length=100, 
  num_beams=5, 
  no_repeat_ngram_size=2,
  num_return_sequences=5, 
  early_stopping=True
)

print("Output:\n" + 80 * '-')
for i, beam_output in enumerate(beam_outputs):
  print("{}: {}".format(i, tokenizer.decode(beam_output, skip_special_tokens=True)))

Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence


Output:
--------------------------------------------------------------------------------
0: Walter Hansel Cuvee Alyce Chardonnay 2015 [response]	The 2015 vintage of this wine was ranked #2 on the Wine Spectator's Top 10 Wines of 2016
<|startoftext|>	[prompt]aditionalChateau Ste. Michelle Cold Creek Vineyard Cabernet Sauvignon (1.5 Liter Magnum) 2013		"This is a big, bold wine with a lot going on in the nose and palate.
1: Walter Hansel Cuvee Alyce Chardonnay 2015 [response]	The 2015 vintage of this wine was ranked #2 on the Wine Spectator's Top 10 Wines of 2016
<|startoftext|>	[prompt]aditionalChateau Ste. Michelle Cold Creek Vineyard Cabernet Sauvignon (1.5 Liter Magnum) 2013		"This is a big, rich wine with a lot going on in the nose and palate.
2: Walter Hansel Cuvee Alyce Chardonnay 2015 [response]	The 2015 vintage of this wine was ranked #2 on the Wine Spectator's Top 10 Wines of 2016
<|startoftext|>	[prompt]aditionalChateau Ste. Michelle Cold Creek Vineyard Cabernet Sauvignon (1.5

In [5]:
greedy_output[0].shape

torch.Size([100])

In [4]:
# set seed to reproduce results. Feel free to change the seed though to get different results
#tf.random.set_seed(0)

input_ids = tokenizer.encode("Vendange Chardonnay [response]", return_tensors='pt')

# activate sampling and deactivate top_k by setting top_k sampling to 0
sample_output = model.generate(
    input_ids, 
    do_sample=True, 
    max_length=150, 
    top_p=0.90,
    top_k=0
)

print("Output:\n" + 100 * '-')
print(tokenizer.decode(sample_output[0], skip_special_tokens=False))

Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence


Output:
----------------------------------------------------------------------------------------------------
Vendange Chardonnay [response]	"The 2002 vintage of the Sonoma Chardonnay from our friends at Laguna Vista Vineyards produced a very special wine, full of finesse, depth, and elegance. The bouquet has aromas of pear, kiwi, apple and white peach. The wine is full-bodied, crisp and elegant with a rich, mineral quality, balanced by ripe tropical fruit flavors, finishing with a long, crisp finish. Try this vintage pair this Chardonnay with spicy Asian dishes, smoked fish, roasted chicken, grilled vegetables and foie gras. 

"
<|startoftext|>	[prompt]	Maggio Family Vineyards


In [5]:
fake_names = pd.read_csv("data/fake/fake_names_13301_2020-05-20.csv")
print(fake_names.shape)

(13301, 2)


In [6]:
fake_names.head(3)

Unnamed: 0.1,Unnamed: 0,0
0,0,Lachos Cellars Sauvignon Blanc 2012
1,1,Dry Estated Bios de Bourting Sannero (375ML ha...
2,2,Tarodahadin Chaary Rivi 2010


In [8]:
response_prompt = "[response]"

generated_descriptions = {}
for fake_name in tqdm.tqdm(fake_names.iloc[:,1]):
  #print(fake_name)
  
  # Create token from fake wine name
  tokenized_name = tokenizer.encode(
    text=(fake_name + "\t" + response_prompt), 
    return_tensors='pt'
  )
  
  # Generate a fake description based on the name
  generated_description = model.generate(
    input_ids=tokenized_name,
    do_sample=True,
    max_length=150,
    top_p=0.90,
    top_k=0    
  )
  
  generated_descriptions[fake_name] = tokenizer.decode(
    token_ids=sample_output[0], 
    skip_special_tokens=False
  )

  0%|                                                                                                                             | 0/13301 [00:00<?, ?it/s]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                                                                  | 1/13301 [00:04<17:13:38,  4.66s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                                                                  | 2/13301 [00:08<16:51:32,  4.56s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                                                                  | 3/13301 [00:13<16:58:24,  4.60s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                   

  0%|▎                                                                                                                | 35/13301 [02:38<16:57:56,  4.60s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|▎                                                                                                                | 36/13301 [02:42<16:42:52,  4.54s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|▎                                                                                                                | 37/13301 [02:47<16:45:17,  4.55s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|▎                                                                                                                | 38/13301 [02:51<16:25:54,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|▎                                                                  

  1%|▌                                                                                                                | 70/13301 [05:16<16:33:00,  4.50s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▌                                                                                                                | 71/13301 [05:21<16:33:19,  4.50s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▌                                                                                                                | 72/13301 [05:25<16:18:33,  4.44s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▌                                                                                                                | 73/13301 [05:30<16:23:14,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▋                                                                  

  1%|▉                                                                                                               | 105/13301 [07:48<15:15:26,  4.16s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                                                               | 106/13301 [07:52<15:15:40,  4.16s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                                                               | 107/13301 [07:57<15:23:39,  4.20s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                                                               | 108/13301 [08:01<15:20:12,  4.18s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                  

  1%|█▏                                                                                                              | 140/13301 [10:21<16:17:42,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▏                                                                                                              | 141/13301 [10:25<15:51:41,  4.34s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▏                                                                                                              | 142/13301 [10:30<16:02:12,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▏                                                                                                              | 143/13301 [10:35<16:15:36,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▏                                                                 

  1%|█▍                                                                                                              | 175/13301 [12:57<16:06:45,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▍                                                                                                              | 176/13301 [13:01<15:58:34,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▍                                                                                                              | 177/13301 [13:05<15:58:19,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▍                                                                                                              | 178/13301 [13:10<15:46:45,  4.33s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|█▌                                                                 

  2%|█▊                                                                                                              | 210/13301 [15:33<16:12:42,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▊                                                                                                              | 211/13301 [15:37<16:07:50,  4.44s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▊                                                                                                              | 212/13301 [15:42<16:03:06,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▊                                                                                                              | 213/13301 [15:46<16:17:50,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▊                                                                 

  2%|██                                                                                                              | 245/13301 [18:07<15:43:21,  4.34s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██                                                                                                              | 246/13301 [18:12<15:51:41,  4.37s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██                                                                                                              | 247/13301 [18:16<15:45:29,  4.35s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██                                                                                                              | 248/13301 [18:20<15:47:08,  4.35s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██                                                                 

  2%|██▎                                                                                                             | 280/13301 [20:44<16:09:34,  4.47s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▎                                                                                                             | 281/13301 [20:48<16:14:47,  4.49s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▎                                                                                                             | 282/13301 [20:52<15:57:38,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▍                                                                                                             | 283/13301 [20:57<16:03:16,  4.44s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▍                                                                

  2%|██▋                                                                                                             | 315/13301 [23:20<15:47:20,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▋                                                                                                             | 316/13301 [23:24<15:34:55,  4.32s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▋                                                                                                             | 317/13301 [23:29<15:44:12,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▋                                                                                                             | 318/13301 [23:33<15:50:13,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|██▋                                                                

  3%|██▉                                                                                                             | 350/13301 [25:54<15:49:41,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▉                                                                                                             | 351/13301 [25:59<16:05:49,  4.47s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▉                                                                                                             | 352/13301 [26:03<16:00:53,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▉                                                                                                             | 353/13301 [26:08<16:00:16,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▉                                                                

  3%|███▏                                                                                                            | 385/13301 [28:30<16:03:22,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▎                                                                                                            | 386/13301 [28:34<16:04:18,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▎                                                                                                            | 387/13301 [28:39<16:04:45,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▎                                                                                                            | 388/13301 [28:43<16:09:07,  4.50s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▎                                                               

  3%|███▌                                                                                                            | 420/13301 [31:05<15:42:34,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▌                                                                                                            | 421/13301 [31:10<15:39:03,  4.37s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▌                                                                                                            | 422/13301 [31:14<15:45:07,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▌                                                                                                            | 423/13301 [31:19<15:48:35,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▌                                                               

  3%|███▊                                                                                                            | 455/13301 [33:40<15:58:31,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▊                                                                                                            | 456/13301 [33:45<15:52:39,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▊                                                                                                            | 457/13301 [33:49<15:47:31,  4.43s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▊                                                                                                            | 458/13301 [33:54<16:02:00,  4.49s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|███▊                                                               

  4%|████▏                                                                                                           | 490/13301 [36:16<16:09:49,  4.54s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▏                                                                                                           | 491/13301 [36:20<15:57:53,  4.49s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▏                                                                                                           | 492/13301 [36:25<15:58:43,  4.49s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▏                                                                                                           | 493/13301 [36:29<15:56:09,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▏                                                              

  4%|████▍                                                                                                           | 525/13301 [38:51<15:52:00,  4.47s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▍                                                                                                           | 526/13301 [38:56<15:49:26,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▍                                                                                                           | 527/13301 [39:00<15:32:16,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▍                                                                                                           | 528/13301 [39:04<15:36:38,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▍                                                              

  4%|████▋                                                                                                           | 560/13301 [41:27<15:37:09,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▋                                                                                                           | 561/13301 [41:31<15:27:04,  4.37s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▋                                                                                                           | 562/13301 [41:36<15:37:29,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▋                                                                                                           | 563/13301 [41:40<15:38:20,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|████▋                                                              

  4%|█████                                                                                                           | 595/13301 [44:01<15:28:34,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|█████                                                                                                           | 596/13301 [44:05<15:22:47,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|█████                                                                                                           | 597/13301 [44:10<15:31:37,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|█████                                                                                                           | 598/13301 [44:15<15:44:38,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████                                                              

  5%|█████▎                                                                                                          | 630/13301 [46:37<15:39:45,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▎                                                                                                          | 631/13301 [46:41<15:27:04,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▎                                                                                                          | 632/13301 [46:46<15:26:21,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▎                                                                                                          | 633/13301 [46:50<15:30:41,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▎                                                             

  5%|█████▌                                                                                                          | 665/13301 [49:10<15:04:24,  4.29s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▌                                                                                                          | 666/13301 [49:14<15:19:51,  4.37s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▌                                                                                                          | 667/13301 [49:19<15:28:48,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▌                                                                                                          | 668/13301 [49:23<15:25:38,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▋                                                             

  5%|█████▉                                                                                                          | 700/13301 [51:42<15:04:44,  4.31s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▉                                                                                                          | 701/13301 [51:47<15:15:52,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▉                                                                                                          | 702/13301 [51:51<15:18:55,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▉                                                                                                          | 703/13301 [51:56<15:24:19,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|█████▉                                                             

  6%|██████▏                                                                                                         | 735/13301 [54:16<15:22:07,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▏                                                                                                         | 736/13301 [54:20<15:19:20,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▏                                                                                                         | 737/13301 [54:24<15:13:03,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▏                                                                                                         | 738/13301 [54:29<15:17:55,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▏                                                            

  6%|██████▍                                                                                                         | 770/13301 [56:49<15:03:45,  4.33s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▍                                                                                                         | 771/13301 [56:54<15:07:42,  4.35s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▌                                                                                                         | 772/13301 [56:58<15:16:06,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▌                                                                                                         | 773/13301 [57:02<15:00:56,  4.31s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▌                                                            

  6%|██████▊                                                                                                         | 805/13301 [59:22<15:15:35,  4.40s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▊                                                                                                         | 806/13301 [59:26<15:18:41,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▊                                                                                                         | 807/13301 [59:31<15:07:53,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▊                                                                                                         | 808/13301 [59:35<15:13:48,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▊                                                            

  6%|██████▉                                                                                                       | 840/13301 [1:01:58<15:31:08,  4.48s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▉                                                                                                       | 841/13301 [1:02:02<15:24:14,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▉                                                                                                       | 842/13301 [1:02:07<15:16:00,  4.41s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▉                                                                                                       | 843/13301 [1:02:11<15:06:41,  4.37s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|██████▉                                                            

  7%|███████▏                                                                                                      | 875/13301 [1:04:33<15:21:04,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▏                                                                                                      | 876/13301 [1:04:37<15:19:24,  4.44s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▎                                                                                                      | 877/13301 [1:04:41<15:03:19,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▎                                                                                                      | 878/13301 [1:04:46<15:19:52,  4.44s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▎                                                           

  7%|███████▌                                                                                                      | 910/13301 [1:07:08<15:14:14,  4.43s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▌                                                                                                      | 911/13301 [1:07:13<15:18:34,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▌                                                                                                      | 912/13301 [1:07:17<15:23:14,  4.47s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▌                                                                                                      | 913/13301 [1:07:22<15:14:42,  4.43s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▌                                                           

  7%|███████▊                                                                                                      | 945/13301 [1:09:41<14:57:53,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▊                                                                                                      | 946/13301 [1:09:46<15:04:43,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▊                                                                                                      | 947/13301 [1:09:50<15:20:18,  4.47s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▊                                                                                                      | 948/13301 [1:09:55<15:18:01,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|███████▊                                                           

  7%|████████                                                                                                      | 980/13301 [1:12:15<14:55:08,  4.36s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|████████                                                                                                      | 981/13301 [1:12:20<14:59:40,  4.38s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|████████                                                                                                      | 982/13301 [1:12:24<15:07:23,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|████████▏                                                                                                     | 983/13301 [1:12:29<15:00:45,  4.39s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|████████▏                                                          

  8%|████████▎                                                                                                    | 1015/13301 [1:14:49<15:11:14,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▎                                                                                                    | 1016/13301 [1:14:53<15:12:37,  4.46s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▎                                                                                                    | 1017/13301 [1:14:58<15:11:25,  4.45s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▎                                                                                                    | 1018/13301 [1:15:02<15:05:39,  4.42s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▎                                                          

  8%|████████▌                                                                                                    | 1050/13301 [1:17:22<14:47:45,  4.35s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▌                                                                                                    | 1051/13301 [1:17:26<14:42:43,  4.32s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▌                                                                                                    | 1052/13301 [1:17:30<14:44:47,  4.33s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▋                                                                                                    | 1053/13301 [1:17:35<14:30:58,  4.27s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|████████▋                                                          

KeyboardInterrupt: 

In [9]:
pd.DataFrame.from_dict(generated_descriptions.items())

Unnamed: 0,0,1
0,Lachos Cellars Sauvignon Blanc 2012,"Vendange Chardonnay [response]\t""The 2002 vint..."
1,Dry Estated Bios de Bourting Sannero (375ML ha...,"Vendange Chardonnay [response]\t""The 2002 vint..."
2,Tarodahadin Chaary Rivi 2010,"Vendange Chardonnay [response]\t""The 2002 vint..."
3,Le Valli Sis de Trach Sauvignon Blanc 2013,"Vendange Chardonnay [response]\t""The 2002 vint..."
4,Fotes Jadot Sauvignon Blanc 2005,"Vendange Chardonnay [response]\t""The 2002 vint..."
...,...,...
1060,Domaine de Bord Cote Russian 2015,"Vendange Chardonnay [response]\t""The 2002 vint..."
1061,Domain Fubers Thige Rouge (375ML half-bottle) ...,"Vendange Chardonnay [response]\t""The 2002 vint..."
1062,Dr. Loch Estate Chardonnay (375ML half-bottle)...,"Vendange Chardonnay [response]\t""The 2002 vint..."
1063,Jakubl Mays Blet 2016,"Vendange Chardonnay [response]\t""The 2002 vint..."


In [37]:
type(model)

transformers.modeling_gpt2.GPT2LMHeadModel

In [38]:
torch.cuda.is_available()

True