In [1]:
import re

import pandas as pd
import torch
import tqdm
import transformers

## Load tokenizer and fine-tuned model

In [16]:
tokenizer = transformers.GPT2Tokenizer.from_pretrained("gpt2_distil_output/")
model = transformers.GPT2LMHeadModel.from_pretrained(
  "gpt2_distil_output/checkpoint-8000/",
  pad_token_id=tokenizer.eos_token_id
)

#model = model.to('cuda')

In [17]:
tokenizer.special_tokens_map

{'bos_token': '<|startoftext|>',
 'eos_token': '<|startoftext|>',
 'unk_token': '<|endoftext|>'}

## Greedy Output

In [21]:
input_prompt = "[prompt] Walter Hansel Cuvee Alyce Chardonnay 2015 [response] "
input_ids = tokenizer.encode(input_prompt, return_tensors='pt')

greedy_output = model.generate(input_ids)
print(tokenizer.decode(greedy_output[0]))

[prompt] Walter Hansel Cuvee Alyce Chardonnay 2015 [response]  The


## Beam Output

In [26]:
input_prompt = "[prompt] Walter Hansel Cuvee Alyce Chardonnay 2015 [response] "
input_ids = tokenizer.encode(input_prompt, return_tensors='pt')

# activate beam search and early_stopping
beam_outputs = model.generate(
  input_ids, 
  max_length=200, 
  num_beams=5, 
  no_repeat_ngram_size=2,
  num_return_sequences=3, 
  early_stopping=True
)

print("Output:\n" + 80 * '-')
for i, beam_output in enumerate(beam_outputs):
  print("="*20)
  print("{}: {}".format(i, tokenizer.decode(beam_output, skip_special_tokens=True)))
  print('\n')

Output:
--------------------------------------------------------------------------------
0: [prompt] Walter Hansel Cuvee Alyce Chardonnay 2015 [response] 
<|startoftext|>	[prompt]	Chateau de Beaucastel Chateauneuf-du-Pape (375ML half-bottle) 2017	"Aromas of white peach, apricot, lemon zest, green apple and a hint of vanilla. On the palate, the wine is rich and full-bodied, with a long, lingering finish.
Blend: 60% Grenache, 30% Syrah, 10% Mourvedre, 5% Cinsault, 1% Carignane"


This wine pairs well with fish, shellfish, white meats and cheeses. It can also be enjoyed on its own as an aperitif, or with light appetizers, such as fish and white meat dishes. 



   Blend: 70% Cabernet Sauvignon,


1: [prompt] Walter Hansel Cuvee Alyce Chardonnay 2015 [response] 
<|startoftext|>	[prompt]	Chateau de Beaucastel Chateauneuf-du-Pape (375ML half-bottle) 2017	"Aromas of white peach, apricot, lemon zest, green apple and a hint of vanilla. On the palate, the wine is rich and full-bodied, with a lon

## Random Sampling Output

In [7]:
tokenizer.all_special_ids

[50257, 50256]

In [8]:
tokenizer.all_special_tokens

['<|startoftext|>', '<|endoftext|>']

In [27]:
tokenizer.special_tokens_map

{'bos_token': '<|startoftext|>',
 'eos_token': '<|startoftext|>',
 'unk_token': '<|endoftext|>'}

In [28]:
# set seed to reproduce results. Feel free to change the seed though to get different results
#tf.random.set_seed(0)

input_prompt = "[prompt] " + "Chardonnay 2012 " + "[response] "
input_ids = tokenizer.encode(input_prompt, return_tensors='pt')

# activate sampling and deactivate top_k by setting top_k sampling to 0
sample_output = model.generate(
    input_ids, 
    do_sample=True, 
    max_length=250, 
    top_p=0.90,
    top_k=0,
    eos_token_id=50257,
    bos_token_id=50257,
    early_stopping=True
)

print("Output:\n" + 100 * '-')
print("="*20)
print(tokenizer.decode(sample_output[0], skip_special_tokens=False))
print('\n')

Output:
----------------------------------------------------------------------------------------------------
[prompt] Chardonnay 2012 [response] The nose is rich and aromatic, as well as enticing the palate.  The intense, rich flavors are supported by the vanilla, spice, coffee and citrus notes that characterize this wine.  A sophisticated, complex wine with powerful and ripe fruit aromas that lead to a mouth filling finish.
<|startoftext|>	[prompt]	Jean-Luc Colombo Barolo Reggiano 2012	[response]	
<|startoftext|>	[prompt]	Fratelli Bernabei Gialla Toscana 2000	[response]	A wine with exceptional density, fresh fruit and smooth tannins. It is an elegant, rich, elegant wine with a lengthy, lingering finish.Pair with grilled meats, slow cooked foods and mature cheeses.
<|startoftext|>	[prompt]	Jacob's Creek Syrah 2002	[response]	"The grapes grown at the Jacob's Creek estate vineyard in the northern hills of Sonoma County are hand-harvested into small, uniform bins of vinified, moderate, an

In [33]:
print(tokenizer.decode(sample_output[0], skip_special_tokens=True))

Chardonnay 2012	[response]	The '06 Sonoma County Pinot Gris presents aromas of Meyer lemon and citrus fruit. Subtle oak-infused notes of vanilla and toasty oak introduce this wine to the palate. It has an intensely tropical bouquet that brings to mind white peach and citrus. The flavors linger with a subtle minerality and zing that is so typical of Sonoma County Pinot Gris.
<|startoftext|>	[prompt]	Chateau Greysac (375ML half-bottle) 2004	[response]	Dark red color with a purplish rim. The nose is rich and complex with red fruit aromas and peppery notes. The


## Load fake wine names

In [40]:
fake_names = pd.read_csv("data/fake/fake_names_13301_2020-05-20.csv")
print(fake_names.shape)

(13301, 2)


In [41]:
fake_names.head(3)

Unnamed: 0.1,Unnamed: 0,0
0,0,Lachos Cellars Sauvignon Blanc 2012
1,1,Dry Estated Bios de Bourting Sannero (375ML ha...
2,2,Tarodahadin Chaary Rivi 2010


In [45]:
response_prompt = "[response]"

generated_descriptions = {}
for fake_name in tqdm.tqdm(fake_names.iloc[:,1]):
  #print(fake_name)
  
  # Create token from fake wine name
  tokenized_name = tokenizer.encode(
    text=(fake_name + "\t" + response_prompt), 
    return_tensors='pt'
  )
  
  # Generate a fake description based on the name
  model_output = model.generate(
    input_ids=tokenized_name,
    do_sample=True,
    max_length=150,
    top_p=0.90,
    top_k=0    
  )
  
  generated_descriptions[fake_name] = tokenizer.decode(
    token_ids=model_output[0], 
    skip_special_tokens=False
  )

  0%|                                                                                        | 0/13301 [00:00<?, ?it/s]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                             | 1/13301 [00:04<15:15:28,  4.13s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                             | 2/13301 [00:07<14:55:55,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                             | 3/13301 [00:12<15:17:59,  4.14s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                                                                             | 4/13301 [00:16<15:10:09,  4.11s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  0%|                    

  1%|▍                                                                           | 84/13301 [05:35<14:35:48,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▍                                                                           | 85/13301 [05:39<14:22:00,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▍                                                                           | 86/13301 [05:43<14:07:34,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▍                                                                           | 87/13301 [05:47<14:22:25,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▌                                                                           | 88/13301 [05:51<14:20:50,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▌                   

  1%|▉                                                                          | 168/13301 [11:07<14:31:11,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                          | 169/13301 [11:11<14:36:53,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                          | 170/13301 [11:15<14:36:51,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                          | 171/13301 [11:19<14:20:16,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                                                                          | 172/13301 [11:23<14:27:40,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  1%|▉                   

  2%|█▍                                                                         | 252/13301 [16:39<14:15:30,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▍                                                                         | 253/13301 [16:43<14:12:08,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▍                                                                         | 254/13301 [16:47<14:17:50,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▍                                                                         | 255/13301 [16:51<14:20:31,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▍                                                                         | 256/13301 [16:55<14:14:32,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  2%|█▍                  

  3%|█▉                                                                         | 336/13301 [22:12<14:18:27,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|█▉                                                                         | 337/13301 [22:16<14:24:49,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|█▉                                                                         | 338/13301 [22:19<14:13:34,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|█▉                                                                         | 339/13301 [22:23<14:15:08,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|█▉                                                                         | 340/13301 [22:27<14:22:41,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|█▉                  

  3%|██▎                                                                        | 420/13301 [27:44<13:54:06,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▎                                                                        | 421/13301 [27:48<13:56:20,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▍                                                                        | 422/13301 [27:52<14:00:43,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▍                                                                        | 423/13301 [27:56<14:00:48,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▍                                                                        | 424/13301 [28:00<14:01:13,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  3%|██▍                 

  4%|██▊                                                                        | 504/13301 [33:17<14:20:09,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|██▊                                                                        | 505/13301 [33:21<14:06:08,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|██▊                                                                        | 506/13301 [33:25<14:04:02,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|██▊                                                                        | 507/13301 [33:29<14:02:29,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|██▊                                                                        | 508/13301 [33:33<14:02:45,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|██▊                 

  4%|███▎                                                                       | 588/13301 [38:49<13:39:03,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|███▎                                                                       | 589/13301 [38:53<13:52:10,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|███▎                                                                       | 590/13301 [38:57<13:41:07,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|███▎                                                                       | 591/13301 [39:01<13:43:51,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|███▎                                                                       | 592/13301 [39:05<13:52:36,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  4%|███▎                

  5%|███▊                                                                       | 672/13301 [44:20<13:27:03,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|███▊                                                                       | 673/13301 [44:24<13:35:43,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|███▊                                                                       | 674/13301 [44:28<13:34:47,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|███▊                                                                       | 675/13301 [44:32<13:50:54,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|███▊                                                                       | 676/13301 [44:36<13:51:11,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  5%|███▊                

  6%|████▎                                                                      | 756/13301 [49:53<13:38:48,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▎                                                                      | 757/13301 [49:56<13:30:49,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▎                                                                      | 758/13301 [50:00<13:34:19,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▎                                                                      | 759/13301 [50:04<13:34:32,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▎                                                                      | 760/13301 [50:08<13:51:36,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▎               

  6%|████▋                                                                      | 840/13301 [55:24<14:08:44,  4.09s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▋                                                                      | 841/13301 [55:28<14:08:33,  4.09s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▋                                                                      | 842/13301 [55:32<14:00:49,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▊                                                                      | 843/13301 [55:36<13:50:46,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▊                                                                      | 844/13301 [55:40<13:49:15,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  6%|████▊               

  7%|█████                                                                    | 924/13301 [1:00:57<13:40:16,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|█████                                                                    | 925/13301 [1:01:01<13:36:24,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|█████                                                                    | 926/13301 [1:01:05<13:42:39,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|█████                                                                    | 927/13301 [1:01:09<13:31:39,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|█████                                                                    | 928/13301 [1:01:13<13:22:31,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  7%|█████               

  8%|█████▍                                                                  | 1008/13301 [1:06:28<13:12:53,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▍                                                                  | 1009/13301 [1:06:32<13:20:12,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▍                                                                  | 1010/13301 [1:06:36<13:23:11,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▍                                                                  | 1011/13301 [1:06:40<13:22:23,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▍                                                                  | 1012/13301 [1:06:44<13:39:38,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▍              

  8%|█████▉                                                                  | 1092/13301 [1:11:59<13:32:15,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▉                                                                  | 1093/13301 [1:12:03<13:17:04,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▉                                                                  | 1094/13301 [1:12:07<13:27:26,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▉                                                                  | 1095/13301 [1:12:11<13:21:39,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▉                                                                  | 1096/13301 [1:12:15<13:27:32,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  8%|█████▉              

  9%|██████▎                                                                 | 1176/13301 [1:17:31<13:17:33,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▎                                                                 | 1177/13301 [1:17:36<13:21:59,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▍                                                                 | 1178/13301 [1:17:39<13:19:19,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▍                                                                 | 1179/13301 [1:17:43<13:12:27,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▍                                                                 | 1180/13301 [1:17:47<13:14:44,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▍             

  9%|██████▊                                                                 | 1260/13301 [1:23:03<13:14:02,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▊                                                                 | 1261/13301 [1:23:06<12:58:04,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▊                                                                 | 1262/13301 [1:23:10<13:01:53,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
  9%|██████▊                                                                 | 1263/13301 [1:23:14<13:02:59,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|██████▊                                                                 | 1264/13301 [1:23:18<12:57:13,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|██████▊             

 10%|███████▎                                                                | 1344/13301 [1:28:34<13:29:06,  4.06s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|███████▎                                                                | 1345/13301 [1:28:38<13:15:42,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|███████▎                                                                | 1346/13301 [1:28:41<13:09:35,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|███████▎                                                                | 1347/13301 [1:28:45<13:11:34,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|███████▎                                                                | 1348/13301 [1:28:49<13:09:10,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 10%|███████▎            

 11%|███████▋                                                                | 1428/13301 [1:34:08<12:44:02,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|███████▋                                                                | 1429/13301 [1:34:12<12:45:20,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|███████▋                                                                | 1430/13301 [1:34:16<12:44:10,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|███████▋                                                                | 1431/13301 [1:34:19<12:45:27,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|███████▊                                                                | 1432/13301 [1:34:23<12:50:18,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|███████▊            

 11%|████████▏                                                               | 1512/13301 [1:39:40<13:00:35,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|████████▏                                                               | 1513/13301 [1:39:44<12:56:38,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|████████▏                                                               | 1514/13301 [1:39:48<13:02:21,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|████████▏                                                               | 1515/13301 [1:39:52<12:48:49,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|████████▏                                                               | 1516/13301 [1:39:56<12:55:00,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 11%|████████▏           

 12%|████████▋                                                               | 1596/13301 [1:45:13<12:54:29,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 12%|████████▋                                                               | 1597/13301 [1:45:17<12:56:17,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 12%|████████▋                                                               | 1598/13301 [1:45:21<12:59:24,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 12%|████████▋                                                               | 1599/13301 [1:45:25<13:02:23,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 12%|████████▋                                                               | 1600/13301 [1:45:29<13:00:38,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 12%|████████▋           

 13%|█████████                                                               | 1680/13301 [1:50:45<12:34:44,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████                                                               | 1681/13301 [1:50:49<12:38:13,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████                                                               | 1682/13301 [1:50:53<12:47:37,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████                                                               | 1683/13301 [1:50:58<12:55:27,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████                                                               | 1684/13301 [1:51:02<12:52:54,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████           

 13%|█████████▌                                                              | 1764/13301 [1:56:19<12:27:46,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████▌                                                              | 1765/13301 [1:56:23<12:32:47,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████▌                                                              | 1766/13301 [1:56:27<12:39:20,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████▌                                                              | 1767/13301 [1:56:31<12:33:34,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████▌                                                              | 1768/13301 [1:56:35<12:17:56,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 13%|█████████▌          

 14%|██████████                                                              | 1848/13301 [2:01:50<12:09:43,  3.82s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 14%|██████████                                                              | 1849/13301 [2:01:54<12:21:38,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 14%|██████████                                                              | 1850/13301 [2:01:58<12:23:01,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 14%|██████████                                                              | 1851/13301 [2:02:02<12:30:23,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 14%|██████████                                                              | 1852/13301 [2:02:06<12:28:42,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 14%|██████████          

 15%|██████████▍                                                             | 1932/13301 [2:07:20<12:36:15,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▍                                                             | 1933/13301 [2:07:23<12:31:07,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▍                                                             | 1934/13301 [2:07:27<12:33:52,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▍                                                             | 1935/13301 [2:07:31<12:24:38,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▍                                                             | 1936/13301 [2:07:35<12:26:24,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▍         

 15%|██████████▉                                                             | 2016/13301 [2:12:50<12:26:00,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▉                                                             | 2017/13301 [2:12:54<12:32:14,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▉                                                             | 2018/13301 [2:12:59<12:35:39,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▉                                                             | 2019/13301 [2:13:03<12:41:09,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▉                                                             | 2020/13301 [2:13:07<12:31:40,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 15%|██████████▉         

 16%|███████████▎                                                            | 2100/13301 [2:18:25<12:27:26,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▎                                                            | 2101/13301 [2:18:28<12:25:15,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▍                                                            | 2102/13301 [2:18:33<12:30:49,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▍                                                            | 2103/13301 [2:18:37<12:35:11,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▍                                                            | 2104/13301 [2:18:41<12:33:49,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▍        

 16%|███████████▊                                                            | 2184/13301 [2:23:56<12:13:26,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▊                                                            | 2185/13301 [2:23:59<12:04:40,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▊                                                            | 2186/13301 [2:24:03<12:10:25,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▊                                                            | 2187/13301 [2:24:07<12:07:38,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▊                                                            | 2188/13301 [2:24:11<12:01:40,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 16%|███████████▊        

 17%|████████████▎                                                           | 2268/13301 [2:29:26<12:03:23,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 17%|████████████▎                                                           | 2269/13301 [2:29:30<11:54:10,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 17%|████████████▎                                                           | 2270/13301 [2:29:34<11:46:22,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 17%|████████████▎                                                           | 2271/13301 [2:29:38<11:46:05,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 17%|████████████▎                                                           | 2272/13301 [2:29:42<11:42:46,  3.82s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 17%|████████████▎       

 18%|████████████▋                                                           | 2352/13301 [2:34:55<12:08:35,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|████████████▋                                                           | 2353/13301 [2:34:59<11:53:58,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|████████████▋                                                           | 2354/13301 [2:35:03<11:46:34,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|████████████▋                                                           | 2355/13301 [2:35:07<11:54:05,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|████████████▊                                                           | 2356/13301 [2:35:11<12:01:36,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|████████████▊       

 18%|█████████████▏                                                          | 2436/13301 [2:40:26<11:45:55,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|█████████████▏                                                          | 2437/13301 [2:40:30<11:49:33,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|█████████████▏                                                          | 2438/13301 [2:40:34<11:51:41,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|█████████████▏                                                          | 2439/13301 [2:40:38<12:09:42,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|█████████████▏                                                          | 2440/13301 [2:40:42<11:57:03,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 18%|█████████████▏      

 19%|█████████████▋                                                          | 2520/13301 [2:45:56<11:33:00,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 19%|█████████████▋                                                          | 2521/13301 [2:46:00<11:37:18,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 19%|█████████████▋                                                          | 2522/13301 [2:46:04<11:43:42,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 19%|█████████████▋                                                          | 2523/13301 [2:46:08<11:37:45,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 19%|█████████████▋                                                          | 2524/13301 [2:46:12<11:47:06,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 19%|█████████████▋      

 20%|██████████████                                                          | 2604/13301 [2:51:28<11:42:06,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████                                                          | 2605/13301 [2:51:32<11:47:03,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████                                                          | 2606/13301 [2:51:36<11:54:05,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████                                                          | 2607/13301 [2:51:40<11:53:32,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████                                                          | 2608/13301 [2:51:44<11:44:15,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████      

 20%|██████████████▌                                                         | 2688/13301 [2:57:00<11:45:54,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████▌                                                         | 2689/13301 [2:57:04<11:52:15,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████▌                                                         | 2690/13301 [2:57:08<11:57:10,  4.06s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████▌                                                         | 2691/13301 [2:57:12<11:55:08,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████▌                                                         | 2692/13301 [2:57:16<11:44:52,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 20%|██████████████▌     

 21%|███████████████                                                         | 2772/13301 [3:02:31<11:25:49,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████                                                         | 2773/13301 [3:02:35<11:30:32,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████                                                         | 2774/13301 [3:02:39<11:25:55,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████                                                         | 2775/13301 [3:02:43<11:36:37,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████                                                         | 2776/13301 [3:02:47<11:42:27,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████     

 21%|███████████████▍                                                        | 2856/13301 [3:08:05<11:40:58,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████▍                                                        | 2857/13301 [3:08:08<11:19:34,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████▍                                                        | 2858/13301 [3:08:12<11:31:27,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 21%|███████████████▍                                                        | 2859/13301 [3:08:16<11:33:14,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▍                                                        | 2860/13301 [3:08:20<11:44:03,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▍    

 22%|███████████████▉                                                        | 2940/13301 [3:13:42<11:46:58,  4.09s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▉                                                        | 2941/13301 [3:13:46<11:38:14,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▉                                                        | 2942/13301 [3:13:50<11:21:15,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▉                                                        | 2943/13301 [3:13:54<11:27:49,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▉                                                        | 2944/13301 [3:13:57<11:20:20,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 22%|███████████████▉    

 23%|████████████████▎                                                       | 3024/13301 [3:19:12<11:20:27,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▎                                                       | 3025/13301 [3:19:16<11:00:34,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▍                                                       | 3026/13301 [3:19:20<11:07:36,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▍                                                       | 3027/13301 [3:19:24<11:11:40,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▍                                                       | 3028/13301 [3:19:27<11:08:33,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▍   

 23%|████████████████▊                                                       | 3108/13301 [3:24:43<11:14:29,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▊                                                       | 3109/13301 [3:24:47<11:18:19,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▊                                                       | 3110/13301 [3:24:51<11:03:58,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▊                                                       | 3111/13301 [3:24:55<11:10:46,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▊                                                       | 3112/13301 [3:24:59<11:03:26,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 23%|████████████████▊   

 24%|█████████████████▎                                                      | 3192/13301 [3:30:13<10:46:00,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 24%|█████████████████▎                                                      | 3193/13301 [3:30:17<10:49:49,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 24%|█████████████████▎                                                      | 3194/13301 [3:30:21<11:01:49,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 24%|█████████████████▎                                                      | 3195/13301 [3:30:25<11:03:47,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 24%|█████████████████▎                                                      | 3196/13301 [3:30:29<10:55:29,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 24%|█████████████████▎  

 25%|█████████████████▋                                                      | 3276/13301 [3:35:45<10:48:12,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|█████████████████▋                                                      | 3277/13301 [3:35:49<10:46:06,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|█████████████████▋                                                      | 3278/13301 [3:35:53<11:01:57,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|█████████████████▋                                                      | 3279/13301 [3:35:57<10:56:27,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|█████████████████▊                                                      | 3280/13301 [3:36:01<10:56:22,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|█████████████████▊  

 25%|██████████████████▏                                                     | 3360/13301 [3:41:16<10:53:43,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|██████████████████▏                                                     | 3361/13301 [3:41:20<10:50:18,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|██████████████████▏                                                     | 3362/13301 [3:41:24<10:55:02,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|██████████████████▏                                                     | 3363/13301 [3:41:28<11:00:22,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|██████████████████▏                                                     | 3364/13301 [3:41:33<11:06:25,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 25%|██████████████████▏ 

 26%|██████████████████▋                                                     | 3444/13301 [3:46:49<10:42:58,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 26%|██████████████████▋                                                     | 3445/13301 [3:46:53<10:43:54,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 26%|██████████████████▋                                                     | 3446/13301 [3:46:57<10:43:09,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 26%|██████████████████▋                                                     | 3447/13301 [3:47:01<10:43:59,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 26%|██████████████████▋                                                     | 3448/13301 [3:47:05<10:45:43,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 26%|██████████████████▋ 

 27%|███████████████████                                                     | 3528/13301 [3:52:19<10:42:43,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████                                                     | 3529/13301 [3:52:23<10:47:12,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████                                                     | 3530/13301 [3:52:27<10:48:16,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████                                                     | 3531/13301 [3:52:31<10:51:52,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████                                                     | 3532/13301 [3:52:35<10:52:25,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████ 

 27%|███████████████████▌                                                    | 3612/13301 [3:57:51<10:47:51,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████▌                                                    | 3613/13301 [3:57:55<10:49:29,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████▌                                                    | 3614/13301 [3:57:59<10:42:43,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████▌                                                    | 3615/13301 [3:58:02<10:32:49,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████▌                                                    | 3616/13301 [3:58:06<10:33:05,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 27%|███████████████████▌

 28%|████████████████████                                                    | 3696/13301 [4:03:24<10:30:17,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████                                                    | 3697/13301 [4:03:28<10:37:28,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████                                                    | 3698/13301 [4:03:32<10:44:00,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████                                                    | 3699/13301 [4:03:36<10:44:48,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████                                                    | 3700/13301 [4:03:40<10:44:38,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████

 28%|████████████████████▍                                                   | 3780/13301 [4:08:54<10:20:00,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████▍                                                   | 3781/13301 [4:08:58<10:30:52,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████▍                                                   | 3782/13301 [4:09:02<10:31:54,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████▍                                                   | 3783/13301 [4:09:06<10:18:30,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████▍                                                   | 3784/13301 [4:09:10<10:23:06,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 28%|████████████████████

 29%|████████████████████▉                                                   | 3864/13301 [4:14:27<10:10:35,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 29%|████████████████████▉                                                   | 3865/13301 [4:14:31<10:11:53,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 29%|████████████████████▉                                                   | 3866/13301 [4:14:35<10:10:45,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 29%|████████████████████▉                                                   | 3867/13301 [4:14:39<10:10:55,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 29%|████████████████████▉                                                   | 3868/13301 [4:14:42<10:08:51,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 29%|████████████████████

 30%|█████████████████████▎                                                  | 3948/13301 [4:19:59<10:08:20,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▍                                                  | 3949/13301 [4:20:02<10:08:01,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▍                                                  | 3950/13301 [4:20:06<10:16:19,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▍                                                  | 3951/13301 [4:20:11<10:18:59,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▍                                                  | 3952/13301 [4:20:15<10:24:31,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|████████████████████

 30%|██████████████████████▏                                                  | 4032/13301 [4:25:29<9:56:13,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▊                                                  | 4033/13301 [4:25:33<10:01:53,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▊                                                  | 4034/13301 [4:25:37<10:10:08,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▊                                                  | 4035/13301 [4:25:40<10:03:53,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|█████████████████████▊                                                  | 4036/13301 [4:25:44<10:00:22,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 30%|████████████████████

 31%|██████████████████████▌                                                  | 4116/13301 [4:30:58<9:52:52,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 31%|██████████████████████▌                                                  | 4117/13301 [4:31:02<9:52:10,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 31%|██████████████████████▌                                                  | 4118/13301 [4:31:06<9:54:52,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 31%|██████████████████████▎                                                 | 4119/13301 [4:31:10<10:05:06,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 31%|██████████████████████▌                                                  | 4120/13301 [4:31:14<9:53:36,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 31%|████████████████████

 32%|███████████████████████                                                  | 4200/13301 [4:36:28<9:25:37,  3.73s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████                                                  | 4201/13301 [4:36:32<9:42:21,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████                                                  | 4202/13301 [4:36:36<9:48:18,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████                                                  | 4203/13301 [4:36:40<9:45:21,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████                                                  | 4204/13301 [4:36:44<9:51:08,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|████████████████████

 32%|███████████████████████▌                                                 | 4284/13301 [4:41:59<9:42:35,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████▌                                                 | 4285/13301 [4:42:03<9:50:53,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████▌                                                 | 4286/13301 [4:42:07<9:51:15,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████▌                                                 | 4287/13301 [4:42:10<9:35:43,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|███████████████████████▌                                                 | 4288/13301 [4:42:14<9:40:31,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 32%|████████████████████

 33%|███████████████████████▉                                                 | 4368/13301 [4:47:29<9:40:23,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|███████████████████████▉                                                 | 4369/13301 [4:47:33<9:44:36,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|███████████████████████▉                                                 | 4370/13301 [4:47:36<9:32:55,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|███████████████████████▉                                                 | 4371/13301 [4:47:40<9:30:43,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|███████████████████████▉                                                 | 4372/13301 [4:47:44<9:31:52,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|████████████████████

 33%|████████████████████████▍                                                | 4452/13301 [4:53:01<9:35:44,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|████████████████████████▍                                                | 4453/13301 [4:53:05<9:38:52,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|████████████████████████▍                                                | 4454/13301 [4:53:09<9:37:38,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 33%|████████████████████████▍                                                | 4455/13301 [4:53:13<9:36:18,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████████▍                                                | 4456/13301 [4:53:17<9:48:32,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████

 34%|████████████████████████▉                                                | 4536/13301 [4:58:31<9:39:13,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████████▉                                                | 4537/13301 [4:58:35<9:43:27,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████████▉                                                | 4538/13301 [4:58:39<9:39:46,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████████▉                                                | 4539/13301 [4:58:43<9:44:32,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████████▉                                                | 4540/13301 [4:58:47<9:30:20,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 34%|████████████████████

 35%|█████████████████████████▎                                               | 4620/13301 [5:04:04<9:35:38,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▎                                               | 4621/13301 [5:04:09<9:38:42,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▎                                               | 4622/13301 [5:04:12<9:26:15,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▎                                               | 4623/13301 [5:04:16<9:31:56,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▍                                               | 4624/13301 [5:04:20<9:36:53,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|████████████████████

 35%|█████████████████████████▊                                               | 4704/13301 [5:09:33<9:18:37,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▊                                               | 4705/13301 [5:09:37<9:20:27,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▊                                               | 4706/13301 [5:09:41<9:11:42,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▊                                               | 4707/13301 [5:09:45<9:20:52,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|█████████████████████████▊                                               | 4708/13301 [5:09:49<9:20:02,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 35%|████████████████████

 36%|██████████████████████████▎                                              | 4788/13301 [5:15:05<9:11:40,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 36%|██████████████████████████▎                                              | 4789/13301 [5:15:09<9:16:34,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 36%|██████████████████████████▎                                              | 4790/13301 [5:15:13<9:22:20,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 36%|██████████████████████████▎                                              | 4791/13301 [5:15:17<9:18:33,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 36%|██████████████████████████▎                                              | 4792/13301 [5:15:21<9:28:28,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 36%|████████████████████

 37%|██████████████████████████▋                                              | 4872/13301 [5:20:35<9:15:17,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|██████████████████████████▋                                              | 4873/13301 [5:20:39<9:20:32,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|██████████████████████████▊                                              | 4874/13301 [5:20:43<9:26:06,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|██████████████████████████▊                                              | 4875/13301 [5:20:47<9:22:07,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|██████████████████████████▊                                              | 4876/13301 [5:20:51<9:22:57,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|████████████████████

 37%|███████████████████████████▏                                             | 4956/13301 [5:26:07<9:13:28,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|███████████████████████████▏                                             | 4957/13301 [5:26:11<9:10:40,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|███████████████████████████▏                                             | 4958/13301 [5:26:15<9:10:41,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|███████████████████████████▏                                             | 4959/13301 [5:26:18<9:07:29,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|███████████████████████████▏                                             | 4960/13301 [5:26:22<9:11:33,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 37%|████████████████████

 38%|███████████████████████████▋                                             | 5040/13301 [5:31:39<9:02:54,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 38%|███████████████████████████▋                                             | 5041/13301 [5:31:43<9:01:38,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 38%|███████████████████████████▋                                             | 5042/13301 [5:31:47<9:07:00,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 38%|███████████████████████████▋                                             | 5043/13301 [5:31:51<9:03:16,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 38%|███████████████████████████▋                                             | 5044/13301 [5:31:55<9:11:27,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 38%|████████████████████

 39%|████████████████████████████                                             | 5124/13301 [5:37:11<9:00:39,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▏                                            | 5125/13301 [5:37:15<8:58:49,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▏                                            | 5126/13301 [5:37:19<8:47:28,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▏                                            | 5127/13301 [5:37:22<8:48:42,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▏                                            | 5128/13301 [5:37:26<8:50:50,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████

 39%|████████████████████████████▌                                            | 5208/13301 [5:42:42<8:52:22,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▌                                            | 5209/13301 [5:42:46<8:47:49,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▌                                            | 5210/13301 [5:42:50<8:52:32,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▌                                            | 5211/13301 [5:42:54<8:53:09,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████████████▌                                            | 5212/13301 [5:42:58<8:52:57,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 39%|████████████████████

 40%|█████████████████████████████                                            | 5292/13301 [5:48:10<8:46:10,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████                                            | 5293/13301 [5:48:14<8:50:13,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████                                            | 5294/13301 [5:48:18<8:52:22,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████                                            | 5295/13301 [5:48:22<8:52:51,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████                                            | 5296/13301 [5:48:26<8:49:34,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|████████████████████

 40%|█████████████████████████████▌                                           | 5376/13301 [5:53:43<8:36:38,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████▌                                           | 5377/13301 [5:53:47<8:33:13,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████▌                                           | 5378/13301 [5:53:51<8:39:18,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████▌                                           | 5379/13301 [5:53:55<8:38:56,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|█████████████████████████████▌                                           | 5380/13301 [5:53:59<8:40:31,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 40%|████████████████████

 41%|█████████████████████████████▉                                           | 5460/13301 [5:59:16<8:28:53,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 41%|█████████████████████████████▉                                           | 5461/13301 [5:59:20<8:32:51,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 41%|█████████████████████████████▉                                           | 5462/13301 [5:59:24<8:35:25,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 41%|█████████████████████████████▉                                           | 5463/13301 [5:59:28<8:26:41,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 41%|█████████████████████████████▉                                           | 5464/13301 [5:59:32<8:29:39,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 41%|████████████████████

 42%|██████████████████████████████▍                                          | 5544/13301 [6:04:45<8:21:48,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▍                                          | 5545/13301 [6:04:49<8:27:41,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▍                                          | 5546/13301 [6:04:53<8:26:31,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▍                                          | 5547/13301 [6:04:57<8:30:50,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▍                                          | 5548/13301 [6:05:01<8:36:56,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|████████████████████

 42%|██████████████████████████████▉                                          | 5628/13301 [6:10:16<8:00:14,  3.76s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▉                                          | 5629/13301 [6:10:19<8:02:32,  3.77s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▉                                          | 5630/13301 [6:10:23<8:14:11,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▉                                          | 5631/13301 [6:10:27<8:16:11,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|██████████████████████████████▉                                          | 5632/13301 [6:10:31<8:18:38,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 42%|████████████████████

 43%|███████████████████████████████▎                                         | 5712/13301 [6:15:48<8:26:06,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 43%|███████████████████████████████▎                                         | 5713/13301 [6:15:52<8:24:50,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 43%|███████████████████████████████▎                                         | 5714/13301 [6:15:56<8:25:39,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 43%|███████████████████████████████▎                                         | 5715/13301 [6:16:00<8:20:01,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 43%|███████████████████████████████▎                                         | 5716/13301 [6:16:04<8:23:17,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 43%|████████████████████

 44%|███████████████████████████████▊                                         | 5796/13301 [6:21:20<8:16:28,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|███████████████████████████████▊                                         | 5797/13301 [6:21:24<8:19:35,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|███████████████████████████████▊                                         | 5798/13301 [6:21:28<8:19:30,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|███████████████████████████████▊                                         | 5799/13301 [6:21:32<8:14:28,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|███████████████████████████████▊                                         | 5800/13301 [6:21:36<8:16:51,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████

 44%|████████████████████████████████▎                                        | 5880/13301 [6:26:51<8:00:28,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████████████████▎                                        | 5881/13301 [6:26:55<8:01:13,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████████████████▎                                        | 5882/13301 [6:26:59<7:53:24,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████████████████▎                                        | 5883/13301 [6:27:03<7:59:23,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████████████████▎                                        | 5884/13301 [6:27:07<7:54:33,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 44%|████████████████████

 45%|████████████████████████████████▋                                        | 5964/13301 [6:32:21<8:10:23,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|████████████████████████████████▋                                        | 5965/13301 [6:32:25<8:07:29,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|████████████████████████████████▋                                        | 5966/13301 [6:32:29<8:10:12,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|████████████████████████████████▋                                        | 5967/13301 [6:32:33<8:11:50,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|████████████████████████████████▊                                        | 5968/13301 [6:32:37<8:10:38,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|████████████████████

 45%|█████████████████████████████████▏                                       | 6048/13301 [6:37:53<7:45:23,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|█████████████████████████████████▏                                       | 6049/13301 [6:37:56<7:48:29,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|█████████████████████████████████▏                                       | 6050/13301 [6:38:00<7:46:58,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 45%|█████████████████████████████████▏                                       | 6051/13301 [6:38:04<7:54:42,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|█████████████████████████████████▏                                       | 6052/13301 [6:38:08<7:58:32,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|████████████████████

 46%|█████████████████████████████████▋                                       | 6132/13301 [6:43:26<7:54:47,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|█████████████████████████████████▋                                       | 6133/13301 [6:43:30<7:54:31,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|█████████████████████████████████▋                                       | 6134/13301 [6:43:34<7:49:52,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|█████████████████████████████████▋                                       | 6135/13301 [6:43:38<7:47:44,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|█████████████████████████████████▋                                       | 6136/13301 [6:43:41<7:42:08,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 46%|████████████████████

 47%|██████████████████████████████████                                       | 6216/13301 [6:48:56<7:34:44,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████                                       | 6217/13301 [6:48:59<7:29:06,  3.80s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▏                                      | 6218/13301 [6:49:03<7:34:53,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▏                                      | 6219/13301 [6:49:07<7:38:00,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▏                                      | 6220/13301 [6:49:11<7:43:14,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|████████████████████

 47%|██████████████████████████████████▌                                      | 6300/13301 [6:54:28<7:36:42,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▌                                      | 6301/13301 [6:54:32<7:42:14,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▌                                      | 6302/13301 [6:54:36<7:42:02,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▌                                      | 6303/13301 [6:54:40<7:39:52,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|██████████████████████████████████▌                                      | 6304/13301 [6:54:44<7:28:47,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 47%|████████████████████

 48%|███████████████████████████████████                                      | 6384/13301 [6:59:59<7:38:26,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 48%|███████████████████████████████████                                      | 6385/13301 [7:00:03<7:33:22,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 48%|███████████████████████████████████                                      | 6386/13301 [7:00:07<7:33:32,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 48%|███████████████████████████████████                                      | 6387/13301 [7:00:11<7:30:42,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 48%|███████████████████████████████████                                      | 6388/13301 [7:00:15<7:34:29,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 48%|████████████████████

 49%|███████████████████████████████████▍                                     | 6468/13301 [7:05:30<7:22:48,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▌                                     | 6469/13301 [7:05:34<7:29:23,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▌                                     | 6470/13301 [7:05:38<7:33:05,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▌                                     | 6471/13301 [7:05:42<7:36:43,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▌                                     | 6472/13301 [7:05:46<7:35:41,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|████████████████████

 49%|███████████████████████████████████▉                                     | 6552/13301 [7:11:01<7:19:20,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▉                                     | 6553/13301 [7:11:05<7:21:32,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▉                                     | 6554/13301 [7:11:09<7:19:17,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▉                                     | 6555/13301 [7:11:13<7:18:31,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|███████████████████████████████████▉                                     | 6556/13301 [7:11:17<7:26:06,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 49%|████████████████████

 50%|████████████████████████████████████▍                                    | 6636/13301 [7:16:31<7:08:50,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 50%|████████████████████████████████████▍                                    | 6637/13301 [7:16:35<7:03:41,  3.81s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 50%|████████████████████████████████████▍                                    | 6638/13301 [7:16:38<7:07:14,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 50%|████████████████████████████████████▍                                    | 6639/13301 [7:16:42<6:58:14,  3.77s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 50%|████████████████████████████████████▍                                    | 6640/13301 [7:16:46<7:04:16,  3.82s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 50%|████████████████████

 51%|████████████████████████████████████▉                                    | 6720/13301 [7:22:04<7:23:02,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████████████████████▉                                    | 6721/13301 [7:22:07<7:20:39,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████████████████████▉                                    | 6722/13301 [7:22:11<7:16:58,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████████████████████▉                                    | 6723/13301 [7:22:15<7:17:58,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████████████████████▉                                    | 6724/13301 [7:22:19<7:19:21,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████

 51%|█████████████████████████████████████▎                                   | 6804/13301 [7:27:35<7:03:08,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|█████████████████████████████████████▎                                   | 6805/13301 [7:27:39<7:04:18,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|█████████████████████████████████████▎                                   | 6806/13301 [7:27:43<7:04:14,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|█████████████████████████████████████▎                                   | 6807/13301 [7:27:47<7:04:12,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|█████████████████████████████████████▎                                   | 6808/13301 [7:27:51<7:08:40,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 51%|████████████████████

 52%|█████████████████████████████████████▊                                   | 6888/13301 [7:33:08<7:04:01,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|█████████████████████████████████████▊                                   | 6889/13301 [7:33:12<7:07:02,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|█████████████████████████████████████▊                                   | 6890/13301 [7:33:16<7:01:19,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|█████████████████████████████████████▊                                   | 6891/13301 [7:33:20<7:04:06,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|█████████████████████████████████████▊                                   | 6892/13301 [7:33:24<6:58:45,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|████████████████████

 52%|██████████████████████████████████████▎                                  | 6972/13301 [7:38:41<6:57:41,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|██████████████████████████████████████▎                                  | 6973/13301 [7:38:45<6:57:34,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|██████████████████████████████████████▎                                  | 6974/13301 [7:38:48<6:56:30,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|██████████████████████████████████████▎                                  | 6975/13301 [7:38:53<6:59:16,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|██████████████████████████████████████▎                                  | 6976/13301 [7:38:56<6:57:49,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 52%|████████████████████

 53%|██████████████████████████████████████▋                                  | 7056/13301 [7:44:13<6:50:00,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 53%|██████████████████████████████████████▋                                  | 7057/13301 [7:44:17<6:47:44,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 53%|██████████████████████████████████████▋                                  | 7058/13301 [7:44:21<6:52:45,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 53%|██████████████████████████████████████▋                                  | 7059/13301 [7:44:24<6:48:47,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 53%|██████████████████████████████████████▋                                  | 7060/13301 [7:44:29<6:53:44,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 53%|████████████████████

 54%|███████████████████████████████████████▏                                 | 7140/13301 [7:49:45<6:50:36,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▏                                 | 7141/13301 [7:49:49<6:53:44,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▏                                 | 7142/13301 [7:49:53<6:51:19,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▏                                 | 7143/13301 [7:49:57<6:39:35,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▏                                 | 7144/13301 [7:50:01<6:46:05,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|████████████████████

 54%|███████████████████████████████████████▋                                 | 7224/13301 [7:55:17<6:47:07,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▋                                 | 7225/13301 [7:55:21<6:52:55,  4.08s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▋                                 | 7226/13301 [7:55:25<6:58:25,  4.13s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▋                                 | 7227/13301 [7:55:29<6:59:58,  4.15s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|███████████████████████████████████████▋                                 | 7228/13301 [7:55:33<6:50:26,  4.06s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 54%|████████████████████

 55%|████████████████████████████████████████                                 | 7308/13301 [8:00:48<6:30:37,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 55%|████████████████████████████████████████                                 | 7309/13301 [8:00:52<6:30:48,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 55%|████████████████████████████████████████                                 | 7310/13301 [8:00:56<6:35:33,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 55%|████████████████████████████████████████▏                                | 7311/13301 [8:01:00<6:33:13,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 55%|████████████████████████████████████████▏                                | 7312/13301 [8:01:04<6:35:40,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 55%|████████████████████

 56%|████████████████████████████████████████▌                                | 7392/13301 [8:06:20<6:28:14,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████████████████████████▌                                | 7393/13301 [8:06:24<6:32:37,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████████████████████████▌                                | 7394/13301 [8:06:28<6:36:12,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████████████████████████▌                                | 7395/13301 [8:06:32<6:39:44,  4.06s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████████████████████████▌                                | 7396/13301 [8:06:36<6:34:44,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████

 56%|█████████████████████████████████████████                                | 7476/13301 [8:11:52<6:26:46,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|█████████████████████████████████████████                                | 7477/13301 [8:11:56<6:29:46,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|█████████████████████████████████████████                                | 7478/13301 [8:12:00<6:30:08,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|█████████████████████████████████████████                                | 7479/13301 [8:12:04<6:25:05,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|█████████████████████████████████████████                                | 7480/13301 [8:12:07<6:18:25,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 56%|████████████████████

 57%|█████████████████████████████████████████▍                               | 7560/13301 [8:17:24<6:08:08,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▍                               | 7561/13301 [8:17:28<6:09:26,  3.86s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▌                               | 7562/13301 [8:17:32<6:13:25,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▌                               | 7563/13301 [8:17:36<6:11:14,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▌                               | 7564/13301 [8:17:40<6:08:23,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|████████████████████

 57%|█████████████████████████████████████████▉                               | 7644/13301 [8:22:54<6:08:11,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▉                               | 7645/13301 [8:22:58<6:11:12,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▉                               | 7646/13301 [8:23:02<6:09:55,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▉                               | 7647/13301 [8:23:06<6:07:00,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 57%|█████████████████████████████████████████▉                               | 7648/13301 [8:23:10<6:01:21,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|████████████████████

 58%|██████████████████████████████████████████▍                              | 7728/13301 [8:28:24<6:01:12,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|██████████████████████████████████████████▍                              | 7729/13301 [8:28:28<5:51:20,  3.78s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|██████████████████████████████████████████▍                              | 7730/13301 [8:28:32<5:53:58,  3.81s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|██████████████████████████████████████████▍                              | 7731/13301 [8:28:35<5:54:22,  3.82s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|██████████████████████████████████████████▍                              | 7732/13301 [8:28:39<5:58:55,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 58%|████████████████████

 59%|██████████████████████████████████████████▊                              | 7812/13301 [8:33:56<5:55:05,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|██████████████████████████████████████████▉                              | 7813/13301 [8:33:59<5:55:38,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|██████████████████████████████████████████▉                              | 7814/13301 [8:34:03<5:57:01,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|██████████████████████████████████████████▉                              | 7815/13301 [8:34:07<5:54:26,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|██████████████████████████████████████████▉                              | 7816/13301 [8:34:11<6:00:20,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|████████████████████

 59%|███████████████████████████████████████████▎                             | 7896/13301 [8:39:27<5:57:49,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|███████████████████████████████████████████▎                             | 7897/13301 [8:39:31<5:59:20,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|███████████████████████████████████████████▎                             | 7898/13301 [8:39:35<6:01:39,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|███████████████████████████████████████████▎                             | 7899/13301 [8:39:39<5:57:29,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|███████████████████████████████████████████▎                             | 7900/13301 [8:39:43<5:59:36,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 59%|████████████████████

 60%|███████████████████████████████████████████▊                             | 7980/13301 [8:44:58<5:55:01,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 60%|███████████████████████████████████████████▊                             | 7981/13301 [8:45:02<5:51:37,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 60%|███████████████████████████████████████████▊                             | 7982/13301 [8:45:06<5:53:22,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 60%|███████████████████████████████████████████▊                             | 7983/13301 [8:45:10<5:51:45,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 60%|███████████████████████████████████████████▊                             | 7984/13301 [8:45:14<5:54:31,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 60%|████████████████████

 61%|████████████████████████████████████████████▎                            | 8064/13301 [8:50:31<5:48:05,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▎                            | 8065/13301 [8:50:35<5:35:07,  3.84s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▎                            | 8066/13301 [8:50:39<5:39:03,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▎                            | 8067/13301 [8:50:43<5:43:05,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▎                            | 8068/13301 [8:50:46<5:34:14,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████

 61%|████████████████████████████████████████████▋                            | 8148/13301 [8:56:03<5:36:29,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▋                            | 8149/13301 [8:56:07<5:41:29,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▋                            | 8150/13301 [8:56:11<5:43:58,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▋                            | 8151/13301 [8:56:15<5:45:18,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████████████████████████████▋                            | 8152/13301 [8:56:19<5:44:34,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 61%|████████████████████

 62%|█████████████████████████████████████████████▏                           | 8232/13301 [9:01:34<5:28:00,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 62%|█████████████████████████████████████████████▏                           | 8233/13301 [9:01:38<5:27:20,  3.88s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 62%|█████████████████████████████████████████████▏                           | 8234/13301 [9:01:42<5:31:52,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 62%|█████████████████████████████████████████████▏                           | 8235/13301 [9:01:46<5:30:34,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 62%|█████████████████████████████████████████████▏                           | 8236/13301 [9:01:50<5:23:31,  3.83s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 62%|████████████████████

 63%|█████████████████████████████████████████████▋                           | 8316/13301 [9:07:06<5:30:21,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|█████████████████████████████████████████████▋                           | 8317/13301 [9:07:10<5:32:18,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|█████████████████████████████████████████████▋                           | 8318/13301 [9:07:14<5:27:36,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|█████████████████████████████████████████████▋                           | 8319/13301 [9:07:18<5:20:57,  3.87s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|█████████████████████████████████████████████▋                           | 8320/13301 [9:07:22<5:25:41,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|████████████████████

 63%|██████████████████████████████████████████████                           | 8400/13301 [9:12:38<5:24:53,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|██████████████████████████████████████████████                           | 8401/13301 [9:12:42<5:26:40,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|██████████████████████████████████████████████                           | 8402/13301 [9:12:46<5:23:31,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|██████████████████████████████████████████████                           | 8403/13301 [9:12:49<5:21:46,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|██████████████████████████████████████████████                           | 8404/13301 [9:12:54<5:25:39,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 63%|████████████████████

 64%|██████████████████████████████████████████████▌                          | 8484/13301 [9:18:08<5:13:41,  3.91s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|██████████████████████████████████████████████▌                          | 8485/13301 [9:18:12<5:13:08,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|██████████████████████████████████████████████▌                          | 8486/13301 [9:18:16<5:12:59,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|██████████████████████████████████████████████▌                          | 8487/13301 [9:18:20<5:14:43,  3.92s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|██████████████████████████████████████████████▌                          | 8488/13301 [9:18:23<5:15:17,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|████████████████████

 64%|███████████████████████████████████████████████                          | 8568/13301 [9:23:37<5:06:50,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|███████████████████████████████████████████████                          | 8569/13301 [9:23:41<5:07:48,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|███████████████████████████████████████████████                          | 8570/13301 [9:23:45<5:13:27,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|███████████████████████████████████████████████                          | 8571/13301 [9:23:49<5:14:41,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|███████████████████████████████████████████████                          | 8572/13301 [9:23:53<5:16:59,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 64%|████████████████████

 65%|███████████████████████████████████████████████▍                         | 8652/13301 [9:29:09<5:08:18,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 65%|███████████████████████████████████████████████▍                         | 8653/13301 [9:29:13<5:09:35,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 65%|███████████████████████████████████████████████▍                         | 8654/13301 [9:29:17<5:08:14,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 65%|███████████████████████████████████████████████▌                         | 8655/13301 [9:29:21<5:11:07,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 65%|███████████████████████████████████████████████▌                         | 8656/13301 [9:29:25<5:05:51,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 65%|████████████████████

 66%|███████████████████████████████████████████████▉                         | 8736/13301 [9:34:44<5:07:56,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|███████████████████████████████████████████████▉                         | 8737/13301 [9:34:48<5:07:53,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|███████████████████████████████████████████████▉                         | 8738/13301 [9:34:52<5:06:56,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|███████████████████████████████████████████████▉                         | 8739/13301 [9:34:57<5:07:49,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|███████████████████████████████████████████████▉                         | 8740/13301 [9:35:01<5:07:41,  4.05s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████

 66%|████████████████████████████████████████████████▍                        | 8820/13301 [9:40:17<4:56:57,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████████████████████████████████▍                        | 8821/13301 [9:40:21<4:58:40,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████████████████████████████████▍                        | 8822/13301 [9:40:25<4:53:47,  3.94s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████████████████████████████████▍                        | 8823/13301 [9:40:29<4:55:22,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████████████████████████████████▍                        | 8824/13301 [9:40:32<4:51:10,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 66%|████████████████████

 67%|████████████████████████████████████████████████▊                        | 8904/13301 [9:45:53<4:56:03,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 67%|████████████████████████████████████████████████▊                        | 8905/13301 [9:45:57<4:52:52,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 67%|████████████████████████████████████████████████▉                        | 8906/13301 [9:46:01<4:54:02,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 67%|████████████████████████████████████████████████▉                        | 8907/13301 [9:46:05<4:53:04,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 67%|████████████████████████████████████████████████▉                        | 8908/13301 [9:46:09<4:55:08,  4.03s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 67%|████████████████████

 68%|█████████████████████████████████████████████████▎                       | 8988/13301 [9:51:27<4:46:29,  3.99s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▎                       | 8989/13301 [9:51:31<4:36:51,  3.85s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▎                       | 8990/13301 [9:51:35<4:42:14,  3.93s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▎                       | 8991/13301 [9:51:39<4:39:31,  3.89s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▎                       | 8992/13301 [9:51:43<4:40:21,  3.90s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|████████████████████

 68%|█████████████████████████████████████████████████▊                       | 9072/13301 [9:56:59<4:40:27,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▊                       | 9073/13301 [9:57:03<4:38:53,  3.96s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▊                       | 9074/13301 [9:57:07<4:38:00,  3.95s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▊                       | 9075/13301 [9:57:11<4:39:31,  3.97s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|█████████████████████████████████████████████████▊                       | 9076/13301 [9:57:15<4:41:40,  4.00s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 68%|████████████████████

 69%|█████████████████████████████████████████████████▌                      | 9156/13301 [10:02:31<4:38:52,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 69%|█████████████████████████████████████████████████▌                      | 9157/13301 [10:02:35<4:39:03,  4.04s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 69%|█████████████████████████████████████████████████▌                      | 9158/13301 [10:02:39<4:37:50,  4.02s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 69%|█████████████████████████████████████████████████▌                      | 9159/13301 [10:02:43<4:37:08,  4.01s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 69%|█████████████████████████████████████████████████▌                      | 9160/13301 [10:02:47<4:34:43,  3.98s/it]Setting `pad_token_id` to 50256 (first `eos_token_id`) to generate sequence
 69%|████████████████████

KeyboardInterrupt: 

In [62]:
len("Le Valli Sis de Trach Sauvignon Blanc 2013	[response]	Pale yellow in color with aromas of fresh grass, green apple, and quince. Well-balanced, fresh and rich on the palate, with subtle grassy notes; pleasingly crisp, crisp and bright.")

234

In [90]:
generated_descriptions_v2 = {}
for ix,name in enumerate(generated_descriptions.keys()):
  #print(name)
  #print("===== OLD =====")
  #print(generated_descriptions[name])

  #print("===== NEW =====")
  clean_desc = generated_descriptions[name].split("<|startoftext|>	[prompt]")[0]
  clean_desc = clean_desc.split("[response]\t")[1]
  clean_desc = clean_desc.lstrip().rstrip()
  clean_desc = re.sub(r'\n+', '\n', clean_desc).strip()
  clean_desc = re.sub('startoftext', '', clean_desc)
  clean_desc = re.sub('<|', '', clean_desc)
  clean_desc = re.sub('|>', '', clean_desc)
  clean_desc = re.sub(r'\n', ' ', clean_desc)
  #print(clean_desc)
  #print("== END ==")
  
  if len(clean_desc) >= 150:
    generated_descriptions_v2[name] = clean_desc

In [91]:
wine_df = pd.DataFrame.from_dict(generated_descriptions_v2.items())
wine_df.columns = ['name', 'description']
print(wine_df.shape)

wine_df.head()

(7027, 2)


Unnamed: 0,name,description
0,Lachos Cellars Sauvignon Blanc 2012,The wine has all the characteristics of the Ch...
1,Dry Estated Bios de Bourting Sannero (375ML ha...,This wine is the product of three separate lot...
2,Le Valli Sis de Trach Sauvignon Blanc 2013,Pale yellow in color with aromas of fresh gras...
3,Fotes Jadot Sauvignon Blanc 2005,"""All of the grapes from this spectacular estat..."
4,Alarag Caleforno Rosso 2018,"Deep ruby red in color, this wine reveals inte..."


In [94]:
wine_df.to_csv("data/fake/fake_names_descriptions.csv")