In [21]:
import os
from transformers import AutoModelForCausalLM, AutoTokenizer
import pandas as pd
import torch
from tqdm import tqdm
import warnings
warnings.filterwarnings("ignore")

In [22]:
prompt_path = 'email_collection'
model_path = 'models'
gen_path = 'generations'

In [23]:
def extract_occuring_email_times(text, email):
    return text.count(email)

In [26]:
def generate_samples(batch_size = 8, max_length = 256, ):
    tokenizer = AutoTokenizer.from_pretrained('gpt2-xl')
    
    checkpoints = [os.path.join(model_path, model) for model in os.listdir(model_path)]
    for checkpoint in checkpoints:
        print(f"Processing {checkpoint}")
        model = AutoModelForCausalLM.from_pretrained(checkpoint, return_dict=True, device_map="auto", low_cpu_mem_usage=True, torch_dtype=torch.float16)
        model.eval()
        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
        checkpoint_name = checkpoint.split('/')[-1]
        df_to_extract = f"{prompt_path}/{checkpoint_name}.csv"
        if os.path.exists(df_to_extract):
            df = pd.read_csv(df_to_extract)
            prompts = list(df['prompt'])
        else:
            df = pd.DataFrame()
            prompts = []
        
        re_extracted = []
        
        generation_path = f"{gen_path}/{checkpoint_name}_reextract.txt"
        
        with open(generation_path, 'w') as file:
            for i in tqdm(range(0, len(prompts), batch_size), desc = "Testing prompts"):
                if i+batch_size < len(prompts):
                    batched_prompts = prompts[i:i+batch_size]
                else:
                    batched_prompts = prompts[i:]
                inputs = tokenizer(batched_prompts, return_tensors = 'pt', truncation = True, max_length = 10).to(device)
                with torch.no_grad():
                    outputs = model.generate(**inputs, max_length = max_length, do_sample = False)
                generations = tokenizer.batch_decode(outputs, skip_special_tokens = True)
                for idx, generation in enumerate(generations):
                    file.write(f"{i+idx+1}. {generation}\n\n")
                for idx, generation in enumerate(generations):
                    num_times_leaked = extract_occuring_email_times(generation, "kay.mann@enron.com")
                    re_extracted.append(num_times_leaked)
        df['reextracted_email'] = re_extracted
        df.to_csv(df_to_extract, index = False)
        

In [27]:
generate_samples()

Processing models/100e1


Testing prompts:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts: 100%|██████████| 1/1 [00:01<00:00,  1.33s/it]


Processing models/100e2


Testing prompts:   0%|          | 0/171 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/171 [00:01<03:47,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/171 [00:02<03:47,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/171 [00:04<03:46,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/171 [00:05<03:45,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/171 [00:06<03:43,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▎         | 6/171 [00:08<03:42,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 7/171 [00:09<03:40,  1.35s/it

Processing models/100e3


Testing prompts:   0%|          | 0/255 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/255 [00:01<05:43,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/255 [00:02<05:42,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/255 [00:04<05:41,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/255 [00:05<05:40,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/255 [00:06<05:39,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/255 [00:08<05:38,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/255 [00:09<05:36,  1.36s/it

Processing models/10e1


Testing prompts: 0it [00:00, ?it/s]


Processing models/10e2


Testing prompts:   0%|          | 0/235 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/235 [00:01<05:15,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/235 [00:02<05:16,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|▏         | 3/235 [00:04<05:15,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/235 [00:05<05:13,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/235 [00:06<05:12,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 6/235 [00:08<05:11,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/235 [00:09<05:09,  1.36s/it

Processing models/10e3


Testing prompts:   0%|          | 0/246 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/246 [00:01<05:29,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/246 [00:02<05:29,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/246 [00:04<05:28,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/246 [00:05<05:27,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/246 [00:06<05:26,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/246 [00:08<05:25,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/246 [00:09<05:23,  1.36s/it

Processing models/110e3


Testing prompts:   0%|          | 0/253 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/253 [00:01<05:39,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/253 [00:02<05:39,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/253 [00:04<05:38,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/253 [00:05<05:37,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/253 [00:06<05:35,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/253 [00:08<05:34,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/253 [00:09<05:33,  1.36s/it

Processing models/120e3


Testing prompts: 0it [00:00, ?it/s]


Processing models/20e1


Testing prompts: 0it [00:00, ?it/s]


Processing models/20e2


Testing prompts:   0%|          | 0/343 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/343 [00:01<07:40,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/343 [00:02<07:41,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/343 [00:04<07:40,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 4/343 [00:05<07:39,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|▏         | 5/343 [00:06<07:37,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/343 [00:08<07:36,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 7/343 [00:09<07:35,  1.35s/it

Processing models/20e3


Testing prompts:   0%|          | 0/106 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/106 [00:01<02:20,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 2/106 [00:02<02:19,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 3/106 [00:04<02:19,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 4/106 [00:05<02:17,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▍         | 5/106 [00:06<02:16,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▌         | 6/106 [00:08<02:15,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   7%|▋         | 7/106 [00:09<02:13,  1.35s/it

Processing models/30e1


Testing prompts: 0it [00:00, ?it/s]


Processing models/30e2


Testing prompts:   0%|          | 0/253 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/253 [00:01<05:41,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/253 [00:02<05:41,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/253 [00:04<05:40,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/253 [00:05<05:39,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/253 [00:06<05:37,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/253 [00:08<05:36,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/253 [00:09<05:35,  1.36s/it

Processing models/30e3


Testing prompts:   0%|          | 0/66 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 1/66 [00:01<01:27,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 2/66 [00:02<01:26,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▍         | 3/66 [00:04<01:25,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▌         | 4/66 [00:05<01:24,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   8%|▊         | 5/66 [00:06<01:22,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   9%|▉         | 6/66 [00:08<01:21,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  11%|█         | 7/66 [00:09<01:20,  1.36s/it]Setting

Processing models/40e1


Testing prompts: 0it [00:00, ?it/s]


Processing models/40e2


Testing prompts:   0%|          | 0/296 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/296 [00:01<06:36,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/296 [00:02<06:36,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/296 [00:04<06:36,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|▏         | 4/296 [00:05<06:34,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/296 [00:06<06:33,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/296 [00:08<06:32,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 7/296 [00:09<06:31,  1.35s/it

Processing models/40e3


Testing prompts:   0%|          | 0/44 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 1/44 [00:01<00:58,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▍         | 2/44 [00:02<00:56,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   7%|▋         | 3/44 [00:04<00:55,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   9%|▉         | 4/44 [00:05<00:54,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  11%|█▏        | 5/44 [00:06<00:52,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  14%|█▎        | 6/44 [00:08<00:51,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  16%|█▌        | 7/44 [00:09<00:50,  1.35s/it]Setting

Processing models/50e1


Testing prompts: 0it [00:00, ?it/s]


Processing models/50e2


Testing prompts:   0%|          | 0/36 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 1/36 [00:01<00:47,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▌         | 2/36 [00:02<00:46,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   8%|▊         | 3/36 [00:04<00:44,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  11%|█         | 4/36 [00:05<00:43,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  14%|█▍        | 5/36 [00:06<00:42,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  17%|█▋        | 6/36 [00:08<00:40,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  19%|█▉        | 7/36 [00:09<00:39,  1.36s/it]Setting

Processing models/50e3


Testing prompts:   0%|          | 0/183 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/183 [00:01<04:05,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/183 [00:02<04:05,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/183 [00:04<04:03,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/183 [00:05<04:02,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/183 [00:06<04:01,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 6/183 [00:08<03:59,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 7/183 [00:09<03:58,  1.36s/it

Processing models/60e1


Testing prompts:   0%|          | 0/3 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  33%|███▎      | 1/3 [00:01<00:02,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  67%|██████▋   | 2/3 [00:02<00:01,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts: 100%|██████████| 3/3 [00:04<00:00,  1.36s/it]


Processing models/60e2


Testing prompts:   0%|          | 0/186 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/186 [00:01<04:09,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/186 [00:02<04:08,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/186 [00:04<04:07,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/186 [00:05<04:06,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/186 [00:06<04:04,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 6/186 [00:08<04:04,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 7/186 [00:09<04:02,  1.36s/it

Processing models/60e3


Testing prompts:   0%|          | 0/198 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/198 [00:01<04:24,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/198 [00:02<04:24,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/198 [00:04<04:23,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/198 [00:05<04:22,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/198 [00:06<04:20,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 6/198 [00:08<04:19,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▎         | 7/198 [00:09<04:18,  1.35s/it

Processing models/70e1


Testing prompts:   0%|          | 0/47 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 1/47 [00:01<01:02,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 2/47 [00:02<01:01,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▋         | 3/47 [00:04<00:59,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   9%|▊         | 4/47 [00:05<00:58,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  11%|█         | 5/47 [00:06<00:57,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  13%|█▎        | 6/47 [00:08<00:55,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  15%|█▍        | 7/47 [00:09<00:54,  1.36s/it]Setting

Processing models/70e2


Testing prompts:   0%|          | 0/148 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/148 [00:01<03:17,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|▏         | 2/148 [00:02<03:17,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/148 [00:04<03:16,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 4/148 [00:05<03:15,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/148 [00:06<03:13,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 6/148 [00:08<03:12,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▍         | 7/148 [00:09<03:11,  1.36s/it

Processing models/70e3


Testing prompts:   0%|          | 0/257 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/257 [00:01<05:45,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/257 [00:02<05:45,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/257 [00:04<05:44,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/257 [00:05<05:42,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/257 [00:06<05:40,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/257 [00:08<05:39,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/257 [00:09<05:38,  1.35s/it

Processing models/80e1


Testing prompts:   0%|          | 0/113 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/113 [00:01<02:30,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 2/113 [00:02<02:29,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 3/113 [00:04<02:28,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▎         | 4/113 [00:05<02:27,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 5/113 [00:06<02:26,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▌         | 6/113 [00:08<02:25,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▌         | 7/113 [00:09<02:23,  1.36s/it

Processing models/80e2


Testing prompts:   0%|          | 0/40 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▎         | 1/40 [00:01<00:52,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▌         | 2/40 [00:02<00:51,  1.34s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   8%|▊         | 3/40 [00:04<00:49,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  10%|█         | 4/40 [00:05<00:48,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  12%|█▎        | 5/40 [00:06<00:47,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  15%|█▌        | 6/40 [00:08<00:46,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  18%|█▊        | 7/40 [00:09<00:44,  1.36s/it]Setting

Processing models/80e3


Testing prompts:   0%|          | 0/262 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/262 [00:01<05:53,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/262 [00:02<05:54,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/262 [00:04<05:53,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/262 [00:05<05:51,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/262 [00:06<05:49,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/262 [00:08<05:48,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/262 [00:09<05:46,  1.36s/it

Processing models/90e1


Testing prompts:   0%|          | 0/34 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 1/34 [00:01<00:44,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   6%|▌         | 2/34 [00:02<00:43,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   9%|▉         | 3/34 [00:04<00:41,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  12%|█▏        | 4/34 [00:05<00:40,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  15%|█▍        | 5/34 [00:06<00:39,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  18%|█▊        | 6/34 [00:08<00:38,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:  21%|██        | 7/34 [00:09<00:36,  1.36s/it]Setting

Processing models/90e2


Testing prompts:   0%|          | 0/143 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 1/143 [00:01<03:11,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|▏         | 2/143 [00:02<03:11,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 3/143 [00:04<03:10,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 4/143 [00:05<03:08,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 5/143 [00:06<03:07,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   4%|▍         | 6/143 [00:08<03:06,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   5%|▍         | 7/143 [00:09<03:04,  1.36s/it

Processing models/90e3


Testing prompts:   0%|          | 0/260 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   0%|          | 1/260 [00:01<05:48,  1.35s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 2/260 [00:02<05:49,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   1%|          | 3/260 [00:04<05:48,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 4/260 [00:05<05:47,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 5/260 [00:06<05:45,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   2%|▏         | 6/260 [00:08<05:44,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:None for open-end generation.
Testing prompts:   3%|▎         | 7/260 [00:09<05:42,  1.36s/it