In [1]:
import transformers
import accelerate
import outlines
import json
import pandas as pd
import torch
import tqdm
import gc
import ast
from outlines import from_transformers, Generator, models
from pydantic import BaseModel, Field, ValidationError
from typing import List, Optional

  from .autonotebook import tqdm as notebook_tqdm


In [16]:
'''
This is a chunk for clearing model cache if it becomes necessary to switch to another model without having to reset
'''

# Delete the model object
del model
gc.collect()

# Clear PyTorch cache on GPU
torch.cuda.empty_cache()
torch.cuda.reset_peak_memory_stats()

# This is a comment to test git


In [2]:
model = from_transformers(
    transformers.AutoModelForCausalLM.from_pretrained("meta-llama/Llama-3.2-1B", device_map="auto", dtype=torch.bfloat16),
    transformers.AutoTokenizer.from_pretrained("meta-llama/Llama-3.2-1B")
)
#"meta-llama/Llama-3.2-1B"

In [2]:
'''
This is the DeepSeek 14b model, which at first glance seems to perform better than the Llama model. 
Definitely worth considering if this should be used instead.
'''

model = from_transformers(
    transformers.AutoModelForCausalLM.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-14B", device_map="auto", dtype=torch.bfloat16),
    transformers.AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-R1-Distill-Qwen-14B")
)

Fetching 4 files:   0%|          | 0/4 [00:00<?, ?it/s]Cancellation requested; stopping current tasks.
Fetching 4 files:   0%|          | 0/4 [00:25<?, ?it/s]


KeyboardInterrupt: 

In [3]:
# Defining the pydantic class which ensures the structured output from the llm
class BlameeDetection(BaseModel):
    text: str = Field(description="The exact original sentence being analyzed")
    previous: str = Field(description="The exact previous sentence used for context which follows 'Previous sentence:'")
    following: str = Field(description="The exact following sentence used for context which follows 'Following sentence:'")
    blamee: Optional[str] = Field(default = None, description="Who or what is being blamed")
    arguments: Optional[str] = Field(default = None, description="What the blamee is being blamed for - the specific negative outcome"
    )

In [4]:
text_data = pd.read_csv("/work/RuneEgeskovTrust#9638/Bachelor/Bachelor_project/annotation_data_translated_version_03_10.csv", encoding='utf-8')

In [5]:

paragraph_entry = {}
for i, text in enumerate(text_data["da_segmented_text"]): #check if i is sctually number


    da_segmented_sentences = ast.literal_eval(text_data.loc[i]["da_segmented_text"])

    sentence_entry = {}
    for p, sentence in enumerate(da_segmented_sentences):
        sentence_entry[p] = sentence
    
    paragraph_entry[i] = sentence_entry



In [6]:
with open('/work/RuneEgeskovTrust#9638/Bachelor/Bachelor_project/labelstudio_with_metadata.json', 'r') as file:
    orig_data = json.load(file)

In [32]:
orig_data[0]

{'paragraph': '2',
 'sentence_nr': '235',
 'text': 'Regeringen vil også fortsætte sin offensive  miljøpolitik.',
 'speaker': 'Poul Nyrup Rasmussen',
 'party': 'S',
 'preceding_sentence': 'sentence_nr 234 \nDer indføres en belønningsordning for virksomheder, der gør  en særlig ekstraindsats ud over det, loven stiller krav om,  for at forbedre arbejdsmiljøet.',
 'succeeding_sent': 'sentence_nr 236 \nDet er vores næste store felt.',
 'current_speaker_in_government': True,
 'parties_in_government': ['S', 'RV'],
 'date': '1997-10-07 00:00:00'}

In [None]:
spoken_sentences =

for i in range(len(data)):
    text = data[i]["text"]
    speaker = data[i]["speaker"]
    spoken_sentences.append(text)

In [7]:
generator = Generator(model, BlameeDetection)

In [30]:
orig_data[0]

{'paragraph': '2',
 'sentence_nr': '235',
 'text': 'Regeringen vil også fortsætte sin offensive  miljøpolitik.',
 'speaker': 'Poul Nyrup Rasmussen',
 'party': 'S',
 'preceding_sentence': 'Der indføres en belønningsordning for virksomheder, der gør  en særlig ekstraindsats ud over det, loven stiller krav om,  for at forbedre arbejdsmiljøet.',
 'succeeding_sent': 'Det er vores næste store felt.',
 'current_speaker_in_government': True,
 'parties_in_government': ['S', 'RV'],
 'date': '1997-10-07 00:00:00'}

In [9]:
for i in orig_data:
    print(i)
    try:
        i["preceding_sentence"] = i["preceding_sentence"].split("\n")[1]
        i["succeeding_sent"] = i["succeeding_sent"].split("\n")[1]
    except IndexError as e:
        print(f"{e} No sentence before")
        pass

# REMEMBER TO TRY CATCH FOR SENTENCES WHICH EITHER ARE THE START OR THE END OF A PARAGRAPH. 
# ALSO OVERVEJ IF THE SKIPPED LINES WHICH BREAK THE JSON SHOULD BE APPENDED TO A LIST FOR LATER PROCESSING WITH MORE AVAILABLE TOKENS FOR GENERATION.

{'paragraph': '2', 'sentence_nr': '235', 'text': 'Regeringen vil også fortsætte sin offensive  miljøpolitik.', 'speaker': 'Poul Nyrup Rasmussen', 'party': 'S', 'preceding_sentence': 'Der indføres en belønningsordning for virksomheder, der gør  en særlig ekstraindsats ud over det, loven stiller krav om,  for at forbedre arbejdsmiljøet.', 'succeeding_sent': 'Det er vores næste store felt.', 'current_speaker_in_government': True, 'parties_in_government': ['S', 'RV'], 'date': '1997-10-07 00:00:00'}
list index out of range No sentence before
{'paragraph': '4', 'sentence_nr': '85', 'text': 'i det synspunkt.  \xa0\xa0\xa0\xa0\xa0I skærende kontrast til det synspunkt står  landbrugsorganisationernes reaktion og Venstres og De  Konservatives finanslovudspil kemisk renset for afgifter som  styringsredskab, altså ligegyldighed over for vandmiljøet for  at tilfredsstille landbrugslobbyens høge.', 'speaker': 'Torben Lund', 'party': 'S', 'preceding_sentence': 'Jeg er 100 pct. enig', 'succeeding_sent

In [None]:
for sentence in tqdm.tqdm(orig_data, desc = "Blamee detection"):
    prev_sent = sentence["preceding_sentence"]
    sent = sentence["text"]
    suc_sent = sentence["succeeding_sent"]
    prompt = f"""You are an expert argumentative journalist with an expertise in how blame gets thrown around in political debates,  
    based on this role, identify who or what is being blamed in the following sentence based on the context of the previous and following sentence.
    The entity being blamed can be present in either of the three sentences.
    Sentence: {sent}
    Previous sentence: {prev_sent}
    Following sentence: {suc_sent}

    Rules:
    - Identify specifically who or what is being blamed for causing a negative outcome in the above sentence
    - The "text" field must be EXACTLY the sentence provided above - do not modify it
    - Identify a specific part of the above sentence which indicates what the blamee is being accused of
    - Never leave arguments as an empty string
    - Never use "sentence_nr [x]" for classifying blame

    - Roles:
    - Blamee: The patient receiving the blame (who or what is being blamed)
    - Argument: What is the blamee being blamed for (the negative outcome)"""
    with torch.no_grad():  # Disable gradient tracking
        result = generator(prompt, max_new_tokens=256, use_cache=False)
        #print(result)
    try:
        result_out = BlameeDetection.model_validate_json(result)
    except (ValidationError, json.JSONDecodeError):
        print("Skipping invalid entry.")
        continue

    with open("result_blamee_detection.json", "a") as f:
        json.dump(result_out.model_dump(), f, indent=2)




Blamee detection:   0%|          | 0/4325 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 1/4325 [01:07<81:39:00, 67.98s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 2/4325 [01:08<34:04:22, 28.37s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 3/4325 [01:08<18:37:24, 15.51s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 4/4325 [01:09<11:35:34,  9.66s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 5/4325 [01:10<7:51:15,  6.55s/it] Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 6/4325 [01:10<5:19:52,  4.44s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection: 

Skipping invalid entry.


Blamee detection:   0%|          | 11/4325 [01:20<3:12:55,  2.68s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   0%|          | 12/4325 [01:20<2:22:30,  1.98s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 13/4325 [01:22<2:15:02,  1.88s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 14/4325 [01:22<1:47:48,  1.50s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 15/4325 [01:25<2:18:59,  1.93s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 16/4325 [01:26<1:51:25,  1.55s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 17/4325 [01:26<1:27:25,  1.22s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   0%|          | 18/4325 [01:28<1:29:18,  1.24s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   1%|          | 23/4325 [01:38<2:26:36,  2.04s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 24/4325 [01:38<1:47:11,  1.50s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 25/4325 [01:39<1:30:41,  1.27s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 26/4325 [01:43<2:21:56,  1.98s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   1%|          | 27/4325 [01:46<2:59:23,  2.50s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   1%|          | 28/4325 [01:48<2:49:10,  2.36s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 29/4325 [01:49<2:09:41,  1.81s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 30/4325 [01:50<2:00:50,  1.69s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 31/4325 [01:51<1:32:14,  1.29s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 32/4325 [01:54<2:22:34,  1.99s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 33/4325 [01:57<2:33:59,  2.15s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 34/4325 [01:58<2:09:05,  1.80s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   1%|          | 38/4325 [02:05<2:01:07,  1.70s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 39/4325 [02:06<1:36:54,  1.36s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 40/4325 [02:10<2:28:04,  2.07s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   1%|          | 41/4325 [02:10<1:56:42,  1.63s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 42/4325 [02:11<1:30:05,  1.26s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 43/4325 [02:13<1:54:51,  1.61s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 44/4325 [02:15<1:51:51,  1.57s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 45/4325 [02:17<2:18:51,  1.95s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 46/4325 [02:18<1:47:27,  1.51s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   1%|          | 47/4325 [02:19<1:37:30,  1.37s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   2%|▏         | 68/4325 [02:49<1:41:59,  1.44s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 69/4325 [02:50<1:38:20,  1.39s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 70/4325 [02:51<1:17:30,  1.09s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 71/4325 [02:53<1:39:42,  1.41s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 72/4325 [02:54<1:39:11,  1.40s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 73/4325 [02:57<2:08:43,  1.82s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 74/4325 [03:00<2:41:57,  2.29s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   2%|▏         | 76/4325 [03:05<2:27:37,  2.08s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 77/4325 [03:08<2:51:51,  2.43s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 78/4325 [03:08<2:11:04,  1.85s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 79/4325 [03:09<1:50:26,  1.56s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 80/4325 [03:10<1:29:56,  1.27s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 81/4325 [03:11<1:36:45,  1.37s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 82/4325 [03:12<1:19:36,  1.13s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   2%|▏         | 87/4325 [03:20<1:50:01,  1.56s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 88/4325 [03:20<1:23:51,  1.19s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 89/4325 [03:21<1:05:11,  1.08it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 90/4325 [03:22<1:14:50,  1.06s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 91/4325 [03:23<1:06:01,  1.07it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 92/4325 [03:24<1:24:15,  1.19s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   2%|▏         | 93/4325 [03:27<1:52:47,  1.60s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee

Skipping invalid entry.


Blamee detection:   3%|▎         | 111/4325 [03:47<1:46:49,  1.52s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 112/4325 [03:48<1:23:58,  1.20s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 113/4325 [03:49<1:13:28,  1.05s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 114/4325 [03:50<1:15:12,  1.07s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 115/4325 [03:50<1:06:18,  1.06it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 116/4325 [03:51<58:18,  1.20it/s]  Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 117/4325 [03:52<1:10:26,  1.00s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.

Skipping invalid entry.


Blamee detection:   3%|▎         | 121/4325 [04:00<1:50:22,  1.58s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 122/4325 [04:03<2:34:55,  2.21s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 123/4325 [04:07<3:10:47,  2.72s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 124/4325 [04:08<2:22:46,  2.04s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 125/4325 [04:08<1:47:25,  1.53s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 126/4325 [04:09<1:27:28,  1.25s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 127/4325 [04:12<2:20:44,  2.01s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 128/4325 [04:14<2:20:20,  2.01s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 129/4325 [04:15<1:49:14,  1.56s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 130/4325 [04:15<1:25:13,  1.22s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 131/4325 [04:16<1:06:53,  1.04it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 132/4325 [04:18<1:26:15,  1.23s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 133/4325 [04:18<1:13:06,  1.05s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 134/4325 [04:19<1:10:30,  1.01s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.

Skipping invalid entry.


Blamee detection:   3%|▎         | 137/4325 [04:23<1:23:58,  1.20s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 138/4325 [04:23<1:04:47,  1.08it/s]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 139/4325 [04:27<1:59:06,  1.71s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 140/4325 [04:28<1:45:02,  1.51s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 141/4325 [04:31<2:24:29,  2.07s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 142/4325 [04:33<2:21:41,  2.03s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 143/4325 [04:37<2:50:15,  2.44s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 144/4325 [04:39<2:38:27,  2.27s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 145/4325 [04:41<2:44:27,  2.36s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 146/4325 [04:44<2:45:17,  2.37s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 147/4325 [04:47<3:07:15,  2.69s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 148/4325 [04:51<3:38:41,  3.14s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 149/4325 [04:55<3:58:10,  3.42s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   3%|▎         | 150/4325 [04:56<2:58:10,  2.56s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   3%|▎         | 151/4325 [04:57<2:39:14,  2.29s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 152/4325 [05:00<2:40:43,  2.31s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 153/4325 [05:01<2:22:58,  2.06s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 154/4325 [05:03<2:12:00,  1.90s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 155/4325 [05:05<2:12:44,  1.91s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 156/4325 [05:08<2:44:32,  2.37s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.

Skipping invalid entry.


Blamee detection:   4%|▎         | 157/4325 [05:09<2:04:04,  1.79s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 158/4325 [05:12<2:33:17,  2.21s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   4%|▎         | 159/4325 [05:12<1:58:11,  1.70s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 160/4325 [05:16<2:37:21,  2.27s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.


Skipping invalid entry.


Blamee detection:   4%|▎         | 161/4325 [05:17<2:04:04,  1.79s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▎         | 162/4325 [05:18<1:46:36,  1.54s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▍         | 163/4325 [05:18<1:20:42,  1.16s/it]Setting `pad_token_id` to `eos_token_id`:128001 for open-end generation.
Blamee detection:   4%|▍         | 163/4325 [05:18<2:15:29,  1.95s/it]


KeyboardInterrupt: 