In [None]:
from google.colab import drive
drive.mount('/content/drive')

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [None]:
import torch
from transformers import GPT2Tokenizer, GPT2LMHeadModel

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# Load the pre-trained model and tokenizer
model_name = "gpt2"
tokenizer = GPT2Tokenizer.from_pretrained(model_name)
pretrained_model = GPT2LMHeadModel.from_pretrained(model_name).to(device)


# Load the fine-tuned model and tokenizer
fine_tuned_model_path = "/content/drive/MyDrive/Rohits final project/gptNYT-2016-2022"
fine_tuned_model = GPT2LMHeadModel.from_pretrained(fine_tuned_model_path).to(device)
fine_tuned_tokenizer = GPT2Tokenizer.from_pretrained(fine_tuned_model_path)

# Function to generate text with attention mask
def generate_text(model, tokenizer, prompt, max_length=50):
    inputs = tokenizer.encode(prompt, return_tensors="pt").to(device)
    attention_mask = torch.ones(inputs.shape, device=device)  # Create attention mask
    outputs = model.generate(
        inputs,
        attention_mask=attention_mask,  # Pass attention mask
        max_length=max_length,
        pad_token_id=tokenizer.eos_token_id  # Set pad token ID to eos_token_id
    )
    return tokenizer.decode(outputs[0], skip_special_tokens=True)

The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


In [None]:
# Testing the pre-trained model
pretrained_prompt = "Judge Pratt’s decision"
pretrained_output = generate_text(pretrained_model, tokenizer, pretrained_prompt)
print("Pre-trained Model Output:")
print(pretrained_output)

Pre-trained Model Output:
Judge Pratt’s decision to allow the use of the word "felony" in the name of a child is a clear violation of the First Amendment.

The court also ruled that the use of the word "felony"


In [None]:
# Testing the fine-tuned model
finetuned_prompt = "Judge Pratt’s decision"
finetuned_output = generate_text(fine_tuned_model, fine_tuned_tokenizer, finetuned_prompt)
print("\nFine-tuned Model Output:")
print(finetuned_output)


Fine-tuned Model Output:
Judge Pratt’s decision to allow the president to use executive authority to order a halt to the deportation of undocumented immigrants is a victory for the president. But it’s a victory for the people of the United States.’s decision


In [None]:
import pandas as pd
df=pd.read_csv('/content/drive/MyDrive/Rohits final project/NYT_2016_to_2022_cleaned.csv')

In [None]:
df.head()

Unnamed: 0,pub_date,abstract
0,2016-07-01,Judge Pratt’s decision is the first in a feder...
1,2016-07-01,A selected guide to concerts in the New York C...
2,2016-07-01,All eyes are on the Hershey Trust Company agai...
3,2016-07-01,Friends and family members went to the Church ...
4,2016-07-01,"The Battle of the Somme, a century ago, left i..."


In [None]:
df['abstract'][0]

'Judge Pratt’s decision is the first in a federal court to indicate that a ban on abortion because of genetic anomalies would likely be unconstitutional.'

In [None]:
print("Original abstract : ",df['abstract'][0])
print()
print("pretrained_output : ",pretrained_output)
print()
print("finetuned_output : ",finetuned_output)

Original abstract :  Judge Pratt’s decision is the first in a federal court to indicate that a ban on abortion because of genetic anomalies would likely be unconstitutional.

pretrained_output :  Judge Pratt’s decision to allow the use of the word "felony" in the name of a child is a clear violation of the First Amendment.

The court also ruled that the use of the word "felony"

finetuned_output :  Judge Pratt’s decision to allow the president to use executive authority to order a halt to the deportation of undocumented immigrants is a victory for the president. But it’s a victory for the people of the United States.’s decision
