In [None]:
# Import necessary libraries
from transformers import PegasusTokenizer, PegasusForConditionalGeneration
from datasets import load_dataset
from src.model.fine_tuning import fine_tune_model
from src.data_preprocessing.tokenization import load_tokenizer, preprocess_data
from src.model.evaluation import evaluate_model
import logging

In [None]:
# Set up logging
logging.basicConfig(filename='logs/main.log', level=logging.INFO)

In [None]:
# Step 1: Load the dataset and tokenizer
tokenizer = load_tokenizer()
train_data = load_dataset("cnn_dailymail", split="train[:10%]")
train_data = preprocess_data(train_data, tokenizer)


In [None]:
# Step 2: Load Pretrained Model (PEGASUS)
model = PegasusForConditionalGeneration.from_pretrained("google/pegasus-cnn_dailymail")


In [None]:
# Step 3: Fine-tune the model
fine_tune_model(model, train_data)


In [None]:
# Step 4: Evaluate the model
evaluate_model(model, train_data)


In [None]:

# Step 5: Save the fine-tuned model
model.save_pretrained("models/fine_tuned/pegasus_model")
