In [None]:
from transformers import pipeline, set_seed, GPT2Tokenizer

bert_model = "bert-base-uncased"
roberta_model = "roberta-base"
bart_model = "facebook/bart-base"

In [None]:
import os
import nltk

In [None]:
file_path = "unit 1.txt"

try:
    with open(file_path, "r", encoding="utf-8") as f:
        text = f.read()
    print("File loaded successfully!")
except FileNotFoundError:
    print(f"Error: '{file_path}' not found.")

File loaded successfully!


In [None]:
import warnings
import logging

# Suppress warnings/logs
warnings.filterwarnings("ignore")
logging.getLogger("transformers").setLevel(logging.ERROR)

set_seed(42)

prompt = "The future of Artificial Intelligence is"

def safe_generate(model_name, label):
    try:
        generator = pipeline("text-generation", model=model_name)
        output = generator(prompt, max_length=50, num_return_sequences=1, truncation=True)
        print(f"{label} Output:\n{output[0]['generated_text']}\n")
    except Exception as e:
        print(f"{label} Error: {e}\n")

# 1. BERT
safe_generate("bert-base-uncased", "BERT")

# 2. RoBERTa
safe_generate("roberta-base", "RoBERTa")

# 3. BART
safe_generate("facebook/bart-base", "BART")


BERT Output:
The future of Artificial Intelligence is................................................................................................................................................................................................................................................................

RoBERTa Output:
The future of Artificial Intelligence is

BART Output:
The future of Artificial Intelligence isOtherwise ShakOtherwise sure Shak Shak323208 df empir squat Shak chuckms healer df MarxismOtherwisePatrick Walkdy Shak slipsreleased df df32 slips debugger Walk slips Shak denim Shak df df df Walk Drawn Drawn Drawn 361 slipsino Person Princeton Shak chuckSpoilerSpoiler slips df df initially dismant Drawn Crkas Drawn Drawn spotsenc Shak Drawn Drawnino Drawn Drawn opposition Shak workload slips Shak slips df Drawn DrawnEngland Drawn32 Drawn DrawnSel Drawn workload Drawn Drawn Output Drawn Drawn communism Drawn Drawn debugger spots spots dfPost df df workload Drawn df Drawn 

In [None]:
from transformers import pipeline
import warnings, logging

# Suppress warnings/logs
warnings.filterwarnings("ignore")
logging.getLogger("transformers").setLevel(logging.ERROR)

# Sentences with correct mask tokens
sentences = {
    "bert-base-uncased": "The goal of Generative AI is to [MASK] new content.",
    "roberta-base": "The goal of Generative AI is to <mask> new content.",
    "facebook/bart-base": "The goal of Generative AI is to <mask> new content."
}

models = ["bert-base-uncased", "roberta-base", "facebook/bart-base"]

for model in models:
    try:
        fill_mask = pipeline("fill-mask", model=model)
        results = fill_mask(sentences[model])

        print(f"\nModel: {model}")
        print("Predictions:")
        for r in results:
            print(f"  - {r['sequence']} (score: {r['score']:.4f})")
    except Exception as e:
        print(f"\nModel: {model}")
        print(f"Error: {e}")


Model: bert-base-uncased
Predictions:
  - the goal of generative ai is to create new content. (score: 0.5397)
  - the goal of generative ai is to generate new content. (score: 0.1558)
  - the goal of generative ai is to produce new content. (score: 0.0541)
  - the goal of generative ai is to develop new content. (score: 0.0445)
  - the goal of generative ai is to add new content. (score: 0.0176)

Model: roberta-base
Predictions:
  - The goal of Generative AI is to generate new content. (score: 0.3711)
  - The goal of Generative AI is to create new content. (score: 0.3677)
  - The goal of Generative AI is to discover new content. (score: 0.0835)
  - The goal of Generative AI is to find new content. (score: 0.0213)
  - The goal of Generative AI is to provide new content. (score: 0.0165)

Model: facebook/bart-base
Predictions:
  - The goal of Generative AI is to create new content. (score: 0.0746)
  - The goal of Generative AI is to help new content. (score: 0.0657)
  - The goal of Gener

In [None]:
from transformers import pipeline
import warnings, logging

# Suppress warnings/logs
warnings.filterwarnings("ignore")
logging.getLogger("transformers").setLevel(logging.ERROR)

context = "Generative AI poses significant risks such as hallucinations, bias, and deepfakes."
question = "What are the risks?"

models = ["bert-base-uncased", "roberta-base", "facebook/bart-base"]

for model in models:
    try:
        qa = pipeline("question-answering", model=model)
        print(f"\nModel: {model}")
        print(qa(question=question, context=context))
    except Exception as e:
        print(f"\nModel: {model} FAILED")
        print(e)


Model: bert-base-uncased
{'score': 0.008281194604933262, 'start': 72, 'end': 81, 'answer': 'deepfakes'}

Model: roberta-base
{'score': 0.004184452351182699, 'start': 0, 'end': 81, 'answer': 'Generative AI poses significant risks such as hallucinations, bias, and deepfakes'}

Model: facebook/bart-base
{'score': 0.028195755556225777, 'start': 11, 'end': 71, 'answer': 'AI poses significant risks such as hallucinations, bias, and'}


# Observation Table

| Task       | Model   | Classification (Success/Failure) | Observation (What actually happened?)                                   | Why did this happen? (Architectural Reason)                  |
|------------|---------|----------------------------------|------------------------------------------------------------------------|---------------------------------------------------------------|
| Generation | BERT    | Failure                          | Output was just dots, no real text.                                    | BERT is only an encoder, not built to write sentences.        |
|            | RoBERTa | Failure                          | Output stopped after the prompt, no continuation.                      | RoBERTa is also only an encoder, not made for text generation.|
|            | BART    | Partial Success                  | Output was messy and random words.                                     | BART base is not trained for generation tasks.                |
| Fill-Mask  | BERT    | Success                          | Predicted clear words like 'create', 'generate', 'produce'.            | BERT is trained to guess missing words (MLM).                 |
|            | RoBERTa | Success                          | Predicted good words like 'generate', 'create', 'discover'.            | RoBERTa is trained for masked word prediction.                |
|            | BART    | Success                          | Predicted words like 'create', 'help', 'provide', but less accurate.   | BART can do MLM but it is not its main training goal.         |
| QA         | BERT    | Failure                          | Answered only 'deepfakes' with very low score.                         | Base BERT is not trained for question answering.              |
|            | RoBERTa | Partial Success                  | Gave the whole context as answer, but not precise.                     | RoBERTa base is not fine-tuned for QA tasks.                  |
|            | BART    | Failure                          | Answer was a broken sentence fragment.                                 | BART base is not trained for QA span extraction.              |