In [2]:
import torch
import torch.nn.functional as F
import torch.nn as nn
import numpy as np
from transformers import (AutoModelForCausalLM, AutoTokenizer, BertForSequenceClassification, BertTokenizer, BertModel,
 RobertaForSequenceClassification, RobertaTokenizer, RobertaModel, TrainingArguments, Trainer, RobertaConfig, pipeline, AutoConfig)
import adapters
import os
os.chdir("../")

# Freezing base

## Mistral samples

In [2]:
config = RobertaConfig.from_pretrained('FacebookAI/roberta-base')
model_path = "best_model_mistral.pt"
state_dict = torch.load(model_path)
model = RobertaForSequenceClassification(config)
model.load_state_dict(state_dict)

tokenizer = RobertaTokenizer.from_pretrained('FacebookAI/roberta-base')
pipeline_classif_mistral = pipeline('text-classification', model=model, tokenizer=tokenizer)

<All keys matched successfully>

In [5]:
sample_text_fake = "Voters in Japan will turn out for parliamentary elections Sunday in what poll after poll shows will be a historic shift in political power to oust the ruling party. Japanese Prime Minister Taro Aso has approval ratings in the teens. The Liberal Democratic Party has been in nearly continuous control of Japan's parliament for more than five decades. But the country's worst economic crisis since World War II has led a normally sedate electorate to the polls, disgruntled with how slowly the country"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.7413396239280701}]

In [6]:
sample_text_true = "Voters in Japan will turn out for parliamentary elections Sunday , with the ruling Liberal Democratic Party (LDP) and its junior partner Komeito poised to extend their 10-year grip on power.  The LDP is likely to retain a two-thirds majority in the lower house, which would allow it to change the constitution without the cooperation of the opposition.  But the party, which has dominated Japanese politics for most of the post-war era, has failed to persuade voters it can tackle the country’s probl"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.7499374151229858}]

In [9]:
sample_text_fake = "Two of Turkey's main political parties are pushing for a constitutional amendment to lift bans on headscarves at public universities, a move that has caused concern among Turkey's secular population.  The lifting of the ban on headscarves has caused concern among Turkey's secular population. Prime Minister Recep Tayyip Erdogan initiated the move, saying it would create equality in Turkey's higher education. The constitutional commission will discuss the proposal -- submitted by the AKP and MHP pa"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.8740516304969788}]

In [10]:
sample_text_fake = "Two of Turkey's main political parties are pushing for a constitutional amendment to lift bans on headscarves at public universities, a move that has caused concern among Turkey's secular population.  The lifting of the ban on headscarves has caused concern among Turkey's secular population.  Prime Minister Recep Tayyip Erdogan initiated the move, saying it would create equality in Turkey's higher education.  The constitutional commission will discuss the proposal -- submitted by the AKP and MHP pa"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.9280597567558289}]

In [12]:
sample_text_fake = "Two of Turkey's main political parties are pushing for a national referendum on the country's membership of the European Union. The ruling Justice and Development Party (AKP) and the opposition Republican People's Party (CHP) are both planning to submit the proposal to parliament. The AKP says the referendum should be held in 2013, while the CHP favors an earlier date. Turkey's EU accession talks have been stalled since 2007 over a series of disputes Turkish Prime Minister Recep Tayyip Erdo"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.7246546745300293}]

In [14]:
sample_text_fake = "Zimbabwean lawmakers on Monday narrowly voted for Lovemore Moyo as speaker of the parliament making him the first opposition lawmaker to hold the position in the country's history. Morgan Tsvangirai's MDC faction has a slim majority following parliamentary elections. \"This is historic as it ceases to be a rubber-stamping house,\" Moyo said after winning the position. \"It will ensure that progressive laws are passed. I promise to be professional.\" Moyo the national chairman of the main Movem"
pipeline_classif_mistral(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.7312844395637512}]

## GPT-2 samples

In [62]:
config = RobertaConfig.from_pretrained('FacebookAI/roberta-base')
model_path = "best_model_gpt2.pt"
state_dict = torch.load(model_path)
model = RobertaForSequenceClassification(config)
model.load_state_dict(state_dict)

tokenizer = RobertaTokenizer.from_pretrained('FacebookAI/roberta-base')
pipeline_classif_gpt2 = pipeline('text-classification', model=model, tokenizer=tokenizer)

In [12]:
sample_text_fake = "After weeks of controversy over Michael Mukasey's views on waterboarding, the Obama administration has decided to stop using torture. President Barack H.\"s decision will not change any new law that is passed,\" said Sen-elect Mike Lee in a statement released Wednesday evening by his campaign and Democratic presidential candidate Hillary Clinton supporters who are trying for president with an \"opportunity\" at this weekday rally outside New Hampshire.As far as"

pipeline_classif_gpt2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.9197396636009216}]

In [31]:
sample_text_fake = "\"Why do only rich kids get good schools?\" I was asked this question by a fellow who has been to many of the best public school systems in America. \"How does it feel for poor students? If you are lucky, then there is always going be one or two other children that don't know how they can succeed academically,\" he told me after we had spent some time together at his home and talked about what life on campus would look like if all those bright young people got their hands dirty with every opportunit"
pipeline_classif_gpt2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.9603350162506104}]

In [35]:
sample_text_fake = "\"Why do only rich kids get good schools?\" I was the founder and director of a part-time out-of-school college preparatory program. The questioner was a parent; herself a victim of a dulled urban education. The statement was more of an indictment than question, and I had no answer. \"Well, why can't this program be a school,\" she offered. The program sent 100 percent of our graduates to college. We served poor students who were the first generation in their families to attend college. We provided "
pipeline_classif_gpt2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.511606752872467}]

## Phi-2 samples

In [37]:
config = RobertaConfig.from_pretrained('FacebookAI/roberta-base')
model_path = "best_model_phi2.pt"
state_dict = torch.load(model_path)
model = RobertaForSequenceClassification(config)
model.load_state_dict(state_dict)

tokenizer = RobertaTokenizer.from_pretrained('FacebookAI/roberta-base')
pipeline_classif_phi2 = pipeline('text-classification', model=model, tokenizer=tokenizer)

In [40]:
sample_text_fake = "Brazil have returned to the top of the FIFA world rankings for the first time since the start of the pandemic. It is estimated that around 100,000 football players and coaches are currently self-isolating after testing positive for COVID-19. The government is trying to ensure that all of the country's footballers have been tested for the virus, and those that test positive are being quarantined in a number of specially-built isolation units. The government has been criticised for not doing enoug"
pipeline_classif_phi2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.6936783790588379}]

In [48]:
sample_text_true = "Brazil have returned to the top of the FIFA world rankings after a two-year absence, following their Confederations Cup final victory over the United States in South Africa on Sunday -- FIFA.com have reported. The Brazilian national side top the FIFA world rankings again after an absence of two years. Dunga's side came from behind to defeat the United States 3-2, a result which sees them replace Spain after the European champions were beaten in the semifinals to finish third in the Confederation."
pipeline_classif_phi2(sample_text_true)

[{'label': 'LABEL_0', 'score': 0.9688941240310669}]

In [54]:
sample_text_true = "He is iconic, there's no doubt. George Hamilton gets his life story on screen in \"My One and Only.\" With the elegant suit and tie, the impeccable grooming, the tan (Did I mention the tan?), George Hamilton is still a charmer, and he comes across like a born bon vivant. Sure, his acting may have taken a backseat to his bronzed visage years ago, but what did happen to him years ago? Well, there's a story there, one now coming to the big screen. Hamilton's formative years are loosely depicted in th"
pipeline_classif_phi2(sample_text_true)

[{'label': 'LABEL_0', 'score': 0.8942074775695801}]

In [58]:
sample_text_fake = "He is iconic, there's no doubt. George Hamilton gets his life story on screen in \"My One and Only.\", and has become synonymous with a certain kind of masculine manliness. But who is this man? What does it mean to be a George Hamilton? It's difficult to pinpoint exactly what makes a George Hamilton, but there are a few qualities that are common to all. 1. He is physically strong and fit. George Hamilton is a man who takes care of his body. He works out regularly, eats a healthy diet, and gets plenty of rest. He i"
pipeline_classif_phi2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.9198764562606812}]

## Cross model predictions

In [59]:
sample_text_fake = "\"Why do only rich kids get good schools?\" I was asked this question by a fellow who has been to many of the best public school systems in America. \"How does it feel for poor students? If you are lucky, then there is always going be one or two other children that don't know how they can succeed academically,\" he told me after we had spent some time together at his home and talked about what life on campus would look like if all those bright young people got their hands dirty with every opportunit"
pipeline_classif_phi2(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.6927809119224548}]

In [61]:
sample_text_fake = "\"Why do only rich kids get good schools?\" I was the founder and director of a part-time out-of-school college preparatory program. The questioner was a parent; herself a victim of a dulled urban education. The statement was more of an indictment than question, and I had no answer. \"Well, why can't this program be a school,\" she offered. The program sent 100 percent of our graduates to college. We served poor students who were the first generation in their families to attend college. We provided "
pipeline_classif_phi2(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.7440130710601807}]

In [64]:
sample_text_fake = "Brazil have returned to the top of the FIFA world rankings for the first time since the start of the pandemic. It is estimated that around 100,000 football players and coaches are currently self-isolating after testing positive for COVID-19. The government is trying to ensure that all of the country's footballers have been tested for the virus, and those that test positive are being quarantined in a number of specially-built isolation units. The government has been criticised for not doing enoug"
pipeline_classif_gpt2(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.9977840781211853}]

In [65]:
sample_text_fake = "Brazil have returned to the top of the FIFA world rankings for the first time since the start of the pandemic. It is estimated that around 100,000 football players and coaches are currently self-isolating after testing positive for COVID-19. The government is trying to ensure that all of the country's footballers have been tested for the virus, and those that test positive are being quarantined in a number of specially-built isolation units. The government has been criticised for not doing enoug"
pipeline_classif_gpt2(sample_text_fake)

[{'label': 'LABEL_0', 'score': 0.5806064605712891}]

# Full finetuning

# Adapter training 

In [7]:
detector_path = "FacebookAI/roberta-large"
config = AutoConfig.from_pretrained(detector_path)
model = RobertaForSequenceClassification(config)
bert_tokenizer = RobertaTokenizer.from_pretrained(detector_path)

In [8]:
model_path = "./saved_training_logs/roberta_large/fake_true_dataset_gpt2_10k/26_03_1841/saved_models/best_model.pt"
adapters.init(model)
config = adapters.BnConfig(mh_adapter=True, output_adapter=True, reduction_factor=16, non_linearity="relu")
model.add_adapter("fake_true_detection", config=config)
model.load_state_dict(torch.load(model_path))
model = model.to('cuda')

In [13]:
model.roberta.encoder.layer[0]

RobertaLayer(
  (attention): RobertaAttention(
    (self): RobertaSelfAttentionWithAdapters(
      (query): LoRALinear(
        in_features=1024, out_features=1024, bias=True
        (loras): ModuleDict()
      )
      (key): LoRALinear(
        in_features=1024, out_features=1024, bias=True
        (loras): ModuleDict()
      )
      (value): LoRALinear(
        in_features=1024, out_features=1024, bias=True
        (loras): ModuleDict()
      )
      (dropout): Dropout(p=0.1, inplace=False)
      (prefix_tuning): PrefixTuningLayer(
        (prefix_gates): ModuleDict()
        (pool): PrefixTuningPool(
          (prefix_tunings): ModuleDict()
        )
      )
    )
    (output): RobertaSelfOutputWithAdapters(
      (dense): Linear(in_features=1024, out_features=1024, bias=True)
      (LayerNorm): LayerNorm((1024,), eps=1e-05, elementwise_affine=True)
      (dropout): Dropout(p=0.1, inplace=False)
      (adapters): ModuleDict(
        (fake_true_detection): Adapter(
          (non_lin

# Weird results

In [2]:
config = RobertaConfig.from_pretrained('distilbert/distilroberta-base')
model_path = "saved_training_logs_experiment_2/distil_roberta-base/freeze_base/fake_true_dataset_gemma_10k/04_04_1004/saved_models/best_model.pt"
state_dict = torch.load(model_path)
model = RobertaForSequenceClassification(config)
model.load_state_dict(state_dict)

tokenizer = RobertaTokenizer.from_pretrained('distilbert/distilroberta-base')
pipeline_classif_gemma = pipeline('text-classification', model=model, tokenizer=tokenizer)

## Dick Cheney example

In [12]:
sample_text_true = "Former Vice President Dick Cheney on Sunday defended the Bush administration's economic record, the invasion of Iraq and the treatment of suspected terrorists, warning that reversing its anti-terrorism policies endangers Americans. \"We've accomplished nearly everything we set out to do,\" ex-Vice President Dick Cheney says Sunday about Iraq. In a wide-ranging interview with CNN's \"State of the Union,\" Cheney said the harsh interrogations of suspects and the use of warrantless electronic surveilla"
pipeline_classif_gemma(sample_text_true)

[{'label': 'LABEL_0', 'score': 0.8481298685073853}]

In [13]:
sample_text_fake_gemma = "Former Vice President Dick Cheney on Sunday defended the Bush administration’s decision to invade Iraq, arguing that the U.S. should have acted against Saddam Hussein in the wake of the 9\/11 terrorist attacks. “I think there was a good case for action,” Cheney said on NBC’s “Meet the Press.” “I think we did the right thing.” Cheney, who served as Vice President under George W. Bush, was asked about the president’s comments on Thursday, when he said that the U.S. should not have invaded Iraq and "
pipeline_classif_gemma(sample_text_fake_gemma)

  sample_text_fake = "Former Vice President Dick Cheney on Sunday defended the Bush administration’s decision to invade Iraq, arguing that the U.S. should have acted against Saddam Hussein in the wake of the 9\/11 terrorist attacks. “I think there was a good case for action,” Cheney said on NBC’s “Meet the Press.” “I think we did the right thing.” Cheney, who served as Vice President under George W. Bush, was asked about the president’s comments on Thursday, when he said that the U.S. should not have invaded Iraq and "


[{'label': 'LABEL_1', 'score': 0.9525690674781799}]

In [14]:
sample_text_fake_phi = "Former Vice President Dick Cheney on Sunday defended the Bush administration’s energy policy, saying it has “made a big difference.” In an interview with the “CBS Evening News” program, Cheney, who is currently on leave from his post as CEO of Halliburton, the oil and gas services company, said that “the energy policy of the Bush administration has been extremely successful.” The interview aired Sunday morning, but was not aired in its entirety on the CBS Evening News, which aired the interview"
pipeline_classif_gemma(sample_text_fake_phi)

[{'label': 'LABEL_1', 'score': 0.9780640602111816}]

In [15]:
sample_text_fake_mistral = "Former Vice President Dick Cheney on Sunday defended the Bush administration's decision to close Guantanamo Bay prison after his former boss was accused of ordering an attack against a U.S.-led coalition in Yemen, saying it would be \"shameful\" if there were no charges brought by that country over its alleged involvement with al Qaeda-linked militants who carried out attacks at US military bases and other places throughout the Middle East last year as well: -The United States has never been invol"
pipeline_classif_gemma(sample_text_fake)

[{'label': 'LABEL_1', 'score': 0.9946627616882324}]

In [16]:
sample_text_fake_gpt2 = "Former Vice President Dick Cheney on Sunday defended the Bush administration's actions in Iraq, saying they did not cause any harm to U.S.-led forces and that there was no need for more airstrikes against Islamic State targets near Baghdad after a series of air strikes over six months ago killed at least 21 Iraqi soldiers who had joined IS or were suspected terrorists by government officials as part (AFP Photo\/RUFA RUSSELL) A senior US official said Saturday he believes \"that it is possible\" Was"
pipeline_classif_gemma(sample_text_fake)

  sample_text_fake_gpt2 = "Former Vice President Dick Cheney on Sunday defended the Bush administration's actions in Iraq, saying they did not cause any harm to U.S.-led forces and that there was no need for more airstrikes against Islamic State targets near Baghdad after a series of air strikes over six months ago killed at least 21 Iraqi soldiers who had joined IS or were suspected terrorists by government officials as part (AFP Photo\/RUFA RUSSELL) A senior US official said Saturday he believes \"that it is possible\" Was"


[{'label': 'LABEL_1', 'score': 0.9777976274490356}]

## Four groups example

In [117]:
sample_text_true = "Four groups that advocate for immigrant rights said Thursday they will challenge Arizona's new immigration law, which allows police to ask anyone for proof of legal U.S. residency. The Mexican American Legal Defense and Educational Fund, the American Civil Liberties Union, the ACLU of Arizona and the National Immigration Law Center held a news conference Thursday in Phoenix to announce the legal challenge. \"The Arizona community can be assured that a vigorous and sophisticated legal challenge wi"
pipeline_classif_gemma(sample_text_true)

[{'label': 'LABEL_0', 'score': 0.9731037616729736}]

In [94]:
sample_text_fake_gemma = "Four groups that advocate for immigrant rights said Thursday they are suing the Trump administration over its new policy that blocks federal funding for legal representation to immigrants facing deportation. The groups, including the American Civil Liberties Union and the National Immigration Law Center, said they are filing a lawsuit in the U.S. District Court in Los Angeles. The lawsuit alleges that the Trump administration’s policy violates the 14th Amendment, which guarantees equal protectio"
pipeline_classif_gemma(sample_text_fake_gemma)

[{'label': 'LABEL_1', 'score': 0.8621445894241333}]

In [114]:
sample_text_fake_gemma = "Four groups that advocate for immigrant rights said Thursday they are suing the Trump administration over its new policy that blocks federal funding for legal representation to immigrants facing deportation. The groups, including the American Civil Liberties Union and the National Immigration Law Center, said they are filing a lawsuit in the U.S. District Court in Los Angeles. The lawsuit alleges that the Trump administration's policy violates the 14th Amendment, which guarantees equal protectio"
pipeline_classif_gemma(sample_text_fake_gemma)

[{'label': 'LABEL_1', 'score': 0.7527174353599548}]

In [156]:
sample_text_fake_gemma = "Four groups that advocate for immigrant rights said Thursday they are suing the Trump administration over its new policy. The lawsuit alleges that the Trump administration's policy violates the 14th Amendment, which guarantees equal protection."
pipeline_classif_gemma(sample_text_fake_gemma)

[{'label': 'LABEL_1', 'score': 0.759391188621521}]

In [None]:
sample_text_fake_trivial_true = "The news shocked the world, he did it again. As Chile celebrated the 100th Anniversary of its independence, the terrorist group attacked the festivities at the capital. The attacker's motive matched the police's investigation."
pipeline_classif_gemma(sample_text_fake_trivial_true)

In [62]:
prob_fake_dict = []
all_chars_list = [chr(i) for i in range(128)]
for char in all_chars_list:
    sample_text_fake_trivial = char

    res_scores = []
    for i in range(10):
        res = pipeline_classif_gemma(sample_text_fake_trivial)[0]
        res_label = res["label"]
        if res_label == "LABEL_0":
            res_scores.append(-res["score"])
        elif res_label == "LABEL_1":
            res_scores.append(res["score"])
        else:
            raise ValueError("Error")
    res_score_avg = sum(res_scores) / len(res_scores)
    prob_fake_dict.append({"char": char, "score" : res_score_avg})


In [63]:
import pandas as pd
prob_fake_dict_df = pd.DataFrame(prob_fake_dict)

In [65]:
prob_fake_dict_df.sort_values("score", ascending=True)

Unnamed: 0,char,score
39,',-0.942340
46,.,-0.920768
15,,-0.825839
1,,-0.823418
18,,-0.816708
...,...,...
43,+,0.491466
120,x,0.526440
60,<,0.591004
94,^,0.643556


In [68]:
top_20 = prob_fake_dict_df.sort_values("score", ascending=True)[:20]
top_20

Unnamed: 0,char,score
39,',-0.94234
46,.,-0.920768
15,,-0.825839
1,,-0.823418
18,,-0.816708
41,),-0.808557
28,,-0.774449
90,Z,-0.746635
98,b,-0.730442
63,?,-0.717379


In [92]:
all_words_list = []
with open("word_list.txt", "r") as f:
    words = f.readlines()
    words = [word.strip() for word in words]
    all_words_list.extend(words)  

In [93]:
all_words_list

['a',
 'AAA',
 'AAAS',
 'aardvark',
 'Aarhus',
 'Aaron',
 'ABA',
 'Ababa',
 'aback',
 'abacus',
 'abalone',
 'abandon',
 'abase',
 'abash',
 'abate',
 'abbas',
 'abbe',
 'abbey',
 'abbot',
 'Abbott',
 'abbreviate',
 'abc',
 'abdicate',
 'abdomen',
 'abdominal',
 'abduct',
 'Abe',
 'abed',
 'Abel',
 'Abelian',
 'Abelson',
 'Aberdeen',
 'Abernathy',
 'aberrant',
 'aberrate',
 'abet',
 'abetted',
 'abetting',
 'abeyance',
 'abeyant',
 'abhor',
 'abhorred',
 'abhorrent',
 'abide',
 'Abidjan',
 'Abigail',
 'abject',
 'abjure',
 'ablate',
 'ablaze',
 'able',
 'ablution',
 'abnegation',
 'Abner',
 'abnormal',
 'Abo',
 'aboard',
 'abode',
 'abolish',
 'abolition',
 'abominable',
 'abominate',
 'aboriginal',
 'aborigine',
 'aborning',
 'abort',
 'abound',
 'about',
 'above',
 'aboveboard',
 'aboveground',
 'abovementioned',
 'abrade',
 'Abraham',
 'Abram',
 'Abramson',
 'abrasion',
 'abrasive',
 'abreact',
 'abreast',
 'abridge',
 'abridgment',
 'abroad',
 'abrogate',
 'abrupt',
 'abscess',
 'a

In [96]:
from tqdm import tqdm
prob_fake_dict = []
for word in tqdm(all_words_list):
    sample_text_fake_trivial = word
    res_scores = []
    for i in range(5):
        res = pipeline_classif_gemma(sample_text_fake_trivial)[0]
        res_label = res["label"]
        if res_label == "LABEL_0":
            res_scores.append(-res["score"])
        elif res_label == "LABEL_1":
            res_scores.append(res["score"])
        else:
            raise ValueError("Error")
    res_score_avg = sum(res_scores) / len(res_scores)
    prob_fake_dict.append({"word": word, "score" : res_score_avg})

  0%|          | 1/25487 [00:00<49:43,  8.54it/s]

100%|██████████| 25487/25487 [38:25<00:00, 11.06it/s] 


In [97]:
prob_fake_dict_df = pd.DataFrame(prob_fake_dict)
top_20_true = prob_fake_dict_df.sort_values("score", ascending=True)[:20]
top_20_true

Unnamed: 0,word,score
7427,eavesdropping,-0.989576
13462,leapt,-0.967688
24903,where're,-0.957969
2051,basketry,-0.954982
509,ain't,-0.954606
188,achieve,-0.954331
10832,he'll,-0.954186
5847,c's,-0.950743
18663,q's,-0.950241
16900,parry,-0.950173


In [112]:
top_20_fake = prob_fake_dict_df.sort_values("score", ascending=False)[:20]
top_20_fake

Unnamed: 0,word,score
12485,irreclaimable,0.867342
13679,lightweight,0.826113
22736,Taurus,0.823779
3925,Caucasus,0.802326
24663,Warburton,0.789884
16077,nouveau,0.786104
23443,toxin,0.768726
21780,Stanford,0.764462
1110,A&P,0.763143
24507,Vladimir,0.762693


In [7]:
sample_text_fake_trivial_fake = "The news shocked the world, he did it again. As Chile celebrated the 100th Anniversary of its independence, the terrorist group attacked the festivities at the capital. The attacker’s motive matched the police’s investigation."
pipeline_classif_gemma(sample_text_fake_trivial_fake)

[{'label': 'LABEL_0', 'score': 0.5188333988189697}]

In [117]:
sample_text_fake_trivial_true = "The news shocked the world. He did it again. As Chile celebrated the 100th Anniversary of its independence, the terrorist group attacked the festivities at the capital. Truely shocking. I am speacheless. It is said that many of those killed were from rich countries. "
pipeline_classif_gemma(sample_text_fake_trivial_true)

[{'label': 'LABEL_0', 'score': 0.7145633697509766}]

In [114]:
sample_text_fake_trivial_true = "irreclaimable"
pipeline_classif_gemma(sample_text_fake_trivial_true)

[{'label': 'LABEL_1', 'score': 0.6598275303840637}]

In [128]:
sample_text_fake_phi = "Four groups that advocate for immigrant rights said Thursday they are working on a new bill that would give undocumented immigrants a path to citizenship, but they said they are still waiting for a final version of the immigration bill passed by the House in November. The bill, known as the American Dream and Promise Act, would allow undocumented immigrants who have lived in the United States for five years and meet other requirements to apply for temporary legal status, followed by a path to ci"
pipeline_classif_gemma(sample_text_fake_phi)

[{'label': 'LABEL_0', 'score': 0.5859024524688721}]

In [129]:
sample_text_fake_mistral = "Four groups that advocate for immigrant rights said Thursday they will fight to prevent a new law from being enacted. (Published Wednesday, June 18th 2017) — A group of four activists is asking the Supreme Court in an appeal filed on behalf and against one other court case involving undocumented immigrants who have been denied visas because their families are U-Hauled at home or if there's no way around it: The Immigrant Law Enforcement Coalition has requested this week $10 million dollars more "
pipeline_classif_gemma(sample_text_fake_mistral)

[{'label': 'LABEL_0', 'score': 0.9476719498634338}]

In [19]:
sample_text_fake_gpt2 = "Four groups that advocate for immigrant rights said Thursday they will hold a rally on Oct. 26 in Washington, D-C., to protest President Trump's executive order barring entry into the United States of citizens and residents from seven predominantly Muslim countries—Iran, Iraq\/ Syria & Yemen. (Jenny Starrs \/ The Seattle Times) More than 2 million people have signed an online petition calling attention against \"Trumpism\" at home by highlighting how America has been so divided since Donald J.(L.) t"
pipeline_classif_gemma(sample_text_fake_gpt2)

  sample_text_fake_gpt2 = "Four groups that advocate for immigrant rights said Thursday they will hold a rally on Oct. 26 in Washington, D-C., to protest President Trump's executive order barring entry into the United States of citizens and residents from seven predominantly Muslim countries—Iran, Iraq\/ Syria & Yemen. (Jenny Starrs \/ The Seattle Times) More than 2 million people have signed an online petition calling attention against \"Trumpism\" at home by highlighting how America has been so divided since Donald J.(L.) t"


[{'label': 'LABEL_0', 'score': 0.9917388558387756}]

# Test phi detector with prompt

In [23]:
from transformers import AutoTokenizer, AutoModelForCausalLM
import torch

model_id = "meta-llama/Meta-Llama-3-8B-Instruct"

tokenizer = AutoTokenizer.from_pretrained(model_id)

Special tokens have been added in the vocabulary, make sure the associated word embeddings are fine-tuned or trained.


In [19]:
tokenizer.encode("<pad>")

[128000, 8085, 329, 29]

In [25]:
tokenizer.decode([128000, 128000, 128006,   9125, 128007,    271,   2675,    527,    264,
         11190,  18328,     13, 128009, 128006,    882, 128007,    271,  24433,
           311,   3350,    420,   3754,   4652,     25,  14253,  30427,   6917,
         15469,  21254,  80556,  20192,   2680,    311,    264,   5068, 128009,
        128006,  78191, 128007,   1432,  42398,  30427,   6917,  15469,  21254,
         80556,  20192,   2680,    311,    264,   5068, 128009, 128009, 128009,
        128009, 128009, 128009, 128009, 128009, 128009, 128009, 128009, 128009,
        128009, 128009])

'<|begin_of_text|><|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\nYou are a helpful assistant.<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nContinue to write this news article: Harry Potter star Daniel Radcliffe gains access to a reported<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n\nHarry Potter star Daniel Radcliffe gains access to a reported<|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|><|eot_id|>'

In [27]:
tokenizer.decode([128000, 128000, 128006,   9125, 128007,    271,   2675,    527,    264,
         11190,  18328,     13, 128009, 128006,    882, 128007,    271,  24433,
           311,   3350,    420,   3754,   4652,     25,  14253,  30427,   6917,
         15469,  21254,  80556,  20192,   2680,    311,    264,   5068, 128009,
        128006,  78191, 128007,   1432,  42398,  30427,   6917,  15469,  21254,
         80556,  20192,   2680,    311,    264,   5068, 128009, 128009, 128009,
        128009])

'<|begin_of_text|><|begin_of_text|><|start_header_id|>system<|end_header_id|>\n\nYou are a helpful assistant.<|eot_id|><|start_header_id|>user<|end_header_id|>\n\nContinue to write this news article: Harry Potter star Daniel Radcliffe gains access to a reported<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n\nHarry Potter star Daniel Radcliffe gains access to a reported<|eot_id|><|eot_id|><|eot_id|><|eot_id|>'

In [28]:
text_test = "As he awaits a crucial progress report on Iraq, President Bush will try to put a twist on comparisons of the war to Vietnam by invoking the historical lessons of that conflict to argue against pulling out. President Bush pauses Tuesday during a news conference at the North American Leaders summit in Canada. On Wednesday in Kansas City, Missouri, Bush will tell members of the Veterans of Foreign Wars that \"then, as now, people argued that the real problem was America's presence and that if we wou"
tokenizer(text_test)