In [3]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [1]:
!pip install -q transformers torch pandas tqdm

In [9]:
import pandas as pd
import torch
from transformers import AutoTokenizer, AutoModelForSequenceClassification, pipeline
from tqdm import tqdm


In [11]:
# Path articoli
input_path = "/content/drive/Shareddrives/information project/Information Disorder Project/Fase 1 - Raccolta articoli OSINT/Prove Franci/google_news_svb_netflix_FINAL_CLEAN.csv"

articles_df = pd.read_csv(input_path)

# Modello multilingua (STESSO DEI TWEET)
model_name = "cardiffnlp/twitter-xlm-roberta-base-sentiment"

tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSequenceClassification.from_pretrained(model_name)

sentiment_pipeline = pipeline(
    "sentiment-analysis",
    model=model,
    tokenizer=tokenizer
)

# Funzione IDENTICA
def get_sentiment_score(text):
    if pd.isna(text):
        return 0.0

    result = sentiment_pipeline(str(text)[:512])[0]
    label = result["label"]
    score = result["score"]

    if label.lower() == "positive":
        return score
    elif label.lower() == "negative":
        return -score
    else:
        return 0.0

# Applichiamo al titolo
articles_df["xlm_score"] = articles_df["title"].apply(get_sentiment_score)

articles_df.head(10)


Device set to use cpu


Unnamed: 0,case,title,source,published_utc,link,query,date,xlm_score
0,SVB,Silicon Valley Bank and Signature Bank taken o...,Norton Rose Fulbright,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMizwFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
1,SVB,"Silicon Valley Bank Closed by Regulators, FDIC...",The Wall Street Journal,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMizgNBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
2,SVB,Regulators take over Silicon Valley Bank - Ban...,Banking Dive,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMitwFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
3,SVB,Silicon Valley Bank has officially failed afte...,Fortune,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMiigFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.89701
4,SVB,Silicon Valley Bank shut down by regulators - ...,Fox Business,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMiiAFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.662338
5,SVB,"Regulators shut down Silicon Valley Bank, capp...",American Banker,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMiswFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.857818
6,SVB,US regulators shut down Silicon Valley Bank - ...,DW.com,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMiggFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.773473
7,SVB,Silicon Valley Bank is seized by U.S. after hi...,marketplace.org,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMimAFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.822898
8,SVB,Silicon Valley Bank Collapse Leaves Tech Indus...,Crunchbase News,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMicEFVX...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.732317
9,SVB,SVB is largest bank failure since 2008 financi...,Reuters,2023-03-10 08:00:00+00:00,https://news.google.com/rss/articles/CBMiigFBV...,"""SVB"" bank collapse",2023-03-10,-0.86688


In [13]:
articles_df = articles_df.drop(columns=["published_utc"])

In [14]:
articles_df.head(10)

Unnamed: 0,case,title,source,link,query,date,xlm_score
0,SVB,Silicon Valley Bank and Signature Bank taken o...,Norton Rose Fulbright,https://news.google.com/rss/articles/CBMizwFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
1,SVB,"Silicon Valley Bank Closed by Regulators, FDIC...",The Wall Street Journal,https://news.google.com/rss/articles/CBMizgNBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
2,SVB,Regulators take over Silicon Valley Bank - Ban...,Banking Dive,https://news.google.com/rss/articles/CBMitwFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,0.0
3,SVB,Silicon Valley Bank has officially failed afte...,Fortune,https://news.google.com/rss/articles/CBMiigFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.89701
4,SVB,Silicon Valley Bank shut down by regulators - ...,Fox Business,https://news.google.com/rss/articles/CBMiiAFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.662338
5,SVB,"Regulators shut down Silicon Valley Bank, capp...",American Banker,https://news.google.com/rss/articles/CBMiswFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.857818
6,SVB,US regulators shut down Silicon Valley Bank - ...,DW.com,https://news.google.com/rss/articles/CBMiggFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.773473
7,SVB,Silicon Valley Bank is seized by U.S. after hi...,marketplace.org,https://news.google.com/rss/articles/CBMimAFBV...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.822898
8,SVB,Silicon Valley Bank Collapse Leaves Tech Indus...,Crunchbase News,https://news.google.com/rss/articles/CBMicEFVX...,"""Silicon Valley Bank"" regulators",2023-03-10,-0.732317
9,SVB,SVB is largest bank failure since 2008 financi...,Reuters,https://news.google.com/rss/articles/CBMiigFBV...,"""SVB"" bank collapse",2023-03-10,-0.86688


In [15]:
output_path = "/content/drive/Shareddrives/information project/Information Disorder Project/Fase 2 - Analisi del sentiment con finBERT e distilBERT/final clean/google_news_xlm_sentiment.csv"
articles_df.to_csv(output_path, index=False)

print("CSV articoli con sentiment salvato in:")
print(output_path)


CSV articoli con sentiment salvato in:
/content/drive/Shareddrives/information project/Information Disorder Project/Fase 2 - Analisi del sentiment con finBERT e distilBERT/final clean/google_news_xlm_sentiment.csv
