# Analysis of LLM Labels

- Load LLM-labelled data
- Calculate the ratio of posts that are labelled prediction and non-predicton

In [1]:
import os
import sys

import pandas as pd

from tqdm import tqdm

# Get the current working directory of the notebook
notebook_dir = os.getcwd()
# print(notebook_dir)
# Add the parent directory to the system path
sys.path.append(os.path.join(notebook_dir, '../'))

from data_processing import DataProcessing
from text_generation_models import TextGenerationModelFactory

In [6]:
pd.set_option('max_colwidth', 800)

In [3]:
path_to_data = "../data/open_measures/bluesky_all_llm_labels/bluesky-v10.json"
full_path = os.path.join(notebook_dir, path_to_data)
df = pd.read_json(full_path)
df

Unnamed: 0,sentence,model,label,meta_data,majority_vote
0,Wow! Nepal confirmed as one of 16 finalists fo...,gemma2-9b-it,not a prediction,"{'data_range_per_file': 0, '$type': 'app.bsky....",not a prediction
1,Wow! Nepal confirmed as one of 16 finalists fo...,llama-3.1-8b-instant,prediction,"{'data_range_per_file': 0, '$type': 'app.bsky....",not a prediction
2,Wow! Nepal confirmed as one of 16 finalists fo...,llama-3.3-70b-versatile,not a prediction,"{'data_range_per_file': 0, '$type': 'app.bsky....",not a prediction
3,Wow! Nepal confirmed as one of 16 finalists fo...,meta-llama/llama-guard-4-12b,safe,"{'data_range_per_file': 0, '$type': 'app.bsky....",not a prediction
4,Sad! AFC bans Nepal from U16 Asian Championshi...,gemma2-9b-it,not a prediction,"{'data_range_per_file': 1, '$type': 'app.bsky....",not a prediction
...,...,...,...,...,...
798,"3Ô∏è‚É£: Super Bowl LVII\n""Super Bowl LVII was an ...",meta-llama/llama-guard-4-12b,safe,"{'data_range_per_file': 198, '$type': 'app.bsk...",not a prediction
799,Where do Reid and Mahomes sit among QB/coachin...,gemma2-9b-it,prediction,"{'data_range_per_file': 199, '$type': 'app.bsk...",prediction
800,Where do Reid and Mahomes sit among QB/coachin...,llama-3.1-8b-instant,prediction,"{'data_range_per_file': 199, '$type': 'app.bsk...",prediction
801,Where do Reid and Mahomes sit among QB/coachin...,llama-3.3-70b-versatile,not a prediction,"{'data_range_per_file': 199, '$type': 'app.bsk...",prediction


In [7]:
filt_prediction = (df['majority_vote'] == 'prediction')
df[filt_prediction]

Unnamed: 0,sentence,model,label,meta_data,majority_vote
8,"2016 Super Bowl odds: Patriots, Cards begin playoffs as co-favorites http://www.cbssports.com/nfl/eye-on-football/25442860/super-bowl-odds-patriots-cardinals-begin-playoffs-as-co-favorites via @CBSSports",gemma2-9b-it,not a prediction,"{'data_range_per_file': 2, '$type': 'app.bsky.feed.post', 'author': 'did:plc:ahok3cgd4c7rhnwrnofapqls', 'authorProfile': '{'_id': 'did:plc:ahok3cgd4c7rhnwrnofapqls', '_index': 'smat-bluesky-users', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreic5yiylpra6qg2hpluhkktuiggzesdtc25s6xhhpitqueiicso27e@jpeg', 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreia47gyvqcq2mcndvv2dtkwkepudxmwfk6ca4rujpwfynwn6onibsa@jpeg', 'description': 'Find my profile at https://vivensjoachim.brandyourself.com/\nFind my community works at: https://mibaleavantou.com, or\nhttp://vjmvp.com/index.php, and some other works at: https://ntkvideo.com/\nBorn in Haiti in 1970. Migrated to the USA in 1994. Live in CT', 'did': 'did:plc:ahok3cg...",prediction
9,"2016 Super Bowl odds: Patriots, Cards begin playoffs as co-favorites http://www.cbssports.com/nfl/eye-on-football/25442860/super-bowl-odds-patriots-cardinals-begin-playoffs-as-co-favorites via @CBSSports",llama-3.1-8b-instant,prediction,"{'data_range_per_file': 2, '$type': 'app.bsky.feed.post', 'author': 'did:plc:ahok3cgd4c7rhnwrnofapqls', 'authorProfile': '{'_id': 'did:plc:ahok3cgd4c7rhnwrnofapqls', '_index': 'smat-bluesky-users', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreic5yiylpra6qg2hpluhkktuiggzesdtc25s6xhhpitqueiicso27e@jpeg', 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreia47gyvqcq2mcndvv2dtkwkepudxmwfk6ca4rujpwfynwn6onibsa@jpeg', 'description': 'Find my profile at https://vivensjoachim.brandyourself.com/\nFind my community works at: https://mibaleavantou.com, or\nhttp://vjmvp.com/index.php, and some other works at: https://ntkvideo.com/\nBorn in Haiti in 1970. Migrated to the USA in 1994. Live in CT', 'did': 'did:plc:ahok3cg...",prediction
10,"2016 Super Bowl odds: Patriots, Cards begin playoffs as co-favorites http://www.cbssports.com/nfl/eye-on-football/25442860/super-bowl-odds-patriots-cardinals-begin-playoffs-as-co-favorites via @CBSSports",llama-3.3-70b-versatile,prediction,"{'data_range_per_file': 2, '$type': 'app.bsky.feed.post', 'author': 'did:plc:ahok3cgd4c7rhnwrnofapqls', 'authorProfile': '{'_id': 'did:plc:ahok3cgd4c7rhnwrnofapqls', '_index': 'smat-bluesky-users', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreic5yiylpra6qg2hpluhkktuiggzesdtc25s6xhhpitqueiicso27e@jpeg', 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreia47gyvqcq2mcndvv2dtkwkepudxmwfk6ca4rujpwfynwn6onibsa@jpeg', 'description': 'Find my profile at https://vivensjoachim.brandyourself.com/\nFind my community works at: https://mibaleavantou.com, or\nhttp://vjmvp.com/index.php, and some other works at: https://ntkvideo.com/\nBorn in Haiti in 1970. Migrated to the USA in 1994. Live in CT', 'did': 'did:plc:ahok3cg...",prediction
11,"2016 Super Bowl odds: Patriots, Cards begin playoffs as co-favorites http://www.cbssports.com/nfl/eye-on-football/25442860/super-bowl-odds-patriots-cardinals-begin-playoffs-as-co-favorites via @CBSSports",meta-llama/llama-guard-4-12b,safe,"{'data_range_per_file': 2, '$type': 'app.bsky.feed.post', 'author': 'did:plc:ahok3cgd4c7rhnwrnofapqls', 'authorProfile': '{'_id': 'did:plc:ahok3cgd4c7rhnwrnofapqls', '_index': 'smat-bluesky-users', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreic5yiylpra6qg2hpluhkktuiggzesdtc25s6xhhpitqueiicso27e@jpeg', 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:ahok3cgd4c7rhnwrnofapqls/bafkreia47gyvqcq2mcndvv2dtkwkepudxmwfk6ca4rujpwfynwn6onibsa@jpeg', 'description': 'Find my profile at https://vivensjoachim.brandyourself.com/\nFind my community works at: https://mibaleavantou.com, or\nhttp://vjmvp.com/index.php, and some other works at: https://ntkvideo.com/\nBorn in Haiti in 1970. Migrated to the USA in 1994. Live in CT', 'did': 'did:plc:ahok3cg...",prediction
20,Is there a point to the rest of the #NFL season...or should we just get ready to cheer against the #Patriots in the Super Bowl?,gemma2-9b-it,prediction,"{'data_range_per_file': 5, '$type': 'app.bsky.feed.post', 'author': 'did:plc:fwb2rz5jbqoxaiccbonp5wff', 'authorProfile': '{'did': 'did:plc:fwb2rz5jbqoxaiccbonp5wff', 'handle': 'arrizzo.bsky.social', 'followers': 22, 'indexed_at': '2024-12-05T16:09:24.008Z', 'following': 48, 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:fwb2rz5jbqoxaiccbonp5wff/bafkreiewvtbog6idl7543u3ssd63jzilnfsfyu6xx73l2xzaxesxsjaxnu@jpeg', 'description': '#Bills #Yankees #Heat #Bonnies #Sabres? #Toffees #Griffs?\nMan of Pizzazz full of #HappyManTears\nFluent in #BeardLaw \nCello Lover\n#Goose \n#Phish', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:fwb2rz5jbqoxaiccbonp5wff/bafkreic2cybiqexoy74holnh3ilstntg6ogsihs3h7dx54wxkjpouvlwxy@jpeg', 'display_name': 'Anthony Rizzo', 'posts': 12574, 'lastse...",prediction
...,...,...,...,...,...
794,"Forgot to post this today. From 1982, Brimstone prepares for the Super Bowl. Disappointment follows.",meta-llama/llama-guard-4-12b,safe,"{'data_range_per_file': 197, '$type': 'app.bsky.feed.post', 'author': 'did:plc:w33kky5h2zepbv3xp6en5ohp', 'authorProfile': '{'_index': 'smat-bluesky-users', 'viewer_blocked_by': False, 'viewer_mute': False, 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:w33kky5h2zepbv3xp6en5ohp/bafkreihfwcqgzatkot77io2twtzbdbxbcokl5oc57cp5h4xrzfpc77hwci@jpeg', 'description': 'Writer & Enthusiast ‚Ä¢ Overthinking The Born Loser since 2008 ‚Ä¢ Bi ‚Ä¢ They/them\n\nAbout: https://www.tauycreek.com/p/about-the.html', '_op_type': 'index', 'handle': 'tauycreek.bsky.social', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:w33kky5h2zepbv3xp6en5ohp/bafkreicmmxaynx7ubi45oiftvrwhucbmkjpizjsgag63w7uyibrvn7hfvi@jpeg', 'display_name': 'Brian Hall', 'posts': 704, 'followers': 46, 'following': 122, '_id': ...",prediction
799,Where do Reid and Mahomes sit among QB/coaching duos for playoffs wins?,gemma2-9b-it,prediction,"{'data_range_per_file': 199, '$type': 'app.bsky.feed.post', 'author': 'did:plc:khnhnlclg7d347pphyr4ftjp', 'authorProfile': '{'_index': 'smat-bluesky-users', 'viewer_blocked_by': False, 'viewer_mute': False, 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreihhz6litbxizy5pqxwte6h7aayrqwhl27vfu676pfo5s6ndcc4vta@jpeg', 'description': 'KCC News brings you entertaining & up to date coverage of Kansas City Chiefs and the NFL üèà', '_op_type': 'index', 'handle': 'kccnews.bsky.social', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreigcoc262u7vc3k3ivaqmbfjo24h2jmqz4pilj4zbeff345wxjn2zq@jpeg', 'display_name': 'Kansas City Chiefs News', 'posts': 540, 'followers': 81, 'following': 0, '_id': 'did:plc:khnhnlclg7d347pphyr4ft...",prediction
800,Where do Reid and Mahomes sit among QB/coaching duos for playoffs wins?,llama-3.1-8b-instant,prediction,"{'data_range_per_file': 199, '$type': 'app.bsky.feed.post', 'author': 'did:plc:khnhnlclg7d347pphyr4ftjp', 'authorProfile': '{'_index': 'smat-bluesky-users', 'viewer_blocked_by': False, 'viewer_mute': False, 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreihhz6litbxizy5pqxwte6h7aayrqwhl27vfu676pfo5s6ndcc4vta@jpeg', 'description': 'KCC News brings you entertaining & up to date coverage of Kansas City Chiefs and the NFL üèà', '_op_type': 'index', 'handle': 'kccnews.bsky.social', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreigcoc262u7vc3k3ivaqmbfjo24h2jmqz4pilj4zbeff345wxjn2zq@jpeg', 'display_name': 'Kansas City Chiefs News', 'posts': 540, 'followers': 81, 'following': 0, '_id': 'did:plc:khnhnlclg7d347pphyr4ft...",prediction
801,Where do Reid and Mahomes sit among QB/coaching duos for playoffs wins?,llama-3.3-70b-versatile,not a prediction,"{'data_range_per_file': 199, '$type': 'app.bsky.feed.post', 'author': 'did:plc:khnhnlclg7d347pphyr4ftjp', 'authorProfile': '{'_index': 'smat-bluesky-users', 'viewer_blocked_by': False, 'viewer_mute': False, 'banner': 'https://cdn.bsky.app/img/banner/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreihhz6litbxizy5pqxwte6h7aayrqwhl27vfu676pfo5s6ndcc4vta@jpeg', 'description': 'KCC News brings you entertaining & up to date coverage of Kansas City Chiefs and the NFL üèà', '_op_type': 'index', 'handle': 'kccnews.bsky.social', 'avatar': 'https://cdn.bsky.app/img/avatar/plain/did:plc:khnhnlclg7d347pphyr4ftjp/bafkreigcoc262u7vc3k3ivaqmbfjo24h2jmqz4pilj4zbeff345wxjn2zq@jpeg', 'display_name': 'Kansas City Chiefs News', 'posts': 540, 'followers': 81, 'following': 0, '_id': 'did:plc:khnhnlclg7d347pphyr4ft...",prediction
