In [None]:
import pandas as pd
import math
import numpy as np
from tqdm import tqdm
from fractions import Fraction
from datasets import load_dataset

In [None]:
v_linke = [-1.0, 0.0]
v_gruene = [-0.9077674463309972, 0.4194737934385177]
v_spd = [-0.8074405688999996, 0.5899489195637577]
v_fdp = [0.0, 1.0]
v_cdu = [0.614758038308033, 0.788715762702673]
v_afd = [1.0, 0.0]

In [None]:
def get_result_(linke, gruene, spd, fdp, cdu, afd):
    x = (linke*v_linke[0]+
        gruene*v_gruene[0]+
        spd*v_spd[0]+
        fdp*v_fdp[0]+
        cdu*v_cdu[0]+
        afd*v_afd[0])
    y = (linke*v_linke[1]+
        gruene*v_gruene[1]+
        spd*v_spd[1]+
        fdp*v_fdp[1]+
        cdu*v_cdu[1]+
        afd*v_afd[1])
    if y != 0:
        result = math.atan(x/y)/(np.pi/2)
    else:
        if x == 0:
            result = 0
        elif x<0:
            result = -1
        else:
            result = 1
    return result

In [None]:
def get_result(linke, gruene, spd, fdp, cdu, afd):
    result_full = get_result_(linke, gruene, spd, fdp, cdu, afd)
    result_without_gruene = get_result_(linke, 0.0, spd, fdp, cdu, afd)
    result_without_spd = get_result_(linke, gruene, 0.0, fdp, cdu, afd)
    return [result_full, result_without_gruene, result_without_spd]

In [None]:
def convertMedienlandschaft(x):
    return float(-Fraction(4/3)+Fraction(1/3)*x)

In [None]:
#############

In [None]:
def calculateDirection(df_in):
    df = df_in.copy()
    label_start_index = max([list(df.columns).index('other'), list(df.columns).index('politic')])+1
    labels = [x for x in df.columns[label_start_index::] if "index" not in x]
    groups = [labels[x:x+6] for x in range(len(labels))[::6] if len(list(range(x, x+6)))==6]
    #print(groups)
    d_results = {}
    for group in groups:
        classifier_name = group[0].replace("_"+group[0].split("_")[-1], "")
        if "result_"+classifier_name not in d_results:
            d_results["result_"+classifier_name] = []
        if "result_"+classifier_name+"_without_gruene" not in d_results:
            d_results["result_"+classifier_name+"_without_gruene"] = []
        if "result_"+classifier_name+"_without_spd" not in d_results:
            d_results["result_"+classifier_name+"_without_spd"] = []
    
    for i, row in tqdm(df.iterrows(), total=df.shape[0]):
        for group in groups:
            classifier_name = group[0].replace("_"+group[0].split("_")[-1], "")
            linke = row[classifier_name+"_DIE LINKE"]
            gruene = row[classifier_name+"_BÜNDNIS 90/DIE GRÜNEN"]
            spd = row[classifier_name+"_SPD"]
            fdp = row[classifier_name+"_FDP"]
            cdu = row[classifier_name+"_CDU/CSU"]
            afd = row[classifier_name+"_AfD"]
            result_full, result_without_gruene, result_without_spd = get_result(linke, gruene, spd, fdp, cdu, afd)
            d_results["result_"+classifier_name].append(result_full)
            d_results["result_"+classifier_name+"_without_gruene"].append(result_without_gruene)
            d_results["result_"+classifier_name+"_without_spd"].append(result_without_spd)
    for x in d_results.keys():
        df[x] = d_results[x]
    return df

In [None]:
ds = load_dataset("NLP-UniBW/deutschlandfunk_de_classified")['train']
df = ds.to_pandas()

In [None]:
#df

In [None]:
#df = pd.read_json("deutschlandfunk_de_classified.json")
ds = load_dataset("NLP-UniBW/deutschlandfunk_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("deutschlandfunk_de_classified_left_right.json")

In [None]:
#df = pd.read_json("focus_de_classified.json")
ds = load_dataset("NLP-UniBW/focus_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("focus_de_classified_left_right.json")

In [None]:
#df = pd.read_json("linksunten_classified.json")
ds = load_dataset("NLP-UniBW/linksunten_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("linksunten_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/taz_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("taz_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/zeit_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("zeit_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/stern_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("stern_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/tichyseinblick_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("tichyseinblick_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/cicero_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("cicero_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/spiegel_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("spiegel_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/vice_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("vice_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/tagesschau_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("tagesschau_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/sueddeutsche_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("sueddeutsche_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/welt_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("welt_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/mdr_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("mdr_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/der_freitag_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("der_freitag_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/frankfurter_rundschau_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("frankfurter_rundschau_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/bild_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("bild_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/russia_today_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("russia_today_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/tagesspiegel_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("tagesspiegel_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/br_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("br_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/achgut_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("achgut_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/wdr_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("wdr_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/neues_deutschland_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("neues_deutschland_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/compact_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("compact_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/ndr_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("ndr_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/nachdenkseiten_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("nachdenkseiten_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/junge_freiheit_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("junge_freiheit_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/rtl_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("rtl_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/junge_welt_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("junge_welt_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/ntv_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("ntv_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/jungle_world_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("jungle_world_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/frankfurter_allgemeine_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("frankfurter_allgemeine_de_classified_left_right.json")

In [None]:
#df = pd.read_json("taz_de_classified.json")
ds = load_dataset("NLP-UniBW/mm_news_de_classified")['train']
df = ds.to_pandas()
df_out = calculateDirection(df)
df_out.to_json("mm_news_de_classified_left_right.json")

In [None]:
######################

In [None]:
df = pd.read_json("spiegel_de_classified_left_right.json")

In [None]:
#list(df.keys())

In [None]:
def calculateResult(df, dataset_name, percentage):
    df = df[df['politic'] >= percentage]
    result_labels = [x for x in list(df.columns) if x.startswith("result")]
    d_results = {}
    d_results["dataset"] = dataset_name
    for label in result_labels:
        d_results[label+"_mean"] = np.mean(df[label])
        d_results[label+"_median"] = np.median(df[label])
    df_out = pd.DataFrame(d_results, index=[0])
    return df_out

In [None]:
df = pd.read_json("deutschlandfunk_de_classified_left_right.json")
df_out = calculateResult(df, "deutschlandfunk_de", 0.8)
df_out.to_json("deutschlandfunk_de_classified_result.json")

In [None]:
df = pd.read_json("focus_de_classified_left_right.json")
df_out = calculateResult(df, "focus_de", 0.8)
df_out.to_json("focus_de_classified_result.json")

In [None]:
df = pd.read_json("linksunten_classified_left_right.json")
df_out = calculateResult(df, "linksunten", 0.8)
df_out.to_json("linksunten_classified_result.json")

In [None]:
df = pd.read_json("taz_de_classified_left_right.json")
df_out = calculateResult(df, "taz_de", 0.8)
df_out.to_json("taz_de_classified_result.json")

In [None]:
df = pd.read_json("zeit_de_classified_left_right.json")
df_out = calculateResult(df, "zeit_de", 0.8)
df_out.to_json("zeit_de_classified_result.json")

In [None]:
df = pd.read_json("stern_de_classified_left_right.json")
df_out = calculateResult(df, "stern_de", 0.8)
df_out.to_json("stern_de_classified_result.json")

In [None]:
df = pd.read_json("tichyseinblick_de_classified_left_right.json")
df_out = calculateResult(df, "tichyseinblick_de", 0.8)
df_out.to_json("tichyseinblick_de_classified_result.json")

In [None]:
df = pd.read_json("cicero_de_classified_left_right.json")
df_out = calculateResult(df, "cicero_de", 0.8)
df_out.to_json("cicero_de_classified_result.json")

In [None]:
df = pd.read_json("spiegel_de_classified_left_right.json")
df_out = calculateResult(df, "spiegel_de", 0.8)
df_out.to_json("spiegel_de_classified_result.json")

In [None]:
df = pd.read_json("vice_de_classified_left_right.json")
df_out = calculateResult(df, "vice_de", 0.8)
df_out.to_json("vice_de_classified_result.json")

In [None]:
df = pd.read_json("tagesschau_de_classified_left_right.json")
df_out = calculateResult(df, "tagesschau_de", 0.8)
df_out.to_json("tagesschau_de_classified_result.json")

In [None]:
df = pd.read_json("sueddeutsche_de_classified_left_right.json")
df_out = calculateResult(df, "sueddeutsche_de", 0.8)
df_out.to_json("sueddeutsche_de_classified_result.json")

In [None]:
df = pd.read_json("welt_de_classified_left_right.json")
df_out = calculateResult(df, "welt_de", 0.8)
df_out.to_json("welt_de_classified_result.json")

In [None]:
df = pd.read_json("welt_de_classified_left_right.json")
df_out = calculateResult(df, "welt_de", 0.8)
df_out.to_json("welt_de_classified_result.json")

In [None]:
df = pd.read_json("mdr_de_classified_left_right.json")
df_out = calculateResult(df, "mdr_de", 0.8)
df_out.to_json("mdr_de_classified_result.json")

In [None]:
df = pd.read_json("der_freitag_de_classified_left_right.json")
df_out = calculateResult(df, "der_freitag_de", 0.8)
df_out.to_json("der_freitag_de_classified_result.json")

In [None]:
df = pd.read_json("frankfurter_rundschau_de_classified_left_right.json")
df_out = calculateResult(df, "frankfurter_rundschau_de", 0.8)
df_out.to_json("frankfurter_rundschau_de_classified_result.json")

In [None]:
df = pd.read_json("bild_de_classified_left_right.json")
df_out = calculateResult(df, "bild_de", 0.8)
df_out.to_json("bild_de_classified_result.json")

In [None]:
df = pd.read_json("russia_today_de_classified_left_right.json")
df_out = calculateResult(df, "russia_today_de", 0.8)
df_out.to_json("russia_today_de_classified_result.json")

In [None]:
df = pd.read_json("tagesspiegel_de_classified_left_right.json")
df_out = calculateResult(df, "tagesspiegel_de", 0.8)
df_out.to_json("tagesspiegel_de_classified_result.json")

In [None]:
df = pd.read_json("br_de_classified_left_right.json")
df_out = calculateResult(df, "br_de", 0.8)
df_out.to_json("br_de_classified_result.json")

In [None]:
df = pd.read_json("achgut_de_classified_left_right.json")
df_out = calculateResult(df, "achgut_de", 0.8)
df_out.to_json("achgut_de_classified_result.json")

In [None]:
df = pd.read_json("wdr_de_classified_left_right.json")
df_out = calculateResult(df, "wdr_de", 0.8)
df_out.to_json("wdr_de_classified_result.json")

In [None]:
df = pd.read_json("neues_deutschland_de_classified_left_right.json")
df_out = calculateResult(df, "neues_deutschland_de", 0.8)
df_out.to_json("neues_deutschland_de_classified_result.json")

In [None]:
df = pd.read_json("compact_de_classified_left_right.json")
df_out = calculateResult(df, "compact_de", 0.8)
df_out.to_json("compact_de_classified_result.json")

In [None]:
df = pd.read_json("ndr_de_classified_left_right.json")
df_out = calculateResult(df, "ndr_de", 0.8)
df_out.to_json("ndr_de_classified_result.json")

In [None]:
df = pd.read_json("nachdenkseiten_de_classified_left_right.json")
df_out = calculateResult(df, "nachdenkseiten_de", 0.8)
df_out.to_json("nachdenkseiten_de_classified_result.json")

In [None]:
df = pd.read_json("junge_freiheit_de_classified_left_right.json")
df_out = calculateResult(df, "junge_freiheit_de", 0.8)
df_out.to_json("junge_freiheit_de_classified_result.json")

In [None]:
df = pd.read_json("rtl_de_classified_left_right.json")
df_out = calculateResult(df, "rtl_de", 0.8)
df_out.to_json("rtl_de_classified_result.json")

In [None]:
df = pd.read_json("junge_welt_classified_left_right.json")
df_out = calculateResult(df, "junge_welt", 0.8)
df_out.to_json("junge_welt_classified_result.json")

In [None]:
df = pd.read_json("ntv_de_classified_left_right.json")
df_out = calculateResult(df, "ntv_de", 0.8)
df_out.to_json("ntv_de_classified_result.json")

In [None]:
df = pd.read_json("jungle_world_classified_left_right.json")
df_out = calculateResult(df, "jungle_world", 0.8)
df_out.to_json("jungle_world_classified_result.json")

In [None]:
df = pd.read_json("frankfurter_allgemeine_de_classified_left_right.json")
df_out = calculateResult(df, "frankfurter_allgemeine_de", 0.8)
df_out.to_json("frankfurter_allgemeine_de_classified_result.json")

In [None]:
df = pd.read_json("mm_news_de_classified_left_right.json")
df_out = calculateResult(df, "mm_news_de", 0.8)
df_out.to_json("mm_news_de_classified_result.json")

In [None]:
######################

In [None]:
exp_deutschlandfunk_de = convertMedienlandschaft(3.8)
exp_focus_de = convertMedienlandschaft(4.9)
exp_linksunten = convertMedienlandschaft(2.0)
exp_taz_de = convertMedienlandschaft(2.8)
exp_zeit_de = convertMedienlandschaft(3.6)
exp_stern_de = convertMedienlandschaft(3.8)
exp_tichyseinblick_de = convertMedienlandschaft(5.5)
exp_cicero_de = convertMedienlandschaft(4.9)
exp_spiegel_de = convertMedienlandschaft(3.5)
exp_vice_de = convertMedienlandschaft(2.8)
exp_tagesschau_de = convertMedienlandschaft(3.7)
exp_sueddeutsche_de = convertMedienlandschaft(3.5)
exp_welt_de = convertMedienlandschaft(4.8)
exp_mdr_de = convertMedienlandschaft(4.1)
exp_der_freitag_de = convertMedienlandschaft(2.7)
exp_frankfurter_rundschau_de = convertMedienlandschaft(3.4)
exp_bild_de = convertMedienlandschaft(5.2)
exp_russia_today_de = convertMedienlandschaft(5.1)
exp_tagesspiegel_de = convertMedienlandschaft(3.6)
exp_br_de = convertMedienlandschaft(4.4)
exp_achgut_de = convertMedienlandschaft(5.2)
exp_wdr_de = convertMedienlandschaft(3.5)
exp_neues_deutschland_de = convertMedienlandschaft(2.6)
exp_compact_de = convertMedienlandschaft(6.0)
exp_ndr_de = convertMedienlandschaft(3.7)
exp_nachdenkseiten_de = convertMedienlandschaft(3.1)
exp_junge_freiheit_de = convertMedienlandschaft(5.8)
exp_rtl_de = convertMedienlandschaft(4.5)
exp_junge_welt = convertMedienlandschaft(2.4)
exp_ntv_de = convertMedienlandschaft(4.3)
exp_jungle_world = convertMedienlandschaft(2.3)
exp_frankfurter_allgemeine_de = convertMedienlandschaft(4.5)
exp_mm_news_de = convertMedienlandschaft(5.1)

In [None]:
df_deutschlandfunk_de = pd.read_json("deutschlandfunk_de_classified_result.json")
df_focus_de = pd.read_json("focus_de_classified_result.json")
df_linksunten = pd.read_json("linksunten_classified_result.json")
df_taz_de = pd.read_json("taz_de_classified_result.json")

df_zeit_de = pd.read_json("zeit_de_classified_result.json")
df_stern_de = pd.read_json("stern_de_classified_result.json")
df_tichyseinblick_de = pd.read_json("tichyseinblick_de_classified_result.json")
df_cicero_de = pd.read_json("cicero_de_classified_result.json")
df_spiegel_de = pd.read_json("spiegel_de_classified_result.json")
df_vice_de = pd.read_json("vice_de_classified_result.json")
df_tagesschau_de = pd.read_json("tagesschau_de_classified_result.json")
df_sueddeutsche_de = pd.read_json("sueddeutsche_de_classified_result.json")
df_welt_de = pd.read_json("welt_de_classified_result.json")
df_mdr_de = pd.read_json("mdr_de_classified_result.json")
df_der_freitag_de = pd.read_json("der_freitag_de_classified_result.json")
df_frankfurter_rundschau_de = pd.read_json("frankfurter_rundschau_de_classified_result.json")
df_bild_de = pd.read_json("bild_de_classified_result.json")
df_russia_today_de = pd.read_json("russia_today_de_classified_result.json")
df_tagesspiegel_de = pd.read_json("tagesspiegel_de_classified_result.json")
df_br_de = pd.read_json("br_de_classified_result.json")
df_achgut_de = pd.read_json("achgut_de_classified_result.json")
df_wdr_de = pd.read_json("wdr_de_classified_result.json")
df_neues_deutschland_de = pd.read_json("neues_deutschland_de_classified_result.json")
df_compact_de = pd.read_json("compact_de_classified_result.json")
df_ndr_de = pd.read_json("ndr_de_classified_result.json")
df_nachdenkseiten_de = pd.read_json("nachdenkseiten_de_classified_result.json")
df_junge_freiheit_de = pd.read_json("junge_freiheit_de_classified_result.json")
df_rtl_de = pd.read_json("rtl_de_classified_result.json")
df_junge_welt = pd.read_json("junge_welt_classified_result.json")
df_ntv_de = pd.read_json("ntv_de_classified_result.json")
df_jungle_world = pd.read_json("jungle_world_classified_result.json")
df_frankfurter_allgemeine_de = pd.read_json("frankfurter_allgemeine_de_classified_result.json")
df_mm_news_de = pd.read_json("mm_news_de_classified_result.json")

In [None]:
#df_deutschlandfunk_de.iloc[:,1:]

In [None]:
df_deutschlandfunk_de_tmp = (df_deutschlandfunk_de.iloc[:,1:]-exp_deutschlandfunk_de)**2
df_focus_de_tmp = (df_focus_de.iloc[:,1:]-exp_focus_de)**2
df_linksunten_tmp = (df_linksunten.iloc[:,1:]-exp_linksunten)**2
df_taz_de_tmp = (df_taz_de.iloc[:,1:]-exp_taz_de)**2

df_zeit_de_tmp = (df_zeit_de.iloc[:,1:]-exp_zeit_de)**2
df_stern_de_tmp = (df_stern_de.iloc[:,1:]-exp_stern_de)**2
df_tichyseinblick_de_tmp = (df_tichyseinblick_de.iloc[:,1:]-exp_tichyseinblick_de)**2
df_cicero_de_tmp = (df_cicero_de.iloc[:,1:]-exp_cicero_de)**2
df_spiegel_de_tmp = (df_spiegel_de.iloc[:,1:]-exp_spiegel_de)**2
df_vice_de_tmp = (df_vice_de.iloc[:,1:]-exp_vice_de)**2
df_tagesschau_de_tmp = (df_tagesschau_de.iloc[:,1:]-exp_tagesschau_de)**2
df_sueddeutsche_de_tmp = (df_sueddeutsche_de.iloc[:,1:]-exp_sueddeutsche_de)**2
df_welt_de_tmp = (df_welt_de.iloc[:,1:]-exp_welt_de)**2
df_mdr_de_tmp = (df_mdr_de.iloc[:,1:]-exp_mdr_de)**2
df_der_freitag_de_tmp = (df_der_freitag_de.iloc[:,1:]-exp_der_freitag_de)**2
df_frankfurter_rundschau_de_tmp = (df_frankfurter_rundschau_de.iloc[:,1:]-exp_frankfurter_rundschau_de)**2
df_bild_de_tmp = (df_bild_de.iloc[:,1:]-exp_bild_de)**2
df_russia_today_de_tmp = (df_russia_today_de.iloc[:,1:]-exp_russia_today_de)**2
df_tagesspiegel_de_tmp = (df_tagesspiegel_de.iloc[:,1:]-exp_tagesspiegel_de)**2
df_br_de_tmp = (df_br_de.iloc[:,1:]-exp_br_de)**2
df_achgut_de_tmp = (df_achgut_de.iloc[:,1:]-exp_achgut_de)**2
df_wdr_de_tmp = (df_wdr_de.iloc[:,1:]-exp_wdr_de)**2
df_neues_deutschland_de_tmp = (df_neues_deutschland_de.iloc[:,1:]-exp_neues_deutschland_de)**2
df_compact_de_tmp = (df_compact_de.iloc[:,1:]-exp_compact_de)**2
df_ndr_de_tmp = (df_ndr_de.iloc[:,1:]-exp_ndr_de)**2
df_nachdenkseiten_de_tmp = (df_nachdenkseiten_de.iloc[:,1:]-exp_nachdenkseiten_de)**2
df_junge_freiheit_de_tmp = (df_junge_freiheit_de.iloc[:,1:]-exp_junge_freiheit_de)**2
df_rtl_de_tmp = (df_rtl_de.iloc[:,1:]-exp_rtl_de)**2
df_junge_welt_tmp = (df_junge_welt.iloc[:,1:]-exp_junge_welt)**2
df_ntv_de_tmp = (df_ntv_de.iloc[:,1:]-exp_ntv_de)**2
df_jungle_world_tmp = (df_jungle_world.iloc[:,1:]-exp_jungle_world)**2
df_frankfurter_allgemeine_de_tmp = (df_frankfurter_allgemeine_de.iloc[:,1:]-exp_frankfurter_allgemeine_de)**2
df_mm_news_de_tmp = (df_mm_news_de.iloc[:,1:]-exp_mm_news_de)**2

In [None]:
df_deutschlandfunk_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_combined_tmp = df_deutschlandfunk_de_tmp + \
df_focus_de_tmp + \
df_linksunten_tmp + \
df_taz_de_tmp + \
df_zeit_de_tmp + \
df_stern_de_tmp + \
df_tichyseinblick_de_tmp + \
df_cicero_de_tmp + \
df_spiegel_de_tmp + \
df_vice_de_tmp + \
df_tagesschau_de_tmp + \
df_sueddeutsche_de_tmp + \
df_welt_de_tmp + \
df_mdr_de_tmp + \
df_der_freitag_de_tmp + \
df_frankfurter_rundschau_de_tmp + \
df_bild_de_tmp + \
df_russia_today_de_tmp + \
df_tagesspiegel_de_tmp + \
df_br_de_tmp + \
df_achgut_de_tmp + \
df_wdr_de_tmp + \
df_neues_deutschland_de_tmp + \
df_compact_de_tmp + \
df_ndr_de_tmp + \
df_nachdenkseiten_de_tmp + \
df_junge_freiheit_de_tmp + \
df_rtl_de_tmp + \
df_junge_welt_tmp + \
df_ntv_de_tmp + \
df_jungle_world_tmp + \
df_frankfurter_allgemeine_de_tmp + \
df_mm_news_de_tmp 

In [None]:
df_combined_tmp['result_gemma-2-9b_mean']

In [None]:
df_deutschlandfunk_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_focus_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_linksunten_tmp['result_gemma-2-9b_mean']

In [None]:
df_taz_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_zeit_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_stern_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_tichyseinblick_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_cicero_de_tmp['result_gemma-2-9b_mean']

In [None]:
#df_spiegel_de_tmp['result_gemma-2-9b_mean']

In [None]:
df_spiegel_de_tmp.keys()

In [None]:
df_combined_tmp = df_combined_tmp/33

In [None]:
df_combined_tmp_T = df_combined_tmp.T

In [None]:
df_combined_tmp_T = df_combined_tmp_T.sort_values(by=[0], ascending=True)

In [None]:
df_combined_tmp_T = df_combined_tmp_T.reset_index().rename(columns={0: "MSE", "index": "classifier"})

In [None]:
df_combined_tmp_T['classifier'] = [x.replace("result_", "") for x in df_combined_tmp_T['classifier']]

In [None]:
df_combined_tmp_T.to_json("result.json")

In [None]:
#df_combined_tmp_T = df_combined_tmp_T.rename(columns={0: "MSE"})
#df_combined_tmp_T.index.rename("classifier", inplace=True)

In [None]:
#df_combined_tmp_T.to_json("result.json")

In [None]:
pd.read_json("result.json").head(20)

In [None]:
df_combined_tmp_T.to_excel("result.xlsx")

In [None]:
df_combined_tmp_T