In [None]:
import json
import pandas as pd
import matplotlib.pyplot as plt

with open("forensics-data/ff-model-personality/combined_ap.json", "r") as f:
    data = json.load(f)



df = pd.DataFrame(data["comparisons"])

# limit to comparisons between gpt-4o and gpt-5

df["len_a"] = df["response_a"].apply(lambda x: len(x.get("text", "")))
df["len_b"] = df["response_b"].apply(lambda x: len(x.get("text", "")))

df["model_a"] = df["response_a"].apply(lambda x: x.get("model", ""))
df["model_b"] = df["response_b"].apply(lambda x: x.get("model", ""))

# limit to model a being gpt-5

df = df[df["model_a"].str.contains("gpt-5")]

# max out at 10000
df["len_a"] = df["len_a"].clip(upper=10000)
df["len_b"] = df["len_b"].clip(upper=10000)

# Set dark style
plt.style.use('dark_background')

# Create figure with nice dark styling
fig, ax = plt.subplots(figsize=(6, 4))
fig.patch.set_facecolor('#0d1117')  # GitHub dark background color
ax.set_facecolor('#0d1117')

num_bins = 15

# Use nice colors for dark mode
gpt5_color = '#58a6ff'  # Nice blue
gpt4o_color = '#f85149'  # Nice red

ax.hist(df["len_a"], bins=num_bins, label="GPT-5", alpha=0.7, color=gpt5_color, edgecolor='white', linewidth=0.5)
ax.hist(df["len_b"], bins=num_bins, label="GPT-4o", alpha=0.7, color=gpt4o_color, edgecolor='white', linewidth=0.5)

# Style the plot for dark mode
ax.set_xlabel("Response length", color='white', fontsize=12)
ax.set_ylabel("Number of responses", color='white', fontsize=12)
ax.tick_params(colors='white')
ax.spines['bottom'].set_color('white')
ax.spines['top'].set_color('white')
ax.spines['right'].set_color('white')
ax.spines['left'].set_color('white')

# Style the legend
legend = ax.legend(facecolor='#21262d', edgecolor='white', labelcolor='white')
legend.get_frame().set_alpha(0.9)

# add x axis label + to indicate that last bin contains values greater than 10000
ax.set_xlabel("Response length (characters)")
#ax.set_xlim(0, 10000)
ax.set_xticks([0, 2000, 4000, 6000, 8000, 10000])
ax.set_xticklabels([0, 2000, 4000, 6000, 8000, "10000+"])

plt.tight_layout()
plt.savefig("response_length_hist.png", dpi=300)
plt.show()

#df.head()
