# rewrite to be the same as the neo file

In [None]:

import json
import numpy as np
import matplotlib.pyplot as plt

RESULTS_PATH = f"lora_rank{LORA_RANK}_inference_results.jsonl"

results = []
with open(RESULTS_PATH, 'r', encoding='utf-8') as f:
    for line in f:
        results.append(json.loads(line))

print(f"Loaded {len(results)} responses")

# Calculate word lengths and token lengths
word_lengths = []
token_lengths = []

for r in results:
    response = r['response']
    
    words = response.split()
    word_lengths.append(len(words))
    
    tokens = tokenizer.encode(response, add_special_tokens=False)
    token_lengths.append(len(tokens))

word_lengths = np.array(word_lengths)
token_lengths = np.array(token_lengths)

# Summary statistics
print("=" * 60)
print(f"RESPONSE LENGTH STATISTICS (LoRA rank={LORA_RANK})")
print("=" * 60)
print(f"\nWord Length:")
print(f"  Mean:   {word_lengths.mean():.2f}")
print(f"  Stdev:  {word_lengths.std():.2f}")
print(f"  Min:    {word_lengths.min()}")
print(f"  Max:    {word_lengths.max()}")

print(f"\nToken Length:")
print(f"  Mean:   {token_lengths.mean():.2f}")
print(f"  Stdev:  {token_lengths.std():.2f}")
print(f"  Min:    {token_lengths.min()}")
print(f"  Max:    {token_lengths.max()}")
print("=" * 60)

# Histograms
fig, axes = plt.subplots(1, 2, figsize=(14, 5))

axes[0].hist(word_lengths, bins=30, edgecolor='black', alpha=0.7, color='steelblue')
axes[0].axvline(word_lengths.mean(), color='red', linestyle='--', linewidth=2, label=f'Mean: {word_lengths.mean():.1f}')
axes[0].set_xlabel('Word Count')
axes[0].set_ylabel('Frequency')
axes[0].set_title(f'Response Length Distribution - LoRA rank={LORA_RANK} (Words)')
axes[0].legend()

axes[1].hist(token_lengths, bins=30, edgecolor='black', alpha=0.7, color='darkorange')
axes[1].axvline(token_lengths.mean(), color='red', linestyle='--', linewidth=2, label=f'Mean: {token_lengths.mean():.1f}')
axes[1].set_xlabel('Token Count')
axes[1].set_ylabel('Frequency')
axes[1].set_title(f'Response Length Distribution - LoRA rank={LORA_RANK} (Tokens)')
axes[1].legend()

plt.tight_layout()
plt.show()

## Step 10: Side-by-Side Comparison (Optional)

If you have neologism results, compare them here.

# Load neologism results if available
NEOLOGISM_RESULTS_PATH = "short_inference_results.jsonl"

if os.path.exists(NEOLOGISM_RESULTS_PATH):
    neo_results = []
    with open(NEOLOGISM_RESULTS_PATH, 'r', encoding='utf-8') as f:
        for line in f:
            neo_results.append(json.loads(line))
    
    neo_word_lengths = np.array([len(r['response'].split()) for r in neo_results])
    
    print("=" * 60)
    print("COMPARISON: Neologism vs LoRA Fine-tuning")
    print("=" * 60)
    print(f"\nNeologism (~short):")
    print(f"  Mean word count: {neo_word_lengths.mean():.2f}")
    print(f"  Stdev: {neo_word_lengths.std():.2f}")
    
    print(f"\nLoRA (rank={LORA_RANK}):")
    print(f"  Mean word count: {word_lengths.mean():.2f}")
    print(f"  Stdev: {word_lengths.std():.2f}")
    
    print(f"\nDifference: {word_lengths.mean() - neo_word_lengths.mean():.2f} words")
    
    # Overlaid histogram
    plt.figure(figsize=(10, 6))
    plt.hist(neo_word_lengths, bins=30, alpha=0.5, label=f'Neologism (mean={neo_word_lengths.mean():.1f})', color='blue')
    plt.hist(word_lengths, bins=30, alpha=0.5, label=f'LoRA rank={LORA_RANK} (mean={word_lengths.mean():.1f})', color='orange')
    plt.xlabel('Word Count')
    plt.ylabel('Frequency')
    plt.title('Response Length: Neologism vs LoRA Fine-tuning')
    plt.legend()
    plt.show()
else:
    print(f"Neologism results not found at {NEOLOGISM_RESULTS_PATH}")
    print("Run neologism inference first to enable comparison.")