# Fix Submission Format Issue

The submission failed because some values don't have the 's' prefix. Let's fix this and understand the format better.

In [None]:
import pandas as pd
import numpy as np
import os

# Load the original snapshot submission
original_path = '/home/nonroot/snapshots/santa-2025/21145965159/submission/submission.csv'
df = pd.read_csv(original_path)
print(f'Total rows: {len(df)}')
print(f'Columns: {df.columns.tolist()}')
print(df.head(10))

In [None]:
# Check for values without 's' prefix
for col in ['x', 'y', 'deg']:
    non_s = df[~df[col].astype(str).str.startswith('s')]
    print(f'Column {col}: {len(non_s)} values without s prefix')
    if len(non_s) > 0:
        print(non_s.head(3))

In [None]:
# Function to ensure 's' prefix
def ensure_s_prefix(val):
    s = str(val)
    if s.startswith('s'):
        return s
    return f's{s}'

# Fix all columns
df_fixed = df.copy()
for col in ['x', 'y', 'deg']:
    df_fixed[col] = df_fixed[col].apply(ensure_s_prefix)

print('After fixing:')
for col in ['x', 'y', 'deg']:
    non_s = df_fixed[~df_fixed[col].astype(str).str.startswith('s')]
    print(f'Column {col}: {len(non_s)} values without s prefix')

print(df_fixed.head(10))

In [None]:
# Save the fixed submission
fixed_path = '/home/submission/submission.csv'
df_fixed.to_csv(fixed_path, index=False)
print(f'Saved fixed submission to {fixed_path}')

# Also save to experiment folder
os.makedirs('/home/code/experiments/002_fixed_baseline', exist_ok=True)
df_fixed.to_csv('/home/code/experiments/002_fixed_baseline/submission.csv', index=False)

In [None]:
# Verify the score using our scoring script
import subprocess
result = subprocess.run(['python', '/home/code/score_submission.py', fixed_path], capture_output=True, text=True)
print(result.stdout)
print(result.stderr)