# Loop 65 Analysis: Major Breakthrough with Ens Model Approach

**Key Event**: Experiment 069 achieved CV = 0.005146, a 35.17% improvement!

**Critical Question**: Does this approach have a DIFFERENT CV-LB relationship?

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from scipy import stats

# All submissions with CV and LB scores
submissions = [
    {'exp': 'exp_000', 'cv': 0.0111, 'lb': 0.0982},
    {'exp': 'exp_001', 'cv': 0.0123, 'lb': 0.1065},
    {'exp': 'exp_003', 'cv': 0.0105, 'lb': 0.0972},
    {'exp': 'exp_005', 'cv': 0.0104, 'lb': 0.0969},
    {'exp': 'exp_006', 'cv': 0.0097, 'lb': 0.0946},
    {'exp': 'exp_007', 'cv': 0.0093, 'lb': 0.0932},
    {'exp': 'exp_009', 'cv': 0.0092, 'lb': 0.0936},
    {'exp': 'exp_012', 'cv': 0.0090, 'lb': 0.0913},
    {'exp': 'exp_024', 'cv': 0.0087, 'lb': 0.0893},
    {'exp': 'exp_026', 'cv': 0.0085, 'lb': 0.0887},
    {'exp': 'exp_030', 'cv': 0.0083, 'lb': 0.0877},
    {'exp': 'exp_041', 'cv': 0.0090, 'lb': 0.0932},
    {'exp': 'exp_042', 'cv': 0.0145, 'lb': 0.1147},
]

df = pd.DataFrame(submissions)
print(f'Total submissions: {len(df)}')
print(df)

Total submissions: 13
        exp      cv      lb
0   exp_000  0.0111  0.0982
1   exp_001  0.0123  0.1065
2   exp_003  0.0105  0.0972
3   exp_005  0.0104  0.0969
4   exp_006  0.0097  0.0946
5   exp_007  0.0093  0.0932
6   exp_009  0.0092  0.0936
7   exp_012  0.0090  0.0913
8   exp_024  0.0087  0.0893
9   exp_026  0.0085  0.0887
10  exp_030  0.0083  0.0877
11  exp_041  0.0090  0.0932
12  exp_042  0.0145  0.1147


In [2]:
# Fit linear regression: LB = slope * CV + intercept
slope, intercept, r_value, p_value, std_err = stats.linregress(df['cv'], df['lb'])

print(f'CV-LB Relationship (13 submissions):')
print(f'  LB = {slope:.2f} * CV + {intercept:.4f}')
print(f'  R-squared = {r_value**2:.4f}')
print(f'  Intercept = {intercept:.4f}')
print(f'\nInterpretation:')
print(f'  Even at CV=0, expected LB would be {intercept:.4f}')
print(f'  Target LB: 0.0347')
print(f'  Gap: {intercept - 0.0347:.4f} (intercept > target!)')

CV-LB Relationship (13 submissions):
  LB = 4.23 * CV + 0.0533
  R-squared = 0.9807
  Intercept = 0.0533

Interpretation:
  Even at CV=0, expected LB would be 0.0533
  Target LB: 0.0347
  Gap: 0.0186 (intercept > target!)


In [3]:
# Predict LB for new CV = 0.005146 using old relationship
new_cv = 0.005146
predicted_lb = slope * new_cv + intercept

print(f'\nPrediction for exp_069 (CV = {new_cv}):')
print(f'  Using old relationship: LB = {slope:.2f} * {new_cv} + {intercept:.4f}')
print(f'  Predicted LB = {predicted_lb:.4f}')
print(f'\nBest LB so far: 0.0877 (exp_030)')
print(f'Predicted improvement: {(0.0877 - predicted_lb) / 0.0877 * 100:.1f}%')


Prediction for exp_069 (CV = 0.005146):
  Using old relationship: LB = 4.23 * 0.005146 + 0.0533
  Predicted LB = 0.0751

Best LB so far: 0.0877 (exp_030)
Predicted improvement: 14.4%


In [4]:
# Summary of key findings
print('='*60)
print('KEY FINDINGS FOR SEED PROMPT')
print('='*60)

print('\n1. MAJOR BREAKTHROUGH: exp_069 achieved CV = 0.005146 (35% improvement)')
print('   - CatBoost + XGBoost ensemble with feature priority filtering')
print('   - Full Data MSE improved by 62% (0.007789 -> 0.002992)')
print('   - Single Solvent MSE slightly worse (0.008216 -> 0.009175)')

print('\n2. CV-LB RELATIONSHIP: LB = 4.21*CV + 0.0535 (R-squared = 0.98)')
print('   - Intercept (0.0535) > Target (0.0347)')
print('   - Target is UNREACHABLE with current relationship')

print('\n3. PREDICTED LB FOR exp_069: 0.0752')
print('   - Would be best LB achieved (vs current best 0.0877)')
print('   - But still far from target (0.0347)')

print('\n4. CRITICAL QUESTION: Does exp_069 have a DIFFERENT CV-LB relationship?')
print('   - This is the key hypothesis to test with a submission')
print('   - If yes, target may become reachable')
print('   - If no, we need to find other approaches')

print('\n5. RECOMMENDATION: SUBMIT exp_069 IMMEDIATELY')
print('   - 5 submissions remaining')
print('   - This is the most important submission to make')
print('   - Will reveal if the CV-LB relationship has changed')

KEY FINDINGS FOR SEED PROMPT

1. MAJOR BREAKTHROUGH: exp_069 achieved CV = 0.005146 (35% improvement)
   - CatBoost + XGBoost ensemble with feature priority filtering
   - Full Data MSE improved by 62% (0.007789 -> 0.002992)
   - Single Solvent MSE slightly worse (0.008216 -> 0.009175)

2. CV-LB RELATIONSHIP: LB = 4.21*CV + 0.0535 (R-squared = 0.98)
   - Intercept (0.0535) > Target (0.0347)
   - Target is UNREACHABLE with current relationship

3. PREDICTED LB FOR exp_069: 0.0752
   - Would be best LB achieved (vs current best 0.0877)
   - But still far from target (0.0347)

4. CRITICAL QUESTION: Does exp_069 have a DIFFERENT CV-LB relationship?
   - This is the key hypothesis to test with a submission
   - If yes, target may become reachable
   - If no, we need to find other approaches

5. RECOMMENDATION: SUBMIT exp_069 IMMEDIATELY
   - 5 submissions remaining
   - This is the most important submission to make
   - Will reveal if the CV-LB relationship has changed
