# Models Training Status

In this notebook there are scripts to check which models are there and which are missing.

In [1]:
base_path = "/loss_landscape/checkpoint/different_knobs_subset_10/"
sizes = ['small', 'baseline', 'large']
batch_sizes = [16, 32, 64, 128, 256, 512, 1024]
learning_rates = [0.1, 0.05, 0.025, 0.0125, 0.00625, 0.003125, 0.0015625]
precisions = [2, 3, 4, 5, 6, 7, 8, 9, 10, 11]

In [5]:
missing = []
for bs in batch_sizes:
    for lr in learning_rates:
        for precision in precisions:
            for size in sizes:
                print(f'BATCH SIZE: {bs} - LEARNING RATE {lr} - SIZE {size} - PRECISION {precision}')
                for exp in range(1, 3):
                    file_path = base_path + f'bs{bs}_lr{lr}/ECON_{precision}b/{size}/{size}_emd_{exp}.txt'
                    try:
                        with open(file_path, 'r') as file:
                            content = file.read()
                            print("AVG EMD: ", content)

                    except Exception as e:
                        missing.append((bs, lr, size))
                        continue


BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE small - PRECISION 2
AVG EMD:  [{'AVG_EMD': 7.402425289154053}]
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE baseline - PRECISION 2
AVG EMD:  [{'AVG_EMD': -0.5}]
AVG EMD:  [{'AVG_EMD': -0.5}]
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE large - PRECISION 2
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE small - PRECISION 3
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE baseline - PRECISION 3
AVG EMD:  [{'AVG_EMD': -0.5}]
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE large - PRECISION 3
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE small - PRECISION 4
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE baseline - PRECISION 4
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE large - PRECISION 4
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE small - PRECISION 5
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE baseline - PRECISION 5
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE large - PRECISION 5
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE small - PRECISION 6
BATCH SIZE: 16 - LEARNING RATE 0.1 - SIZE baselin

In [8]:
sorted_missing = sorted(missing, key=lambda x: x[2])

In [12]:
for tmp in set(sorted_missing):
    if tmp[0] == 1024:
        print(f'{tmp[0]}\t\t{tmp[1]}\t\t{tmp[2]}')


1024		0.05		baseline
1024		0.003125		baseline
1024		0.00625		large
1024		0.003125		small
1024		0.1		baseline
1024		0.1		large
1024		0.0015625		large
1024		0.003125		large
1024		0.025		large
1024		0.025		small


In [13]:
for tmp in set(sorted_missing):
    if tmp[0] == 512:
        print(f'{tmp[0]}\t\t{tmp[1]}\t\t{tmp[2]}')

512		0.0015625		small
512		0.003125		baseline
512		0.00625		baseline
512		0.00625		large
512		0.00625		small
512		0.05		large
512		0.1		baseline
512		0.1		large
512		0.1		small
512		0.0015625		large
512		0.003125		large
512		0.003125		small
512		0.025		baseline
512		0.025		large
512		0.025		small
512		0.0125		large
512		0.05		baseline
512		0.0015625		baseline


In [14]:

for tmp in set(missing):
    if tmp[0] == 256:
        print(tmp[0], tmp[1], tmp[2])

256 0.1 baseline
256 0.025 baseline
256 0.0125 baseline
256 0.00625 small
256 0.05 small
256 0.00625 large
256 0.05 baseline
256 0.1 small
256 0.05 large
256 0.0015625 small
256 0.1 large
256 0.0015625 baseline
256 0.025 small
256 0.0015625 large
256 0.0125 small
256 0.025 large
256 0.003125 small
256 0.0125 large
256 0.003125 baseline
256 0.00625 baseline
256 0.003125 large


In [15]:
for tmp in set(missing):
    if tmp[0] == 128:
        print(tmp[0], tmp[1], tmp[2])

128 0.05 baseline
128 0.05 large
128 0.025 small
128 0.0015625 small
128 0.025 large
128 0.0015625 large
128 0.00625 small
128 0.00625 large
128 0.1 small
128 0.1 large
128 0.025 baseline
128 0.0125 small
128 0.0015625 baseline
128 0.003125 small
128 0.003125 baseline
128 0.00625 baseline
128 0.003125 large
128 0.1 baseline
128 0.0125 baseline
128 0.0125 large
128 0.05 small


In [16]:
for tmp in set(missing):
    if tmp[0] == 64:
        print(tmp[0], tmp[1], tmp[2])

64 0.0125 large
64 0.00625 baseline
64 0.025 baseline
64 0.0125 baseline
64 0.003125 small
64 0.003125 large
64 0.05 small
64 0.003125 baseline
64 0.05 baseline
64 0.05 large
64 0.0015625 small
64 0.0015625 baseline
64 0.0015625 large
64 0.00625 small
64 0.00625 large
64 0.1 small
64 0.1 baseline
64 0.1 large
64 0.025 small
64 0.0125 small
64 0.025 large


In [17]:
for tmp in set(missing):
    if tmp[0] == 32:
        print(tmp[0], tmp[1], tmp[2])

32 0.0125 small
32 0.0125 baseline
32 0.0125 large
32 0.05 small
32 0.003125 baseline
32 0.05 large
32 0.00625 small
32 0.00625 large
32 0.05 baseline
32 0.025 small
32 0.0015625 small
32 0.025 large
32 0.0015625 large
32 0.00625 baseline
32 0.1 small
32 0.1 large
32 0.025 baseline
32 0.0015625 baseline
32 0.003125 small
32 0.003125 large
32 0.1 baseline


In [18]:
for tmp in set(missing):
    if tmp[0] == 16:
        print(tmp[0], tmp[1], tmp[2])

16 0.003125 baseline
16 0.05 small
16 0.0125 baseline
16 0.05 large
16 0.05 baseline
16 0.0015625 small
16 0.025 small
16 0.0015625 large
16 0.025 baseline
16 0.025 large
16 0.003125 small
16 0.00625 small
16 0.00625 baseline
16 0.003125 large
16 0.00625 large
16 0.1 small
16 0.1 baseline
16 0.1 large
16 0.0015625 baseline
16 0.0125 small
16 0.0125 large
