In [1]:
import re

In [3]:
def extract_metrics(data: str):
    # 解析数据
    metrics = {
        "recall": {},
        "mrr": {},
        "ndcg": {}
    }
    
    for line in data.strip().split("\n"):
        match = re.search(r'wandb:\s+train/predict_(\w+)@(\d+)\s+([\d.]+)', line)
        if match:
            metric, k, value = match.groups()
            if metric in metrics:
                metrics[metric][int(k)] = round(float(value), 4) # 保留小数点后四位
    
    # 按照 recall 1-50, mrr 1-50, ndcg 1-50 顺序整理
    result = []
    for metric in ["recall", "mrr", "ndcg"]:
        for k in sorted(metrics[metric]):
            result.append(str(metrics[metric][k]))
    
    return ", ".join(result)

In [5]:
# 1 - 1e-6

data = """
wandb:               train/predict_loss 7.53936
wandb:              train/predict_mrr@1 0.02624
wandb:             train/predict_mrr@10 0.04874
wandb:             train/predict_mrr@20 0.05157
wandb:              train/predict_mrr@5 0.0431
wandb:             train/predict_mrr@50 0.05403
wandb:             train/predict_ndcg@1 0.02624
wandb:            train/predict_ndcg@10 0.06451
wandb:            train/predict_ndcg@20 0.07459
wandb:             train/predict_ndcg@5 0.05085
wandb:            train/predict_ndcg@50 0.08992
wandb:           train/predict_recall@1 0.02624
wandb:          train/predict_recall@10 0.11662
wandb:          train/predict_recall@20 0.15598
wandb:           train/predict_recall@5 0.07434
wandb:          train/predict_recall@50 0.23324
wandb:            train/predict_runtime 25.6633
wandb: train/predict_samples_per_second 26.731
wandb:   train/predict_steps_per_second 3.351
wandb:                       train_loss 7.62746
wandb:                    train_runtime 6074.3743
"""

print(extract_metrics(data))

0.0262, 0.0743, 0.1166, 0.156, 0.2332, 0.0262, 0.0431, 0.0487, 0.0516, 0.054, 0.0262, 0.0508, 0.0645, 0.0746, 0.0899


In [6]:
# 1 - 5e-7

data = """
wandb:                       train/loss 7.3281
wandb:               train/predict_loss 7.64185
wandb:              train/predict_mrr@1 0.01895
wandb:             train/predict_mrr@10 0.03742
wandb:             train/predict_mrr@20 0.0397
wandb:              train/predict_mrr@5 0.03214
wandb:             train/predict_mrr@50 0.04171
wandb:             train/predict_ndcg@1 0.01895
wandb:            train/predict_ndcg@10 0.0526
wandb:            train/predict_ndcg@20 0.06127
wandb:             train/predict_ndcg@5 0.03957
wandb:            train/predict_ndcg@50 0.07455
wandb:           train/predict_recall@1 0.01895
wandb:          train/predict_recall@10 0.1035
wandb:          train/predict_recall@20 0.13848
wandb:           train/predict_recall@5 0.06268
wandb:          train/predict_recall@50 0.207
wandb:            train/predict_runtime 25.6917
"""

print(extract_metrics(data))

0.019, 0.0627, 0.1035, 0.1385, 0.207, 0.019, 0.0321, 0.0374, 0.0397, 0.0417, 0.019, 0.0396, 0.0526, 0.0613, 0.0746


In [7]:
# 1 - 5e-6

data = """
wandb:                      train/epoch 1
wandb:                train/global_step 3343
wandb:                  train/grad_norm 45.71592
wandb:              train/learning_rate 1e-05
wandb:                       train/loss 6.3125
wandb:               train/predict_loss 7.46374
wandb:              train/predict_mrr@1 0.03061
wandb:             train/predict_mrr@10 0.05734
wandb:             train/predict_mrr@20 0.06105
wandb:              train/predict_mrr@5 0.05236
wandb:             train/predict_mrr@50 0.06351
wandb:             train/predict_ndcg@1 0.03061
wandb:            train/predict_ndcg@10 0.07532
wandb:            train/predict_ndcg@20 0.08891
wandb:             train/predict_ndcg@5 0.06313
wandb:            train/predict_ndcg@50 0.10424
wandb:           train/predict_recall@1 0.03061
wandb:          train/predict_recall@10 0.13411
wandb:          train/predict_recall@20 0.18805
wandb:           train/predict_recall@5 0.09621
wandb:          train/predict_recall@50 0.26531
wandb:            train/predict_runtime 25.9373
wandb: train/predict_samples_per_second 26.448
"""

print(extract_metrics(data))

0.0306, 0.0962, 0.1341, 0.188, 0.2653, 0.0306, 0.0524, 0.0573, 0.0611, 0.0635, 0.0306, 0.0631, 0.0753, 0.0889, 0.1042


In [8]:
# 2 - 1e-6

data = """
wandb:                       train/loss 7.2422
wandb:               train/predict_loss 7.57152
wandb:              train/predict_mrr@1 0.02041
wandb:             train/predict_mrr@10 0.04303
wandb:             train/predict_mrr@20 0.04576
wandb:              train/predict_mrr@5 0.03822
wandb:             train/predict_mrr@50 0.04751
wandb:             train/predict_ndcg@1 0.02041
wandb:            train/predict_ndcg@10 0.05915
wandb:            train/predict_ndcg@20 0.06933
wandb:             train/predict_ndcg@5 0.04742
wandb:            train/predict_ndcg@50 0.0807
wandb:           train/predict_recall@1 0.02041
wandb:          train/predict_recall@10 0.11224
wandb:          train/predict_recall@20 0.15306
wandb:           train/predict_recall@5 0.0758
wandb:          train/predict_recall@50 0.21137
wandb:            train/predict_runtime 25.05
"""

print(extract_metrics(data))

0.0204, 0.0758, 0.1122, 0.1531, 0.2114, 0.0204, 0.0382, 0.043, 0.0458, 0.0475, 0.0204, 0.0474, 0.0592, 0.0693, 0.0807


In [4]:
# 2 - 5e-6

data = """
wandb:               train/predict_loss 7.45445
wandb:              train/predict_mrr@1 0.03499
wandb:             train/predict_mrr@10 0.05964
wandb:             train/predict_mrr@20 0.06237
wandb:              train/predict_mrr@5 0.05345
wandb:             train/predict_mrr@50 0.06486
wandb:             train/predict_ndcg@1 0.03499
wandb:            train/predict_ndcg@10 0.07756
wandb:            train/predict_ndcg@20 0.08824
wandb:             train/predict_ndcg@5 0.06251
wandb:            train/predict_ndcg@50 0.10341
wandb:           train/predict_recall@1 0.03499
wandb:          train/predict_recall@10 0.13703
wandb:          train/predict_recall@20 0.18076
wandb:           train/predict_recall@5 0.09038
wandb:          train/predict_recall@50 0.25656
wandb:            train/predict_runtime 25.1426
wandb: train/predict_samples_per_second 27.284
"""

print(extract_metrics(data))

0.035, 0.0904, 0.137, 0.1808, 0.2566, 0.035, 0.0534, 0.0596, 0.0624, 0.0649, 0.035, 0.0625, 0.0776, 0.0882, 0.1034


In [5]:
# 4 - 1e-6

data = """
wandb:                      train/epoch 0.9991
wandb:                train/global_step 835
wandb:                  train/grad_norm 32.22339
wandb:              train/learning_rate 0.0
wandb:                       train/loss 7.3672
wandb:               train/predict_loss 7.65561
wandb:              train/predict_mrr@1 0.01895
wandb:             train/predict_mrr@10 0.03445
wandb:             train/predict_mrr@20 0.0367
wandb:              train/predict_mrr@5 0.03034
wandb:             train/predict_mrr@50 0.03901
wandb:             train/predict_ndcg@1 0.01895
wandb:            train/predict_ndcg@10 0.04602
wandb:            train/predict_ndcg@20 0.05417
wandb:             train/predict_ndcg@5 0.03611
wandb:            train/predict_ndcg@50 0.0684
wandb:           train/predict_recall@1 0.01895
wandb:          train/predict_recall@10 0.08455
wandb:          train/predict_recall@20 0.11662
wandb:           train/predict_recall@5 0.05394
wandb:          train/predict_recall@50 0.18805
wandb:            train/predict_runtime 25.0011
wandb: train/predict_samples_per_second 27.439
wandb:   train/predict_steps_per_second 3.44
wandb:                       train_loss 7.92487
wandb:                    train_runtime 4894.9986
wandb:         train_samples_per_second 5.463
wandb:           train_steps_per_second 0.171
"""

print(extract_metrics(data))

0.019, 0.0539, 0.0846, 0.1166, 0.188, 0.019, 0.0303, 0.0345, 0.0367, 0.039, 0.019, 0.0361, 0.046, 0.0542, 0.0684


In [6]:
# 4 - 5e-6

data = """
wandb:                       train/loss 6.9609
wandb:               train/predict_loss 7.47467
wandb:              train/predict_mrr@1 0.03353
wandb:             train/predict_mrr@10 0.05552
wandb:             train/predict_mrr@20 0.05807
wandb:              train/predict_mrr@5 0.04995
wandb:             train/predict_mrr@50 0.06101
wandb:             train/predict_ndcg@1 0.03353
wandb:            train/predict_ndcg@10 0.07238
wandb:            train/predict_ndcg@20 0.08185
wandb:             train/predict_ndcg@5 0.05877
wandb:            train/predict_ndcg@50 0.10029
wandb:           train/predict_recall@1 0.03353
wandb:          train/predict_recall@10 0.12828
wandb:          train/predict_recall@20 0.16618
wandb:           train/predict_recall@5 0.08601
wandb:          train/predict_recall@50 0.25948
wandb:            train/predict_runtime 25.1132
wandb: train/predict_samples_per_second 27.316
wandb:   train/predict_steps_per_second 3.424
wandb:                       train_loss 7.49882
wandb:                    train_runtime 4902.4247
wandb:         train_samples_per_second 5.454
wandb:           train_steps_per_second 0.17
"""

print(extract_metrics(data))

0.0335, 0.086, 0.1283, 0.1662, 0.2595, 0.0335, 0.05, 0.0555, 0.0581, 0.061, 0.0335, 0.0588, 0.0724, 0.0819, 0.1003


In [7]:
# 4 - 1e-5

data = """
wandb:               train/predict_loss 7.45882
wandb:              train/predict_mrr@1 0.03061
wandb:             train/predict_mrr@10 0.0561
wandb:             train/predict_mrr@20 0.05892
wandb:              train/predict_mrr@5 0.05022
wandb:             train/predict_mrr@50 0.06139
wandb:             train/predict_ndcg@1 0.03061
wandb:            train/predict_ndcg@10 0.07396
wandb:            train/predict_ndcg@20 0.08474
wandb:             train/predict_ndcg@5 0.05976
wandb:            train/predict_ndcg@50 0.10092
wandb:           train/predict_recall@1 0.03061
wandb:          train/predict_recall@10 0.13265
wandb:          train/predict_recall@20 0.17638
wandb:           train/predict_recall@5 0.08892
wandb:          train/predict_recall@50 0.25948
wandb:            train/predict_runtime 26.5689
"""

print(extract_metrics(data))

0.0306, 0.0889, 0.1326, 0.1764, 0.2595, 0.0306, 0.0502, 0.0561, 0.0589, 0.0614, 0.0306, 0.0598, 0.074, 0.0847, 0.1009


In [8]:
# 8 - 5e-6

data = """
wandb:               train/predict_loss 7.50784
wandb:              train/predict_mrr@1 0.03061
wandb:             train/predict_mrr@10 0.05312
wandb:             train/predict_mrr@20 0.05583
wandb:              train/predict_mrr@5 0.04798
wandb:             train/predict_mrr@50 0.05805
wandb:             train/predict_ndcg@1 0.03061
wandb:            train/predict_ndcg@10 0.06955
wandb:            train/predict_ndcg@20 0.07972
wandb:             train/predict_ndcg@5 0.05694
wandb:            train/predict_ndcg@50 0.09338
wandb:           train/predict_recall@1 0.03061
wandb:          train/predict_recall@10 0.12391
wandb:          train/predict_recall@20 0.16472
wandb:           train/predict_recall@5 0.08455
wandb:          train/predict_recall@50 0.23324
wandb:            train/predict_runtime 27.7107
"""

print(extract_metrics(data))

0.0306, 0.0846, 0.1239, 0.1647, 0.2332, 0.0306, 0.048, 0.0531, 0.0558, 0.058, 0.0306, 0.0569, 0.0696, 0.0797, 0.0934


In [5]:
# 8 - 1e-5

data = """
wandb:               train/predict_loss 7.45882
wandb:              train/predict_mrr@1 0.02478
wandb:             train/predict_mrr@10 0.05086
wandb:             train/predict_mrr@20 0.0547
wandb:              train/predict_mrr@5 0.04568
wandb:             train/predict_mrr@50 0.05676
wandb:             train/predict_ndcg@1 0.02478
wandb:            train/predict_ndcg@10 0.06797
wandb:            train/predict_ndcg@20 0.08221
wandb:             train/predict_ndcg@5 0.05531
wandb:            train/predict_ndcg@50 0.09476
wandb:           train/predict_recall@1 0.02478
wandb:          train/predict_recall@10 0.12391
wandb:          train/predict_recall@20 0.18076
wandb:           train/predict_recall@5 0.08455
wandb:          train/predict_recall@50 0.24344
wandb:            train/predict_runtime 27.3504
wandb: train/predict_samples_per_second 25.082
wandb:   train/predict_steps_per_second 3.144
wandb:                       train_loss 7.48349
wandb:                    train_runtime 5049.1253
wandb:         train_samples_per_second 5.296
wandb:           train_steps_per_second 0.083
"""

print(extract_metrics(data))

0.0248, 0.0846, 0.1239, 0.1808, 0.2434, 0.0248, 0.0457, 0.0509, 0.0547, 0.0568, 0.0248, 0.0553, 0.068, 0.0822, 0.0948


In [7]:
# 16 - 5e-6

data = """
wandb:               train/predict_loss 7.58856
wandb:              train/predict_mrr@1 0.02332
wandb:             train/predict_mrr@10 0.043
wandb:             train/predict_mrr@20 0.04605
wandb:              train/predict_mrr@5 0.03865
wandb:             train/predict_mrr@50 0.04832
wandb:             train/predict_ndcg@1 0.02332
wandb:            train/predict_ndcg@10 0.05614
wandb:            train/predict_ndcg@20 0.06697
wandb:             train/predict_ndcg@5 0.04571
wandb:            train/predict_ndcg@50 0.08134
wandb:           train/predict_recall@1 0.02332
wandb:          train/predict_recall@10 0.09913
wandb:          train/predict_recall@20 0.1414
wandb:           train/predict_recall@5 0.06706
wandb:          train/predict_recall@50 0.21429
wandb:            train/predict_runtime 26.6928
"""

print(extract_metrics(data))

0.0233, 0.0671, 0.0991, 0.1414, 0.2143, 0.0233, 0.0386, 0.043, 0.0461, 0.0483, 0.0233, 0.0457, 0.0561, 0.067, 0.0813


In [4]:
# 16 - 1e-5

data = """
wandb:                      train/epoch 0.99551
wandb:                train/global_step 208
wandb:                  train/grad_norm 14.48255
wandb:              train/learning_rate 1e-05
wandb:                       train/loss 7.208
wandb:               train/predict_loss 7.5246
wandb:              train/predict_mrr@1 0.02624
wandb:             train/predict_mrr@10 0.04704
wandb:             train/predict_mrr@20 0.05015
wandb:              train/predict_mrr@5 0.0421
wandb:             train/predict_mrr@50 0.05256
wandb:             train/predict_ndcg@1 0.02624
wandb:            train/predict_ndcg@10 0.06218
wandb:            train/predict_ndcg@20 0.07381
wandb:             train/predict_ndcg@5 0.05005
wandb:            train/predict_ndcg@50 0.08843
wandb:           train/predict_recall@1 0.02624
wandb:          train/predict_recall@10 0.11224
wandb:          train/predict_recall@20 0.15889
wandb:           train/predict_recall@5 0.07434
wandb:          train/predict_recall@50 0.23178
wandb:            train/predict_runtime 25.3082
"""

print(extract_metrics(data))

0.0262, 0.0743, 0.1122, 0.1589, 0.2318, 0.0262, 0.0421, 0.047, 0.0502, 0.0526, 0.0262, 0.05, 0.0622, 0.0738, 0.0884


In [4]:
# 2 - 1e-5

data = """
wandb:               train/predict_loss 7.48506
wandb:              train/predict_mrr@1 0.02478
wandb:             train/predict_mrr@10 0.04847
wandb:             train/predict_mrr@20 0.0528
wandb:              train/predict_mrr@5 0.04424
wandb:             train/predict_mrr@50 0.05548
wandb:             train/predict_ndcg@1 0.02478
wandb:            train/predict_ndcg@10 0.06479
wandb:            train/predict_ndcg@20 0.08061
wandb:             train/predict_ndcg@5 0.05447
wandb:            train/predict_ndcg@50 0.09736
wandb:           train/predict_recall@1 0.02478
wandb:          train/predict_recall@10 0.11808
wandb:          train/predict_recall@20 0.18076
wandb:           train/predict_recall@5 0.08601
wandb:          train/predict_recall@50 0.26531
"""

print(extract_metrics(data))

0.0248, 0.086, 0.1181, 0.1808, 0.2653, 0.0248, 0.0442, 0.0485, 0.0528, 0.0555, 0.0248, 0.0545, 0.0648, 0.0806, 0.0974


In [5]:
# 16 - 5e-5

data = """
wandb:               train/predict_loss 7.72631
wandb:              train/predict_mrr@1 0.00729
wandb:             train/predict_mrr@10 0.02231
wandb:             train/predict_mrr@20 0.02385
wandb:              train/predict_mrr@5 0.01866
wandb:             train/predict_mrr@50 0.02563
wandb:             train/predict_ndcg@1 0.00729
wandb:            train/predict_ndcg@10 0.03274
wandb:            train/predict_ndcg@20 0.03879
wandb:             train/predict_ndcg@5 0.02411
wandb:            train/predict_ndcg@50 0.04981
wandb:           train/predict_recall@1 0.00729
wandb:          train/predict_recall@10 0.06706
wandb:          train/predict_recall@20 0.09184
wandb:           train/predict_recall@5 0.04082
wandb:          train/predict_recall@50 0.14723
wandb:            train/predict_runtime 26.1123
wandb: train/predict_samples_per_second 26.271
wandb:   train/predict_steps_per_second 3.293
wandb:                       train_loss 7.85202
wandb:                    train_runtime 4812.0079
wandb:         train_samples_per_second 5.557
wandb:           train_steps_per_second 0.043
"""

print(extract_metrics(data))

0.0073, 0.0408, 0.0671, 0.0918, 0.1472, 0.0073, 0.0187, 0.0223, 0.0238, 0.0256, 0.0073, 0.0241, 0.0327, 0.0388, 0.0498


In [6]:
# 32 - 1e-5

data = """
wandb:               train/predict_loss 7.53754
wandb:              train/predict_mrr@1 0.01895
wandb:             train/predict_mrr@10 0.04241
wandb:             train/predict_mrr@20 0.04475
wandb:              train/predict_mrr@5 0.03785
wandb:             train/predict_mrr@50 0.0474
wandb:             train/predict_ndcg@1 0.01895
wandb:            train/predict_ndcg@10 0.0581
wandb:            train/predict_ndcg@20 0.0666
wandb:             train/predict_ndcg@5 0.04718
wandb:            train/predict_ndcg@50 0.08393
wandb:           train/predict_recall@1 0.01895
wandb:          train/predict_recall@10 0.10933
wandb:          train/predict_recall@20 0.14286
wandb:           train/predict_recall@5 0.0758
wandb:          train/predict_recall@50 0.23178
wandb:            train/predict_runtime 25.3417
wandb: train/predict_samples_per_second 27.07
wandb:   train/predict_steps_per_second 3.394
wandb:                       train_loss 7.75324
"""

print(extract_metrics(data))

0.019, 0.0758, 0.1093, 0.1429, 0.2318, 0.019, 0.0379, 0.0424, 0.0447, 0.0474, 0.019, 0.0472, 0.0581, 0.0666, 0.0839


In [7]:
# 32 - 5e-5

data = """
wandb:               train/predict_loss 7.58582
wandb:              train/predict_mrr@1 0.02041
wandb:             train/predict_mrr@10 0.0396
wandb:             train/predict_mrr@20 0.04274
wandb:              train/predict_mrr@5 0.03671
wandb:             train/predict_mrr@50 0.04554
wandb:             train/predict_ndcg@1 0.02041
wandb:            train/predict_ndcg@10 0.05124
wandb:            train/predict_ndcg@20 0.06316
wandb:             train/predict_ndcg@5 0.0442
wandb:            train/predict_ndcg@50 0.0801
wandb:           train/predict_recall@1 0.02041
wandb:          train/predict_recall@10 0.08892
wandb:          train/predict_recall@20 0.13703
wandb:           train/predict_recall@5 0.06706
wandb:          train/predict_recall@50 0.22157
wandb:            train/predict_runtime 25.3675
"""

print(extract_metrics(data))


0.0204, 0.0671, 0.0889, 0.137, 0.2216, 0.0204, 0.0367, 0.0396, 0.0427, 0.0455, 0.0204, 0.0442, 0.0512, 0.0632, 0.0801


In [8]:
# 64 - 5e-5

data = """
wandb:               train/predict_loss 7.60313
wandb:              train/predict_mrr@1 0.0102
wandb:             train/predict_mrr@10 0.0279
wandb:             train/predict_mrr@20 0.0312
wandb:              train/predict_mrr@5 0.02306
wandb:             train/predict_mrr@50 0.03338
wandb:             train/predict_ndcg@1 0.0102
wandb:            train/predict_ndcg@10 0.04069
wandb:            train/predict_ndcg@20 0.05304
wandb:             train/predict_ndcg@5 0.02892
wandb:            train/predict_ndcg@50 0.06703
wandb:           train/predict_recall@1 0.0102
wandb:          train/predict_recall@10 0.08309
wandb:          train/predict_recall@20 0.13265
wandb:           train/predict_recall@5 0.04665
wandb:          train/predict_recall@50 0.20408
"""

print(extract_metrics(data))

0.0102, 0.0466, 0.0831, 0.1326, 0.2041, 0.0102, 0.0231, 0.0279, 0.0312, 0.0334, 0.0102, 0.0289, 0.0407, 0.053, 0.067


In [3]:
# 新数据(Qwen)

# 1 - 1e-6

data = """
wandb:               train/predict_loss 7.59157
wandb:              train/predict_mrr@1 0.01453
wandb:             train/predict_mrr@10 0.0379
wandb:             train/predict_mrr@20 0.04104
wandb:              train/predict_mrr@5 0.03275
wandb:             train/predict_mrr@50 0.04304
wandb:             train/predict_ndcg@1 0.01453
wandb:            train/predict_ndcg@10 0.05413
wandb:            train/predict_ndcg@20 0.06578
wandb:             train/predict_ndcg@5 0.04152
wandb:            train/predict_ndcg@50 0.0788
wandb:           train/predict_recall@1 0.01453
wandb:          train/predict_recall@10 0.10756
wandb:          train/predict_recall@20 0.15407
wandb:           train/predict_recall@5 0.06831
wandb:          train/predict_recall@50 0.22093
wandb:            train/predict_runtime 17.0051
wandb: train/predict_samples_per_second 40.459
wandb:   train/predict_steps_per_second 5.057
wandb:                       train_loss 7.74529
wandb:                    train_runtime 5272.1581
wandb:         train_samples_per_second 5.083
wandb:           train_steps_per_second 0.635
"""

print(extract_metrics(data))

0.0145, 0.0683, 0.1076, 0.1541, 0.2209, 0.0145, 0.0328, 0.0379, 0.041, 0.043, 0.0145, 0.0415, 0.0541, 0.0658, 0.0788


In [4]:
# 2 - 1e-6

data = """
wandb:                  train/grad_norm 26.937
wandb:              train/learning_rate 0.0
wandb:                       train/loss 7.9688
wandb:               train/predict_loss 7.63463
wandb:              train/predict_mrr@1 0.01308
wandb:             train/predict_mrr@10 0.0321
wandb:             train/predict_mrr@20 0.03421
wandb:              train/predict_mrr@5 0.02798
wandb:             train/predict_mrr@50 0.03659
wandb:             train/predict_ndcg@1 0.01308
wandb:            train/predict_ndcg@10 0.04466
wandb:            train/predict_ndcg@20 0.05261
wandb:             train/predict_ndcg@5 0.03473
wandb:            train/predict_ndcg@50 0.06797
wandb:           train/predict_recall@1 0.01308
wandb:          train/predict_recall@10 0.08576
wandb:          train/predict_recall@20 0.11773
wandb:           train/predict_recall@5 0.05523
wandb:          train/predict_recall@50 0.19622
"""

print(extract_metrics(data))



0.0131, 0.0552, 0.0858, 0.1177, 0.1962, 0.0131, 0.028, 0.0321, 0.0342, 0.0366, 0.0131, 0.0347, 0.0447, 0.0526, 0.068


In [4]:
# 4 - 1e-6

data = """
wandb:                       train/loss 7.4023
wandb:               train/predict_loss 7.68423
wandb:              train/predict_mrr@1 0.01599
wandb:             train/predict_mrr@10 0.02941
wandb:             train/predict_mrr@20 0.03166
wandb:              train/predict_mrr@5 0.02682
wandb:             train/predict_mrr@50 0.03348
wandb:             train/predict_ndcg@1 0.01599
wandb:            train/predict_ndcg@10 0.0386
wandb:            train/predict_ndcg@20 0.04647
wandb:             train/predict_ndcg@5 0.03269
wandb:            train/predict_ndcg@50 0.05796
wandb:           train/predict_recall@1 0.01599
wandb:          train/predict_recall@10 0.06831
wandb:          train/predict_recall@20 0.09884
wandb:           train/predict_recall@5 0.05087
wandb:          train/predict_recall@50 0.15698
wandb:            train/predict_runtime 16.7915
wandb: train/predict_samples_per_second 40.973
wandb:   train/predict_steps_per_second 5.122
wandb:                       train_loss 8.1028
wandb:                    train_runtime 2573.4131
wandb:         train_samples_per_second 10.414
wandb:           train_steps_per_second 0.325
"""

print(extract_metrics(data))


0.016, 0.0509, 0.0683, 0.0988, 0.157, 0.016, 0.0268, 0.0294, 0.0317, 0.0335, 0.016, 0.0327, 0.0386, 0.0465, 0.058


In [3]:
# 4 - 5e-6

data = """
wandb:               train/predict_loss 7.48165
wandb:              train/predict_mrr@1 0.01163
wandb:             train/predict_mrr@10 0.03812
wandb:             train/predict_mrr@20 0.04116
wandb:              train/predict_mrr@5 0.03207
wandb:             train/predict_mrr@50 0.04376
wandb:             train/predict_ndcg@1 0.01163
wandb:            train/predict_ndcg@10 0.05664
wandb:            train/predict_ndcg@20 0.06817
wandb:             train/predict_ndcg@5 0.04176
wandb:            train/predict_ndcg@50 0.08412
wandb:           train/predict_recall@1 0.01163
wandb:          train/predict_recall@10 0.11773
wandb:          train/predict_recall@20 0.16424
wandb:           train/predict_recall@5 0.07122
wandb:          train/predict_recall@50 0.24419
wandb:            train/predict_runtime 16.2421
wandb: train/predict_samples_per_second 42.359
wandb:   train/predict_steps_per_second 5.295
wandb:                       train_loss 7.58607
wandb:                    train_runtime 2853.2199
wandb:         train_samples_per_second 9.393
wandb:           train_steps_per_second 0.293
"""

print(extract_metrics(data))

0.0116, 0.0712, 0.1177, 0.1642, 0.2442, 0.0116, 0.0321, 0.0381, 0.0412, 0.0438, 0.0116, 0.0418, 0.0566, 0.0682, 0.0841


In [9]:
# 8 - 5e-6

data = """
wandb:                       train/loss 7.4121
wandb:               train/predict_loss 7.51962
wandb:              train/predict_mrr@1 0.01453
wandb:             train/predict_mrr@10 0.03581
wandb:             train/predict_mrr@20 0.03887
wandb:              train/predict_mrr@5 0.02936
wandb:             train/predict_mrr@50 0.04134
wandb:             train/predict_ndcg@1 0.01453
wandb:            train/predict_ndcg@10 0.05228
wandb:            train/predict_ndcg@20 0.06359
wandb:             train/predict_ndcg@5 0.03645
wandb:            train/predict_ndcg@50 0.07911
wandb:           train/predict_recall@1 0.01453
wandb:          train/predict_recall@10 0.10756
wandb:          train/predict_recall@20 0.15262
wandb:           train/predict_recall@5 0.05814
wandb:          train/predict_recall@50 0.2311
wandb:            train/predict_runtime 17.9034
wandb: train/predict_samples_per_second 38.428
wandb:   train/predict_steps_per_second 4.804
wandb:                       train_loss 7.68341
wandb:                    train_runtime 2511.1749
wandb:         train_samples_per_second 10.672
wandb:           train_steps_per_second 0.166
"""

print(extract_metrics(data))

0.0145, 0.0581, 0.1076, 0.1526, 0.2311, 0.0145, 0.0294, 0.0358, 0.0389, 0.0413, 0.0145, 0.0365, 0.0523, 0.0636, 0.0791


In [3]:
# 8 - 1e-5

data = """
wandb:              train/learning_rate 1e-05
wandb:                       train/loss 7.3086
wandb:               train/predict_loss 7.49491
wandb:              train/predict_mrr@1 0.01163
wandb:             train/predict_mrr@10 0.03202
wandb:             train/predict_mrr@20 0.03641
wandb:              train/predict_mrr@5 0.02754
wandb:             train/predict_mrr@50 0.03891
wandb:             train/predict_ndcg@1 0.01163
wandb:            train/predict_ndcg@10 0.04695
wandb:            train/predict_ndcg@20 0.06307
wandb:             train/predict_ndcg@5 0.03612
wandb:            train/predict_ndcg@50 0.07864
wandb:           train/predict_recall@1 0.01163
wandb:          train/predict_recall@10 0.09593
wandb:          train/predict_recall@20 0.15988
wandb:           train/predict_recall@5 0.0625
wandb:          train/predict_recall@50 0.23837
wandb:            train/predict_runtime 17.384
wandb: train/predict_samples_per_second 39.577
wandb:   train/predict_steps_per_second 4.947
wandb:                       train_loss 7.57469
wandb:                    train_runtime 2727.7652
wandb:         train_samples_per_second 9.825
wandb:           train_steps_per_second 0.153
"""

print(extract_metrics(data))

0.0116, 0.0625, 0.0959, 0.1599, 0.2384, 0.0116, 0.0275, 0.032, 0.0364, 0.0389, 0.0116, 0.0361, 0.0469, 0.0631, 0.0786


In [4]:
## 0325更新数据

# 1 - 1e-6

data = """
wandb:                       train/loss 7.7031
wandb:               train/predict_loss 7.65493
wandb:              train/predict_mrr@1 0.01306
wandb:             train/predict_mrr@10 0.02888
wandb:             train/predict_mrr@20 0.03255
wandb:              train/predict_mrr@5 0.02579
wandb:             train/predict_mrr@50 0.03502
wandb:             train/predict_ndcg@1 0.01306
wandb:            train/predict_ndcg@10 0.04045
wandb:            train/predict_ndcg@20 0.05396
wandb:             train/predict_ndcg@5 0.03295
wandb:            train/predict_ndcg@50 0.06966
wandb:           train/predict_recall@1 0.01306
wandb:          train/predict_recall@10 0.07837
wandb:          train/predict_recall@20 0.13208
wandb:           train/predict_recall@5 0.05515
wandb:          train/predict_recall@50 0.2119
wandb:            train/predict_runtime 17.2251
"""

print(extract_metrics(data))


0.0131, 0.0551, 0.0784, 0.1321, 0.2119, 0.0131, 0.0258, 0.0289, 0.0326, 0.035, 0.0131, 0.033, 0.0404, 0.054, 0.0697


In [5]:
# 1 - 5e-6
data = """
wandb:                       train/loss 7.6562
wandb:               train/predict_loss 7.56114
wandb:              train/predict_mrr@1 0.01742
wandb:             train/predict_mrr@10 0.03642
wandb:             train/predict_mrr@20 0.03954
wandb:              train/predict_mrr@5 0.03004
wandb:             train/predict_mrr@50 0.0426
wandb:             train/predict_ndcg@1 0.01742
wandb:            train/predict_ndcg@10 0.05175
wandb:            train/predict_ndcg@20 0.06361
wandb:             train/predict_ndcg@5 0.03655
wandb:            train/predict_ndcg@50 0.08328
wandb:           train/predict_recall@1 0.01742
wandb:          train/predict_recall@10 0.10305
wandb:          train/predict_recall@20 0.15094
wandb:           train/predict_recall@5 0.0566
wandb:          train/predict_recall@50 0.25109
"""

print(extract_metrics(data))

0.0174, 0.0566, 0.1031, 0.1509, 0.2511, 0.0174, 0.03, 0.0364, 0.0395, 0.0426, 0.0174, 0.0365, 0.0517, 0.0636, 0.0833


In [6]:
# 2 - 1e-6

data = """
wandb:                       train/loss 7.7109
wandb:               train/predict_loss 7.63253
wandb:              train/predict_mrr@1 0.01161
wandb:             train/predict_mrr@10 0.0281
wandb:             train/predict_mrr@20 0.03141
wandb:              train/predict_mrr@5 0.02242
wandb:             train/predict_mrr@50 0.03367
wandb:             train/predict_ndcg@1 0.01161
wandb:            train/predict_ndcg@10 0.04253
wandb:            train/predict_ndcg@20 0.05462
wandb:             train/predict_ndcg@5 0.0283
wandb:            train/predict_ndcg@50 0.06955
wandb:           train/predict_recall@1 0.01161
wandb:          train/predict_recall@10 0.09144
wandb:          train/predict_recall@20 0.13933
wandb:           train/predict_recall@5 0.04644
wandb:          train/predict_recall@50 0.21626
wandb:            train/predict_runtime 16.7603
wandb: train/predict_samples_per_second 41.109
wandb:   train/predict_steps_per_second 5.191
wandb:                       train_loss 7.87493
wandb:                    train_runtime 3137.4575
wandb:         train_samples_per_second 8.53
wandb:           train_steps_per_second 0.533
"""

print(extract_metrics(data))

0.0116, 0.0464, 0.0914, 0.1393, 0.2163, 0.0116, 0.0224, 0.0281, 0.0314, 0.0337, 0.0116, 0.0283, 0.0425, 0.0546, 0.0696


In [6]:
# 新数据（DeepSeek）

# 1 - 5e-7

data = """
wandb:              train/learning_rate 0.0
wandb:                       train/loss 7.5156
wandb:               train/predict_loss 7.74729
wandb:              train/predict_mrr@1 0.01012
wandb:             train/predict_mrr@10 0.02332
wandb:             train/predict_mrr@20 0.02673
wandb:              train/predict_mrr@5 0.01879
wandb:             train/predict_mrr@50 0.02889
wandb:             train/predict_ndcg@1 0.01012
wandb:            train/predict_ndcg@10 0.0341
wandb:            train/predict_ndcg@20 0.04628
wandb:             train/predict_ndcg@5 0.02271
wandb:            train/predict_ndcg@50 0.05955
wandb:           train/predict_recall@1 0.01012
wandb:          train/predict_recall@10 0.07081
wandb:          train/predict_recall@20 0.1185
wandb:           train/predict_recall@5 0.03468
wandb:          train/predict_recall@50 0.18497
wandb:            train/predict_runtime 17.5363
wandb: train/predict_samples_per_second 39.461
wandb:   train/predict_steps_per_second 4.961
wandb:                       train_loss 7.971
wandb:                    train_runtime 3533.0826
wandb:         train_samples_per_second 7.597
wandb:           train_steps_per_second 0.95
"""

print(extract_metrics(data))

0.0101, 0.0347, 0.0708, 0.1185, 0.185, 0.0101, 0.0188, 0.0233, 0.0267, 0.0289, 0.0101, 0.0227, 0.0341, 0.0463, 0.0595


In [4]:
# 使用Qwen2.5-7B-Instruct模型

data = """
wandb:               train/predict_loss 7.70203
wandb:              train/predict_mrr@1 0.01453
wandb:             train/predict_mrr@10 0.03198
wandb:             train/predict_mrr@20 0.03456
wandb:              train/predict_mrr@5 0.0272
wandb:             train/predict_mrr@50 0.03685
wandb:             train/predict_ndcg@1 0.01453
wandb:            train/predict_ndcg@10 0.04572
wandb:            train/predict_ndcg@20 0.05521
wandb:             train/predict_ndcg@5 0.03404
wandb:            train/predict_ndcg@50 0.06876
wandb:           train/predict_recall@1 0.01453
wandb:          train/predict_recall@10 0.09157
wandb:          train/predict_recall@20 0.12936
wandb:           train/predict_recall@5 0.05523
wandb:          train/predict_recall@50 0.19622
wandb:            train/predict_runtime 17.1406
"""

print(extract_metrics(data))



0.0145, 0.0552, 0.0916, 0.1294, 0.1962, 0.0145, 0.0272, 0.032, 0.0346, 0.0369, 0.0145, 0.034, 0.0457, 0.0552, 0.0688


In [3]:
# 0326更新数据
data = """
wandb:                       train/loss 7.125
wandb:               train/predict_loss 7.58543
wandb:              train/predict_mrr@1 0.01331
wandb:             train/predict_mrr@10 0.03431
wandb:             train/predict_mrr@20 0.03811
wandb:              train/predict_mrr@5 0.02848
wandb:             train/predict_mrr@50 0.04021
wandb:             train/predict_ndcg@1 0.01331
wandb:            train/predict_ndcg@10 0.05026
wandb:            train/predict_ndcg@20 0.06435
wandb:             train/predict_ndcg@5 0.03599
wandb:            train/predict_ndcg@50 0.07774
wandb:           train/predict_recall@1 0.01331
wandb:          train/predict_recall@10 0.10355
wandb:          train/predict_recall@20 0.15976
wandb:           train/predict_recall@5 0.05917
wandb:          train/predict_recall@50 0.22781
wandb:            train/predict_runtime 17.4182
"""

print(extract_metrics(data))


0.0133, 0.0592, 0.1036, 0.1598, 0.2278, 0.0133, 0.0285, 0.0343, 0.0381, 0.0402, 0.0133, 0.036, 0.0503, 0.0644, 0.0777


## 点击保留user + recommender

In [3]:
# 4 - 1e-6 - 1 epoch

data = """
wandb:                       train/loss 7.6953
wandb:               train/predict_loss 7.79677
wandb:              train/predict_mrr@1 0.00824
wandb:             train/predict_mrr@10 0.01905
wandb:             train/predict_mrr@20 0.02135
wandb:              train/predict_mrr@5 0.01686
wandb:             train/predict_mrr@50 0.02358
wandb:             train/predict_ndcg@1 0.00824
wandb:            train/predict_ndcg@10 0.02611
wandb:            train/predict_ndcg@20 0.03465
wandb:             train/predict_ndcg@5 0.02058
wandb:            train/predict_ndcg@50 0.04882
wandb:           train/predict_recall@1 0.00824
wandb:          train/predict_recall@10 0.04945
wandb:          train/predict_recall@20 0.08352
wandb:           train/predict_recall@5 0.03187
wandb:          train/predict_recall@50 0.15549
wandb:            train/predict_runtime 46.6808
"""

print(extract_metrics(data))


0.0082, 0.0319, 0.0495, 0.0835, 0.1555, 0.0082, 0.0169, 0.0191, 0.0214, 0.0236, 0.0082, 0.0206, 0.0261, 0.0347, 0.0488


In [6]:
data = """
wandb:                       train/loss 7.9219
wandb:               train/predict_loss 7.78167
wandb:              train/predict_mrr@1 0.00397
wandb:             train/predict_mrr@10 0.01194
wandb:             train/predict_mrr@20 0.014
wandb:              train/predict_mrr@5 0.0094
wandb:             train/predict_mrr@50 0.01621
wandb:             train/predict_ndcg@1 0.00397
wandb:            train/predict_ndcg@10 0.01884
wandb:            train/predict_ndcg@20 0.02682
wandb:             train/predict_ndcg@5 0.01268
wandb:            train/predict_ndcg@50 0.04098
wandb:           train/predict_recall@1 0.00397
wandb:          train/predict_recall@10 0.04203
wandb:          train/predict_recall@20 0.07454
wandb:           train/predict_recall@5 0.023
wandb:          train/predict_recall@50 0.14671
wandb:            train/predict_runtime 33.9192
wandb: train/predict_samples_per_second 37.177
wandb:   train/predict_steps_per_second 4.658
wandb:                       train_loss 8.02426
wandb:                    train_runtime 1617.2116
"""

print(extract_metrics(data))

0.004, 0.023, 0.042, 0.0745, 0.1467, 0.004, 0.0094, 0.0119, 0.014, 0.0162, 0.004, 0.0127, 0.0188, 0.0268, 0.041


## 交互记录+偏好分析的匹配

### filter

In [4]:
# 4 5e-6 1 epoch gas=16

data = """
wandb:                       train/loss 6.8115
wandb:               train/predict_loss 6.88039
wandb:              train/predict_mrr@1 0.07308
wandb:             train/predict_mrr@10 0.11907
wandb:             train/predict_mrr@20 0.12359
wandb:              train/predict_mrr@5 0.11089
wandb:             train/predict_mrr@50 0.12618
wandb:             train/predict_ndcg@1 0.07308
wandb:            train/predict_ndcg@10 0.14784
wandb:            train/predict_ndcg@20 0.16426
wandb:             train/predict_ndcg@5 0.12808
wandb:            train/predict_ndcg@50 0.18032
wandb:           train/predict_recall@1 0.07308
wandb:          train/predict_recall@10 0.24121
wandb:          train/predict_recall@20 0.30604
wandb:           train/predict_recall@5 0.18022
wandb:          train/predict_recall@50 0.38681
wandb:            train/predict_runtime 123.4255
"""

print(extract_metrics(data))

0.0731, 0.1802, 0.2412, 0.306, 0.3868, 0.0731, 0.1109, 0.1191, 0.1236, 0.1262, 0.0731, 0.1281, 0.1478, 0.1643, 0.1803
