diff --git a/mlperf_logging/compliance_checker/training_5.1.0/closed_llama31_8b.yaml b/mlperf_logging/compliance_checker/training_5.1.0/closed_llama31_8b.yaml index 3619827..b6335dc 100644 --- a/mlperf_logging/compliance_checker/training_5.1.0/closed_llama31_8b.yaml +++ b/mlperf_logging/compliance_checker/training_5.1.0/closed_llama31_8b.yaml @@ -4,46 +4,82 @@ POST: > s['global_batch_size'] = v['value'] -# TODO: Update with official compliance requirements +- KEY: + NAME: max_sequence_length + REQ: EXACTLY_ONE + CHECK: " v['value'] == 8192 " + +- KEY: + NAME: opt_name + REQ: EXACTLY_ONE + CHECK: " v['value'] == 'adamw' " + - KEY: NAME: opt_base_learning_rate REQ: EXACTLY_ONE - KEY: - NAME: opt_lamb_epsilon + NAME: opt_end_learning_rate REQ: EXACTLY_ONE - KEY: - NAME: opt_learning_rate_training_steps + NAME: opt_learning_rate_decay_steps REQ: EXACTLY_ONE + CHECK: " v['value'] * s['global_batch_size'] == 1.2e6 " - KEY: NAME: opt_learning_rate_warmup_steps REQ: EXACTLY_ONE - KEY: - NAME: num_warmup_steps + NAME: opt_learning_rate_decay_schedule + REQ: EXACTLY_ONE + CHECK: " v['value'] == 'cosine with linear warmup' " + +- KEY: + NAME: opt_adamw_beta_1 REQ: EXACTLY_ONE + CHECK: " v['value'] == 0.9 " - KEY: - NAME: start_warmup_step + NAME: opt_adamw_beta_2 REQ: EXACTLY_ONE + CHECK: " v['value'] == 0.95 " - KEY: - NAME: opt_lamb_beta_1 + NAME: opt_adamw_epsilon REQ: EXACTLY_ONE + CHECK: " v['value'] == 1e-05 " - KEY: - NAME: opt_lamb_beta_2 + NAME: opt_adamw_weight_decay REQ: EXACTLY_ONE + CHECK: " v['value'] == 0.1 " - KEY: - NAME: opt_lamb_weight_decay_rate + NAME: opt_gradient_clip_norm REQ: EXACTLY_ONE + CHECK: " v['value'] == 1.0 " + +- KEY: + NAME: gradient_accumulation_steps + REQ: EXACTLY_ONE + CHECK: " v['value'] > 0 " + +- KEY: + NAME: eval_samples + REQ: EXACTLY_ONE + CHECK: " v['value'] == 1024 " - KEY: NAME: eval_accuracy REQ: AT_LEAST_ONE CHECK: - - "'epoch_num' in v['metadata']" - ATLEAST_ONE_CHECK: "(v['value'] >= 0.720) and v['value'] < 1.0" + - "'samples_count' in v['metadata']" + ATLEAST_ONE_CHECK: "(v['value'] <= 3.3) and v['value'] > 0.0" + +- KEY: + NAME: MAX_STEPS + REQ: EXACTLY_ONE + CHECK: " v['value'] == 1200000 " +