Skip to content

Commit

Permalink
Merge pull request facebookresearch#2 from ustcwhy/patch-1
Browse files Browse the repository at this point in the history
Update fairseq_criterion.py
  • Loading branch information
shumingma committed Nov 14, 2023
2 parents 8069d60 + 87e6d91 commit 7b370e1
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions fairseq/criterions/fairseq_criterion.py
Original file line number Diff line number Diff line change
Expand Up @@ -164,6 +164,10 @@ class MoECriterion(FairseqCriterion):
"unused_expert2_count", # average number of 2nd experts which process no tokens
"all_to_all_cpu_time_ms", # CPU time spent in all to all calls in milliseconds
"all_to_all_cuda_time_ms", # CUDA ttime spent in all to all calls in milliseconds
"moe_second_expert_threshold",
"expert1_token",
"expert2_token",
"moe_expert_noise_threshold",
]
def __init__(self, task, moe_gate_loss_wt, moe_gate_loss_combine_method, moe_gate_loss_transform, sentence_avg):
super().__init__(task)
Expand Down

0 comments on commit 7b370e1

Please sign in to comment.