diff --git a/custom_ops/xpu_ops/src/ops/moe_expert_ffn.cc b/custom_ops/xpu_ops/src/ops/moe_expert_ffn.cc index 860fd850348..45868821440 100644 --- a/custom_ops/xpu_ops/src/ops/moe_expert_ffn.cc +++ b/custom_ops/xpu_ops/src/ops/moe_expert_ffn.cc @@ -441,7 +441,7 @@ std::vector MoeExpertFFN( const std::string& quant_method, const int hadamard_blocksize, const int valid_token_num) { - if (ffn_in.numel() == 0) { + if (ffn_in.numel() == 0 || valid_token_num == 0) { paddle::Tensor ffn2_out = paddle::empty_like(ffn_in, paddle::DataType::BFLOAT16); return {ffn2_out};