We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents dff1d0c + 9184714 commit 59e0f17Copy full SHA for 59e0f17
1 file changed
src/maxtext/models/gemma4.py
@@ -370,7 +370,7 @@ def __call__(
370
371
next_layer_addition = mlp_lnx + residual
372
layer_output = next_layer_addition
373
- layer_output = layer_output * self.layer_scalar.value
+ layer_output = layer_output * jnp.asarray(self.layer_scalar.value, cfg.dtype)
374
375
layer_output = nn.with_logical_constraint(layer_output, self.activation_axis_names)
376
0 commit comments