diff --git a/src/transformers/integrations/hub_kernels.py b/src/transformers/integrations/hub_kernels.py index 112ac670e9a0..673780654872 100644 --- a/src/transformers/integrations/hub_kernels.py +++ b/src/transformers/integrations/hub_kernels.py @@ -71,6 +71,12 @@ layer_name="RMSNorm", ) }, + "npu": { + Mode.INFERENCE: LayerRepository( + repo_id="kernels-community/liger_kernels", + layer_name="LigerRMSNorm", + ) + }, }, "MLP": { "cuda": LayerRepository(