Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
73 changes: 46 additions & 27 deletions src/parallax/sglang/monkey_patch.py
Original file line number Diff line number Diff line change
@@ -1,35 +1,54 @@
from parallax.sglang.monkey_patch_utils.glm4_moe_model import (
apply_glm4_moe_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.gpt_oss_model import apply_gpt_oss_monkey_patch
from parallax.sglang.monkey_patch_utils.minimax_m2_model import (
apply_minimax_m2_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.model_parallel import (
apply_model_parallel_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.qwen3_next_config import (
apply_qwen3_next_config_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.qwen3_next_model import (
apply_qwen3_next_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.triton_backend import (
apply_triton_backend_init_monkey_patch,
)
from parallax.sglang.monkey_patch_utils.weight_loader_filter import (
apply_weight_loader_filter_patch,
)


## Here is some patch func for sglang
## Hopefully, when sglang support pipeline parallelism natively, we can remove these patches
"""
Here is some patch func for sglang
Hopefully, when sglang support pipeline parallelism natively, we can remove these patches
"""


def apply_parallax_sglang_monkey_patch():
from parallax.sglang.monkey_patch_utils.model_parallel import (
apply_model_parallel_monkey_patch,
)

apply_model_parallel_monkey_patch()

from parallax.sglang.monkey_patch_utils.triton_backend import (
apply_triton_backend_init_monkey_patch,
)

apply_triton_backend_init_monkey_patch()

from parallax.sglang.monkey_patch_utils.weight_loader_filter import (
apply_weight_loader_filter_patch,
)

apply_weight_loader_filter_patch()
apply_qwen3_next_monkey_patch()

from parallax.sglang.monkey_patch_utils.qwen3_next_config import (
apply_qwen3_next_config_monkey_patch,
)

apply_qwen3_next_config_monkey_patch()

from parallax.sglang.monkey_patch_utils.qwen3_next_model import (
apply_qwen3_next_monkey_patch,
)

apply_qwen3_next_monkey_patch()

from parallax.sglang.monkey_patch_utils.gpt_oss_model import (
apply_gpt_oss_monkey_patch,
)

apply_gpt_oss_monkey_patch()

from parallax.sglang.monkey_patch_utils.minimax_m2_model import (
apply_minimax_m2_monkey_patch,
)

apply_minimax_m2_monkey_patch()

from parallax.sglang.monkey_patch_utils.glm4_moe_model import (
apply_glm4_moe_monkey_patch,
)

apply_glm4_moe_monkey_patch()