|
1 | | -from parallax.sglang.monkey_patch_utils.glm4_moe_model import ( |
2 | | - apply_glm4_moe_monkey_patch, |
3 | | -) |
4 | | -from parallax.sglang.monkey_patch_utils.gpt_oss_model import apply_gpt_oss_monkey_patch |
5 | | -from parallax.sglang.monkey_patch_utils.minimax_m2_model import ( |
6 | | - apply_minimax_m2_monkey_patch, |
7 | | -) |
8 | | -from parallax.sglang.monkey_patch_utils.model_parallel import ( |
9 | | - apply_model_parallel_monkey_patch, |
10 | | -) |
11 | | -from parallax.sglang.monkey_patch_utils.qwen3_next_config import ( |
12 | | - apply_qwen3_next_config_monkey_patch, |
13 | | -) |
14 | | -from parallax.sglang.monkey_patch_utils.qwen3_next_model import ( |
15 | | - apply_qwen3_next_monkey_patch, |
16 | | -) |
17 | | -from parallax.sglang.monkey_patch_utils.triton_backend import ( |
18 | | - apply_triton_backend_init_monkey_patch, |
19 | | -) |
20 | | -from parallax.sglang.monkey_patch_utils.weight_loader_filter import ( |
21 | | - apply_weight_loader_filter_patch, |
22 | | -) |
23 | | - |
24 | | - |
25 | | -## Here is some patch func for sglang |
26 | | -## Hopefully, when sglang support pipeline parallelism natively, we can remove these patches |
| 1 | +""" |
| 2 | +Here is some patch func for sglang |
| 3 | +Hopefully, when sglang support pipeline parallelism natively, we can remove these patches |
| 4 | +""" |
| 5 | + |
| 6 | + |
27 | 7 | def apply_parallax_sglang_monkey_patch(): |
| 8 | + from parallax.sglang.monkey_patch_utils.model_parallel import ( |
| 9 | + apply_model_parallel_monkey_patch, |
| 10 | + ) |
| 11 | + |
28 | 12 | apply_model_parallel_monkey_patch() |
| 13 | + |
| 14 | + from parallax.sglang.monkey_patch_utils.triton_backend import ( |
| 15 | + apply_triton_backend_init_monkey_patch, |
| 16 | + ) |
| 17 | + |
29 | 18 | apply_triton_backend_init_monkey_patch() |
| 19 | + |
| 20 | + from parallax.sglang.monkey_patch_utils.weight_loader_filter import ( |
| 21 | + apply_weight_loader_filter_patch, |
| 22 | + ) |
| 23 | + |
30 | 24 | apply_weight_loader_filter_patch() |
31 | | - apply_qwen3_next_monkey_patch() |
| 25 | + |
| 26 | + from parallax.sglang.monkey_patch_utils.qwen3_next_config import ( |
| 27 | + apply_qwen3_next_config_monkey_patch, |
| 28 | + ) |
| 29 | + |
32 | 30 | apply_qwen3_next_config_monkey_patch() |
| 31 | + |
| 32 | + from parallax.sglang.monkey_patch_utils.qwen3_next_model import ( |
| 33 | + apply_qwen3_next_monkey_patch, |
| 34 | + ) |
| 35 | + |
| 36 | + apply_qwen3_next_monkey_patch() |
| 37 | + |
| 38 | + from parallax.sglang.monkey_patch_utils.gpt_oss_model import ( |
| 39 | + apply_gpt_oss_monkey_patch, |
| 40 | + ) |
| 41 | + |
33 | 42 | apply_gpt_oss_monkey_patch() |
| 43 | + |
| 44 | + from parallax.sglang.monkey_patch_utils.minimax_m2_model import ( |
| 45 | + apply_minimax_m2_monkey_patch, |
| 46 | + ) |
| 47 | + |
34 | 48 | apply_minimax_m2_monkey_patch() |
| 49 | + |
| 50 | + from parallax.sglang.monkey_patch_utils.glm4_moe_model import ( |
| 51 | + apply_glm4_moe_monkey_patch, |
| 52 | + ) |
| 53 | + |
35 | 54 | apply_glm4_moe_monkey_patch() |
0 commit comments