From b4b1274bd0fc7743368843f11e0b0549e1285a2e Mon Sep 17 00:00:00 2001 From: Jintao Huang Date: Thu, 18 Jun 2026 16:35:31 +0800 Subject: [PATCH 1/3] fix moe_router_load_balancing_type --- src/mcore_bridge/config/model_config.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/mcore_bridge/config/model_config.py b/src/mcore_bridge/config/model_config.py index 257f16b..42e0331 100644 --- a/src/mcore_bridge/config/model_config.py +++ b/src/mcore_bridge/config/model_config.py @@ -173,8 +173,7 @@ class ModelConfig(TransformerConfig): moe_router_bias_update_rate: float = 1e-3 moe_router_enable_expert_bias: bool = False moe_router_topk_scaling_factor: Optional[float] = None - moe_router_load_balancing_type: Literal['aux_loss', 'seq_aux_loss', 'global_aux_loss', 'sinkhorn', - 'none'] = 'aux_loss' + moe_router_load_balancing_type: Union[str, List[str]] = "aux_loss" moe_shared_expert_gate: bool = False # mla From 08023a297f41d1283bd0f2adff3596cba6987c48 Mon Sep 17 00:00:00 2001 From: Jintao Huang Date: Thu, 18 Jun 2026 18:06:48 +0800 Subject: [PATCH 2/3] lint pass --- src/mcore_bridge/config/model_config.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/mcore_bridge/config/model_config.py b/src/mcore_bridge/config/model_config.py index 42e0331..12d2b31 100644 --- a/src/mcore_bridge/config/model_config.py +++ b/src/mcore_bridge/config/model_config.py @@ -173,7 +173,7 @@ class ModelConfig(TransformerConfig): moe_router_bias_update_rate: float = 1e-3 moe_router_enable_expert_bias: bool = False moe_router_topk_scaling_factor: Optional[float] = None - moe_router_load_balancing_type: Union[str, List[str]] = "aux_loss" + moe_router_load_balancing_type: Union[str, List[str]] = 'aux_loss' moe_shared_expert_gate: bool = False # mla From 40317158d8cbba614fad2ed52d2a774f01d7b332 Mon Sep 17 00:00:00 2001 From: Jintao Huang Date: Mon, 22 Jun 2026 11:10:02 +0800 Subject: [PATCH 3/3] update --- src/mcore_bridge/config/model_config.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/mcore_bridge/config/model_config.py b/src/mcore_bridge/config/model_config.py index 12d2b31..ce07979 100644 --- a/src/mcore_bridge/config/model_config.py +++ b/src/mcore_bridge/config/model_config.py @@ -173,6 +173,7 @@ class ModelConfig(TransformerConfig): moe_router_bias_update_rate: float = 1e-3 moe_router_enable_expert_bias: bool = False moe_router_topk_scaling_factor: Optional[float] = None + # 'aux_loss', 'seq_aux_loss', 'global_aux_loss', 'sinkhorn', 'none' moe_router_load_balancing_type: Union[str, List[str]] = 'aux_loss' moe_shared_expert_gate: bool = False