diff --git a/examples/auto_deploy/model_registry/models.yaml b/examples/auto_deploy/model_registry/models.yaml index e71fef61adaa..fe948e349efb 100644 --- a/examples/auto_deploy/model_registry/models.yaml +++ b/examples/auto_deploy/model_registry/models.yaml @@ -310,10 +310,9 @@ models: # - name: deepseek-ai/DeepSeek-R1 # config_id: deepseek_r1 # yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'deepseek-r1.yaml', 'enable_sharder_ir.yaml'] -# OOM during AutoDeploy run. -# - name: deepseek-ai/DeepSeek-R1-0528 -# config_id: deepseek_r1 -# yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'deepseek-r1.yaml', 'enable_sharder_ir.yaml'] +- name: deepseek-ai/DeepSeek-R1-0528 + config_id: deepseek_r1 + yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'deepseek-r1.yaml', 'enable_sharder_ir.yaml'] # OOM during AutoDeploy run. # - name: deepseek-ai/DeepSeek-Coder-V2-Instruct # config_id: deepseek_v2_ep @@ -374,14 +373,12 @@ models: # config_id: default_ws_4 # yaml_extra: ['dashboard_default.yaml', 'world_size_4.yaml'] # --- Qwen3.5 MoE (Feb 2026) --- -# tensorrt_llm.executor.utils.RequestError: Ran into a kwarg keyword mismatch. -# - name: Qwen/Qwen3.5-35B-A3B -# config_id: qwen3_5_moe_35b -# yaml_extra: ['dashboard_default.yaml', 'world_size_2.yaml', 'qwen3.5_moe_35b.yaml', 'enable_sharder_ir.yaml'] -# OOM during AutoDeploy run. -# - name: Qwen/Qwen3.5-397B-A17B -# config_id: qwen3_5_moe_400b -# yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'qwen3.5_moe_400b.yaml', 'enable_sharder_ir.yaml'] +- name: Qwen/Qwen3.5-35B-A3B + config_id: qwen3_5_moe_35b + yaml_extra: ['dashboard_default.yaml', 'world_size_2.yaml', 'qwen3.5_moe_35b.yaml', 'enable_sharder_ir.yaml'] +- name: Qwen/Qwen3.5-397B-A17B + config_id: qwen3_5_moe_400b + yaml_extra: ['dashboard_default.yaml', 'world_size_8.yaml', 'qwen3.5_moe_400b.yaml', 'enable_sharder_ir.yaml'] # --- GLM-5 (Feb 2026) --- - name: zai-org/GLM-5 config_id: glm_5