end

MrZ20 · MrZ20 · commit 3a0e746b49b5 · 2026-01-06T17:35:08.000+08:00
Signed-off-by: MrZ20 &lt;2609716663@qq.com&gt;
diff --git a/.github/workflows/nightly_test_a3.yaml b/.github/workflows/nightly_test_a3.yaml
@@ -74,11 +74,11 @@ jobs:
           - name: multi-node-qwenw8a8-2node-longseq
             config_file_path: Qwen3-235B-W8A8-longseq.yaml
             size: 2
-          - name: multi-node-qwen3-235b-a22b-pd
-            config_file_path: Qwen3-235B-A22B-pd.yaml
+          - name: multi-node-qwen-disagg-pd
+            config_file_path: Qwen3-235B-disagg-pd.yaml
             size: 2
-          - name: multi-node-qwen3-vl-235b-a22b-instruct
-            config_file_path: Qwen3-VL-235B-A22B-Instruct.yaml
+          - name: multi-node-qwen-vl-disagg-pd
+            config_file_path: Qwen3-VL-235B-disagg-pd.yaml
             size: 2
     uses: ./.github/workflows/_e2e_nightly_multi_node.yaml
     with:
diff --git a/tests/e2e/nightly/multi_node/config/Qwen3-235B-disagg-pd.yaml b/tests/e2e/nightly/multi_node/config/Qwen3-235B-disagg-pd.yaml
@@ -1,4 +1,4 @@
-test_name: "test Qwen3-235B-A22B pd online"
+test_name: "test Qwen3-235B-A22B disaggregated_prefill"
 model: "Qwen/Qwen3-235B-A22B"
 num_nodes: 2
 npu_per_node: 16
diff --git a/tests/e2e/nightly/multi_node/config/Qwen3-VL-235B-disagg-pd.yaml b/tests/e2e/nightly/multi_node/config/Qwen3-VL-235B-disagg-pd.yaml
@@ -1,4 +1,4 @@
-test_name: "test qwen3-vl-235b-a22b disaggregated_prefill on A3"
+test_name: "test Qwen3-VL-235B-A22B disaggregated_prefill"
 model: "Qwen/Qwen3-VL-235B-A22B-Instruct"
 num_nodes: 2
 npu_per_node: 16
@@ -11,7 +11,6 @@ env_common:
   HCCL_OP_EXPANSION_MODE: "AIV"
   TASK_QUEUE_ENABLE: 1
   PYTORCH_NPU_ALLOC_CONF: expandable_segments:True
-  DISAGGREGATED_PREFILL_PROXY_SCRIPT: "examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py"
 
 disaggregated_prefill:
   enabled: true
diff --git a/vllm_ascend/ascend_config.py b/vllm_ascend/ascend_config.py
@@ -102,8 +102,12 @@ def __init__(self, vllm_config: "VllmConfig"):
                     decode_tp_size = min(decode_tp_size, num_kv_head)
                     self.pd_head_ratio = prefill_tp_size // decode_tp_size
                 except Exception:
-                    raise AssertionError(
-                        "Can not get num_key_value_heads from model_config")
+                    raise ValueError(
+                        "The text_config extracted from the model config does not have "
+                        "`num_key_value_heads` attribute. This indicates a mismatch "
+                        "between the model config and vLLM's expectations. Please "
+                        "ensure that the model config is compatible with vLLM."
+                    )
 
             if self.pd_tp_ratio == 0:
                 raise AssertionError(

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-test_name: "test Qwen3-235B-A22B pd online"`
	`1`	`+test_name: "test Qwen3-235B-A22B disaggregated_prefill"`
`2`	`2`	`model: "Qwen/Qwen3-235B-A22B"`
`3`	`3`	`num_nodes: 2`
`4`	`4`	`npu_per_node: 16`