Skip to content

Commit 3a0e746

Browse files
committed
end
Signed-off-by: MrZ20 <[email protected]>
1 parent f596c07 commit 3a0e746

File tree

4 files changed

+12
-9
lines changed

4 files changed

+12
-9
lines changed

.github/workflows/nightly_test_a3.yaml

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -74,11 +74,11 @@ jobs:
7474
- name: multi-node-qwenw8a8-2node-longseq
7575
config_file_path: Qwen3-235B-W8A8-longseq.yaml
7676
size: 2
77-
- name: multi-node-qwen3-235b-a22b-pd
78-
config_file_path: Qwen3-235B-A22B-pd.yaml
77+
- name: multi-node-qwen-disagg-pd
78+
config_file_path: Qwen3-235B-disagg-pd.yaml
7979
size: 2
80-
- name: multi-node-qwen3-vl-235b-a22b-instruct
81-
config_file_path: Qwen3-VL-235B-A22B-Instruct.yaml
80+
- name: multi-node-qwen-vl-disagg-pd
81+
config_file_path: Qwen3-VL-235B-disagg-pd.yaml
8282
size: 2
8383
uses: ./.github/workflows/_e2e_nightly_multi_node.yaml
8484
with:

tests/e2e/nightly/multi_node/config/Qwen3-235B-A22B-pd.yaml renamed to tests/e2e/nightly/multi_node/config/Qwen3-235B-disagg-pd.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
test_name: "test Qwen3-235B-A22B pd online"
1+
test_name: "test Qwen3-235B-A22B disaggregated_prefill"
22
model: "Qwen/Qwen3-235B-A22B"
33
num_nodes: 2
44
npu_per_node: 16

tests/e2e/nightly/multi_node/config/Qwen3-VL-235B-A22B-Instruct.yaml renamed to tests/e2e/nightly/multi_node/config/Qwen3-VL-235B-disagg-pd.yaml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
test_name: "test qwen3-vl-235b-a22b disaggregated_prefill on A3"
1+
test_name: "test Qwen3-VL-235B-A22B disaggregated_prefill"
22
model: "Qwen/Qwen3-VL-235B-A22B-Instruct"
33
num_nodes: 2
44
npu_per_node: 16
@@ -11,7 +11,6 @@ env_common:
1111
HCCL_OP_EXPANSION_MODE: "AIV"
1212
TASK_QUEUE_ENABLE: 1
1313
PYTORCH_NPU_ALLOC_CONF: expandable_segments:True
14-
DISAGGREGATED_PREFILL_PROXY_SCRIPT: "examples/disaggregated_prefill_v1/load_balance_proxy_server_example.py"
1514

1615
disaggregated_prefill:
1716
enabled: true

vllm_ascend/ascend_config.py

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -102,8 +102,12 @@ def __init__(self, vllm_config: "VllmConfig"):
102102
decode_tp_size = min(decode_tp_size, num_kv_head)
103103
self.pd_head_ratio = prefill_tp_size // decode_tp_size
104104
except Exception:
105-
raise AssertionError(
106-
"Can not get num_key_value_heads from model_config")
105+
raise ValueError(
106+
"The text_config extracted from the model config does not have "
107+
"`num_key_value_heads` attribute. This indicates a mismatch "
108+
"between the model config and vLLM's expectations. Please "
109+
"ensure that the model config is compatible with vLLM."
110+
)
107111

108112
if self.pd_tp_ratio == 0:
109113
raise AssertionError(

0 commit comments

Comments
 (0)