[Fix] use more acurrate golden results and delete a test

1Fire4 · 1Fire4 · commit 7d649deeaa28 · 2025-09-09T10:03:55.000+08:00
Signed-off-by: 1Fire4 &lt;wangdingyi2@huawei.com&gt;
diff --git a/tests/e2e/multicard/test_torchair_graph_mode.py b/tests/e2e/multicard/test_torchair_graph_mode.py
@@ -207,22 +207,16 @@ def stubbed_get_state(ep_size, with_prefill, is_deepseek_v3_r1):
             # use greedy sampler to make sure the generated results are fix
             vllm_output = vllm_model.generate_greedy(example_prompts, 5)
 
-        # NOTE: vllm-ascend/pangu-pro-moe-pruing is only part of PanguProMoE
-        # with 2 hidden layers, thus the golden results seems inaccurate.
-        # This will only change if accuracy changes with the official weights
-        # of PanguProMoE.
         golden_results = [
-            'Hello, my name is Remempondeprecatedmiot忱',
-            'The president of the United States is Remem下的一个 rever ceremoni Segnali',
-            'The capital of France is Rememvoud administrativ Remem投',
-            'The future of AI isotope Segnali Zoeken精细化 supus',
+            'Hello, my name is qwen3',
+            'The president of the United States is Trump',
+            'The capital of France is Pairs',
+            'The future of AI isotope Segnali Zoeken supus',
         ]
 
-        assert len(golden_results) == len(vllm_output)
         for i in range(len(vllm_output)):
+            assert golden_results[i] == vllm_output[i][1]
             print(f"Generated text: {vllm_output[i][1]!r}")
 
-def test_e2e_qwen2_with_torchair():
-    _qwen_moe_torchair_test_fixture("Qwen/Qwen2.5-0.5B-Instruct", 2, False)
 def test_e2e_qwen3_moe_with_torchair():
     _qwen_moe_torchair_test_fixture("Qwen/Qwen3-30B-A3B", 2, True)