vllm-project · MrZ20 · Nov 18, 2025 · Nov 18, 2025 · Nov 19, 2025 · MengqingCao
diff --git a/.github/workflows/vllm_ascend_test_nightly_a2.yaml b/.github/workflows/vllm_ascend_test_nightly_a2.yaml
@@ -114,12 +114,15 @@ jobs:
               - Qwen3-VL-8B-Instruct
               - Qwen2.5-Omni-7B
               - Meta-Llama-3.1-8B-Instruct
+              - Mistral-7B-Instruct-v0.1
+              - Phi-4-mini-instruct
           - os: linux-aarch64-a2-2
             model_list:
               - Qwen3-30B-A3B
               - Qwen3-VL-30B-A3B-Instruct
               - DeepSeek-V2-Lite
               - Qwen3-30B-A3B-W8A8
+              - ERNIE-4.5-21B-A3B-PT
           - os: linux-aarch64-a2-4
             model_list:
               - Qwen3-Next-80B-A3B-Instruct

diff --git a/tests/e2e/models/configs/ERNIE-4.5-21B-A3B-PT.yaml b/tests/e2e/models/configs/ERNIE-4.5-21B-A3B-PT.yaml
@@ -0,0 +1,15 @@
+model_name: "PaddlePaddle/ERNIE-4.5-21B-A3B-PT"
+hardware: "Atlas A2 Series"
+tasks:
+- name: "gsm8k"
+  metrics:
+  - name: "exact_match,flexible-extract"
+    value: 0.72
+- name: "ceval-valid"
+  metrics:
+  - name: "acc,none"
+    value: 0.85
+num_fewshot: 5
+tensor_parallel_size: 2
+batch_size: 16
+gpu_memory_utilization: 0.6
diff --git a/tests/e2e/models/configs/Mistral-7B-Instruct-v0.1.yaml b/tests/e2e/models/configs/Mistral-7B-Instruct-v0.1.yaml
@@ -0,0 +1,11 @@
+model_name: "mistralai/Mistral-7B-Instruct-v0.1"
+hardware: "Atlas A2 Series"
+tasks:
+- name: "gsm8k"
+  metrics:
+  - name: "exact_match,strict-match"
+    value: 0.35
+  - name: "exact_match,flexible-extract"
+    value: 0.38
+trust_remote_code: True
+num_fewshot: 5
diff --git a/tests/e2e/models/configs/Phi-4-mini-instruct.yaml b/tests/e2e/models/configs/Phi-4-mini-instruct.yaml
@@ -0,0 +1,13 @@
+model_name: "LLM-Research/Phi-4-mini-instruct"
+hardware: "Atlas A2 Series"
+tasks:
+- name: "gsm8k"
+  metrics:
+  - name: "exact_match,strict-match"
+    value: 0.81
+  - name: "exact_match,flexible-extract"
+    value: 0.81
+trust_remote_code: True
+num_fewshot: 5
+batch_size: 32
+gpu_memory_utilization: 0.8
diff --git a/tests/e2e/models/configs/accuracy.txt b/tests/e2e/models/configs/accuracy.txt
@@ -1,4 +1,9 @@
 DeepSeek-V2-Lite.yaml
+ERNIE-4.5-21B-A3B-PT.yaml
+InternVL3_5-8B.yaml
+Meta-Llama-3.1-8B-Instruct.yaml
+Mistral-7B-Instruct-v0.1.yaml
+Phi-4-mini-instruct.yaml
 Qwen2.5-VL-7B-Instruct.yaml
 Qwen3-30B-A3B.yaml
 Qwen3-8B.yaml
@@ -8,5 +13,3 @@ Qwen2-Audio-7B-Instruct.yaml
 Qwen3-VL-30B-A3B-Instruct.yaml
 Qwen3-VL-8B-Instruct.yaml
 Qwen2.5-Omni-7B.yaml
-Meta-Llama-3.1-8B-Instruct.yaml
-InternVL3_5-8B.yaml