diff --git a/.github/workflows/vllm_ascend_test_nightly_a2.yaml b/.github/workflows/vllm_ascend_test_nightly_a2.yaml index 4baa3332c8a..7589f63d99e 100644 --- a/.github/workflows/vllm_ascend_test_nightly_a2.yaml +++ b/.github/workflows/vllm_ascend_test_nightly_a2.yaml @@ -114,12 +114,15 @@ jobs: - Qwen3-VL-8B-Instruct - Qwen2.5-Omni-7B - Meta-Llama-3.1-8B-Instruct + - Mistral-7B-Instruct-v0.1 + - Phi-4-mini-instruct - os: linux-aarch64-a2-2 model_list: - Qwen3-30B-A3B - Qwen3-VL-30B-A3B-Instruct - DeepSeek-V2-Lite - Qwen3-30B-A3B-W8A8 + - ERNIE-4.5-21B-A3B-PT - os: linux-aarch64-a2-4 model_list: - Qwen3-Next-80B-A3B-Instruct diff --git a/tests/e2e/models/configs/ERNIE-4.5-21B-A3B-PT.yaml b/tests/e2e/models/configs/ERNIE-4.5-21B-A3B-PT.yaml new file mode 100644 index 00000000000..75bdacb40be --- /dev/null +++ b/tests/e2e/models/configs/ERNIE-4.5-21B-A3B-PT.yaml @@ -0,0 +1,15 @@ +model_name: "PaddlePaddle/ERNIE-4.5-21B-A3B-PT" +hardware: "Atlas A2 Series" +tasks: +- name: "gsm8k" + metrics: + - name: "exact_match,flexible-extract" + value: 0.72 +- name: "ceval-valid" + metrics: + - name: "acc,none" + value: 0.85 +num_fewshot: 5 +tensor_parallel_size: 2 +batch_size: 16 +gpu_memory_utilization: 0.6 diff --git a/tests/e2e/models/configs/Mistral-7B-Instruct-v0.1.yaml b/tests/e2e/models/configs/Mistral-7B-Instruct-v0.1.yaml new file mode 100644 index 00000000000..bf3c1618dba --- /dev/null +++ b/tests/e2e/models/configs/Mistral-7B-Instruct-v0.1.yaml @@ -0,0 +1,11 @@ +model_name: "mistralai/Mistral-7B-Instruct-v0.1" +hardware: "Atlas A2 Series" +tasks: +- name: "gsm8k" + metrics: + - name: "exact_match,strict-match" + value: 0.35 + - name: "exact_match,flexible-extract" + value: 0.38 +trust_remote_code: True +num_fewshot: 5 diff --git a/tests/e2e/models/configs/Phi-4-mini-instruct.yaml b/tests/e2e/models/configs/Phi-4-mini-instruct.yaml new file mode 100644 index 00000000000..162768666d2 --- /dev/null +++ b/tests/e2e/models/configs/Phi-4-mini-instruct.yaml @@ -0,0 +1,13 @@ +model_name: "LLM-Research/Phi-4-mini-instruct" +hardware: "Atlas A2 Series" +tasks: +- name: "gsm8k" + metrics: + - name: "exact_match,strict-match" + value: 0.81 + - name: "exact_match,flexible-extract" + value: 0.81 +trust_remote_code: True +num_fewshot: 5 +batch_size: 32 +gpu_memory_utilization: 0.8 diff --git a/tests/e2e/models/configs/accuracy.txt b/tests/e2e/models/configs/accuracy.txt index daa23e97639..071d1504e27 100644 --- a/tests/e2e/models/configs/accuracy.txt +++ b/tests/e2e/models/configs/accuracy.txt @@ -1,4 +1,9 @@ DeepSeek-V2-Lite.yaml +ERNIE-4.5-21B-A3B-PT.yaml +InternVL3_5-8B.yaml +Meta-Llama-3.1-8B-Instruct.yaml +Mistral-7B-Instruct-v0.1.yaml +Phi-4-mini-instruct.yaml Qwen2.5-VL-7B-Instruct.yaml Qwen3-30B-A3B.yaml Qwen3-8B.yaml @@ -8,5 +13,3 @@ Qwen2-Audio-7B-Instruct.yaml Qwen3-VL-30B-A3B-Instruct.yaml Qwen3-VL-8B-Instruct.yaml Qwen2.5-Omni-7B.yaml -Meta-Llama-3.1-8B-Instruct.yaml -InternVL3_5-8B.yaml \ No newline at end of file