add qwen3 30b a3b to vllm-benchmark-models (#5280)

This commit is contained in:
Peter Park
2025-09-09 17:41:11 -04:00
committed by GitHub
parent 3c37ae88f0
commit 05a66f75fe

View File

@@ -78,7 +78,11 @@ vllm_benchmark:
model_repo: Qwen/QwQ-32B
url: https://huggingface.co/Qwen/QwQ-32B
precision: float16
tunableop: true
- model: Qwen3 30B A3B
mad_tag: pyt_vllm_qwen3-30b-a3b
model_repo: Qwen/Qwen3-30B-A3B
url: https://huggingface.co/Qwen/Qwen3-30B-A3B
precision: float16
- group: Microsoft Phi
tag: phi
models: