Add SGLang inference benchmark doc w/ initial support for DeepSeek-R1-Distill-Qwen-32B (#4870)

2026-01-08 22:28:06 -05:00 · 2025-07-25 12:42:40 -04:00
parent 2c9c3d0ba1
commit cc5bc5a882
6 changed files with 328 additions and 0 deletions
--- a/docs/sphinx/_toc.yml.in
+++ b/docs/sphinx/_toc.yml.in
@@ -82,6 +82,8 @@ subtrees:
            title: vLLM inference performance testing
          - file: how-to/rocm-for-ai/inference/benchmark-docker/pytorch-inference.rst
            title: PyTorch inference performance testing
+          - file: how-to/rocm-for-ai/inference/benchmark-docker/sglang.rst
+            title: SGLang inference performance testing
          - file: how-to/rocm-for-ai/inference/deploy-your-model.rst
            title: Deploy your model