diff --git a/.github/configs/amd-master.yaml b/.github/configs/amd-master.yaml index 89318004b..461cdfa33 100644 --- a/.github/configs/amd-master.yaml +++ b/.github/configs/amd-master.yaml @@ -204,7 +204,7 @@ qwen3.5-fp8-mi355x-sglang: - { tp: 8, conc-start: 4, conc-end: 64 } qwen3.5-fp4-mi355x-sglang: - image: lmsysorg/sglang:v0.5.10-rocm720-mi35x + image: rocm/sgl-dev:v0.5.10rc0-rocm720-mi35x-20260413 model: amd/Qwen3.5-397B-A17B-MXFP4 model-prefix: qwen3.5 runner: mi355x @@ -216,12 +216,12 @@ qwen3.5-fp4-mi355x-sglang: osl: 1024 search-space: - { tp: 2, conc-start: 4, conc-end: 256 } - - { tp: 4, conc-start: 4, conc-end: 4 } + - { tp: 4, conc-start: 4, conc-end: 16 } - isl: 8192 osl: 1024 search-space: - { tp: 2, conc-start: 4, conc-end: 256 } - - { tp: 4, conc-start: 4, conc-end: 32 } + - { tp: 4, conc-start: 4, conc-end: 16 } qwen3.5-fp8-mi300x-sglang: image: lmsysorg/sglang:v0.5.10-rocm720-mi30x diff --git a/perf-changelog.yaml b/perf-changelog.yaml index 6721dbb1e..6dd675bb4 100644 --- a/perf-changelog.yaml +++ b/perf-changelog.yaml @@ -1,3 +1,9 @@ +- config-keys: + - qwen3.5-fp4-mi355x-sglang + description: + - "Update SGLang image from 'lmsysorg/sglang:v0.5.10-rocm720-mi35x' to 'rocm/sgl-dev:v0.5.10rc0-rocm720-mi35x-20260413'" + pr-link: https://github.com/SemiAnalysisAI/InferenceX/pull/1041 + - config-keys: - kimik2.5-int4-mi300x-vllm description: