From e868d0b60eb2d435c5599165f787bca06bdc9c3d Mon Sep 17 00:00:00 2001 From: lizamd <161388580+lizamd@users.noreply.github.com> Date: Thu, 6 Feb 2025 21:08:06 -0800 Subject: [PATCH] update waves_per_eu to 1 (#3356) --- .../sglang/srt/layers/attention/triton_ops/extend_attention.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/attention/triton_ops/extend_attention.py b/python/sglang/srt/layers/attention/triton_ops/extend_attention.py index e070bc3a9..9fe1e1b60 100644 --- a/python/sglang/srt/layers/attention/triton_ops/extend_attention.py +++ b/python/sglang/srt/layers/attention/triton_ops/extend_attention.py @@ -351,7 +351,7 @@ def extend_attention_fwd( extra_kargs = {} if is_hip_: - extra_kargs = {"waves_per_eu": 4, "matrix_instr_nonkdim": 16, "kpack": 2} + extra_kargs = {"waves_per_eu": 1, "matrix_instr_nonkdim": 16, "kpack": 2} _fwd_kernel[grid]( q_extend,