support qwen3_next blackwell (#10403)

2025-09-13 17:18:26 +08:00
parent 31e9d3a5aa
commit 297d374510
4 changed files with 26 additions and 3 deletions
--- a/python/sglang/srt/mem_cache/memory_pool.py
+++ b/python/sglang/srt/mem_cache/memory_pool.py
@@ -728,6 +728,9 @@ class HybridLinearKVPool(KVCache):
            layer_id_override=layer_id,
        )

+    def get_v_head_dim(self):
+        return self.full_kv_pool.get_value_buffer(0).shape[-1]
+

 class SWAKVPool(KVCache):
    """KV cache with separate pools for full and SWA attention layers."""