support qwen3_next blackwell (#10403)

This commit is contained in:
Yi Zhang
2025-09-13 17:18:26 +08:00
committed by GitHub
parent 31e9d3a5aa
commit 297d374510
4 changed files with 26 additions and 3 deletions

View File

@@ -728,6 +728,9 @@ class HybridLinearKVPool(KVCache):
layer_id_override=layer_id,
)
def get_v_head_dim(self):
return self.full_kv_pool.get_value_buffer(0).shape[-1]
class SWAKVPool(KVCache):
"""KV cache with separate pools for full and SWA attention layers."""