Fix nightly ci Gsm8k & Fix flashinfer backend kvcache quant (#4147)

This commit is contained in:
yinfan98
2025-03-07 03:50:07 +08:00
committed by GitHub
parent bc1534ff32
commit ab7fba0ece

View File

@@ -904,6 +904,7 @@ class FlashInferIndicesUpdaterPrefill:
self.head_dim,
1,
q_data_type=self.q_data_type,
kv_data_type=self.data_type,
custom_mask=custom_mask,
non_blocking=True,
)