[Feature]Support ragged prefill in flashinfer mla backend (#3967)
Co-authored-by: Yineng Zhang <me@zhyncs.com> Co-authored-by: pankajroark <pankajroark@users.noreply.github.com>
This commit is contained in:
@@ -23,6 +23,7 @@ suites = {
|
||||
"test_gguf.py",
|
||||
"test_input_embeddings.py",
|
||||
"test_mla.py",
|
||||
"test_mla_flashinfer.py",
|
||||
"test_mla_fp8.py",
|
||||
"test_json_constrained.py",
|
||||
"test_large_max_new_tokens.py",
|
||||
|
||||
Reference in New Issue
Block a user