Add unit test on page_size > 1 and mla and integration test for Flash Attention 3 (#4760)

This commit is contained in:
Yubo Wang
2025-04-07 23:20:51 -07:00
committed by GitHub
parent a7c3f74bec
commit 804d9f2e4c
6 changed files with 733 additions and 224 deletions

View File

@@ -28,6 +28,7 @@ suites = {
TestFile("test_chunked_prefill.py", 336),
TestFile("test_eagle_infer.py", 500),
TestFile("test_ebnf_constrained.py"),
TestFile("test_fa3.py", 5),
TestFile("test_fp8_kernel.py", 8),
TestFile("test_embedding_openai_server.py", 36),
TestFile("test_hidden_states.py", 55),