Fix Triton decode kernel & ut (#1819)

This commit is contained in:
Ke Bao
2024-10-28 01:54:38 +08:00
committed by GitHub
parent 51c81e339b
commit c77762d57f
5 changed files with 218 additions and 42 deletions

View File

@@ -26,7 +26,8 @@ suites = {
"test_srt_endpoint.py",
"test_torch_compile.py",
"test_torchao.py",
"test_triton_attn_backend.py",
"test_triton_attention_kernels.py",
"test_triton_attention_backend.py",
"test_update_weights.py",
"test_vision_openai_server.py",
],