Fix memory leak for chunked prefill 2 (#1858)

Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com>
This commit is contained in:
Lianmin Zheng
2024-10-31 14:51:51 -07:00
committed by GitHub
parent 8ce202a493
commit a2e0424abf
7 changed files with 138 additions and 30 deletions

View File

@@ -19,6 +19,7 @@ suites = {
"test_openai_server.py",
"test_overlap_schedule.py",
"test_pytorch_sampling_backend.py",
"test_radix_attention.py",
"test_retract_decode.py",
"test_server_args.py",
"test_skip_tokenizer_init.py",