Feature DeepSeek V3/R1 INT8 Quantization (block-wise) (#3730)

Co-authored-by: HandH1998 <1335248067@qq.com>
This commit is contained in:
laixin
2025-02-24 21:43:35 +08:00
committed by GitHub
parent b110084654
commit 1a6e97577a
9 changed files with 1092 additions and 5 deletions

View File

@@ -55,6 +55,7 @@ suites = {
"test_vision_openai_server.py",
"test_w8a8_quantization.py",
"test_fp8_kernel.py",
"test_block_int8.py",
],
"nightly": [
"test_nightly_gsm8k_eval.py",