[Misc] clean up vllm in sgl-kernel test (#5189)

2025-04-09 16:22:13 +08:00
parent 61970b08d8
commit d2e507df3c
4 changed files with 25 additions and 40 deletions
--- a/sgl-kernel/tests/test_awq_dequant.py
+++ b/sgl-kernel/tests/test_awq_dequant.py
@@ -4,7 +4,6 @@ from typing import Optional, Tuple
 import pytest
 import torch
 from sgl_kernel import awq_dequantize
-from vllm import _custom_ops as ops


 def reverse_awq_order(t: torch.Tensor):
@@ -58,12 +57,6 @@ def awq_dequantize_torch(
    return (iweights - zeros) * scales


-def vllm_awq_dequantize(
-    qweight: torch.Tensor, scales: torch.Tensor, qzeros: torch.Tensor
-) -> torch.Tensor:
-    return ops.awq_dequantize(qweight, scales, qzeros, 0, 0, 0)
-
-
 def sglang_awq_dequantize(
    qweight: torch.Tensor, scales: torch.Tensor, qzeros: torch.Tensor
 ) -> torch.Tensor:
@@ -110,7 +103,6 @@ def test_awq_dequant_compare_implementations(
    )

    # Run both implementations
-    vllm_out = vllm_awq_dequantize(qweight, scales.to(torch.float16), qzeros)
    torch_out = awq_dequantize_torch(qweight, scales, qzeros, group_size)
    sglang_out = sglang_awq_dequantize(qweight, scales, qzeros)

@@ -118,13 +110,6 @@ def test_awq_dequant_compare_implementations(
    torch.testing.assert_close(
        torch_out.to(torch.float32), sglang_out.to(torch.float32), rtol=1e-3, atol=1e-5
    )
-    if not is_bf16_act:
-        torch.testing.assert_close(
-            vllm_out.to(torch.float32),
-            sglang_out.to(torch.float32),
-            rtol=1e-3,
-            atol=1e-5,
-        )


 if __name__ == "__main__":