[CI] Add deepep tests to CI (#7872)
This commit is contained in:
@@ -6,6 +6,7 @@ import triton
|
||||
|
||||
from sglang.srt.layers.quantization.fp8_kernel import per_token_group_quant_fp8
|
||||
from sglang.srt.utils import ceil_div, dispose_tensor, is_cuda
|
||||
from sglang.utils import is_in_ci
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
@@ -1058,7 +1059,7 @@ def ep_gather(
|
||||
input_index: torch.Tensor,
|
||||
output_tensor: torch.Tensor,
|
||||
):
|
||||
BLOCK_D = 1024 # block size of quantization
|
||||
BLOCK_D = 1024 if not is_in_ci() else 128 # block size of quantization
|
||||
num_warps = 2
|
||||
num_tokens = output_tensor.shape[0]
|
||||
hidden_size = input_tensor.shape[1]
|
||||
|
||||
Reference in New Issue
Block a user