fix e2e rejection-sampler error (#5341)
### What this PR does / why we need it?
Fixed the error in the CI process for
vllm-ascend/tests/e2e/nightly/ops/triton/test_rejection_sampler.py
Error: test_rejection_sampler_block_verify_triton_kernel: duplicate
parametrization of 'vocab_size'.
- vLLM version: release/v0.13.0
- vLLM main:
bc0a5a0c08
Signed-off-by: chenaoxuan <cax1165@163.com>
This commit is contained in:
@@ -61,7 +61,7 @@ IS_GREEDY = torch.zeros(NUM_TOKENS, dtype=torch.bool, device=DEVICE)
|
||||
@pytest.mark.parametrize("bonus_token_ids", [BONUS_TOKEN_IDS])
|
||||
@pytest.mark.parametrize("uniform_probs", [UNIFORM_PROBS])
|
||||
@pytest.mark.parametrize("is_greedy", [IS_GREEDY])
|
||||
@pytest.mark.parametrize("vocab_size", [BATCH_SIZE])
|
||||
@pytest.mark.parametrize("batch_size", [BATCH_SIZE])
|
||||
@pytest.mark.parametrize("max_spec_len", [MAX_SPEC_LEN])
|
||||
@pytest.mark.parametrize("vocab_size", [VOCAB_SIZE])
|
||||
@torch.inference_mode()
|
||||
|
||||
Reference in New Issue
Block a user