### What this PR does / why we need it?
Add some uts for files in folder /multistream
### Does this PR introduce _any_ user-facing change?
No
- vLLM version: v0.9.2
- vLLM main:
b77c7d327f
Signed-off-by: lwq <liwenquan5@huawei.com>
Co-authored-by: lwq <liwenquan5@huawei.com>
33 lines
1.5 KiB
Python
33 lines
1.5 KiB
Python
from tests.ut.base import TestBase
|
|
from vllm_ascend.multistream.base import (MSAttentionMetadataSplitConfig,
|
|
MSEventKey)
|
|
|
|
|
|
class Testbase(TestBase):
|
|
|
|
def test_ms_event_key(self):
|
|
self.assertEqual(MSEventKey.ATTN_COM_FINISH.value, 0)
|
|
self.assertEqual(MSEventKey.ATTN_AR_FINISH.value, 1)
|
|
self.assertEqual(MSEventKey.FFN_COM_FINISH.value, 2)
|
|
self.assertEqual(MSEventKey.FFN_AR_FINISH.value, 3)
|
|
self.assertEqual(MSEventKey.MOE_BEFORE_COMM.value, 4)
|
|
self.assertEqual(MSEventKey.MOE_AFTER_COMM.value, 5)
|
|
self.assertEqual(MSEventKey.MOE_SE_COMM_FINISH.value, 6)
|
|
self.assertEqual(MSEventKey.MOE_SE_COMP_FINISH.value, 7)
|
|
self.assertEqual(MSEventKey.MOE_GATE_FINISH.value, 8)
|
|
|
|
def test_ms_attention_metadata_split_config_default(self):
|
|
config = MSAttentionMetadataSplitConfig()
|
|
self.assertEqual(config.num_micro_batches, 2)
|
|
self.assertEqual(config.min_total_tokens_to_split, 256)
|
|
self.assertEqual(config.min_prefill_tokens_to_split, 64)
|
|
|
|
def test_ms_attention_metadata_split_config_custom(self):
|
|
config = MSAttentionMetadataSplitConfig(
|
|
num_micro_batches=4,
|
|
min_total_tokens_to_split=512,
|
|
min_prefill_tokens_to_split=128)
|
|
self.assertEqual(config.num_micro_batches, 4)
|
|
self.assertEqual(config.min_total_tokens_to_split, 512)
|
|
self.assertEqual(config.min_prefill_tokens_to_split, 128)
|