[UT]: refactoring 310p ops ut (#6296)

### What this PR does / why we need it? Refactor swiglu and rms_norm unittest case for 310P and 910B. Apply attention_v1 get_kv_cache_shape and build metadata on all of platforms ### Does this PR introduce _any_ user-facing change? NA ### How was this patch tested? CI UT test - vLLM version: v0.14.1 - vLLM main: dc917cceb8 --------- Signed-off-by: pu-zhe <zpuaa@outlook.com>
2026-01-27 16:31:51 +08:00
parent 57fd6e4bd9
commit 21b6779a33
3 changed files with 80 additions and 62 deletions
--- a/tests/ut/attention/test_attention_v1.py
+++ b/tests/ut/attention/test_attention_v1.py
@@ -41,9 +41,7 @@ class TestAscendAttentionBackend(TestBase):
        self.assertEqual(AscendAttentionBackend.get_builder_cls(),
                         AscendAttentionMetadataBuilder)

-    @patch('vllm_ascend.utils.get_ascend_device_type',
-           return_value=AscendDeviceType.A3)
-    def test_get_kv_cache_shape_not_310p(self, mock_soc_version):
+    def test_get_kv_cache_shape_not(self):
        result = AscendAttentionBackend.get_kv_cache_shape(10, 20, 30, 40)
        self.assertEqual(result, (2, 10, 20, 30, 40))

@@ -92,9 +90,7 @@ class TestAscendAttentionMetadataBuilder(TestBase):
        self.assertFalse(result)

    @patch('vllm_ascend.attention.attention_v1.AscendMetadata')
-    @patch('vllm_ascend.utils.get_ascend_device_type',
-           return_value=AscendDeviceType.A3)
-    def test_build_non_310p(self, mock_soc_version, mock_ascend_metadata):
+    def test_build(self, mock_ascend_metadata):
        common_attn_metadata = AscendCommonAttentionMetadata(
            query_start_loc=torch.tensor([0, 2, 5, 9]),
            query_start_loc_cpu=torch.tensor([0, 2, 5, 9]),