Remove unused imports from rocm mla kernel. (#3963)
This commit is contained in:
committed by
GitHub
parent
e3e0bc50a9
commit
77a6c9d229
@@ -20,19 +20,12 @@ It supports page size = 1.
|
|||||||
# https://github.com/ModelTC/lightllm/blob/96353e868a840db4d103138caf15ed9dbea8c186/lightllm/models/deepseek2/triton_kernel/gqa_flash_decoding_stage1.py
|
# https://github.com/ModelTC/lightllm/blob/96353e868a840db4d103138caf15ed9dbea8c186/lightllm/models/deepseek2/triton_kernel/gqa_flash_decoding_stage1.py
|
||||||
# https://github.com/ModelTC/lightllm/blob/96353e868a840db4d103138caf15ed9dbea8c186/lightllm/models/deepseek2/triton_kernel/gqa_flash_decoding_stage2.py
|
# https://github.com/ModelTC/lightllm/blob/96353e868a840db4d103138caf15ed9dbea8c186/lightllm/models/deepseek2/triton_kernel/gqa_flash_decoding_stage2.py
|
||||||
|
|
||||||
import argparse
|
|
||||||
import logging
|
|
||||||
import sys
|
|
||||||
|
|
||||||
import pytest
|
|
||||||
import torch
|
|
||||||
import triton
|
import triton
|
||||||
import triton.language as tl
|
import triton.language as tl
|
||||||
|
|
||||||
from sglang.srt.layers.attention.triton_ops.decode_attention import (
|
from sglang.srt.layers.attention.triton_ops.decode_attention import (
|
||||||
_decode_softmax_reducev_fwd,
|
_decode_softmax_reducev_fwd,
|
||||||
)
|
)
|
||||||
from sglang.srt.layers.rotary_embedding import DeepseekScalingRotaryEmbedding
|
|
||||||
|
|
||||||
|
|
||||||
def is_hip():
|
def is_hip():
|
||||||
|
|||||||
Reference in New Issue
Block a user