DP Enhancement (#8280)
This commit is contained in:
@@ -12,14 +12,16 @@
|
||||
# limitations under the License.
|
||||
# ==============================================================================
|
||||
"""Radix attention."""
|
||||
from __future__ import annotations
|
||||
|
||||
from enum import Enum
|
||||
from typing import Optional
|
||||
from typing import TYPE_CHECKING, Optional
|
||||
|
||||
from torch import nn
|
||||
|
||||
from sglang.srt.layers.quantization.base_config import QuantizationConfig
|
||||
from sglang.srt.model_executor.forward_batch_info import ForwardBatch
|
||||
if TYPE_CHECKING:
|
||||
from sglang.srt.layers.quantization.base_config import QuantizationConfig
|
||||
from sglang.srt.model_executor.forward_batch_info import ForwardBatch
|
||||
|
||||
|
||||
class AttentionType(Enum):
|
||||
|
||||
Reference in New Issue
Block a user