Fix lora flashinfer import bug on ROCM (#3312)

This commit is contained in:
Baizhou Zhang
2025-02-05 00:36:49 -08:00
committed by GitHub
parent 7ab84948d8
commit 76fa2d152c

View File

@@ -1,10 +1,13 @@
from typing import Tuple from typing import Tuple
import torch import torch
from flashinfer import SegmentGEMMWrapper
from sglang.srt.lora.backend import BaseLoraBackend from sglang.srt.lora.backend import BaseLoraBackend
from sglang.srt.lora.lora import LoraBatchInfo from sglang.srt.lora.lora import LoraBatchInfo
from sglang.srt.utils import is_flashinfer_available
if is_flashinfer_available():
from flashinfer import SegmentGEMMWrapper
class FlashInferLoraBackend(BaseLoraBackend): class FlashInferLoraBackend(BaseLoraBackend):