Organize Attention Backends (#1547)

This commit is contained in:
Liangsheng Yin
2024-09-30 15:54:18 -07:00
committed by GitHub
parent 0f4fb19bc8
commit 99ec439da4
12 changed files with 229 additions and 205 deletions

View File

@@ -4,7 +4,9 @@ import unittest
import numpy as np
import torch
from sglang.srt.layers.flashinfer_utils import create_flashinfer_kv_indices_triton
from sglang.srt.layers.attention.flashinfer_utils import (
create_flashinfer_kv_indices_triton,
)
class TestCreateKvIndices(unittest.TestCase):