[Minor] move triton attention kernels into a separate folder (#1379)

2024-09-10 15:15:08 -07:00
parent fbb4754cb8
commit 3a6e8b6d78
13 changed files with 24 additions and 15 deletions
--- a/python/sglang/bench_latency.py
+++ b/python/sglang/bench_latency.py
@@ -57,9 +57,9 @@ import pandas as pd
 import torch
 import torch.distributed as dist

+from sglang.srt.configs.model_config import ModelConfig
 from sglang.srt.hf_transformers_utils import get_tokenizer
 from sglang.srt.managers.schedule_batch import Req, ScheduleBatch
-from sglang.srt.model_config import ModelConfig
 from sglang.srt.model_executor.model_runner import ModelRunner
 from sglang.srt.sampling.sampling_params import SamplingParams
 from sglang.srt.server_args import ServerArgs