2024-01-08 04:37:50 +00:00
|
|
|
[build-system]
|
|
|
|
|
requires = ["setuptools>=61.0", "wheel"]
|
|
|
|
|
build-backend = "setuptools.build_meta"
|
|
|
|
|
|
|
|
|
|
[project]
|
|
|
|
|
name = "sglang"
|
2025-02-14 09:43:14 +08:00
|
|
|
version = "0.4.3"
|
2024-07-20 02:27:39 +10:00
|
|
|
description = "SGLang is yet another fast serving framework for large language models and vision language models."
|
2024-01-08 04:37:50 +00:00
|
|
|
readme = "README.md"
|
|
|
|
|
requires-python = ">=3.8"
|
2024-10-21 15:01:21 -07:00
|
|
|
license = { file = "LICENSE" }
|
2024-01-08 04:37:50 +00:00
|
|
|
classifiers = [
|
|
|
|
|
"Programming Language :: Python :: 3",
|
|
|
|
|
"License :: OSI Approved :: Apache Software License",
|
|
|
|
|
]
|
2024-12-08 01:06:15 -08:00
|
|
|
dependencies = ["requests", "tqdm", "numpy", "IPython", "setproctitle"]
|
2024-01-08 04:37:50 +00:00
|
|
|
|
|
|
|
|
[project.optional-dependencies]
|
2025-01-07 02:52:53 -08:00
|
|
|
runtime_common = [
|
|
|
|
|
"aiohttp", "decord", "fastapi",
|
2024-11-25 16:38:43 -08:00
|
|
|
"hf_transfer", "huggingface_hub", "interegular", "modelscope",
|
2025-02-02 12:13:40 -08:00
|
|
|
"orjson", "packaging", "pillow", "prometheus-client>=0.20.0",
|
|
|
|
|
"psutil", "pydantic", "python-multipart", "pyzmq>=25.1.2",
|
2025-02-15 23:55:08 +08:00
|
|
|
"torchao>=0.7.0", "uvicorn", "uvloop", "xgrammar==0.1.10", "ninja"
|
2025-01-07 02:52:53 -08:00
|
|
|
]
|
|
|
|
|
srt = [
|
|
|
|
|
"sglang[runtime_common]", "cuda-python",
|
2025-02-14 09:43:14 +08:00
|
|
|
"sgl-kernel>=0.0.3.post6", "torch", "vllm>=0.6.4.post1,<=0.7.2",
|
2025-02-14 08:50:14 +08:00
|
|
|
"flashinfer_python>=0.2.1.post1",
|
|
|
|
|
"outlines>=0.0.44,<=0.1.11",
|
2025-01-07 02:52:53 -08:00
|
|
|
]
|
2024-11-08 02:19:41 -08:00
|
|
|
|
2024-10-31 16:38:16 -07:00
|
|
|
# HIP (Heterogeneous-computing Interface for Portability) for AMD
|
|
|
|
|
# => base docker rocm/vllm-dev:20241022, not from public vllm whl
|
2025-02-04 05:44:44 -08:00
|
|
|
srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.7.dev2", "outlines==0.1.11", "sgl-kernel>=0.0.3.post1"]
|
2024-10-13 02:10:32 +08:00
|
|
|
# xpu is not enabled in public vllm and torch whl,
|
|
|
|
|
# need to follow https://docs.vllm.ai/en/latest/getting_started/xpu-installation.htmlinstall vllm
|
2025-02-02 12:13:40 -08:00
|
|
|
srt_xpu = ["sglang[runtime_common]", "outlines>=0.0.44,<0.1.0"]
|
2024-11-23 09:52:23 +05:30
|
|
|
#For Intel Gaudi(device : hpu) follow the installation guide
|
|
|
|
|
#https://docs.vllm.ai/en/latest/getting_started/gaudi-installation.html
|
2025-02-02 12:13:40 -08:00
|
|
|
srt_hpu = ["sglang[runtime_common]", "outlines>=0.0.44,<0.1.0"]
|
2025-01-17 13:22:53 +08:00
|
|
|
# CPU: currently, there are no pre-built vllm wheels for CPU.
|
|
|
|
|
# To install vllm for CPU, please follow the instruction here:
|
|
|
|
|
# https://docs.vllm.ai/en/latest/getting_started/installation/cpu/index.html
|
2025-02-02 12:13:40 -08:00
|
|
|
srt_cpu = ["sglang[runtime_common]", "torch", "outlines>=0.0.44,<0.1.0"]
|
2024-10-13 02:10:32 +08:00
|
|
|
|
2024-06-10 21:13:50 +02:00
|
|
|
openai = ["openai>=1.0", "tiktoken"]
|
|
|
|
|
anthropic = ["anthropic>=0.20.0"]
|
2024-06-08 03:24:28 +08:00
|
|
|
litellm = ["litellm>=1.0.0"]
|
2025-01-14 03:38:51 +08:00
|
|
|
torch_memory_saver = ["torch_memory_saver"]
|
2024-10-21 15:01:21 -07:00
|
|
|
test = [
|
|
|
|
|
"jsonlines",
|
|
|
|
|
"matplotlib",
|
|
|
|
|
"pandas",
|
|
|
|
|
"sentence_transformers",
|
|
|
|
|
"accelerate",
|
|
|
|
|
"peft",
|
|
|
|
|
]
|
2024-06-08 03:24:28 +08:00
|
|
|
all = ["sglang[srt]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
|
2024-10-31 16:38:16 -07:00
|
|
|
all_hip = ["sglang[srt_hip]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
|
2024-10-13 02:10:32 +08:00
|
|
|
all_xpu = ["sglang[srt_xpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
|
2024-11-23 09:52:23 +05:30
|
|
|
all_hpu = ["sglang[srt_hpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
|
2025-01-17 13:22:53 +08:00
|
|
|
all_cpu = ["sglang[srt_cpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
|
2024-12-09 06:30:35 -08:00
|
|
|
|
2024-08-04 18:15:23 -07:00
|
|
|
dev = ["sglang[all]", "sglang[test]"]
|
2024-10-31 16:38:16 -07:00
|
|
|
dev_hip = ["sglang[all_hip]", "sglang[test]"]
|
2024-10-13 02:10:32 +08:00
|
|
|
dev_xpu = ["sglang[all_xpu]", "sglang[test]"]
|
2024-11-23 09:52:23 +05:30
|
|
|
dev_hpu = ["sglang[all_hpu]", "sglang[test]"]
|
2025-01-17 13:22:53 +08:00
|
|
|
dev_cpu = ["sglang[all_cpu]", "sglang[test]"]
|
2024-01-08 04:37:50 +00:00
|
|
|
|
2024-01-15 01:15:53 -08:00
|
|
|
[project.urls]
|
|
|
|
|
"Homepage" = "https://github.com/sgl-project/sglang"
|
|
|
|
|
"Bug Tracker" = "https://github.com/sgl-project/sglang/issues"
|
|
|
|
|
|
2024-12-27 00:16:48 +08:00
|
|
|
[tool.setuptools.package-data]
|
2024-12-29 14:25:53 -08:00
|
|
|
"sglang" = ["srt/layers/moe/fused_moe_triton/configs/*.json", "srt/layers/quantization/configs/*.json"]
|
2024-12-27 00:16:48 +08:00
|
|
|
|
2024-01-08 04:37:50 +00:00
|
|
|
[tool.setuptools.packages.find]
|
2024-10-21 15:01:21 -07:00
|
|
|
exclude = [
|
|
|
|
|
"assets*",
|
|
|
|
|
"benchmark*",
|
|
|
|
|
"docs*",
|
|
|
|
|
"dist*",
|
|
|
|
|
"playground*",
|
|
|
|
|
"scripts*",
|
|
|
|
|
"tests*",
|
|
|
|
|
]
|
2024-01-08 04:37:50 +00:00
|
|
|
|
|
|
|
|
[tool.wheel]
|
2024-10-21 15:01:21 -07:00
|
|
|
exclude = [
|
|
|
|
|
"assets*",
|
|
|
|
|
"benchmark*",
|
|
|
|
|
"docs*",
|
|
|
|
|
"dist*",
|
|
|
|
|
"playground*",
|
|
|
|
|
"scripts*",
|
|
|
|
|
"tests*",
|
|
|
|
|
]
|