Files
sglang/python/pyproject.toml

129 lines
3.6 KiB
TOML
Raw Normal View History

[build-system]
2025-03-24 09:50:28 -07:00
requires = ["setuptools>=61.0", "wheel"]
build-backend = "setuptools.build_meta"
[project]
name = "sglang"
2025-03-26 19:58:00 -07:00
version = "0.4.4.post2"
description = "SGLang is yet another fast serving framework for large language models and vision language models."
readme = "README.md"
requires-python = ">=3.8"
2024-10-21 15:01:21 -07:00
license = { file = "LICENSE" }
classifiers = [
"Programming Language :: Python :: 3",
"License :: OSI Approved :: Apache Software License",
]
dependencies = ["aiohttp", "requests", "tqdm", "numpy", "IPython", "setproctitle"]
[project.optional-dependencies]
runtime_common = [
"datasets",
2025-02-24 03:50:58 -08:00
"decord",
"fastapi",
"hf_transfer",
"huggingface_hub",
"interegular",
"llguidance>=0.6.15",
2025-02-24 03:50:58 -08:00
"modelscope",
"ninja",
2025-02-24 03:50:58 -08:00
"orjson",
"packaging",
"pillow",
"prometheus-client>=0.20.0",
"psutil",
"pydantic",
"python-multipart",
"pyzmq>=25.1.2",
2025-03-25 11:08:40 +08:00
"soundfile==0.13.1",
2025-02-24 03:50:58 -08:00
"torchao>=0.7.0",
"transformers==4.50.0",
2025-02-24 03:50:58 -08:00
"uvicorn",
"uvloop",
"compressed-tensors",
2025-03-27 00:21:59 -07:00
"xgrammar==0.1.17",
]
2025-03-04 21:23:47 -08:00
srt = [
2025-02-24 03:50:58 -08:00
"sglang[runtime_common]",
2025-03-17 14:49:56 -07:00
"sgl-kernel==0.0.5.post3",
"flashinfer_python==0.2.3",
2025-02-24 03:50:58 -08:00
"torch==2.5.1",
"cuda-python",
"outlines>=0.0.44,<=0.1.11",
"partial_json_parser",
"einops",
]
# HIP (Heterogeneous-computing Interface for Portability) for AMD
# => base docker rocm/vllm-dev:20250114, not from public vllm whl
srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.7.dev2", "outlines==0.1.11"]
2025-02-24 03:50:58 -08:00
# xpu is not enabled in public vllm and torch whl,
# need to follow https://docs.vllm.ai/en/latest/getting_started/xpu-installation.htmlinstall vllm
srt_xpu = ["sglang[runtime_common]", "outlines>=0.0.44,<=0.1.11"]
2025-02-24 03:50:58 -08:00
# For Intel Gaudi(device : hpu) follow the installation guide
# https://docs.vllm.ai/en/latest/getting_started/gaudi-installation.html
srt_hpu = ["sglang[runtime_common]", "outlines>=0.0.44,<=0.1.11"]
2025-01-17 13:22:53 +08:00
# CPU: currently, there are no pre-built vllm wheels for CPU.
# To install vllm for CPU, please follow the instruction here:
# https://docs.vllm.ai/en/latest/getting_started/installation/cpu/index.html
2025-02-24 03:50:58 -08:00
srt_cpu = ["sglang[runtime_common]", "outlines>=0.0.44,<=0.1.11", "torch"]
openai = ["openai>=1.0", "tiktoken"]
anthropic = ["anthropic>=0.20.0"]
2024-06-08 03:24:28 +08:00
litellm = ["litellm>=1.0.0"]
torch_memory_saver = ["torch_memory_saver>=0.0.3"]
2024-10-21 15:01:21 -07:00
test = [
"jsonlines",
"matplotlib",
"pandas",
"sentence_transformers",
"accelerate",
"peft",
]
2024-06-08 03:24:28 +08:00
all = ["sglang[srt]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
all_hip = ["sglang[srt_hip]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
all_xpu = ["sglang[srt_xpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
all_hpu = ["sglang[srt_hpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
2025-01-17 13:22:53 +08:00
all_cpu = ["sglang[srt_cpu]", "sglang[openai]", "sglang[anthropic]", "sglang[litellm]"]
2024-12-09 06:30:35 -08:00
dev = ["sglang[all]", "sglang[test]"]
dev_hip = ["sglang[all_hip]", "sglang[test]"]
dev_xpu = ["sglang[all_xpu]", "sglang[test]"]
dev_hpu = ["sglang[all_hpu]", "sglang[test]"]
2025-01-17 13:22:53 +08:00
dev_cpu = ["sglang[all_cpu]", "sglang[test]"]
2024-01-15 01:15:53 -08:00
[project.urls]
"Homepage" = "https://github.com/sgl-project/sglang"
"Bug Tracker" = "https://github.com/sgl-project/sglang/issues"
2024-12-27 00:16:48 +08:00
[tool.setuptools.package-data]
"sglang" = [
"srt/layers/moe/fused_moe_triton/configs/*.json",
"srt/layers/quantization/configs/*.json",
]
2024-12-27 00:16:48 +08:00
[tool.setuptools.packages.find]
2024-10-21 15:01:21 -07:00
exclude = [
"assets*",
"benchmark*",
"docs*",
"dist*",
"playground*",
"scripts*",
"tests*",
]
[tool.wheel]
2024-10-21 15:01:21 -07:00
exclude = [
"assets*",
"benchmark*",
"docs*",
"dist*",
"playground*",
"scripts*",
"tests*",
]