2024-12-31 11:04:01 +08:00
|
|
|
#!/bin/bash
|
2024-12-01 18:55:26 +08:00
|
|
|
# Install the dependency in CI.
|
2025-03-28 10:34:10 -07:00
|
|
|
set -euxo pipefail
|
2024-10-30 02:49:08 -07:00
|
|
|
|
2025-03-28 10:34:10 -07:00
|
|
|
# Use repo from environment variables, passed from GitHub Actions
|
2025-02-14 08:50:14 +08:00
|
|
|
FLASHINFER_REPO="${FLASHINFER_REPO:-https://flashinfer.ai/whl/cu124/torch2.5/flashinfer-python}"
|
2024-12-01 18:55:26 +08:00
|
|
|
|
|
|
|
|
SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
|
|
|
|
|
bash "${SCRIPT_DIR}/killall_sglang.sh"
|
2024-11-30 00:24:30 -08:00
|
|
|
|
2025-04-03 17:45:05 +08:00
|
|
|
# Clean up existing installations
|
|
|
|
|
pip uninstall -y flashinfer flashinfer_python sgl-kernel sglang vllm || true
|
|
|
|
|
pip cache purge
|
|
|
|
|
rm -rf /root/.cache/flashinfer
|
|
|
|
|
rm -rf /usr/local/lib/python3.10/dist-packages/flashinfer*
|
|
|
|
|
rm -rf /usr/local/lib/python3.10/dist-packages/sgl_kernel*
|
|
|
|
|
|
|
|
|
|
# Update pip
|
2024-10-26 04:32:36 -07:00
|
|
|
pip install --upgrade pip
|
2024-12-01 01:47:30 -08:00
|
|
|
|
2025-04-03 17:45:05 +08:00
|
|
|
# Install flashinfer and sgl-kernel
|
|
|
|
|
pip install flashinfer_python==0.2.3 --find-links ${FLASHINFER_REPO} --no-cache-dir
|
2025-04-06 06:35:55 +08:00
|
|
|
pip install sgl-kernel==0.0.8 --no-cache-dir
|
2025-02-14 08:50:14 +08:00
|
|
|
|
2025-04-03 17:45:05 +08:00
|
|
|
# Install the main package
|
|
|
|
|
pip install -e "python[all]" --find-links ${FLASHINFER_REPO}
|
|
|
|
|
|
|
|
|
|
# Install additional dependencies
|
2025-03-28 10:34:10 -07:00
|
|
|
pip install torch_memory_saver
|
2025-04-05 14:20:23 -07:00
|
|
|
pip install transformers==4.51.0 sentence_transformers accelerate==1.4.0 peft pandas datasets timm torchaudio
|
2024-12-01 01:47:30 -08:00
|
|
|
|
|
|
|
|
# For compling xgrammar kernels
|
2024-11-25 04:58:16 -08:00
|
|
|
pip install cuda-python nvidia-cuda-nvrtc-cu12
|