29 lines
912 B
Bash
Executable File
29 lines
912 B
Bash
Executable File
#!/bin/bash
|
|
set -euxo pipefail
|
|
|
|
# Install the dependency in CI.
|
|
|
|
# Use repo from environment variable, passed from GitHub Actions
|
|
FLASHINFER_REPO="${FLASHINFER_REPO:-https://flashinfer.ai/whl/cu124/torch2.4/flashinfer}"
|
|
|
|
SCRIPT_DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
|
|
bash "${SCRIPT_DIR}/killall_sglang.sh"
|
|
|
|
pip install --upgrade pip
|
|
pip install -e "python[all]" --find-links https://flashinfer.ai/whl/cu124/torch2.4/flashinfer/
|
|
|
|
# Force reinstall flashinfer and torch_memory_saver
|
|
pip install flashinfer==0.1.6 --find-links ${FLASHINFER_REPO} --force-reinstall --no-deps
|
|
pip install torch_memory_saver --force-reinstall
|
|
|
|
pip install transformers==4.45.2 sentence_transformers accelerate peft
|
|
|
|
# For compling eagle kernels
|
|
pip install cutex
|
|
|
|
# For compling xgrammar kernels
|
|
pip install cuda-python nvidia-cuda-nvrtc-cu12
|
|
|
|
# reinstall sgl-kernel
|
|
pip install sgl-kernel --force-reinstall --no-deps
|