7 lines
342 B
Docker
7 lines
342 B
Docker
FROM vllm/vllm-openai
|
|
|
|
RUN pip install --upgrade pip
|
|
RUN pip install "sglang[all]"
|
|
RUN pip uninstall -y triton triton-nightly && pip install --no-deps --index-url https://aiinfra.pkgs.visualstudio.com/PublicPackages/_packaging/Triton-Nightly/pypi/simple/ triton-nightly
|
|
RUN pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.3/
|