Files
enginex-bi_series-vllm/Dockerfile

16 lines
626 B
Docker
Raw Permalink Normal View History

2025-10-24 15:45:06 +08:00
FROM git.modelhub.org.cn:9443/enginex-iluvatar/bi100-3.2.3-x86-ubuntu20.04-py3.10-poc-llm-infer:v1.2.3
2025-08-05 19:02:46 +08:00
RUN pip install --no-cache-dir triton==2.1.0
COPY pkgs/triton /usr/local/corex/lib64/python3/dist-packages/triton
COPY pkgs/triton-2.1.0+corex.4.1.2.dist-info /usr/local/corex/lib64/python3/dist-packages/triton-2.1.0+corex.4.1.2.dist-info
2025-10-24 15:45:06 +08:00
COPY paged_attn.py /usr/local/corex/lib64/python3/dist-packages/vllm/attention/ops/paged_attn.py
COPY __init__.py /usr/local/corex/lib64/python3/dist-packages/vllm/triton_utils/__init__.py
2025-08-05 19:02:46 +08:00
RUN mkdir /workspace
WORKDIR /workspace/
COPY ./launch_service /workspace/launch_service