From ad2f32a5859e715391c7a12d092d5a72992b9340 Mon Sep 17 00:00:00 2001 From: i-peixingyu Date: Tue, 19 May 2026 18:36:27 +0800 Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0=20K100-vLLM-Patched-v2.0/Doc?= =?UTF-8?q?kerfile?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- K100-vLLM-Patched-v2.0/Dockerfile | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) create mode 100644 K100-vLLM-Patched-v2.0/Dockerfile diff --git a/K100-vLLM-Patched-v2.0/Dockerfile b/K100-vLLM-Patched-v2.0/Dockerfile new file mode 100644 index 0000000..9da2c4c --- /dev/null +++ b/K100-vLLM-Patched-v2.0/Dockerfile @@ -0,0 +1,21 @@ +FROM git.modelhub.org.cn:9443/enginex-hygon/vllm:0.9.2 + +# 修复1 transformers 库级 patch +COPY patch.py /tmp/patch.py +RUN python3 /tmp/patch.py + +# 修复2 ROCm 平台 Triton backend head_size 验证绕过 +COPY patch_triton.py /tmp/patch_triton.py +RUN python3 /tmp/patch_triton.py + +# 修复3 运行时 tokenizer 配置修复脚本 +COPY detect_tokenizer.py /opt/detect_tokenizer.py +COPY fix_tokenizer.py /opt/fix_tokenizer.py + +# 修复4 head_size 检测,自动切换 attention backend +COPY detect_head_size.py /opt/detect_head_size.py + +COPY entrypoint.sh /opt/entrypoint.sh +RUN chmod +x /opt/entrypoint.sh + +ENTRYPOINT ["/opt/entrypoint.sh"] \ No newline at end of file