FROM git.modelhub.org.cn:9443/enginex-metax/vllm:0.9.1

WORKDIR /workspace

# 复制 requirements.txt 并安装 Python 依赖
COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt

# 复制 server.py 到 workspace
COPY server.py /workspace/

# 暴露端口
EXPOSE 8000

# 启动服务
CMD ["uvicorn", "server:app", "--host", "0.0.0.0", "--port", "8000"]
