diff --git a/Dockerfile b/Dockerfile new file mode 100644 index 0000000..2a450b3 --- /dev/null +++ b/Dockerfile @@ -0,0 +1,12 @@ +FROM mthreads/musa:rc4.3.0-devel-ubuntu22.04-amd64 as builder +ADD . /src +WORKDIR /src +RUN cmake -B build \ + -DGGML_MUSA=ON -DLLAMA_OPENSSL=OFF -DGGML_CUDA_NO_VMM=ON -DMUSA_ARCHITECTURES=${MUSA_ARCH:-22} \ + -DCMAKE_BUILD_TYPE=Release &&\ + cmake --build build -j + +FROM mthreads/musa:rc4.3.0-runtime-ubuntu22.04-amd64 +COPY --from=builder /src/build/bin /app +WORKDIR /app +ENTRYPOINT [ "/app/llama-cli" ] \ No newline at end of file diff --git a/README.md b/README.md index d1e65c7..44540f4 100644 --- a/README.md +++ b/README.md @@ -1,6 +1,6 @@ # llama.cpp -> Sync from upstream `llama.cpp` repository +> Sync from upstream `llama.cpp` repository tag `b7516` ![llama](https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png)