first container code (#52)

This commit is contained in:
Benson Wong
2025-02-14 10:39:25 -08:00
committed by GitHub
parent 13d4552edc
commit ab93460a8b
3 changed files with 75 additions and 0 deletions

View File

@@ -0,0 +1,15 @@
ARG BASE_TAG=server-cuda
FROM ghcr.io/ggerganov/llama.cpp:${BASE_TAG}
# has to be after the FROM
ARG LS_VER=89
WORKDIR /app
RUN \
curl -LO https://github.com/mostlygeek/llama-swap/releases/download/v"${LS_VER}"/llama-swap_"${LS_VER}"_linux_amd64.tar.gz && \
tar -zxf llama-swap_"${LS_VER}"_linux_amd64.tar.gz && \
rm llama-swap_"${LS_VER}"_linux_amd64.tar.gz
ENTRYPOINT [ "/app/llama-swap", "--config", "/config.yaml" ]