15 lines
436 B
Docker
15 lines
436 B
Docker
ARG BASE_TAG=server-cuda
|
|
FROM ghcr.io/ggerganov/llama.cpp:${BASE_TAG}
|
|
|
|
# has to be after the FROM
|
|
ARG LS_VER=89
|
|
|
|
WORKDIR /app
|
|
|
|
RUN \
|
|
curl -LO https://github.com/mostlygeek/llama-swap/releases/download/v"${LS_VER}"/llama-swap_"${LS_VER}"_linux_amd64.tar.gz && \
|
|
tar -zxf llama-swap_"${LS_VER}"_linux_amd64.tar.gz && \
|
|
rm llama-swap_"${LS_VER}"_linux_amd64.tar.gz
|
|
|
|
|
|
ENTRYPOINT [ "/app/llama-swap", "--config", "/config.yaml" ] |