add docs and container build improvements #43

This commit is contained in:
Benson Wong
2025-02-14 12:20:07 -08:00
parent 7a97c38828
commit f20f2c9b7a
4 changed files with 93 additions and 23 deletions

View File

@@ -0,0 +1,17 @@
healthCheckTimeout: 300
logRequests: true
models:
"qwen2.5":
proxy: "http://127.0.0.1:9999"
cmd: >
/app/llama-server
-hf bartowski/Qwen2.5-0.5B-Instruct-GGUF:Q4_K_M
--port 9999
"smollm2":
proxy: "http://127.0.0.1:9999"
cmd: >
/app/llama-server
-hf bartowski/SmolLM2-135M-Instruct-GGUF:Q4_K_M
--port 9999