support environment variables

This commit is contained in:
Benson Wong
2024-10-04 11:55:27 -07:00
parent 43119e807f
commit d682589fb1
6 changed files with 40 additions and 7 deletions

View File

@@ -18,6 +18,9 @@ healthCheckTimeout: 60
# define models
models:
"llama":
env:
- "CUDA_VISIBLE_DEVICES=0"
cmd: "llama-server --port 8999 -m Llama-3.2-1B-Instruct-Q4_K_M.gguf"
# address where llama-ser
@@ -31,7 +34,6 @@ models:
"qwen":
cmd: "llama-server --port 8999 -m path/to/Qwen2.5-1.5B-Instruct-Q4_K_M.gguf"
proxy: "http://127.0.0.1:8999"
aliases:
```
## Testing with CURL