- Add token and performance metrics for v1/chat/completions - Add Activity Page in UI - Add /api/metrics endpoint Contributed by @g2mt
18 lines
386 B
YAML
18 lines
386 B
YAML
healthCheckTimeout: 300
|
|
logRequests: true
|
|
metricsMaxInMemory: 1000
|
|
|
|
models:
|
|
"qwen2.5":
|
|
proxy: "http://127.0.0.1:9999"
|
|
cmd: >
|
|
/app/llama-server
|
|
-hf bartowski/Qwen2.5-0.5B-Instruct-GGUF:Q4_K_M
|
|
--port 9999
|
|
|
|
"smollm2":
|
|
proxy: "http://127.0.0.1:9999"
|
|
cmd: >
|
|
/app/llama-server
|
|
-hf bartowski/SmolLM2-135M-Instruct-GGUF:Q4_K_M
|
|
--port 9999 |