Add metrics logging for chat completion requests (#195)

- Add token and performance metrics for v1/chat/completions - Add Activity Page in UI - Add /api/metrics endpoint Contributed by @g2mt
2025-07-21 22:19:55 -07:00
parent 307e619521
commit 87dce5f8f6
15 changed files with 576 additions and 31 deletions
--- a/config.example.yaml
+++ b/config.example.yaml
@@ -15,6 +15,12 @@ healthCheckTimeout: 500
 # - Valid log levels: debug, info, warn, error
 logLevel: info

+# metricsMaxInMemory: maximum number of metrics to keep in memory
+# - optional, default: 1000
+# - controls how many metrics are stored in memory before older ones are discarded
+# - useful for limiting memory usage when processing large volumes of metrics
+metricsMaxInMemory: 1000
+
 # startPort: sets the starting port number for the automatic ${PORT} macro.
 # - optional, default: 5800
 # - the ${PORT} macro can be used in model.cmd and model.proxy settings
@@ -200,4 +206,4 @@ groups:
    members:
      - "forever-modelA"
      - "forever-modelB"
-      - "forever-modelc"
+      - "forever-modelc"