support v1/rerank endpoint

This commit is contained in:
Benson Wong
2024-12-17 21:22:25 -08:00
parent 9b4e3f307e
commit 9c8860471e
5 changed files with 42 additions and 4 deletions

View File

@@ -26,6 +26,8 @@ models:
aliases:
- gpt-3.5-turbo
# Embedding example with Nomic
# https://huggingface.co/nomic-ai/nomic-embed-text-v1.5-GGUF
"nomic":
proxy: http://127.0.0.1:9005
cmd: >
@@ -38,6 +40,17 @@ models:
-ngl 99
--embeddings
# Reranking example with bge-reranker
# https://huggingface.co/gpustack/bge-reranker-v2-m3-GGUF
"bge-reranker":
proxy: http://127.0.0.1:9006
cmd: >
models/llama-server-osx --port 9006
-m models/bge-reranker-v2-m3-Q4_K_M.gguf
--ctx-size 8192
--reranking
"simple":
# example of setting environment variables
env: