-
Notifications
You must be signed in to change notification settings - Fork 5
/
Taskfile.reranker.yml
37 lines (32 loc) · 1017 Bytes
/
Taskfile.reranker.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
# https://taskfile.dev
version: "3"
tasks:
server:
deps: [ download-model ]
cmds:
- llama-server
--port 9082
--log-disable
--reranking
--model ./models/bge-reranker-v2-m3.gguf
download-model:
cmds:
- mkdir -p models
- curl -s -L -o models/bge-reranker-v2-m3.gguf https://huggingface.co/gpustack/bge-reranker-v2-m3-GGUF/resolve/main/bge-reranker-v2-m3-Q4_K_M.gguf?download=true
status:
- test -f models/bge-reranker-v2-m3.gguf
test:
cmds:
- |
curl http://localhost:9082/v1/rerank \
-H "Content-Type: application/json" \
-d '{
"model": "bge-reranker-v2-m3",
"query": "What is panda?",
"top_n": 3,
"documents": [
"hi",
"it is a bear",
"The giant panda (Ailuropoda melanoleuca), sometimes called a panda bear or simply panda, is a bear species endemic to China."
]
}'