-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathrerank.py
More file actions
37 lines (32 loc) · 997 Bytes
/
rerank.py
File metadata and controls
37 lines (32 loc) · 997 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
from fastapi import APIRouter, Request, Depends
from backend.middleware.auth import require_auth
from backend.services.llm_service import llm_proxy_rerank, llm_proxy_score
from backend.config import get_settings
router = APIRouter()
settings = get_settings()
@router.post("/v1/rerank")
async def rerank(
request: Request,
token: str = Depends(require_auth),
):
data = await request.json()
response = await llm_proxy_rerank(
endpoint=settings.otela_head_addr + "/v1/service/llm/v1/",
api_key=token,
payload=data,
model=data.get("model", "unknown"),
)
return response.data
@router.post("/v1/score")
async def score(
request: Request,
token: str = Depends(require_auth),
):
data = await request.json()
response = await llm_proxy_score(
endpoint=settings.otela_head_addr + "/v1/service/llm/v1/",
api_key=token,
payload=data,
model=data.get("model", "unknown"),
)
return response.data