-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathresponses.py
More file actions
33 lines (28 loc) · 954 Bytes
/
responses.py
File metadata and controls
33 lines (28 loc) · 954 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
from fastapi import APIRouter, Request, Depends
from fastapi.responses import StreamingResponse
from backend.middleware.auth import require_auth
from backend.services.llm_service import llm_proxy_responses, response_generator_raw
from backend.config import get_settings
router = APIRouter()
settings = get_settings()
@router.post("/v1/responses")
async def create_response(
request: Request,
token: str = Depends(require_auth),
):
data = await request.json()
stream = data.get("stream", False)
response = await llm_proxy_responses(
endpoint=settings.otela_head_addr + "/v1/service/llm/v1/",
api_key=token,
payload=data,
stream=stream,
model=data.get("model", "unknown"),
)
if stream:
return StreamingResponse(
response_generator_raw(response),
media_type="text/event-stream",
headers=response.headers,
)
return response.data