Skip to content

Commit b90f0aa

Browse files
committed
feat(models): convert get capabilities of a provider with standard forward request method
1 parent e1aeacb commit b90f0aa

33 files changed

Lines changed: 1231 additions & 2647 deletions

api/clients/model/__init__.py

Lines changed: 0 additions & 8 deletions
This file was deleted.

api/clients/model/_albertmodelprovider.py

Lines changed: 0 additions & 68 deletions
This file was deleted.

api/clients/model/_mistralmodelprovider.py

Lines changed: 0 additions & 68 deletions
This file was deleted.

api/clients/model/_openaimodelprovider.py

Lines changed: 0 additions & 67 deletions
This file was deleted.

api/clients/model/_teimodelprovider.py

Lines changed: 0 additions & 63 deletions
This file was deleted.

api/clients/model/_vllmmodelprovider.py

Lines changed: 0 additions & 67 deletions
This file was deleted.

api/dependencies.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22
from contextvars import ContextVar
33

44
from fastapi import Depends
5+
from redis.asyncio import Redis as AsyncRedis
56
from sqlalchemy.ext.asyncio import AsyncSession
67

78
from api.domain.key import KeyRepository
@@ -43,6 +44,14 @@ async def get_postgres_session() -> AsyncGenerator[AsyncSession]:
4344
raise
4445

4546

47+
async def get_redis_client() -> AsyncGenerator[AsyncRedis]:
48+
client = AsyncRedis(connection_pool=global_context.redis_pool)
49+
50+
yield client
51+
52+
await client.aclose()
53+
54+
4655
# repositories
4756
def _router_repository(session: AsyncSession) -> PostgresRouterRepository:
4857
return PostgresRouterRepository(postgres_session=session, app_title=configuration.settings.app_title)

api/endpoints/chat.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -58,6 +58,7 @@ async def chat_completions(
5858
request_context: ContextVar[RequestContext] = Depends(get_request_context),
5959
) -> JSONResponse | StreamingResponseWithStatusCode:
6060
"""Creates a model response for the given chat conversation."""
61+
6162
model_provider = await model_registry.get_model_provider(
6263
model=body.model,
6364
endpoint=EndpointRoute.CHAT_COMPLETIONS,

0 commit comments

Comments
 (0)