@@ -75,6 +75,8 @@ class DefaultModelSuppliers(str, Enum):
7575 MISTRAL = "mistral"
7676 GROQ = "groq"
7777 GEMINI = "gemini"
78+ ASTRAFLOW = "astraflow"
79+ ASTRAFLOW_CN = "astraflow_cn"
7880
7981
8082class LLMConfig (QuivrBaseConfig ):
@@ -275,6 +277,39 @@ class LLMModelConfig:
275277 tokenizer_hub = "Quivr/gemini-tokenizer" ,
276278 ),
277279 },
280+ # Astraflow (UCloud / 优刻得) — OpenAI-compatible aggregation platform
281+ # supporting 200+ models.
282+ # Global endpoint: https://api-us-ca.umodelverse.ai/v1 (env: ASTRAFLOW_API_KEY)
283+ # China endpoint: https://api.modelverse.cn/v1 (env: ASTRAFLOW_CN_API_KEY)
284+ DefaultModelSuppliers .ASTRAFLOW : {
285+ "gpt-4o" : LLMConfig (
286+ max_context_tokens = 128000 ,
287+ max_output_tokens = 16384 ,
288+ tokenizer_hub = "Quivr/gpt-4o" ,
289+ ),
290+ "gpt-4o-mini" : LLMConfig (
291+ max_context_tokens = 128000 ,
292+ max_output_tokens = 16384 ,
293+ tokenizer_hub = "Quivr/gpt-4o" ,
294+ ),
295+ "claude-3-5-sonnet" : LLMConfig (
296+ max_context_tokens = 200000 ,
297+ max_output_tokens = 8192 ,
298+ tokenizer_hub = "Quivr/claude-tokenizer" ,
299+ ),
300+ },
301+ DefaultModelSuppliers .ASTRAFLOW_CN : {
302+ "gpt-4o" : LLMConfig (
303+ max_context_tokens = 128000 ,
304+ max_output_tokens = 16384 ,
305+ tokenizer_hub = "Quivr/gpt-4o" ,
306+ ),
307+ "gpt-4o-mini" : LLMConfig (
308+ max_context_tokens = 128000 ,
309+ max_output_tokens = 16384 ,
310+ tokenizer_hub = "Quivr/gpt-4o" ,
311+ ),
312+ },
278313 }
279314
280315 @classmethod
0 commit comments