Skip to content

Commit e09510c

Browse files
committed
feat: Enable groq support for PTB
this commit enables support for standard model usage in groq (ie, chat completions, and models with industry standard token usage pricing rates). future work will be undertaken to add PTB support for the following model types on groq: - STT - tool use (GPT-OSS and groq compound models only)
1 parent 80ebad6 commit e09510c

File tree

32 files changed

+1596
-41
lines changed

32 files changed

+1596
-41
lines changed

bifrost/lib/clients/jawnTypes/public.ts

Lines changed: 10 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -414,6 +414,10 @@ export interface paths {
414414
post: operations["GetCostsOverTime"];
415415
};
416416
"/v1/public/model-registry/models": {
417+
/**
418+
* Returns a comprehensive list of all AI models with their configurations, pricing, and capabilities
419+
* @description Get all available models from the registry
420+
*/
417421
get: operations["GetModelRegistry"];
418422
};
419423
"/v1/public/compare/models": {
@@ -2756,7 +2760,7 @@ Json: JsonObject;
27562760
/** @enum {string} */
27572761
ModelProviderName: "anthropic" | "openai" | "bedrock" | "vertex" | "azure" | "perplexity" | "groq" | "deepseek" | "cohere" | "xai" | "google-ai-studio";
27582762
/** @enum {string} */
2759-
AuthorName: "anthropic" | "openai" | "perplexity" | "deepseek" | "cohere" | "xai" | "google" | "meta-llama" | "mistralai" | "amazon" | "microsoft" | "nvidia" | "qwen" | "moonshotai" | "passthrough";
2763+
AuthorName: "anthropic" | "openai" | "perplexity" | "deepseek" | "cohere" | "xai" | "google" | "meta-llama" | "mistralai" | "amazon" | "microsoft" | "nvidia" | "qwen" | "moonshotai" | "alibaba" | "passthrough";
27602764
/** @enum {string} */
27612765
StandardParameter: "max_tokens" | "temperature" | "top_p" | "top_k" | "stop" | "stream" | "frequency_penalty" | "presence_penalty" | "repetition_penalty" | "seed" | "tools" | "tool_choice" | "functions" | "function_call" | "reasoning" | "include_reasoning" | "thinking" | "response_format" | "json_mode" | "truncate" | "min_p" | "logit_bias" | "logprobs" | "top_logprobs" | "structured_outputs" | "verbosity";
27622766
ModelPricing: {
@@ -6348,9 +6352,13 @@ export interface operations {
63486352
};
63496353
};
63506354
};
6355+
/**
6356+
* Returns a comprehensive list of all AI models with their configurations, pricing, and capabilities
6357+
* @description Get all available models from the registry
6358+
*/
63516359
GetModelRegistry: {
63526360
responses: {
6353-
/** @description Ok */
6361+
/** @description Complete model registry with models and filter options */
63546362
200: {
63556363
content: {
63566364
"application/json": components["schemas"]["Result_ModelRegistryResponse.string_"];

docs/swagger.json

Lines changed: 79 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -7578,6 +7578,7 @@
75787578
"nvidia",
75797579
"qwen",
75807580
"moonshotai",
7581+
"alibaba",
75817582
"passthrough"
75827583
]
75837584
},
@@ -18221,16 +18222,93 @@
1822118222
"operationId": "GetModelRegistry",
1822218223
"responses": {
1822318224
"200": {
18224-
"description": "Ok",
18225+
"description": "Complete model registry with models and filter options",
1822518226
"content": {
1822618227
"application/json": {
1822718228
"schema": {
1822818229
"$ref": "#/components/schemas/Result_ModelRegistryResponse.string_"
18230+
},
18231+
"examples": {
18232+
"Example 1": {
18233+
"value": {
18234+
"models": [
18235+
{
18236+
"id": "claude-opus-4-1",
18237+
"name": "Anthropic: Claude Opus 4.1",
18238+
"author": "anthropic",
18239+
"contextLength": 200000,
18240+
"endpoints": [
18241+
{
18242+
"provider": "anthropic",
18243+
"providerSlug": "anthropic",
18244+
"supportsPtb": true,
18245+
"pricing": {
18246+
"prompt": 15,
18247+
"completion": 75,
18248+
"cacheRead": 1.5,
18249+
"cacheWrite": 18.75
18250+
}
18251+
}
18252+
],
18253+
"maxOutput": 32000,
18254+
"trainingDate": "2025-08-05",
18255+
"description": "Most capable Claude model with extended context",
18256+
"inputModalities": [
18257+
null
18258+
],
18259+
"outputModalities": [
18260+
null
18261+
],
18262+
"supportedParameters": [
18263+
null,
18264+
null,
18265+
null,
18266+
null,
18267+
null,
18268+
null,
18269+
null
18270+
]
18271+
}
18272+
],
18273+
"total": 150,
18274+
"filters": {
18275+
"providers": [
18276+
{
18277+
"name": "anthropic",
18278+
"displayName": "Anthropic"
18279+
},
18280+
{
18281+
"name": "openai",
18282+
"displayName": "OpenAI"
18283+
},
18284+
{
18285+
"name": "google",
18286+
"displayName": "Google"
18287+
}
18288+
],
18289+
"authors": [
18290+
"anthropic",
18291+
"openai",
18292+
"google",
18293+
"meta"
18294+
],
18295+
"capabilities": [
18296+
"audio",
18297+
"image",
18298+
"thinking",
18299+
"caching",
18300+
"reasoning"
18301+
]
18302+
}
18303+
}
18304+
}
1822918305
}
1823018306
}
1823118307
}
1823218308
}
1823318309
},
18310+
"description": "Get all available models from the registry",
18311+
"summary": "Returns a comprehensive list of all AI models with their configurations, pricing, and capabilities",
1823418312
"tags": [
1823518313
"Model Registry"
1823618314
],

0 commit comments

Comments
 (0)