|
408 | 408 | }, |
409 | 409 | "responses": { |
410 | 410 | "200": { |
411 | | - "description": "Generated Text", |
| 411 | + "description": "Generated Chat Completion", |
412 | 412 | "content": { |
413 | 413 | "application/json": { |
| 414 | + "schema": { |
| 415 | + "$ref": "#/components/schemas/ChatCompletion" |
| 416 | + } |
| 417 | + }, |
| 418 | + "text/event-stream": { |
414 | 419 | "schema": { |
415 | 420 | "$ref": "#/components/schemas/ChatCompletionChunk" |
416 | 421 | } |
|
492 | 497 | }, |
493 | 498 | "responses": { |
494 | 499 | "200": { |
495 | | - "description": "Generated Text", |
| 500 | + "description": "Generated Chat Completion", |
496 | 501 | "content": { |
497 | 502 | "application/json": { |
498 | 503 | "schema": { |
499 | | - "$ref": "#/components/schemas/ChatCompletionChunk" |
| 504 | + "$ref": "#/components/schemas/Completion" |
| 505 | + } |
| 506 | + }, |
| 507 | + "text/event-stream": { |
| 508 | + "schema": { |
| 509 | + "$ref": "#/components/schemas/CompletionCompleteChunk" |
500 | 510 | } |
501 | 511 | } |
502 | 512 | } |
|
930 | 940 | "tool_prompt": { |
931 | 941 | "type": "string", |
932 | 942 | "description": "A prompt to be appended before the tools", |
933 | | - "example": "\"Based on the conversation, please choose the most appropriate tool to use: \"", |
| 943 | + "example": "\"You will be presented with a JSON schema representing a set of tools.\nIf the user request lacks of sufficient information to make a precise tool selection: Do not invent any tool's properties, instead notify with an error message.\n\nJSON Schema:\n\"", |
934 | 944 | "nullable": true |
935 | 945 | }, |
936 | 946 | "tools": { |
|
1071 | 1081 | "example": "mistralai/Mistral-7B-Instruct-v0.2" |
1072 | 1082 | }, |
1073 | 1083 | "prompt": { |
1074 | | - "type": "string", |
| 1084 | + "type": "array", |
| 1085 | + "items": { |
| 1086 | + "type": "string" |
| 1087 | + }, |
1075 | 1088 | "description": "The prompt to generate completions for.", |
1076 | 1089 | "example": "What is Deep Learning?" |
1077 | 1090 | }, |
|
1234 | 1247 | "type": "object", |
1235 | 1248 | "required": [ |
1236 | 1249 | "name", |
1237 | | - "parameters" |
| 1250 | + "arguments" |
1238 | 1251 | ], |
1239 | 1252 | "properties": { |
| 1253 | + "arguments": {}, |
1240 | 1254 | "description": { |
1241 | 1255 | "type": "string", |
1242 | 1256 | "nullable": true |
1243 | 1257 | }, |
1244 | 1258 | "name": { |
1245 | 1259 | "type": "string" |
1246 | | - }, |
1247 | | - "parameters": {} |
| 1260 | + } |
1248 | 1261 | } |
1249 | 1262 | }, |
1250 | 1263 | "GenerateParameters": { |
|
1260 | 1273 | }, |
1261 | 1274 | "decoder_input_details": { |
1262 | 1275 | "type": "boolean", |
1263 | | - "default": "true" |
| 1276 | + "default": "false" |
1264 | 1277 | }, |
1265 | 1278 | "details": { |
1266 | 1279 | "type": "boolean", |
|
1285 | 1298 | "$ref": "#/components/schemas/GrammarType" |
1286 | 1299 | } |
1287 | 1300 | ], |
| 1301 | + "default": "null", |
1288 | 1302 | "nullable": true |
1289 | 1303 | }, |
1290 | 1304 | "max_new_tokens": { |
|
1478 | 1492 | "max_batch_total_tokens", |
1479 | 1493 | "max_waiting_tokens", |
1480 | 1494 | "validation_workers", |
| 1495 | + "max_client_batch_size", |
1481 | 1496 | "version" |
1482 | 1497 | ], |
1483 | 1498 | "properties": { |
|
1503 | 1518 | "example": "2", |
1504 | 1519 | "minimum": 0 |
1505 | 1520 | }, |
| 1521 | + "max_client_batch_size": { |
| 1522 | + "type": "integer", |
| 1523 | + "example": "32", |
| 1524 | + "minimum": 0 |
| 1525 | + }, |
1506 | 1526 | "max_concurrent_requests": { |
1507 | 1527 | "type": "integer", |
1508 | 1528 | "description": "Router Parameters", |
|
0 commit comments