From ea790a6582cd06658532f7248446b9324d42eea7 Mon Sep 17 00:00:00 2001 From: mdlinville <7674613+mdlinville@users.noreply.github.com> Date: Mon, 20 Apr 2026 10:09:46 +0000 Subject: [PATCH] chore: Update Training API documentation --- training/api-reference/openapi.json | 187 +++++++++++----------------- 1 file changed, 71 insertions(+), 116 deletions(-) diff --git a/training/api-reference/openapi.json b/training/api-reference/openapi.json index eefe8dee79..5ae55fdcb6 100644 --- a/training/api-reference/openapi.json +++ b/training/api-reference/openapi.json @@ -2030,28 +2030,6 @@ "title": "Request Id", "description": "The request_id related to this request. If the caller does not set it, a random_uuid will be generated. This id is used through out the inference process and return in response." }, - "logits_processors": { - "anyOf": [ - { - "items": { - "anyOf": [ - { - "type": "string" - }, - { - "$ref": "#/components/schemas/LogitsProcessorConstructor" - } - ] - }, - "type": "array" - }, - { - "type": "null" - } - ], - "title": "Logits Processors", - "description": "A list of either qualified names of logits processors, or constructor objects, to apply when sampling. A constructor is a JSON object with a required 'qualname' field specifying the qualified name of the processor class/factory, and optional 'args' and 'kwargs' fields containing positional and keyword arguments. For example: {'qualname': 'my_module.MyLogitsProcessor', 'args': [1, 2], 'kwargs': {'param': 'value'}}." - }, "return_tokens_as_token_ids": { "anyOf": [ { @@ -2141,6 +2119,17 @@ ], "title": "Vllm Xargs", "description": "Additional request parameters with (list of) string or numeric values, used by custom extensions." + }, + "repetition_detection": { + "anyOf": [ + { + "$ref": "#/components/schemas/RepetitionDetectionParams" + }, + { + "type": "null" + } + ], + "description": "Parameters for detecting repetitive N-gram patterns in output tokens. If such repetition is detected, generation will be ended early. LLMs can sometimes generate repetitive, unhelpful token patterns, stopping only when they hit the maximum output length (e.g. 'abcdabcdabcd...' or '\\emoji \\emoji \\emoji ...'). This feature can detect such behavior and terminate early, saving time and tokens." } }, "additionalProperties": true, @@ -2458,7 +2447,7 @@ "default": "function" }, "function": { - "$ref": "#/components/schemas/vllm__entrypoints__openai__engine__protocol__FunctionDefinition" + "$ref": "#/components/schemas/FunctionDefinition" } }, "additionalProperties": true, @@ -2591,17 +2580,6 @@ } ], "title": "Reasoning" - }, - "reasoning_content": { - "anyOf": [ - { - "type": "string" - }, - { - "type": "null" - } - ], - "title": "Reasoning Content" } }, "additionalProperties": true, @@ -3342,6 +3320,43 @@ ], "title": "FunctionCall" }, + "FunctionDefinition": { + "properties": { + "name": { + "type": "string", + "title": "Name" + }, + "description": { + "anyOf": [ + { + "type": "string" + }, + { + "type": "null" + } + ], + "title": "Description" + }, + "parameters": { + "anyOf": [ + { + "additionalProperties": true, + "type": "object" + }, + { + "type": "null" + } + ], + "title": "Parameters" + } + }, + "additionalProperties": true, + "type": "object", + "required": [ + "name" + ], + "title": "FunctionDefinition" + }, "HTTPValidationError": { "properties": { "detail": { @@ -3585,44 +3600,6 @@ "title": "LogRequest", "description": "Schema for logging trajectories." }, - "LogitsProcessorConstructor": { - "properties": { - "qualname": { - "type": "string", - "title": "Qualname" - }, - "args": { - "anyOf": [ - { - "items": {}, - "type": "array" - }, - { - "type": "null" - } - ], - "title": "Args" - }, - "kwargs": { - "anyOf": [ - { - "additionalProperties": true, - "type": "object" - }, - { - "type": "null" - } - ], - "title": "Kwargs" - } - }, - "additionalProperties": false, - "type": "object", - "required": [ - "qualname" - ], - "title": "LogitsProcessorConstructor" - }, "Logprob": { "properties": { "logprob": { @@ -3913,6 +3890,28 @@ "type": "object", "title": "PromptTokenUsageInfo" }, + "RepetitionDetectionParams": { + "properties": { + "max_pattern_size": { + "type": "integer", + "title": "Max Pattern Size", + "default": 0 + }, + "min_pattern_size": { + "type": "integer", + "title": "Min Pattern Size", + "default": 0 + }, + "min_count": { + "type": "integer", + "title": "Min Count", + "default": 0 + } + }, + "type": "object", + "title": "RepetitionDetectionParams", + "description": "Parameters for detecting repetitive N-gram patterns in output tokens." + }, "ResponseFormat": { "properties": { "type": { @@ -4489,13 +4488,6 @@ "type": { "type": "string", "title": "Error Type" - }, - "input": { - "title": "Input" - }, - "ctx": { - "type": "object", - "title": "Context" } }, "type": "object", @@ -4553,43 +4545,6 @@ "name" ], "title": "FunctionDefinition" - }, - "vllm__entrypoints__openai__engine__protocol__FunctionDefinition": { - "properties": { - "name": { - "type": "string", - "title": "Name" - }, - "description": { - "anyOf": [ - { - "type": "string" - }, - { - "type": "null" - } - ], - "title": "Description" - }, - "parameters": { - "anyOf": [ - { - "additionalProperties": true, - "type": "object" - }, - { - "type": "null" - } - ], - "title": "Parameters" - } - }, - "additionalProperties": true, - "type": "object", - "required": [ - "name" - ], - "title": "FunctionDefinition" } }, "securitySchemes": {