text-generation-webui/extensions/openai/typing.py

import json
import time
from typing import Dict, List, Optional

from pydantic import BaseModel, Field, model_validator, validator


class GenerationOptions(BaseModel):
    preset: str | None = Field(default=None, description="The name of a file under text-generation-webui/user_data/presets (without the .yaml extension). The sampling parameters that get overwritten by this option are the keys in the default_preset() function in modules/presets.py.")
    dynatemp_low: float = 1
    dynatemp_high: float = 1
    dynatemp_exponent: float = 1
    smoothing_factor: float = 0
    smoothing_curve: float = 1
    min_p: float = 0
    top_k: int = 0
    typical_p: float = 1
    xtc_threshold: float = 0.1
    xtc_probability: float = 0
    epsilon_cutoff: float = 0
    eta_cutoff: float = 0
    tfs: float = 1
    top_a: float = 0
    top_n_sigma: float = 0
    dry_multiplier: float = 0
    dry_allowed_length: int = 2
    dry_base: float = 1.75
    repetition_penalty: float = 1
    encoder_repetition_penalty: float = 1
    no_repeat_ngram_size: int = 0
    repetition_penalty_range: int = 1024
    penalty_alpha: float = 0
    guidance_scale: float = 1
    mirostat_mode: int = 0
    mirostat_tau: float = 5
    mirostat_eta: float = 0.1
    prompt_lookup_num_tokens: int = 0
    max_tokens_second: int = 0
    do_sample: bool = True
    dynamic_temperature: bool = False
    temperature_last: bool = False
    auto_max_new_tokens: bool = False
    ban_eos_token: bool = False
    add_bos_token: bool = True
    enable_thinking: bool = True
    reasoning_effort: str = "medium"
    skip_special_tokens: bool = True
    static_cache: bool = False
    truncation_length: int = 0
    seed: int = -1
    sampler_priority: List[str] | str | None = Field(default=None, description="List of samplers where the first items will appear first in the stack. Example: [\"top_k\", \"temperature\", \"top_p\"].")
    custom_token_bans: str = ""
    negative_prompt: str = ''
    dry_sequence_breakers: str = '"\\n", ":", "\\"", "*"'
    grammar_string: str = ""


class ToolDefinition(BaseModel):
    function: 'ToolFunction'
    type: str


class ToolFunction(BaseModel):
    description: str
    name: str
    parameters: 'ToolParameters'


class ToolParameters(BaseModel):
    properties: Optional[Dict[str, 'ToolProperty']] = None
    required: Optional[list[str]] = None
    type: str
    description: Optional[str] = None


class ToolProperty(BaseModel):
    description: Optional[str] = None
    type: Optional[str] = None  # we are faced with definitions like anyOf, e.g. {'type': 'function', 'function': {'name': 'git_create_branch', 'description': 'Creates a new branch from an optional base branch', 'parameters': {'type': 'object', 'properties': {'repo_path': {'title': 'Repo Path', 'type': 'string'}, 'branch_name': {'title': 'Branch Name', 'type': 'string'}, 'base_branch': {'anyOf': [{'type': 'string'}, {'type': 'null'}], 'default': None, 'title': 'Base Branch'}}, 'required': ['repo_path', 'branch_name'], 'title': 'GitCreateBranch'}}}


class FunctionCall(BaseModel):
    name: str
    arguments: Optional[str] = None
    parameters: Optional[str] = None

    @validator('arguments', allow_reuse=True)
    def checkPropertyArgsOrParams(cls, v, values, **kwargs):
        if not v and not values.get('parameters'):
            raise ValueError("At least one of 'arguments' or 'parameters' must be provided as property in FunctionCall type")
        return v


class ToolCall(BaseModel):
    id: str
    index: int
    type: str
    function: FunctionCall


class CompletionRequestParams(BaseModel):
    model: str | None = Field(default=None, description="Unused parameter. To change the model, use the /v1/internal/model/load endpoint.")
    prompt: str | List[str] | None = Field(default=None, description="Text prompt for completion. Can also use 'messages' format for multimodal.")
    messages: List[dict] | None = Field(default=None, description="OpenAI messages format for multimodal support. Alternative to 'prompt'.")
    best_of: int | None = Field(default=1, description="Unused parameter.")
    echo: bool | None = False
    frequency_penalty: float | None = 0
    logit_bias: dict | None = None
    logprobs: int | None = None
    max_tokens: int | None = 512
    n: int | None = Field(default=1, description="Unused parameter.")
    presence_penalty: float | None = 0
    stop: str | List[str] | None = None
    stream: bool | None = False
    suffix: str | None = None
    temperature: float | None = 1
    top_p: float | None = 1
    user: str | None = Field(default=None, description="Unused parameter.")

    @model_validator(mode='after')
    def validate_prompt_or_messages(self):
        if self.prompt is None and self.messages is None:
            raise ValueError("Either 'prompt' or 'messages' must be provided")
        return self


class CompletionRequest(GenerationOptions, CompletionRequestParams):
    pass


class CompletionResponse(BaseModel):
    id: str
    choices: List[dict]
    created: int = int(time.time())
    model: str
    object: str = "text_completion"
    usage: dict


class ChatCompletionRequestParams(BaseModel):
    messages: List[dict]
    model: str | None = Field(default=None, description="Unused parameter. To change the model, use the /v1/internal/model/load endpoint.")
    frequency_penalty: float | None = 0
    function_call: str | dict | None = Field(default=None, description="Unused parameter.")
    functions: List[dict] | None = Field(default=None, description="Unused parameter.")
    tools: List[dict] | None = Field(default=None, description="Tools signatures passed via MCP.")
    logit_bias: dict | None = None
    max_tokens: int | None = None
    n: int | None = Field(default=1, description="Unused parameter.")
    presence_penalty: float | None = 0
    stop: str | List[str] | None = None
    stream: bool | None = False
    temperature: float | None = 1
    top_p: float | None = 1
    user: str | None = Field(default=None, description="Unused parameter.")

    mode: str = Field(default='instruct', description="Valid options: instruct, chat, chat-instruct.")

    instruction_template: str | None = Field(default=None, description="An instruction template defined under text-generation-webui/user_data/instruction-templates. If not set, the correct template will be automatically obtained from the model metadata.")
    instruction_template_str: str | None = Field(default=None, description="A Jinja2 instruction template. If set, will take precedence over everything else.")

    character: str | None = Field(default=None, description="A character defined under text-generation-webui/user_data/characters. If not set, the default \"Assistant\" character will be used.")
    bot_name: str | None = Field(default=None, description="Overwrites the value set by character field.", alias="name2")
    context: str | None = Field(default=None, description="Overwrites the value set by character field.")
    greeting: str | None = Field(default=None, description="Overwrites the value set by character field.")
    user_name: str | None = Field(default=None, description="Your name (the user). By default, it's \"You\".", alias="name1")
    user_bio: str | None = Field(default=None, description="The user description/personality.")
    chat_template_str: str | None = Field(default=None, description="Jinja2 template for chat.")

    chat_instruct_command: str | None = "Continue the chat dialogue below. Write a single reply for the character \"<|character|>\".\n\n<|prompt|>"

    continue_: bool = Field(default=False, description="Makes the last bot message in the history be continued instead of starting a new message.")


class ChatCompletionRequest(GenerationOptions, ChatCompletionRequestParams):
    pass


class ChatCompletionResponse(BaseModel):
    id: str
    choices: List[dict]
    created: int = int(time.time())
    model: str
    object: str = "chat.completion"
    usage: dict


class ChatPromptResponse(BaseModel):
    prompt: str


class EmbeddingsRequest(BaseModel):
    input: str | List[str] | List[int] | List[List[int]]
    model: str | None = Field(default=None, description="Unused parameter. To change the model, set the OPENEDAI_EMBEDDING_MODEL and OPENEDAI_EMBEDDING_DEVICE environment variables before starting the server.")
    encoding_format: str = Field(default="float", description="Can be float or base64.")
    user: str | None = Field(default=None, description="Unused parameter.")


class EmbeddingsResponse(BaseModel):
    index: int
    embedding: List[float]
    object: str = "embedding"


class EncodeRequest(BaseModel):
    text: str


class EncodeResponse(BaseModel):
    tokens: List[int]
    length: int


class DecodeRequest(BaseModel):
    tokens: List[int]


class DecodeResponse(BaseModel):
    text: str


class TokenCountResponse(BaseModel):
    length: int


class LogitsRequestParams(BaseModel):
    prompt: str
    use_samplers: bool = False
    top_logits: int | None = 50
    frequency_penalty: float | None = 0
    max_tokens: int | None = 512
    presence_penalty: float | None = 0
    temperature: float | None = 1
    top_p: float | None = 1


class LogitsRequest(GenerationOptions, LogitsRequestParams):
    pass


class LogitsResponse(BaseModel):
    logits: Dict[str, float]


class ModelInfoResponse(BaseModel):
    model_name: str
    lora_names: List[str]


class ModelListResponse(BaseModel):
    model_names: List[str]


class LoadModelRequest(BaseModel):
    model_name: str
    args: dict | None = None
    settings: dict | None = None


class LoraListResponse(BaseModel):
    lora_names: List[str]


class LoadLorasRequest(BaseModel):
    lora_names: List[str]


class ImageGenerationRequest(BaseModel):
    """Image-specific parameters for generation."""
    prompt: str
    negative_prompt: str = ""
    size: str = Field(default="1024x1024", description="'WIDTHxHEIGHT'")
    steps: int = Field(default=9, ge=1)
    cfg_scale: float = Field(default=0.0, ge=0.0)
    image_seed: int = Field(default=-1, description="-1 for random")
    batch_size: int | None = Field(default=None, ge=1, description="Parallel batch size (VRAM heavy)")
    n: int = Field(default=1, ge=1, description="Alias for batch_size (OpenAI compatibility)")
    batch_count: int = Field(default=1, ge=1, description="Sequential batch count")

    # OpenAI compatibility (unused)
    model: str | None = None
    response_format: str = "b64_json"
    user: str | None = None

    @model_validator(mode='after')
    def resolve_batch_size(self):
        if self.batch_size is None:
            self.batch_size = self.n
        return self

    def get_width_height(self) -> tuple[int, int]:
        try:
            parts = self.size.lower().split('x')
            return int(parts[0]), int(parts[1])
        except (ValueError, IndexError):
            return 1024, 1024


class ImageGenerationResponse(BaseModel):
    created: int = int(time.time())
    data: List[dict]


def to_json(obj):
    return json.dumps(obj.__dict__, indent=4)


def to_dict(obj):
    return obj.__dict__
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`import json`
			`import time`
Tools support for OpenAI compatible API (#6827) 2025-05-08 17:30:27 +02:00			`from typing import Dict, List, Optional`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
API: Improve a validation 2025-08-11 21:39:18 +02:00			`from pydantic import BaseModel, Field, model_validator, validator`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00

			`class GenerationOptions(BaseModel):`
Restructure the repository (#6904) 2025-04-26 13:56:54 +02:00			`preset: str \| None = Field(default=None, description="The name of a file under text-generation-webui/user_data/presets (without the .yaml extension). The sampling parameters that get overwritten by this option are the keys in the default_preset() function in modules/presets.py.")`
dynatemp_low, dynatemp_high, dynatemp_exponent parameters (#5209) 2024-01-09 03:28:35 +01:00			`dynatemp_low: float = 1`
			`dynatemp_high: float = 1`
			`dynatemp_exponent: float = 1`
Quadratic sampling (#5403) --------- Co-authored-by: oobabooga <112222186+oobabooga@users.noreply.github.com> 2024-02-04 04:20:02 +01:00			`smoothing_factor: float = 0`
Cubic sampling w/ curve param (#5551) --------- Co-authored-by: oobabooga <112222186+oobabooga@users.noreply.github.com> 2024-03-03 17:22:21 +01:00			`smoothing_curve: float = 1`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`min_p: float = 0`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`top_k: int = 0`
			`typical_p: float = 1`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`xtc_threshold: float = 0.1`
			`xtc_probability: float = 0`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`epsilon_cutoff: float = 0`
			`eta_cutoff: float = 0`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`tfs: float = 1`
			`top_a: float = 0`
Add the top N-sigma sampler (#6796) 2025-03-14 20:45:11 +01:00			`top_n_sigma: float = 0`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`dry_multiplier: float = 0`
			`dry_allowed_length: int = 2`
			`dry_base: float = 1.75`
			`repetition_penalty: float = 1`
			`encoder_repetition_penalty: float = 1`
			`no_repeat_ngram_size: int = 0`
			`repetition_penalty_range: int = 1024`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`penalty_alpha: float = 0`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`guidance_scale: float = 1`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`mirostat_mode: int = 0`
			`mirostat_tau: float = 5`
			`mirostat_eta: float = 0.1`
Add prompt_lookup_num_tokens parameter (#5296) 2024-01-17 21:09:36 +01:00			`prompt_lookup_num_tokens: int = 0`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`max_tokens_second: int = 0`
			`do_sample: bool = True`
			`dynamic_temperature: bool = False`
			`temperature_last: bool = False`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`auto_max_new_tokens: bool = False`
			`ban_eos_token: bool = False`
			`add_bos_token: bool = True`
UI: Add an `enable_thinking` option to enable/disable Qwen3 thinking 2025-04-29 07:37:01 +02:00			`enable_thinking: bool = True`
Add a new 'Reasoning effort' UI element 2025-08-06 00:19:11 +02:00			`reasoning_effort: str = "medium"`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`skip_special_tokens: bool = True`
Organize internals (#6646) 2025-01-10 22:04:32 +01:00			`static_cache: bool = False`
			`truncation_length: int = 0`
			`seed: int = -1`
			`sampler_priority: List[str] \| str \| None = Field(default=None, description="List of samplers where the first items will appear first in the stack. Example: [\"top_k\", \"temperature\", \"top_p\"].")`
			`custom_token_bans: str = ""`
			`negative_prompt: str = ''`
			`dry_sequence_breakers: str = '"\\n", ":", "\\"", "*"'`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`grammar_string: str = ""`


Tools support for OpenAI compatible API (#6827) 2025-05-08 17:30:27 +02:00			`class ToolDefinition(BaseModel):`
			`function: 'ToolFunction'`
			`type: str`


			`class ToolFunction(BaseModel):`
			`description: str`
			`name: str`
			`parameters: 'ToolParameters'`


			`class ToolParameters(BaseModel):`
			`properties: Optional[Dict[str, 'ToolProperty']] = None`
			`required: Optional[list[str]] = None`
			`type: str`
			`description: Optional[str] = None`


			`class ToolProperty(BaseModel):`
			`description: Optional[str] = None`
			type: Optional[str] = None # we are faced with definitions like anyOf, e.g. {'type': 'function', 'function': {'name': 'git_create_branch', 'description': 'Creates a new branch from an optional base branch', 'parameters': {'type': 'object', 'properties': {'repo_path': {'title': 'Repo Path', 'type': 'string'}, 'branch_name': {'title': 'Branch Name', 'type': 'string'}, 'base_branch': {'anyOf': [{'type': 'string'}, {'type': 'null'}], 'default': None, 'title': 'Base Branch'}}, 'required': ['repo_path', 'branch_name'], 'title': 'GitCreateBranch'}}}


			`class FunctionCall(BaseModel):`
			`name: str`
			`arguments: Optional[str] = None`
			`parameters: Optional[str] = None`

			`@validator('arguments', allow_reuse=True)`
			`def checkPropertyArgsOrParams(cls, v, values, **kwargs):`
			`if not v and not values.get('parameters'):`
			`raise ValueError("At least one of 'arguments' or 'parameters' must be provided as property in FunctionCall type")`
			`return v`


			`class ToolCall(BaseModel):`
			`id: str`
			`index: int`
			`type: str`
			`function: FunctionCall`


Reorder the parameters in the FastAPI documentation 2023-11-06 18:55:36 +01:00			`class CompletionRequestParams(BaseModel):`
Add system_message parameter, document model (unused) parameter 2023-11-10 15:47:00 +01:00			`model: str \| None = Field(default=None, description="Unused parameter. To change the model, use the /v1/internal/model/load endpoint.")`
Add multimodal support (ExLlamaV3) (#7174) 2025-08-09 04:31:16 +02:00			`prompt: str \| List[str] \| None = Field(default=None, description="Text prompt for completion. Can also use 'messages' format for multimodal.")`
			`messages: List[dict] \| None = Field(default=None, description="OpenAI messages format for multimodal support. Alternative to 'prompt'.")`
Document unused parameters 2023-11-07 17:56:09 +01:00			`best_of: int \| None = Field(default=1, description="Unused parameter.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`echo: bool \| None = False`
			`frequency_penalty: float \| None = 0`
			`logit_bias: dict \| None = None`
			`logprobs: int \| None = None`
Default max_tokens to 512 in the API instead of 16 2025-08-10 16:21:55 +02:00			`max_tokens: int \| None = 512`
Document unused parameters 2023-11-07 17:56:09 +01:00			`n: int \| None = Field(default=1, description="Unused parameter.")`
openai extension: wrong frequency_penalty type (#4512) 2023-11-08 15:23:51 +01:00			`presence_penalty: float \| None = 0`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`stop: str \| List[str] \| None = None`
			`stream: bool \| None = False`
			`suffix: str \| None = None`
			`temperature: float \| None = 1`
			`top_p: float \| None = 1`
Implement echo/suffix parameters 2023-11-07 17:43:45 +01:00			`user: str \| None = Field(default=None, description="Unused parameter.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
API: Improve a validation 2025-08-11 21:39:18 +02:00			`@model_validator(mode='after')`
			`def validate_prompt_or_messages(self):`
			`if self.prompt is None and self.messages is None:`
			`raise ValueError("Either 'prompt' or 'messages' must be provided")`
			`return self`
Add multimodal support (ExLlamaV3) (#7174) 2025-08-09 04:31:16 +02:00
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
Reorder the parameters in the FastAPI documentation 2023-11-06 18:55:36 +01:00			`class CompletionRequest(GenerationOptions, CompletionRequestParams):`
			`pass`


Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`class CompletionResponse(BaseModel):`
			`id: str`
			`choices: List[dict]`
			`created: int = int(time.time())`
			`model: str`
			`object: str = "text_completion"`
			`usage: dict`


Reorder the parameters in the FastAPI documentation 2023-11-06 18:55:36 +01:00			`class ChatCompletionRequestParams(BaseModel):`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`messages: List[dict]`
Add system_message parameter, document model (unused) parameter 2023-11-10 15:47:00 +01:00			`model: str \| None = Field(default=None, description="Unused parameter. To change the model, use the /v1/internal/model/load endpoint.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`frequency_penalty: float \| None = 0`
Document unused parameters 2023-11-07 17:56:09 +01:00			`function_call: str \| dict \| None = Field(default=None, description="Unused parameter.")`
			`functions: List[dict] \| None = Field(default=None, description="Unused parameter.")`
Tools support for OpenAI compatible API (#6827) 2025-05-08 17:30:27 +02:00			`tools: List[dict] \| None = Field(default=None, description="Tools signatures passed via MCP.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`logit_bias: dict \| None = None`
			`max_tokens: int \| None = None`
Document unused parameters 2023-11-07 17:56:09 +01:00			`n: int \| None = Field(default=1, description="Unused parameter.")`
openai extension: wrong frequency_penalty type (#4512) 2023-11-08 15:23:51 +01:00			`presence_penalty: float \| None = 0`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`stop: str \| List[str] \| None = None`
			`stream: bool \| None = False`
			`temperature: float \| None = 1`
			`top_p: float \| None = 1`
Document unused parameters 2023-11-07 17:56:09 +01:00			`user: str \| None = Field(default=None, description="Unused parameter.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
			`mode: str = Field(default='instruct', description="Valid options: instruct, chat, chat-instruct.")`

Restructure the repository (#6904) 2025-04-26 13:56:54 +02:00			`instruction_template: str \| None = Field(default=None, description="An instruction template defined under text-generation-webui/user_data/instruction-templates. If not set, the correct template will be automatically obtained from the model metadata.")`
Jinja templates for Instruct and Chat (#4874) 2023-12-12 21:23:14 +01:00			`instruction_template_str: str \| None = Field(default=None, description="A Jinja2 instruction template. If set, will take precedence over everything else.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
Restructure the repository (#6904) 2025-04-26 13:56:54 +02:00			`character: str \| None = Field(default=None, description="A character defined under text-generation-webui/user_data/characters. If not set, the default \"Assistant\" character will be used.")`
Correct field alias types for OpenAI extension (#5257) 2024-01-14 17:30:36 +01:00			`bot_name: str \| None = Field(default=None, description="Overwrites the value set by character field.", alias="name2")`
API: Make user_name/bot_name the official and name1/name2 the alias 2024-01-10 04:06:11 +01:00			`context: str \| None = Field(default=None, description="Overwrites the value set by character field.")`
			`greeting: str \| None = Field(default=None, description="Overwrites the value set by character field.")`
UI: Add a new "User description" field for user personality/biography (#5691) 2024-03-12 03:41:57 +01:00			`user_name: str \| None = Field(default=None, description="Your name (the user). By default, it's \"You\".", alias="name1")`
Better way to handle user_bio default in the API (alternative to bdcf31035f06d666f01339c9af2447d6c2b83bcc) 2024-03-29 18:54:01 +01:00			`user_bio: str \| None = Field(default=None, description="The user description/personality.")`
Jinja templates for Instruct and Chat (#4874) 2023-12-12 21:23:14 +01:00			`chat_template_str: str \| None = Field(default=None, description="Jinja2 template for chat.")`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
Improve the basic API examples 2025-06-17 16:46:58 +02:00			`chat_instruct_command: str \| None = "Continue the chat dialogue below. Write a single reply for the character \"<\|character\|>\".\n\n<\|prompt\|>"`
Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00
			`continue_: bool = Field(default=False, description="Makes the last bot message in the history be continued instead of starting a new message.")`


Reorder the parameters in the FastAPI documentation 2023-11-06 18:55:36 +01:00			`class ChatCompletionRequest(GenerationOptions, ChatCompletionRequestParams):`
			`pass`


Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`class ChatCompletionResponse(BaseModel):`
			`id: str`
			`choices: List[dict]`
			`created: int = int(time.time())`
			`model: str`
			`object: str = "chat.completion"`
			`usage: dict`


Add a /v1/internal/chat-prompt endpoint (#5879) 2024-04-19 05:24:46 +02:00			`class ChatPromptResponse(BaseModel):`
			`prompt: str`


Add /v1/internal/lora endpoints (#4652) 2023-11-19 04:35:22 +01:00			`class EmbeddingsRequest(BaseModel):`
[OpenAI Extension] Add more types to Embeddings Endpoint (#4895) 2023-12-15 04:26:16 +01:00			`input: str \| List[str] \| List[int] \| List[List[int]]`
Add /v1/internal/lora endpoints (#4652) 2023-11-19 04:35:22 +01:00			`model: str \| None = Field(default=None, description="Unused parameter. To change the model, set the OPENEDAI_EMBEDDING_MODEL and OPENEDAI_EMBEDDING_DEVICE environment variables before starting the server.")`
			`encoding_format: str = Field(default="float", description="Can be float or base64.")`
			`user: str \| None = Field(default=None, description="Unused parameter.")`


			`class EmbeddingsResponse(BaseModel):`
			`index: int`
			`embedding: List[float]`
			`object: str = "embedding"`


Add types to the encode/decode/token-count endpoints 2023-11-08 04:05:36 +01:00			`class EncodeRequest(BaseModel):`
			`text: str`


Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`class EncodeResponse(BaseModel):`
Add types to the encode/decode/token-count endpoints 2023-11-08 04:05:36 +01:00			`tokens: List[int]`
Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`length: int`
Add types to the encode/decode/token-count endpoints 2023-11-08 04:05:36 +01:00

Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`class DecodeRequest(BaseModel):`
Add types to the encode/decode/token-count endpoints 2023-11-08 04:05:36 +01:00			`tokens: List[int]`


			`class DecodeResponse(BaseModel):`
			`text: str`


			`class TokenCountResponse(BaseModel):`
			`length: int`


Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`class LogitsRequestParams(BaseModel):`
			`prompt: str`
			`use_samplers: bool = False`
[OpenAI Extension] Add 'max_logits' parameter in logits endpoint (#4916) 2023-12-15 04:22:43 +01:00			`top_logits: int \| None = 50`
Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`frequency_penalty: float \| None = 0`
Default max_tokens to 512 in the API instead of 16 2025-08-10 16:21:55 +02:00			`max_tokens: int \| None = 512`
Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00			`presence_penalty: float \| None = 0`
			`temperature: float \| None = 1`
			`top_p: float \| None = 1`


			`class LogitsRequest(GenerationOptions, LogitsRequestParams):`
			`pass`


			`class LogitsResponse(BaseModel):`
[OpenAI Extension] Add 'max_logits' parameter in logits endpoint (#4916) 2023-12-15 04:22:43 +01:00			`logits: Dict[str, float]`
Add /v1/internal/logits endpoint (#4650) 2023-11-19 03:19:31 +01:00

Add /v1/internal/model-info endpoint 2023-11-08 03:59:02 +01:00			`class ModelInfoResponse(BaseModel):`
			`model_name: str`
			`lora_names: List[str]`


Add /v1/internal/lora endpoints (#4652) 2023-11-19 04:35:22 +01:00			`class ModelListResponse(BaseModel):`
			`model_names: List[str]`


Add /v1/internal/model/load endpoint (tentative) 2023-11-08 05:58:06 +01:00			`class LoadModelRequest(BaseModel):`
			`model_name: str`
			`args: dict \| None = None`
			`settings: dict \| None = None`


Add /v1/internal/lora endpoints (#4652) 2023-11-19 04:35:22 +01:00			`class LoraListResponse(BaseModel):`
			`lora_names: List[str]`
Make /v1/embeddings functional, add request/response types 2023-11-10 16:34:27 +01:00

Add /v1/internal/lora endpoints (#4652) 2023-11-19 04:35:22 +01:00			`class LoadLorasRequest(BaseModel):`
			`lora_names: List[str]`
Make /v1/embeddings functional, add request/response types 2023-11-10 16:34:27 +01:00

Image: Remove llm_variations from the API 2025-12-05 02:34:17 +01:00			`class ImageGenerationRequest(BaseModel):`
Image: Simplify the API code, add the llm_variations option 2025-12-04 19:23:00 +01:00			`"""Image-specific parameters for generation."""`
Add an API endpoint for generating images 2025-12-03 20:50:35 +01:00			`prompt: str`
			`negative_prompt: str = ""`
			`size: str = Field(default="1024x1024", description="'WIDTHxHEIGHT'")`
			`steps: int = Field(default=9, ge=1)`
			`cfg_scale: float = Field(default=0.0, ge=0.0)`
Image: Simplify the API code, add the llm_variations option 2025-12-04 19:23:00 +01:00			`image_seed: int = Field(default=-1, description="-1 for random")`
Add an API endpoint for generating images 2025-12-03 20:50:35 +01:00			`batch_size: int \| None = Field(default=None, ge=1, description="Parallel batch size (VRAM heavy)")`
			`n: int = Field(default=1, ge=1, description="Alias for batch_size (OpenAI compatibility)")`
			`batch_count: int = Field(default=1, ge=1, description="Sequential batch count")`

			`# OpenAI compatibility (unused)`
			`model: str \| None = None`
			`response_format: str = "b64_json"`
			`user: str \| None = None`

			`@model_validator(mode='after')`
			`def resolve_batch_size(self):`
			`if self.batch_size is None:`
			`self.batch_size = self.n`
			`return self`

			`def get_width_height(self) -> tuple[int, int]:`
			`try:`
			`parts = self.size.lower().split('x')`
			`return int(parts[0]), int(parts[1])`
			`except (ValueError, IndexError):`
			`return 1024, 1024`


			`class ImageGenerationResponse(BaseModel):`
			`created: int = int(time.time())`
			`data: List[dict]`


Make OpenAI API the default API (#4430) 2023-11-06 06:38:29 +01:00			`def to_json(obj):`
			`return json.dumps(obj.__dict__, indent=4)`


			`def to_dict(obj):`
			`return obj.__dict__`