API: Remove deprecated "settings" parameter from model load endpoint

This commit is contained in:
oobabooga 2026-04-04 11:00:14 -07:00
parent 9183dc444e
commit 2eef90a323
3 changed files with 5 additions and 30 deletions

View file

@ -1,5 +1,4 @@
from modules import loaders, shared
from modules.logging_colors import logger
from modules.LoRA import add_lora_to_model
from modules.models import load_model, unload_model
from modules.models_settings import get_model_metadata, update_model_parameters
@ -42,8 +41,7 @@ def model_info_dict(model_name: str) -> dict:
def _load_model(data):
model_name = data["model_name"]
args = data["args"]
settings = data["settings"]
args = data.get("args")
unload_model()
model_settings = get_model_metadata(model_name)
@ -71,16 +69,6 @@ def _load_model(data):
shared.model, shared.tokenizer = load_model(model_name)
# Update shared.settings with custom generation defaults
if settings:
for k in settings:
if k in shared.settings:
shared.settings[k] = settings[k]
if k == 'truncation_length':
logger.info(f"CONTEXT LENGTH (UPDATED): {shared.settings['truncation_length']}")
elif k == 'instruction_template':
logger.info(f"INSTRUCTION TEMPLATE (UPDATED): {shared.settings['instruction_template']}")
def list_loras():
return {'lora_names': get_available_loras()[1:]}

View file

@ -475,10 +475,8 @@ async def handle_list_models():
@app.post("/v1/internal/model/load", dependencies=check_admin_key)
async def handle_load_model(request_data: LoadModelRequest):
'''
This endpoint is experimental and may change in the future.
The "args" parameter can be used to modify flags like "--load-in-4bit"
or "--n-gpu-layers" before loading a model. Example:
The "args" parameter can be used to modify loader flags before loading
a model. Example:
```
"args": {
@ -487,18 +485,8 @@ async def handle_load_model(request_data: LoadModelRequest):
}
```
Note that those settings will remain after loading the model. So you
may need to change them back to load a second model.
The "settings" parameter is also a dict but with keys for the
shared.settings object. It can be used to modify the default instruction
template like this:
```
"settings": {
"instruction_template": "Alpaca"
}
```
Loader args are reset to their startup defaults between loads, so
settings from a previous load do not leak into the next one.
'''
try:

View file

@ -271,7 +271,6 @@ class ModelListResponse(BaseModel):
class LoadModelRequest(BaseModel):
model_name: str
args: dict | None = None
settings: dict | None = None
class LoraListResponse(BaseModel):