mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2026-04-07 23:53:40 +00:00
TensorRT-LLM: Migrate from ModelRunner to LLM API, add concurrent API request support
This commit is contained in:
parent
9824c82cb6
commit
f52d9336e5
7 changed files with 50 additions and 89 deletions
|
|
@ -157,7 +157,6 @@ def list_model_elements():
|
|||
'enable_tp',
|
||||
'tp_backend',
|
||||
'cfg_cache',
|
||||
'cpp_runner',
|
||||
'no_use_fast',
|
||||
'model_draft',
|
||||
'draft_max',
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue