mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2026-04-04 22:27:29 +00:00
Add slider for --ubatch-size for llama.cpp loader, change defaults for better MoE performance (#7316)
This commit is contained in:
parent
8f0048663d
commit
400bb0694b
5 changed files with 6 additions and 1 deletions
|
|
@ -317,6 +317,7 @@ class LlamaServer:
|
|||
"--ctx-size", str(shared.args.ctx_size),
|
||||
"--gpu-layers", str(shared.args.gpu_layers),
|
||||
"--batch-size", str(shared.args.batch_size),
|
||||
"--ubatch-size", str(shared.args.ubatch_size),
|
||||
"--port", str(self.port),
|
||||
"--no-webui",
|
||||
"--flash-attn", "on",
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue