mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2026-03-18 03:14:39 +01:00
llama.cpp: Use --fit-ctx 8192 when --fit on is used
This sets the minimum acceptable context length, which by default is 4096.
This commit is contained in:
parent
5763cab3c4
commit
9119ce0680
|
|
@ -378,6 +378,7 @@ class LlamaServer:
|
|||
cmd += ["--gpu-layers", str(shared.args.gpu_layers), "--fit", "off"]
|
||||
else:
|
||||
cmd += ["--fit", "on"]
|
||||
cmd += ["--fit-ctx", "8192"]
|
||||
if shared.args.fit_target:
|
||||
cmd += ["--fit-target", shared.args.fit_target]
|
||||
|
||||
|
|
|
|||
Loading…
Reference in a new issue