Use --ctx-size to specify the context size for all loaders

Old flags are still recognized as alternatives.
This commit is contained in:
oobabooga 2025-04-25 16:59:03 -07:00
parent faababc4ea
commit d4b1e31c49
12 changed files with 39 additions and 45 deletions

View file

@ -254,7 +254,7 @@ class LlamaServer:
cmd = [
self.server_path,
"--model", self.model_path,
"--ctx-size", str(shared.args.n_ctx),
"--ctx-size", str(shared.args.ctx_size),
"--n-gpu-layers", str(shared.args.n_gpu_layers),
"--batch-size", str(shared.args.batch_size),
"--port", str(self.port),