Estimate the VRAM for GGUF models + autoset gpu-layers (#6980)

2026-04-20 22:13:43 +00:00 · 2025-05-16 00:07:37 -03:00 · 2025-05-16 00:07:37 -03:00 · 5534d01da0
commit 5534d01da0
parent c4a715fd1e
6 changed files with 193 additions and 4 deletions
--- a/modules/models.py
+++ b/modules/models.py
@ -71,7 +71,6 @@ def llama_cpp_server_loader(model_name):
    else:
        model_file = sorted(Path(f'{shared.args.model_dir}/{model_name}').glob('*.gguf'))[0]

-    logger.info(f"llama.cpp weights detected: \"{model_file}\"")
    try:
        model = LlamaServer(model_file)
        return model, model