From fa9be444fa0b3e18763b1cd3d0dd07ad565ac1bb Mon Sep 17 00:00:00 2001 From: oobabooga <112222186+oobabooga@users.noreply.github.com> Date: Sat, 9 Aug 2025 07:26:59 -0700 Subject: [PATCH] Use ExLlamav3 instead of ExLlamav3_HF by default for EXL3 models --- modules/models_settings.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/modules/models_settings.py b/modules/models_settings.py index 729d5dd1..d3bf4a36 100644 --- a/modules/models_settings.py +++ b/modules/models_settings.py @@ -211,11 +211,11 @@ def infer_loader(model_name, model_settings, hf_quant_method=None): elif re.match(r'.*\.gguf', model_name.lower()): loader = 'llama.cpp' elif hf_quant_method == 'exl3': - loader = 'ExLlamav3_HF' + loader = 'ExLlamav3' elif hf_quant_method in ['exl2', 'gptq']: loader = 'ExLlamav2_HF' elif re.match(r'.*exl3', model_name.lower()): - loader = 'ExLlamav3_HF' + loader = 'ExLlamav3' elif re.match(r'.*exl2', model_name.lower()): loader = 'ExLlamav2_HF' else: