Autodetect llamacpp_HF loader when tokenizer exists

2026-04-04 22:27:29 +00:00 · 2024-02-16 09:29:26 -08:00 · 2024-02-16 09:29:26 -08:00 · 4039999be5
commit 4039999be5
parent 76d28eaa9e
2 changed files with 4 additions and 2 deletions
--- a/modules/models_settings.py
+++ b/modules/models_settings.py
@ -153,6 +153,8 @@ def infer_loader(model_name, model_settings):
        loader = 'ExLlamav2_HF'
    elif (path_to_model / 'quant_config.json').exists() or re.match(r'.*-awq', model_name.lower()):
        loader = 'AutoAWQ'
+    elif len(list(path_to_model.glob('*.gguf'))) > 0 and path_to_model.is_dir() and (path_to_model / 'tokenizer_config.json').exists():
+        loader = 'llamacpp_HF'
    elif len(list(path_to_model.glob('*.gguf'))) > 0:
        loader = 'llama.cpp'
    elif re.match(r'.*\.gguf', model_name.lower()):
@ -225,7 +227,7 @@ def apply_model_settings_to_state(model, state):
        loader = model_settings.pop('loader')

        # If the user is using an alternative loader for the same model type, let them keep using it
-        if not (loader == 'ExLlamav2_HF' and state['loader'] in ['GPTQ-for-LLaMa', 'ExLlamav2', 'AutoGPTQ']) and not (loader == 'llama.cpp' and state['loader'] in ['llamacpp_HF', 'ctransformers']):
+        if not (loader == 'ExLlamav2_HF' and state['loader'] in ['GPTQ-for-LLaMa', 'ExLlamav2', 'AutoGPTQ']) and not (loader == 'llama.cpp' and state['loader'] in ['ctransformers']):
            state['loader'] = loader

    for k in model_settings: