Split by rows instead of layers for llama.cpp multi-gpu (#5435)

2026-04-05 06:35:15 +00:00 · 2024-02-05 02:36:40 +00:00 · 2024-02-05 02:36:40 +00:00 · 2a45620c85
commit 2a45620c85
parent 3df7e151f7
6 changed files with 9 additions and 2 deletions
--- a/modules/ui.py
+++ b/modules/ui.py
@ -93,6 +93,7 @@ def list_model_elements():
        'numa',
        'logits_all',
        'no_offload_kqv',
+        'row_split',
        'tensorcores',
        'hqq_backend',
    ]