Add StreamingLLM for llamacpp & llamacpp_HF (2nd attempt) (#5669)

2026-04-06 07:03:37 +00:00 · 2024-03-09 00:25:33 -03:00 · 2024-03-09 00:25:33 -03:00 · afb51bd5d6
commit afb51bd5d6
parent 9271e80914
7 changed files with 147 additions and 0 deletions
--- a/modules/ui.py
+++ b/modules/ui.py
@ -97,6 +97,8 @@ def list_model_elements():
        'no_offload_kqv',
        'row_split',
        'tensorcores',
+        'streaming_llm',
+        'attention_sink_size',
        'hqq_backend',
    ]
    if is_torch_xpu_available():