Bump llama-cpp-python to 0.2.69, add --flash-attn option

2026-04-04 14:17:28 +00:00 · 2024-05-03 04:31:22 -07:00 · 2024-05-03 04:31:22 -07:00 · e61055253c
commit e61055253c
parent 0476f9fe70
15 changed files with 66 additions and 58 deletions
--- a/modules/ui.py
+++ b/modules/ui.py
@ -104,6 +104,7 @@ def list_model_elements():
        'no_offload_kqv',
        'row_split',
        'tensorcores',
+        'flash-attn',
        'streaming_llm',
        'attention_sink_size',
        'hqq_backend',