Add back my llama-cpp-python wheels, bump to 0.2.65 (#5964)

2026-04-11 09:33:40 +00:00 · 2024-04-30 09:11:31 -03:00 · 2024-04-30 09:11:31 -03:00 · 51fb766bea
commit 51fb766bea
parent 5770e06c48
18 changed files with 330 additions and 56 deletions
--- a/modules/llama_cpp_python_hijack.py
+++ b/modules/llama_cpp_python_hijack.py
@ -1,11 +1,25 @@
 from typing import Sequence

-import llama_cpp
 from tqdm import tqdm

 from modules import shared
 from modules.cache_utils import process_llamacpp_cache

+try:
+    import llama_cpp
+except:
+    llama_cpp = None
+
+try:
+    import llama_cpp_cuda
+except:
+    llama_cpp_cuda = None
+
+try:
+    import llama_cpp_cuda_tensorcores
+except:
+    llama_cpp_cuda_tensorcores = None
+

 def eval_with_progress(self, tokens: Sequence[int]):
    """
@ -67,7 +81,7 @@ def monkey_patch_generate(lib):
    lib.Llama.generate = my_generate


-for lib in [llama_cpp]:
+for lib in [llama_cpp, llama_cpp_cuda, llama_cpp_cuda_tensorcores]:
    if lib is not None:
        lib.Llama.eval = eval_with_progress
        monkey_patch_generate(lib)