llama.cpp: Remove the timeout while loading models (closes #6907)

2025-12-06 07:12:10 +01:00 · 2025-04-27 21:22:21 -07:00 · 2025-04-27 21:22:21 -07:00 · c6c2855c80
parent bbcaec75b4
commit c6c2855c80
1 changed files with 1 additions and 5 deletions
--- a/modules/llama_cpp_server.py
+++ b/modules/llama_cpp_server.py
@ -340,9 +340,7 @@ class LlamaServer:
        # Wait for server to be healthy
        health_url = f"http://127.0.0.1:{self.port}/health"
-        start_time = time.time()
+        while True:
        timeout = 3600 * 8  # 8 hours
        while time.time() - start_time < timeout:
            # Check if process is still alive
            if self.process.poll() is not None:
                # Process has terminated
@ -357,8 +355,6 @@ class LlamaServer:
                pass
            time.sleep(1)
        else:
            raise TimeoutError(f"Server health check timed out after {timeout} seconds")
        # Server is now healthy, get model info
        self._get_vocabulary_size()