Fix thinking block parsing for GPT-OSS under llama.cpp

2026-03-07 06:03:51 +01:00 · 2025-08-05 15:36:20 -07:00 · 2025-08-05 15:36:20 -07:00 · 0e42575c57
parent 498778b8ac
commit 0e42575c57
1 changed files with 8 additions and 4 deletions
--- a/modules/html_generator.py
+++ b/modules/html_generator.py
@ -146,19 +146,23 @@ def extract_thinking_block(string):
    alt_end_pos = string.find(ALT_END)
    alt_content_pos = string.find(ALT_CONTENT_START)

-    # Check if start tag or end tag is found
    if alt_start_pos != -1 or alt_end_pos != -1:
        if alt_start_pos == -1:
            thought_start = 0
        else:
            thought_start = alt_start_pos + len(ALT_START)

+        # If no explicit end tag but content start exists, use content start as end
        if alt_end_pos == -1:
-            thought_end = len(string)
-            content_start = len(string)
+            if alt_content_pos != -1:
+                thought_end = alt_content_pos
+                content_start = alt_content_pos + len(ALT_CONTENT_START)
+            else:
+                thought_end = len(string)
+                content_start = len(string)
        else:
            thought_end = alt_end_pos
-            content_start = alt_content_pos + len(ALT_CONTENT_START) if alt_content_pos != -1 else len(string)
+            content_start = alt_content_pos + len(ALT_CONTENT_START) if alt_content_pos != -1 else alt_end_pos + len(ALT_END)

        thinking_content = string[thought_start:thought_end]
        remaining_content = string[content_start:]