Better parsing of the gpt-oss template

2026-03-03 12:04:28 +01:00 · 2025-08-05 11:56:00 -07:00 · 2025-08-05 11:56:00 -07:00 · 9f28f53cfc
parent 3b28dc1821
commit 9f28f53cfc
1 changed files with 8 additions and 1 deletions
--- a/modules/chat.py
+++ b/modules/chat.py
@ -108,7 +108,14 @@ def get_generation_prompt(renderer, impersonate=False, strip_trailing_spaces=Tru

    suffix_plus_prefix = prompt.split("<<|user-message-1|>>")[1].split("<<|user-message-2|>>")[0]
    suffix = prompt.split("<<|user-message-2|>>")[1]
-    prefix = suffix_plus_prefix[len(suffix):]
+
+    # Remove the message suffix. The first case handles the GPT-OSS model
+    # in a way that is likely to not interfere with previous models.
+    if '<|start|>user' in suffix_plus_prefix or '<|start|>assistant' in suffix_plus_prefix:
+        start_index = suffix_plus_prefix.rindex('<|start|>')
+        prefix = suffix_plus_prefix[start_index:]
+    else:
+        prefix = suffix_plus_prefix[len(suffix):]

    if strip_trailing_spaces:
        prefix = prefix.rstrip(' ')