diff --git a/modules/exllamav2.py b/modules/exllamav2.py index 6bb422ea..5d5c5b56 100644 --- a/modules/exllamav2.py +++ b/modules/exllamav2.py @@ -135,7 +135,8 @@ class Exllamav2Model: return result, result def encode(self, string, **kwargs): - return self.tokenizer.encode(string, add_bos=True, encode_special_tokens=True) + add_bos = kwargs.pop('add_bos', True) + return self.tokenizer.encode(string, add_bos=add_bos, encode_special_tokens=True, **kwargs) def decode(self, ids, **kwargs): if isinstance(ids, list): diff --git a/modules/exllamav3.py b/modules/exllamav3.py index 268a64ec..9201801c 100644 --- a/modules/exllamav3.py +++ b/modules/exllamav3.py @@ -316,7 +316,6 @@ class Exllamav3Model: return output def encode(self, string, **kwargs): - # Default add_bos to True for consistency with exllamav2 behavior add_bos = kwargs.pop('add_bos', True) return self.tokenizer.encode(string, add_bos=add_bos, **kwargs)