Update tokenizer.py

transliterates -> transliterate
This commit is contained in:
Ikko Eltociear Ashimine 2023-06-09 03:06:51 +09:00 committed by GitHub
parent d22ba29eca
commit 03fa6922ed
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23

View file

@ -132,7 +132,7 @@ def basic_cleaners(text):
def transliteration_cleaners(text):
'''Pipeline for non-English text that transliterates to ASCII.'''
'''Pipeline for non-English text that transliterate to ASCII.'''
text = convert_to_ascii(text)
text = lowercase(text)
text = collapse_whitespace(text)
@ -190,4 +190,4 @@ class VoiceBpeTokenizer:
txt = txt.replace('[SPACE]', ' ')
txt = txt.replace('[STOP]', '')
txt = txt.replace('[UNK]', '')
return txt
return txt