Skip to content

Commit f93b74e

Browse files
committed
refactor(xtts): use existing cleaners
1 parent a5044cd commit f93b74e

File tree

1 file changed

+1
-17
lines changed

1 file changed

+1
-17
lines changed

TTS/tts/layers/xtts/tokenizer.py

+1-17
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,7 @@
1515
from tokenizers import Tokenizer
1616

1717
from TTS.tts.layers.xtts.zh_num2words import TextNorm as zh_num2words
18+
from TTS.tts.utils.text.cleaners import collapse_whitespace, lowercase
1819

1920
logger = logging.getLogger(__name__)
2021

@@ -72,8 +73,6 @@ def split_sentence(text, lang, text_split_length=250):
7273
return text_splits
7374

7475

75-
_whitespace_re = re.compile(r"\s+")
76-
7776
# List of (regular expression, replacement) pairs for abbreviations:
7877
_abbreviations = {
7978
"en": [
@@ -564,14 +563,6 @@ def expand_numbers_multilingual(text, lang="en"):
564563
return text
565564

566565

567-
def lowercase(text):
568-
return text.lower()
569-
570-
571-
def collapse_whitespace(text):
572-
return re.sub(_whitespace_re, " ", text)
573-
574-
575566
def multilingual_cleaners(text, lang):
576567
text = text.replace('"', "")
577568
if lang == "tr":
@@ -586,13 +577,6 @@ def multilingual_cleaners(text, lang):
586577
return text
587578

588579

589-
def basic_cleaners(text):
590-
"""Basic pipeline that lowercases and collapses whitespace without transliteration."""
591-
text = lowercase(text)
592-
text = collapse_whitespace(text)
593-
return text
594-
595-
596580
def chinese_transliterate(text):
597581
try:
598582
import pypinyin

0 commit comments

Comments
 (0)