Skip to content
Merged
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 9 additions & 0 deletions speechbrain/utils/text_to_sequence.py
Original file line number Diff line number Diff line change
Expand Up @@ -213,6 +213,13 @@ def basic_cleaners(text):
return text


def german_cleaners(text):
"""Pipeline for German text, that collapses whitespace without transliteration.
"""
text = collapse_whitespace(text)
return text


def transliteration_cleaners(text):
"""Pipeline for non-English text that transliterates to ASCII.
"""
Expand Down Expand Up @@ -285,6 +292,8 @@ def _clean_text(text, cleaner_names):
cleaner = transliteration_cleaners
if name == "basic_cleaners":
cleaner = basic_cleaners
if name == "german_cleaners":
cleaner = german_cleaners
if not cleaner:
raise Exception("Unknown cleaner: %s" % name)
text = cleaner(text)
Expand Down