Merge pull request #5 from microsoft/bugfix/german_umlaut_fix

temporary fix for german umlaut
This commit is contained in:
Timm Walz 2022-01-06 13:47:29 +01:00 коммит произвёл GitHub
Родитель ff4f2349d6 3687537482
Коммит 7fa165a369
Не найден ключ, соответствующий данной подписи
Идентификатор ключа GPG: 4AEE18F83AFDEB23
1 изменённых файлов: 8 добавлений и 1 удалений

Просмотреть файл

@ -138,6 +138,12 @@ def bandpass_filter(audio, low_freq, high_freq, sample_rate, order=5):
filtered_audio = lfilter(numerator, denominator, audio)
return filtered_audio
def replace_umlaut_in_string(text, args_dict={'ä': 'ae', 'ö':'oe', 'ü':'ue', 'Ä':'Ae', 'Ö':'Oe', 'Ü':'Ue'}):
'''Replace German Umlaut with ae, oe, ue'''
for key in args_dict.keys():
text = text.replace(key, str(args_dict[key]))
return text
def convert_with_telephone_filter(output_directory, fname):
"""Apply telephone-like filter on the generated training data
Args:
@ -168,8 +174,9 @@ def main(df, output_directory, custom=True, telephone=True):
os.makedirs(f'{output_directory}/tts_generated/', exist_ok=True)
audio_synth = []
for index, row in df.iterrows():
# Temporary workaround for umlaut
try:
app = TextToSpeech(pa.tts_key, pa.tts_language, pa.tts_font, pa.tts_region, row['text'])
app = TextToSpeech(pa.tts_key, pa.tts_language, pa.tts_font, pa.tts_region, replace_umlaut_in_string(row['text']))
app.get_token(pa.tts_region, pa.tts_key)
fname = app.save_audio(pa.tts_region, pa.tts_resource_name, output_directory, pa.tts_language, pa.tts_font)
if custom: