(pad_value=0, pad_to_multiple=1) + + +AUDIO_SAMPLE_RATE = 16000 +MAX_INPUT_AUDIO_LENGTH = 10 # in seconds + + +def remove_prosody_tokens_from_text(text): + # filter out prosody tokens, there is only emphasis '*', and pause '=' + text = text.replace("*", "")....