From e76480482e284f2c1ab2b75aaa13c52d08dbeafd Mon Sep 17 00:00:00 2001 From: "jiaqi.sjq" Date: Fri, 24 Feb 2023 11:00:40 +0800 Subject: [PATCH] [to #41669377] fix pipeline output wav is 32-bit float expect 16-bit int Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/11765670 --- modelscope/models/audio/tts/sambert_hifi.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/modelscope/models/audio/tts/sambert_hifi.py b/modelscope/models/audio/tts/sambert_hifi.py index b930da85..0c5da33f 100644 --- a/modelscope/models/audio/tts/sambert_hifi.py +++ b/modelscope/models/audio/tts/sambert_hifi.py @@ -218,5 +218,6 @@ class SambertHifigan(Model): for line in texts: line = line.strip().split('\t') audio = self.__synthesis_one_sentences(voice, line[1]) - audio_total = np.append(audio_total, audio, axis=0) + audio = 32768.0 * audio + audio_total = np.append(audio_total, audio.astype('int16'), axis=0) return ndarray_pcm_to_wav(self.__sample_rate, audio_total)