From 5fe9d0682e566aec6defb3fa4f2743c58fac9833 Mon Sep 17 00:00:00 2001 From: "wucong.lyb" Date: Tue, 14 Feb 2023 08:42:19 +0000 Subject: [PATCH] support multi audio types Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/11657396 * support multi audio format * SUPPORT_AUDIO_TYPE_SETS add . --- modelscope/utils/audio/audio_utils.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/modelscope/utils/audio/audio_utils.py b/modelscope/utils/audio/audio_utils.py index c0189171..d95fd279 100644 --- a/modelscope/utils/audio/audio_utils.py +++ b/modelscope/utils/audio/audio_utils.py @@ -12,6 +12,7 @@ import numpy as np from modelscope.fileio.file import HTTPStorage SEGMENT_LENGTH_TRAIN = 16000 +SUPPORT_AUDIO_TYPE_SETS = ('.flac', '.mp3', '.ogg', '.opus', '.wav', '.pcm') class TtsTrainType(object): @@ -176,7 +177,7 @@ def generate_scp_from_url(url: str, key: str = None): wav_scp_path = url return wav_scp_path, raw_inputs # for local wav file inputs - if os.path.exists(url) and (url.lower().endswith('.wav')): + if os.path.exists(url) and (url.lower().endswith(SUPPORT_AUDIO_TYPE_SETS)): wav_scp_path = url return wav_scp_path, raw_inputs # for wav url, download bytes data @@ -228,8 +229,7 @@ def generate_scp_for_sv(url: str, key: str = None): wav_scp_path = url return wav_scp_path # for local wav file inputs - if os.path.exists(url) and (url.lower().endswith('.wav') - or url.lower().endswith('.pcm')): + if os.path.exists(url) and (url.lower().endswith(SUPPORT_AUDIO_TYPE_SETS)): wav_path = url work_dir = tempfile.TemporaryDirectory().name if not os.path.exists(work_dir):