Files
modelscope/tests/pipelines/test_speech_separation.py
2023-08-24 16:49:22 +08:00

50 lines
1.8 KiB
Python

# Copyright (c) Alibaba, Inc. and its affiliates.
import os.path
import unittest
import numpy
from modelscope.outputs import OutputKeys
from modelscope.pipelines import pipeline
from modelscope.utils.constant import Tasks
from modelscope.utils.test_utils import test_level
MIX_SPEECH_FILE = 'data/test/audios/mix_speech.wav'
class SpeechSeparationTest(unittest.TestCase):
def setUp(self) -> None:
pass
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
def test_normal(self):
import soundfile as sf
model_id = 'damo/speech_mossformer_separation_temporal_8k'
separation = pipeline(Tasks.speech_separation, model=model_id)
result = separation(os.path.join(os.getcwd(), MIX_SPEECH_FILE))
self.assertTrue(OutputKeys.OUTPUT_PCM_LIST in result)
self.assertEqual(len(result[OutputKeys.OUTPUT_PCM_LIST]), 2)
for i, signal in enumerate(result[OutputKeys.OUTPUT_PCM_LIST]):
save_file = f'output_spk{i}.wav'
sf.write(save_file, numpy.frombuffer(signal, dtype=numpy.int16),
8000)
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
def test_mossformer2(self):
import soundfile as sf
model_id = 'damo/speech_mossformer2_separation_temporal_8k'
separation = pipeline(Tasks.speech_separation, model=model_id)
result = separation(os.path.join(os.getcwd(), MIX_SPEECH_FILE))
self.assertTrue(OutputKeys.OUTPUT_PCM_LIST in result)
self.assertEqual(len(result[OutputKeys.OUTPUT_PCM_LIST]), 2)
for i, signal in enumerate(result[OutputKeys.OUTPUT_PCM_LIST]):
save_file = f'output_spk{i}.wav'
sf.write(save_file, numpy.frombuffer(signal, dtype=numpy.int16),
8000)
if __name__ == '__main__':
unittest.main()