mirror of
https://github.com/modelscope/modelscope.git
synced 2025-12-23 11:39:26 +01:00
Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/10371244 Link: https://code.alibaba-inc.com/Ali-MaaS/MaaS-lib/codereview/10371244
82 lines
3.5 KiB
Python
82 lines
3.5 KiB
Python
# Copyright (c) Alibaba, Inc. and its affiliates.
|
|
|
|
import unittest
|
|
|
|
# NOTICE: Tensorflow 1.15 seems not so compatible with pytorch.
|
|
# A segmentation fault may be raise by pytorch cpp library
|
|
# if 'import tensorflow' in front of 'import torch'.
|
|
# Puting a 'import torch' here can bypass this incompatibility.
|
|
import torch
|
|
from scipy.io.wavfile import write
|
|
|
|
from modelscope.models import Model
|
|
from modelscope.outputs import OutputKeys
|
|
from modelscope.pipelines import pipeline
|
|
from modelscope.utils.constant import Tasks
|
|
from modelscope.utils.demo_utils import DemoCompatibilityCheck
|
|
from modelscope.utils.logger import get_logger
|
|
from modelscope.utils.test_utils import test_level
|
|
|
|
import tensorflow as tf # isort:skip
|
|
|
|
logger = get_logger()
|
|
|
|
|
|
class TextToSpeechSambertHifigan16kPipelineTest(unittest.TestCase,
|
|
DemoCompatibilityCheck):
|
|
|
|
def setUp(self) -> None:
|
|
self.task = Tasks.text_to_speech
|
|
self.zhcn_text = '今天北京天气怎么样'
|
|
self.en_text = 'How is the weather in Beijing?'
|
|
self.zhcn_voices = [
|
|
'zhitian_emo', 'zhizhe_emo', 'zhiyan_emo', 'zhibei_emo', 'zhcn'
|
|
]
|
|
self.zhcn_models = [
|
|
'damo/speech_sambert-hifigan_tts_zhitian_emo_zh-cn_16k',
|
|
'damo/speech_sambert-hifigan_tts_zhizhe_emo_zh-cn_16k',
|
|
'damo/speech_sambert-hifigan_tts_zhiyan_emo_zh-cn_16k',
|
|
'damo/speech_sambert-hifigan_tts_zhibei_emo_zh-cn_16k',
|
|
'damo/speech_sambert-hifigan_tts_zh-cn_16k'
|
|
]
|
|
self.en_voices = ['luca', 'luna', 'andy', 'annie', 'engb', 'enus']
|
|
self.en_models = [
|
|
'damo/speech_sambert-hifigan_tts_luca_en-gb_16k',
|
|
'damo/speech_sambert-hifigan_tts_luna_en-gb_16k',
|
|
'damo/speech_sambert-hifigan_tts_andy_en-us_16k',
|
|
'damo/speech_sambert-hifigan_tts_annie_en-us_16k',
|
|
'damo/speech_sambert-hifigan_tts_en-gb_16k',
|
|
'damo/speech_sambert-hifigan_tts_en-us_16k'
|
|
]
|
|
|
|
@unittest.skipUnless(test_level() >= 0, 'skip test in current test level')
|
|
def test_pipeline(self):
|
|
for i in range(len(self.zhcn_voices)):
|
|
logger.info('test %s' % self.zhcn_voices[i])
|
|
model = Model.from_pretrained(
|
|
model_name_or_path=self.zhcn_models[i], revision='pytorch_am')
|
|
sambert_hifigan_tts = pipeline(task=self.task, model=model)
|
|
self.assertTrue(sambert_hifigan_tts is not None)
|
|
output = sambert_hifigan_tts(input=self.zhcn_text)
|
|
self.assertIsNotNone(output[OutputKeys.OUTPUT_PCM])
|
|
pcm = output[OutputKeys.OUTPUT_PCM]
|
|
write('output_%s.wav' % self.zhcn_voices[i], 16000, pcm)
|
|
for i in range(len(self.en_voices)):
|
|
logger.info('test %s' % self.en_voices[i])
|
|
model = Model.from_pretrained(
|
|
model_name_or_path=self.en_models[i], revision='pytorch_am')
|
|
sambert_hifigan_tts = pipeline(task=self.task, model=model)
|
|
self.assertTrue(sambert_hifigan_tts is not None)
|
|
output = sambert_hifigan_tts(input=self.en_text)
|
|
self.assertIsNotNone(output[OutputKeys.OUTPUT_PCM])
|
|
pcm = output[OutputKeys.OUTPUT_PCM]
|
|
write('output_%s.wav' % self.en_voices[i], 16000, pcm)
|
|
|
|
@unittest.skip('demo compatibility test is only enabled on a needed-basis')
|
|
def test_demo_compatibility(self):
|
|
self.compatibility_check()
|
|
|
|
|
|
if __name__ == '__main__':
|
|
unittest.main()
|