diff --git a/tests/pipelines/test_automatic_speech_recognition.py b/tests/pipelines/test_automatic_speech_recognition.py index c37a6a3f..b6532868 100644 --- a/tests/pipelines/test_automatic_speech_recognition.py +++ b/tests/pipelines/test_automatic_speech_recognition.py @@ -80,164 +80,141 @@ class AutomaticSpeechRecognitionTest(unittest.TestCase, all_models_info = [ { - 'model_group': 'damo', 'model_id': - 'speech_paraformer_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1', + 'damo/speech_paraformer_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', - 'model_id': 'speech_paraformer_asr_nat-aishell1-pytorch', + 'model_id': 'damo/speech_paraformer_asr_nat-aishell1-pytorch', + 'wav_path': 'data/test/audios/asr_example.wav' + }, + { + 'model_id': 'damo/speech_paraformer_asr_nat-aishell2-pytorch', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1', + 'damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8358-tensorflow1', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_paraformer_asr_nat-zh-cn-8k-common-vocab8358-tensorflow1', + 'damo/speech_paraformer_asr_nat-zh-cn-8k-common-vocab8358-tensorflow1', 'wav_path': 'data/test/audios/asr_example_8K.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-zh-cn-8k-common-vocab8358-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-zh-cn-8k-common-vocab8358-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_8K.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-zh-cn-8k-common-vocab8358-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-zh-cn-8k-common-vocab8358-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_8K.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR-large_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-offline', + 'damo/speech_UniASR-large_asr_2pass-zh-cn-16k-common-vocab8358-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-cn-en-moe-16k-vocab8358-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-cn-en-moe-16k-vocab8358-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_cn_en.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-cn-en-moe-16k-vocab8358-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-cn-en-moe-16k-vocab8358-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_cn_en.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-cn-dialect-16k-vocab8358-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-cn-dialect-16k-vocab8358-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_cn_dialect.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-cn-dialect-16k-vocab8358-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-cn-dialect-16k-vocab8358-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_cn_dialect.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_paraformer_asr_nat-zh-cn-16k-common-vocab3444-tensorflow1-online', + 'damo/speech_paraformer_asr_nat-zh-cn-16k-common-vocab3444-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_paraformer_asr_nat-zh-cn-8k-common-vocab3444-tensorflow1-online', + 'damo/speech_paraformer_asr_nat-zh-cn-8k-common-vocab3444-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_8K.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-en-16k-common-vocab1080-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-en-16k-common-vocab1080-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_en.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-en-16k-common-vocab1080-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-en-16k-common-vocab1080-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_en.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ru-16k-common-vocab1664-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-ru-16k-common-vocab1664-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_ru.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ru-16k-common-vocab1664-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-ru-16k-common-vocab1664-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_ru.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-es-16k-common-vocab3445-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-es-16k-common-vocab3445-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_es.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-es-16k-common-vocab3445-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-es-16k-common-vocab3445-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_es.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ko-16k-common-vocab6400-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-ko-16k-common-vocab6400-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_ko.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ko-16k-common-vocab6400-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-ko-16k-common-vocab6400-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_ko.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ja-16k-common-vocab93-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-ja-16k-common-vocab93-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_ja.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-ja-16k-common-vocab93-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-ja-16k-common-vocab93-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_ja.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-id-16k-common-vocab1067-tensorflow1-online', + 'damo/speech_UniASR_asr_2pass-id-16k-common-vocab1067-tensorflow1-online', 'wav_path': 'data/test/audios/asr_example_id.wav' }, { - 'model_group': 'damo', 'model_id': - 'speech_UniASR_asr_2pass-id-16k-common-vocab1067-tensorflow1-offline', + 'damo/speech_UniASR_asr_2pass-id-16k-common-vocab1067-tensorflow1-offline', 'wav_path': 'data/test/audios/asr_example_id.wav' }, ] @@ -404,7 +381,7 @@ class AutomaticSpeechRecognitionTest(unittest.TestCase, logger.info('Run ASR test with all models') for item in self.all_models_info: - model_id = item['model_group'] + '/' + item['model_id'] + model_id = item['model_id'] wav_path = item['wav_path'] rec_result = self.run_pipeline( model_id=model_id, audio_in=wav_path)