Merge 8a70a2ffd0c0b81af31c912b5dcce535dcdb6268 into 08d627c3338173c3229286d8787060d6559fe0f8

This commit is contained in:
DayDaySpeed 2026-06-01 20:02:09 +08:00 committed by GitHub
commit 5a8f5cbd36
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -22,29 +22,36 @@ def only_asr(input_file, language):
def create_model(language="zh"): def create_model(language="zh"):
if language in funasr_models:
return funasr_models[language]
if language == "zh": if language == "zh":
path_vad = "tools/asr/models/speech_fsmn_vad_zh-cn-16k-common-pytorch" path_vad = "tools/asr/models/speech_fsmn_vad_zh-cn-16k-common-pytorch"
path_punc = "tools/asr/models/punc_ct-transformer_zh-cn-common-vocab272727-pytorch" path_punc = "tools/asr/models/punc_ct-transformer_zh-cn-common-vocab272727-pytorch"
path_asr = "tools/asr/models/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch" path_asr = "tools/asr/models/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch"
if not os.path.isdir(path_vad):
snapshot_download( snapshot_download(
"iic/speech_fsmn_vad_zh-cn-16k-common-pytorch", "iic/speech_fsmn_vad_zh-cn-16k-common-pytorch",
local_dir="tools/asr/models/speech_fsmn_vad_zh-cn-16k-common-pytorch", local_dir=path_vad,
) )
if not os.path.isdir(path_punc):
snapshot_download( snapshot_download(
"iic/punc_ct-transformer_zh-cn-common-vocab272727-pytorch", "iic/punc_ct-transformer_zh-cn-common-vocab272727-pytorch",
local_dir="tools/asr/models/punc_ct-transformer_zh-cn-common-vocab272727-pytorch", local_dir=path_punc,
) )
if not os.path.isdir(path_asr):
snapshot_download( snapshot_download(
"iic/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch", "iic/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch",
local_dir="tools/asr/models/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch", local_dir=path_asr,
) )
model_revision = "v2.0.4" model_revision = "v2.0.4"
vad_model_revision = punc_model_revision = "v2.0.4" vad_model_revision = punc_model_revision = "v2.0.4"
elif language == "yue": elif language == "yue":
path_asr = "tools/asr/models/speech_UniASR_asr_2pass-cantonese-CHS-16k-common-vocab1468-tensorflow1-online" path_asr = "tools/asr/models/speech_UniASR_asr_2pass-cantonese-CHS-16k-common-vocab1468-tensorflow1-online"
if not os.path.isdir(path_asr):
snapshot_download( snapshot_download(
"iic/speech_UniASR_asr_2pass-cantonese-CHS-16k-common-vocab1468-tensorflow1-online", "iic/speech_UniASR_asr_2pass-cantonese-CHS-16k-common-vocab1468-tensorflow1-online",
local_dir="tools/asr/models/speech_UniASR_asr_2pass-cantonese-CHS-16k-common-vocab1468-tensorflow1-online", local_dir=path_asr,
) )
path_vad = path_punc = None path_vad = path_punc = None
vad_model_revision = punc_model_revision = "" vad_model_revision = punc_model_revision = ""
@ -52,9 +59,6 @@ def create_model(language="zh"):
else: else:
raise ValueError(f"{language} is not supported") raise ValueError(f"{language} is not supported")
if language in funasr_models:
return funasr_models[language]
else:
model = AutoModel( model = AutoModel(
model=path_asr, model=path_asr,
model_revision=model_revision, model_revision=model_revision,