From 9a80963ae35de0624c6179cc065166671dbf6af2 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E5=88=98=E6=82=A6?= Date: Sat, 3 Feb 2024 11:37:11 +0800 Subject: [PATCH] =?UTF-8?q?=E6=B7=BB=E5=8A=A0=E5=8F=82=E8=80=83=E9=9F=B3?= =?UTF-8?q?=E9=A2=91=E7=B4=A2=E5=BC=95=E4=B8=8B=E6=8B=89=E5=88=97=E8=A1=A8?= =?UTF-8?q?=E5=8A=9F=E8=83=BD?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit 添加参考音频索引下拉列表功能 --- GPT_SoVITS/inference_webui.py | 42 ++++++++++++++++++++++++++++++++++- 1 file changed, 41 insertions(+), 1 deletion(-) diff --git a/GPT_SoVITS/inference_webui.py b/GPT_SoVITS/inference_webui.py index 1868a122..2d2e3b3e 100644 --- a/GPT_SoVITS/inference_webui.py +++ b/GPT_SoVITS/inference_webui.py @@ -135,6 +135,43 @@ if is_half == True: else: ssl_model = ssl_model.to(device) +# 初始化引导音频列表 + +def init_wav_list(sovits_path): + + wav_path = "./output/slicer_opt" + match = re.search(r'([a-zA-Z]+)_e\d+_s\d+\.pth',sovits_path) + if match: + result = match.group(1) + wav_path = f"./logs/{result}/5-wav32k/" + + res = ["请选择参考音频"] + + # 遍历目录 + for file_path in os.listdir(wav_path): + # 检查当前file_path是否为文件 + if os.path.isfile(os.path.join(wav_path, file_path)): + # 将文件名添加到列表中 + res.append(file_path) + + print(res) + + return res + +reference_wavs = init_wav_list(sovits_path) + + +# 切换参考音频 + +def change_wav(audio_name): + + wav_path = f"./output/slicer_opt/{audio_name}" + match = re.search(r'([a-zA-Z]+)_e\d+_s\d+\.pth',sovits_path) + if match: + result = match.group(1) + wav_path = f"./logs/{result}/5-wav32k/{audio_name}" + + return wav_path def change_sovits_weights(sovits_path): global vq_model, hps @@ -158,6 +195,7 @@ def change_sovits_weights(sovits_path): print(vq_model.load_state_dict(dict_s2["weight"], strict=False)) with open("./sweight.txt", "w", encoding="utf-8") as f: f.write(sovits_path) + return init_wav_list(sovits_path) change_sovits_weights(sovits_path) @@ -574,9 +612,10 @@ with gr.Blocks(title="GPT-SoVITS WebUI") as app: with gr.Row(): GPT_dropdown = gr.Dropdown(label=i18n("GPT模型列表"), choices=sorted(GPT_names, key=custom_sort_key), value=gpt_path, interactive=True) SoVITS_dropdown = gr.Dropdown(label=i18n("SoVITS模型列表"), choices=sorted(SoVITS_names, key=custom_sort_key), value=sovits_path, interactive=True) + wavs_dropdown = gr.Dropdown(label=i18n("参考音频列表"), choices=reference_wavs,value="请选择参考音频",interactive=True) refresh_button = gr.Button(i18n("刷新模型路径"), variant="primary") refresh_button.click(fn=change_choices, inputs=[], outputs=[SoVITS_dropdown, GPT_dropdown]) - SoVITS_dropdown.change(change_sovits_weights, [SoVITS_dropdown], []) + SoVITS_dropdown.change(change_sovits_weights, [SoVITS_dropdown], [wavs_dropdown]) GPT_dropdown.change(change_gpt_weights, [GPT_dropdown], []) gr.Markdown(value=i18n("*请上传并填写参考信息")) with gr.Row(): @@ -585,6 +624,7 @@ with gr.Blocks(title="GPT-SoVITS WebUI") as app: prompt_language = gr.Dropdown( label=i18n("参考音频的语种"), choices=[i18n("中文"), i18n("英文"), i18n("日文")], value=i18n("中文") ) + wavs_dropdown.change(change_wav,[wavs_dropdown],[inp_ref]) gr.Markdown(value=i18n("*请填写需要合成的目标文本。中英混合选中文,日英混合选日文,中日混合暂不支持,非目标语言文本自动遗弃。")) with gr.Row(): text = gr.Textbox(label=i18n("需要合成的文本"), value="")