From 0c8832727e704b42ebf6483fc03cca0826c49567 Mon Sep 17 00:00:00 2001 From: RVC-Boss <129054828+RVC-Boss@users.noreply.github.com> Date: Mon, 12 Feb 2024 16:47:30 +0800 Subject: [PATCH 1/4] Update inference_webui.py --- GPT_SoVITS/inference_webui.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/GPT_SoVITS/inference_webui.py b/GPT_SoVITS/inference_webui.py index 566985a4..9c5197a7 100644 --- a/GPT_SoVITS/inference_webui.py +++ b/GPT_SoVITS/inference_webui.py @@ -624,15 +624,15 @@ with gr.Blocks(title="GPT-SoVITS WebUI") as app: interactive=True, ) with gr.Row(): - top_k = gr.Slider(minimum=1,maximum=100,step=1,label=i18n("top_k"),value=20,interactive=True) - top_p = gr.Slider(minimum=0,maximum=1,step=0.05,label=i18n("top_p"),value=0.6,interactive=True) - temperature = gr.Slider(minimum=0,maximum=1,step=0.05,label=i18n("temperature"),value=0.6,interactive=True) + top_k = gr.Slider(minimum=1,maximum=100,step=1,label=i18n("top_k"),value=5,interactive=True) + top_p = gr.Slider(minimum=0,maximum=1,step=0.05,label=i18n("top_p"),value=1,interactive=True) + temperature = gr.Slider(minimum=0,maximum=1,step=0.05,label=i18n("temperature"),value=1,interactive=True) inference_button = gr.Button(i18n("合成语音"), variant="primary") output = gr.Audio(label=i18n("输出的语音")) inference_button.click( get_tts_wav, - [inp_ref, prompt_text, prompt_language, text, text_language, how_to_cut], + [inp_ref, prompt_text, prompt_language, text, text_language, how_to_cut,top_k,top_p,temperature], [output], ) From 3bf71d3790076042ea888fb07d91e0b518f68992 Mon Sep 17 00:00:00 2001 From: RVC-Boss <129054828+RVC-Boss@users.noreply.github.com> Date: Mon, 12 Feb 2024 16:47:43 +0800 Subject: [PATCH 2/4] Update t2s_model.py --- GPT_SoVITS/AR/models/t2s_model.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/GPT_SoVITS/AR/models/t2s_model.py b/GPT_SoVITS/AR/models/t2s_model.py index d3e550d1..aaeace98 100644 --- a/GPT_SoVITS/AR/models/t2s_model.py +++ b/GPT_SoVITS/AR/models/t2s_model.py @@ -402,7 +402,7 @@ class Text2SemanticDecoder(nn.Module): if(idx==0):###第一次跑不能EOS否则没有了 logits = logits[:, :-1] ###刨除1024终止符号的概率 samples = sample( - logits[0], y, top_k=top_k, top_p=top_p, repetition_penalty=1.05, temperature=temperature + logits[0], y, top_k=top_k, top_p=top_p, repetition_penalty=1.35, temperature=temperature )[0].unsqueeze(0) if early_stop_num != -1 and (y.shape[1] - prefix_len) > early_stop_num: print("use early stop num:", early_stop_num) From 2fa74ecb941db27d9015583a9be6962898d66730 Mon Sep 17 00:00:00 2001 From: RVC-Boss <129054828+RVC-Boss@users.noreply.github.com> Date: Mon, 12 Feb 2024 17:00:31 +0800 Subject: [PATCH 3/4] Update fasterwhisper_asr.py --- tools/asr/fasterwhisper_asr.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/tools/asr/fasterwhisper_asr.py b/tools/asr/fasterwhisper_asr.py index 70557117..5f49de70 100644 --- a/tools/asr/fasterwhisper_asr.py +++ b/tools/asr/fasterwhisper_asr.py @@ -1,5 +1,6 @@ import argparse import os +os.environ["HF_ENDPOINT"]="https://hf-mirror.com" import traceback import requests from glob import glob @@ -103,4 +104,4 @@ if __name__ == '__main__': model_size = cmd.model_size, language = cmd.language, precision = cmd.precision, - ) \ No newline at end of file + ) From d82f6bbb98ba725e6725dcee99b80ce71fb0bf28 Mon Sep 17 00:00:00 2001 From: RVC-Boss <129054828+RVC-Boss@users.noreply.github.com> Date: Mon, 12 Feb 2024 18:03:40 +0800 Subject: [PATCH 4/4] Update funasr_asr.py --- tools/asr/funasr_asr.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tools/asr/funasr_asr.py b/tools/asr/funasr_asr.py index 106d7d17..6aa30381 100644 --- a/tools/asr/funasr_asr.py +++ b/tools/asr/funasr_asr.py @@ -43,7 +43,7 @@ def execute_asr(input_folder, output_folder, model_size, language): text = model.generate(input="%s/%s"%(input_folder, name))[0]["text"] output.append(f"{input_folder}/{name}|{output_file_name}|{language.upper()}|{text}") except: - return print(traceback.format_exc()) + print(traceback.format_exc()) output_folder = output_folder or "output/asr_opt" os.makedirs(output_folder, exist_ok=True) @@ -73,4 +73,4 @@ if __name__ == '__main__': output_folder = cmd.output_folder, model_size = cmd.model_size, language = cmd.language, - ) \ No newline at end of file + )