From db5cedf966d35ea02fea3953003f50db163a2137 Mon Sep 17 00:00:00 2001 From: ChasonJiang <1440499136@qq.com> Date: Sun, 30 Mar 2025 20:28:56 +0800 Subject: [PATCH] =?UTF-8?q?=E6=B8=85=E7=90=86=E6=97=A0=E7=94=A8=E4=BB=A3?= =?UTF-8?q?=E7=A0=81?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- GPT_SoVITS/TTS_infer_pack/TTS.py | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/GPT_SoVITS/TTS_infer_pack/TTS.py b/GPT_SoVITS/TTS_infer_pack/TTS.py index af3a182..5cd618e 100644 --- a/GPT_SoVITS/TTS_infer_pack/TTS.py +++ b/GPT_SoVITS/TTS_infer_pack/TTS.py @@ -1124,9 +1124,6 @@ class TTS: else: if parallel_infer: print(f"{i18n('并行合成中')}...") - # for i, idx in enumerate(tqdm(idx_list)): - # phones = batch_phones[i].unsqueeze(0).to(self.configs.device) - # _pred_semantic = (pred_semantic_list[i][-idx:].unsqueeze(0).unsqueeze(0)) # .unsqueeze(0)#mq要多unsqueeze一次 audio_fragments = self.v3_synthesis_batched_infer( idx_list, pred_semantic_list, @@ -1278,7 +1275,7 @@ class TTS: ref_audio = ref_audio.mean(0).unsqueeze(0) if ref_sr!=24000: ref_audio=resample(ref_audio, ref_sr, self.configs.device) - # print("ref_audio",ref_audio.abs().mean())W + mel2 = mel_fn(ref_audio) mel2 = norm_spec(mel2) T_min = min(mel2.shape[2], fea_ref.shape[2])