fix: 修复prompt_cache里面没有cache住ref_audio_path,导致每次TTS推理都需要加载一遍reference_audio的bug【首次音频帧从3.2s -> 1.7s】 (#1235)

This commit is contained in:
bstr9 2024-06-26 22:26:20 +08:00 committed by GitHub
parent e4b17c40bf
commit afbcf4007a
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -360,7 +360,11 @@ class TTS:
'''
self._set_prompt_semantic(ref_audio_path)
self._set_ref_spec(ref_audio_path)
self._set_ref_audio_path(ref_audio_path)
def _set_ref_audio_path(self, ref_audio_path):
self.prompt_cache["ref_audio_path"] = ref_audio_path
def _set_ref_spec(self, ref_audio_path):
audio = load_audio(ref_audio_path, int(self.configs.sampling_rate))
audio = torch.FloatTensor(audio)