mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-04-06 03:57:44 +08:00
Merge 134098cc4babc9af2f428fb138c8b010e9601130 into 5dfce9a3f0def7f1ee1e075df569b0b2d41df9e3
This commit is contained in:
commit
4d5bb3042a
25
GPT_SoVITS/process_dataset.py
Normal file
25
GPT_SoVITS/process_dataset.py
Normal file
@ -0,0 +1,25 @@
|
|||||||
|
import os
|
||||||
|
|
||||||
|
|
||||||
|
# Supporting third-party datasets with the format where each audio file corresponds to a text file.
|
||||||
|
# For example, voice01.wav -> voice01.txt.
|
||||||
|
def convert_dataset(input_folder, output_file, language='zh'):
|
||||||
|
audio_files = []
|
||||||
|
for f in os.listdir(input_folder):
|
||||||
|
if f.endswith('.wav'):
|
||||||
|
audio_files.append(f)
|
||||||
|
|
||||||
|
with open(output_file, 'w', encoding='utf-8') as output:
|
||||||
|
|
||||||
|
for audio_file in audio_files:
|
||||||
|
audio_path = os.path.join(input_folder, audio_file)
|
||||||
|
text_file = os.path.join(input_folder, audio_file.replace('.wav', '.txt'))
|
||||||
|
|
||||||
|
with open(text_file, 'r', encoding='utf-8') as text_content:
|
||||||
|
text = text_content.read().replace('\n', '')
|
||||||
|
|
||||||
|
speaker_name = os.path.splitext(audio_file)[0]
|
||||||
|
|
||||||
|
output_line = f'{audio_path}|{speaker_name}|{language}|{text}\n'
|
||||||
|
output.write(output_line)
|
||||||
|
|
Loading…
x
Reference in New Issue
Block a user