diff --git a/GPT_SoVITS/prepare_datasets/1-get-text.py b/GPT_SoVITS/prepare_datasets/1-get-text.py index 88c9d858..d9c53228 100644 --- a/GPT_SoVITS/prepare_datasets/1-get-text.py +++ b/GPT_SoVITS/prepare_datasets/1-get-text.py @@ -79,7 +79,7 @@ if os.path.exists(txt_path) == False: return phone_level_feature.T def process(data, res): - for name, text, lan in data: + for name, text, lan in tqdm(data, desc="Processing"): try: name = os.path.basename(name) phones, word2ph, norm_text = clean_text( diff --git a/GPT_SoVITS/prepare_datasets/2-get-hubert-wav32k.py b/GPT_SoVITS/prepare_datasets/2-get-hubert-wav32k.py index b8355dd4..bd9a1953 100644 --- a/GPT_SoVITS/prepare_datasets/2-get-hubert-wav32k.py +++ b/GPT_SoVITS/prepare_datasets/2-get-hubert-wav32k.py @@ -1,6 +1,9 @@ # -*- coding: utf-8 -*- import sys,os + +from tqdm import tqdm + inp_text= os.environ.get("inp_text") inp_wav_dir= os.environ.get("inp_wav_dir") exp_name= os.environ.get("exp_name") @@ -94,26 +97,26 @@ def name2go(wav_name,wav_path): with open(inp_text,"r",encoding="utf8")as f: lines=f.read().strip("\n").split("\n") -for line in lines[int(i_part)::int(all_parts)]: +for line in tqdm(lines[int(i_part)::int(all_parts)], desc="Processing"): try: # wav_name,text=line.split("\t") wav_name, spk_name, language, text = line.split("|") - if (inp_wav_dir !=None): + if inp_wav_dir is not None: wav_name = os.path.basename(wav_name) - wav_path = "%s/%s"%(inp_wav_dir, wav_name) + wav_path = "%s/%s" % (inp_wav_dir, wav_name) else: - wav_path=wav_name + wav_path = wav_name wav_name = os.path.basename(wav_name) - name2go(wav_name,wav_path) + name2go(wav_name, wav_path) except: - print(line,traceback.format_exc()) + print(line, traceback.format_exc()) if(len(nan_fails)>0 and is_half==True): - is_half=False - model=model.float() + is_half = False + model = model.float() for wav_name in nan_fails: try: name2go(wav_name) except: - print(wav_name,traceback.format_exc()) + print(wav_name, traceback.format_exc()) diff --git a/GPT_SoVITS/prepare_datasets/3-get-semantic.py b/GPT_SoVITS/prepare_datasets/3-get-semantic.py index 9ab56a48..be7067e0 100644 --- a/GPT_SoVITS/prepare_datasets/3-get-semantic.py +++ b/GPT_SoVITS/prepare_datasets/3-get-semantic.py @@ -81,7 +81,7 @@ if os.path.exists(semantic_path) == False: lines = f.read().strip("\n").split("\n") lines1 = [] - for line in lines[int(i_part) :: int(all_parts)]: + for line in tqdm(lines[int(i_part) :: int(all_parts)], desc="Processing"): # print(line) try: # wav_name,text=line.split("\t")