mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-04-25 11:06:41 +08:00
[ASR] 修复FasterWhisper遍历输入路径失败 (#956)
* remove glob * rename * reset mirror pos
This commit is contained in:
parent
cb776229bb
commit
3124fcf497
@ -1,18 +1,16 @@
|
|||||||
import argparse
|
import argparse
|
||||||
import os
|
import os
|
||||||
os.environ["HF_ENDPOINT"]="https://hf-mirror.com"
|
|
||||||
import traceback
|
import traceback
|
||||||
import requests
|
|
||||||
from glob import glob
|
|
||||||
import torch
|
|
||||||
|
|
||||||
|
os.environ["HF_ENDPOINT"] = "https://hf-mirror.com"
|
||||||
|
os.environ["KMP_DUPLICATE_LIB_OK"] = "TRUE"
|
||||||
|
|
||||||
|
import torch
|
||||||
from faster_whisper import WhisperModel
|
from faster_whisper import WhisperModel
|
||||||
from tqdm import tqdm
|
from tqdm import tqdm
|
||||||
|
|
||||||
from tools.asr.config import check_fw_local_models
|
from tools.asr.config import check_fw_local_models
|
||||||
|
|
||||||
os.environ["KMP_DUPLICATE_LIB_OK"]="TRUE"
|
|
||||||
|
|
||||||
language_code_list = [
|
language_code_list = [
|
||||||
"af", "am", "ar", "as", "az",
|
"af", "am", "ar", "as", "az",
|
||||||
"ba", "be", "bg", "bn", "bo",
|
"ba", "be", "bg", "bn", "bo",
|
||||||
@ -50,17 +48,18 @@ def execute_asr(input_folder, output_folder, model_size, language,precision):
|
|||||||
model = WhisperModel(model_path, device=device, compute_type=precision)
|
model = WhisperModel(model_path, device=device, compute_type=precision)
|
||||||
except:
|
except:
|
||||||
return print(traceback.format_exc())
|
return print(traceback.format_exc())
|
||||||
|
|
||||||
|
input_file_names = os.listdir(input_folder)
|
||||||
|
input_file_names.sort()
|
||||||
|
|
||||||
output = []
|
output = []
|
||||||
output_file_name = os.path.basename(input_folder)
|
output_file_name = os.path.basename(input_folder)
|
||||||
output_file_path = os.path.abspath(f'{output_folder}/{output_file_name}.list')
|
|
||||||
|
|
||||||
if not os.path.exists(output_folder):
|
for file_name in tqdm(input_file_names):
|
||||||
os.makedirs(output_folder)
|
|
||||||
|
|
||||||
for file in tqdm(glob(os.path.join(input_folder, '**/*.wav'), recursive=True)):
|
|
||||||
try:
|
try:
|
||||||
|
file_path = os.path.join(input_folder, file_name)
|
||||||
segments, info = model.transcribe(
|
segments, info = model.transcribe(
|
||||||
audio = file,
|
audio = file_path,
|
||||||
beam_size = 5,
|
beam_size = 5,
|
||||||
vad_filter = True,
|
vad_filter = True,
|
||||||
vad_parameters = dict(min_silence_duration_ms=700),
|
vad_parameters = dict(min_silence_duration_ms=700),
|
||||||
@ -68,18 +67,23 @@ def execute_asr(input_folder, output_folder, model_size, language,precision):
|
|||||||
text = ''
|
text = ''
|
||||||
|
|
||||||
if info.language == "zh":
|
if info.language == "zh":
|
||||||
print("检测为中文文本,转funasr处理")
|
print("检测为中文文本, 转 FunASR 处理")
|
||||||
if("only_asr"not in globals()):
|
if("only_asr"not in globals()):
|
||||||
from tools.asr.funasr_asr import only_asr##如果用英文就不需要导入下载模型
|
from tools.asr.funasr_asr import \
|
||||||
text = only_asr(file)
|
only_asr # #如果用英文就不需要导入下载模型
|
||||||
|
text = only_asr(file_path)
|
||||||
|
|
||||||
if text == '':
|
if text == '':
|
||||||
for segment in segments:
|
for segment in segments:
|
||||||
text += segment.text
|
text += segment.text
|
||||||
output.append(f"{file}|{output_file_name}|{info.language.upper()}|{text}")
|
output.append(f"{file_path}|{output_file_name}|{info.language.upper()}|{text}")
|
||||||
except:
|
except:
|
||||||
return print(traceback.format_exc())
|
return print(traceback.format_exc())
|
||||||
|
|
||||||
|
output_folder = output_folder or "output/asr_opt"
|
||||||
|
os.makedirs(output_folder, exist_ok=True)
|
||||||
|
output_file_path = os.path.abspath(f'{output_folder}/{output_file_name}.list')
|
||||||
|
|
||||||
with open(output_file_path, "w", encoding="utf-8") as f:
|
with open(output_file_path, "w", encoding="utf-8") as f:
|
||||||
f.write("\n".join(output))
|
f.write("\n".join(output))
|
||||||
print(f"ASR 任务完成->标注文件路径: {output_file_path}\n")
|
print(f"ASR 任务完成->标注文件路径: {output_file_path}\n")
|
||||||
|
@ -38,10 +38,11 @@ def execute_asr(input_folder, output_folder, model_size, language):
|
|||||||
output = []
|
output = []
|
||||||
output_file_name = os.path.basename(input_folder)
|
output_file_name = os.path.basename(input_folder)
|
||||||
|
|
||||||
for name in tqdm(input_file_names):
|
for file_name in tqdm(input_file_names):
|
||||||
try:
|
try:
|
||||||
text = model.generate(input="%s/%s"%(input_folder, name))[0]["text"]
|
file_path = os.path.join(input_folder, file_name)
|
||||||
output.append(f"{input_folder}/{name}|{output_file_name}|{language.upper()}|{text}")
|
text = model.generate(input=file_path)[0]["text"]
|
||||||
|
output.append(f"{file_path}|{output_file_name}|{language.upper()}|{text}")
|
||||||
except:
|
except:
|
||||||
print(traceback.format_exc())
|
print(traceback.format_exc())
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user