mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-10-08 16:00:01 +08:00
增强了功能,增加了List合并小工具
This commit is contained in:
parent
9125424f3a
commit
28d3a5bfa5
@ -1,4 +1,5 @@
|
|||||||
import srt
|
import srt
|
||||||
|
import shutil
|
||||||
|
|
||||||
def parse_srt_with_lib(content):
|
def parse_srt_with_lib(content):
|
||||||
|
|
||||||
@ -87,10 +88,47 @@ def slice_audio_with_lib(audio_path, save_folder, format, subtitles, pre_preserv
|
|||||||
try:
|
try:
|
||||||
audio = pydub.AudioSegment.from_file(audio_path)
|
audio = pydub.AudioSegment.from_file(audio_path)
|
||||||
sliced_audio = audio[int(start * 1000):int(end * 1000)]
|
sliced_audio = audio[int(start * 1000):int(end * 1000)]
|
||||||
file_name = f'{i + 1:03d}.{format}'
|
file_name = f'{character}_{i + 1:03d}.{format}'
|
||||||
save_path = os.path.join(save_folder, file_name)
|
save_path = os.path.join(save_folder, file_name)
|
||||||
sliced_audio.export(save_path, format=format)
|
sliced_audio.export(save_path, format=format)
|
||||||
f.write(f"{file_name}|{character}|{language}|{subtitle.content}\n")
|
f.write(f"{file_name}|{character}|{language}|{subtitle.content}\n")
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
raise e
|
raise e
|
||||||
|
|
||||||
|
def merge_list_folders(first_list_file, second_list_file, character, first_folder, second_folder):
|
||||||
|
merged_lines = []
|
||||||
|
character1 = ""
|
||||||
|
filenames = set()
|
||||||
|
with open(first_list_file, 'r', encoding="utf-8") as f:
|
||||||
|
first_list = f.readlines()
|
||||||
|
for line in first_list:
|
||||||
|
filename, character1, language, content = line.split('|')
|
||||||
|
filenames.add(filename)
|
||||||
|
if character=="" or character is None:
|
||||||
|
character = character1
|
||||||
|
new_line = f"{filename}|{character}|{language}|{content}"
|
||||||
|
merged_lines.append(new_line)
|
||||||
|
with open(second_list_file, 'r', encoding="utf-8") as f:
|
||||||
|
second_list = f.readlines()
|
||||||
|
for line in second_list:
|
||||||
|
filename, _, language, content = line.split('|')
|
||||||
|
orig_filename = filename
|
||||||
|
num = 1
|
||||||
|
while filename in filenames:
|
||||||
|
filename = f"{filename.rsplit('.', 1)[0]}_{num}.{filename.rsplit('.', 1)[1]}"
|
||||||
|
num += 1
|
||||||
|
try:
|
||||||
|
os.rename(os.path.join(second_folder, orig_filename), os.path.join(first_folder, filename))
|
||||||
|
except Exception as e:
|
||||||
|
raise e
|
||||||
|
new_line = f"{filename}|{character}|{language}|{content}"
|
||||||
|
merged_lines.append(new_line)
|
||||||
|
os.remove(second_list_file)
|
||||||
|
if not os.listdir(second_folder):
|
||||||
|
os.rmdir(second_folder)
|
||||||
|
with open(first_list_file, 'w', encoding="utf-8") as f:
|
||||||
|
f.writelines(merged_lines)
|
||||||
|
return "\n".join(merged_lines)
|
||||||
|
|
||||||
|
|
||||||
|
|
@ -1,9 +1,18 @@
|
|||||||
import gradio as gr
|
import gradio as gr
|
||||||
|
|
||||||
import sys
|
import sys
|
||||||
|
import os
|
||||||
|
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '..')))
|
||||||
|
sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), '../..')))
|
||||||
sys.path.append('.')
|
sys.path.append('.')
|
||||||
sys.path.append('..')
|
from srt_utils import (
|
||||||
from tools.srt_slicer.srt_utils import merge_subtitles_with_lib, parse_srt_with_lib, generate_srt_with_lib, slice_audio_with_lib, count_words_multilang
|
merge_subtitles_with_lib,
|
||||||
|
parse_srt_with_lib,
|
||||||
|
generate_srt_with_lib,
|
||||||
|
slice_audio_with_lib,
|
||||||
|
count_words_multilang,
|
||||||
|
merge_list_folders
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
from i18n.i18n import I18nAuto
|
from i18n.i18n import I18nAuto
|
||||||
@ -19,7 +28,6 @@ def merge_srt(input_text, output_text, short_interval=0.1, max_interval=1, max_t
|
|||||||
return output_text
|
return output_text
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
def slice_audio(
|
def slice_audio(
|
||||||
input_audio,
|
input_audio,
|
||||||
save_folder,
|
save_folder,
|
||||||
@ -46,6 +54,7 @@ def slice_audio(
|
|||||||
os.makedirs(character_folder, exist_ok=True)
|
os.makedirs(character_folder, exist_ok=True)
|
||||||
subtitles = parse_srt_with_lib(output_text)
|
subtitles = parse_srt_with_lib(output_text)
|
||||||
try:
|
try:
|
||||||
|
gr.Info(f"{i18n('正在切分音频')} {input_audio} {i18n('到')} {character_folder}")
|
||||||
slice_audio_with_lib(
|
slice_audio_with_lib(
|
||||||
input_audio,
|
input_audio,
|
||||||
character_folder,
|
character_folder,
|
||||||
@ -58,6 +67,7 @@ def slice_audio(
|
|||||||
language,
|
language,
|
||||||
character,
|
character,
|
||||||
)
|
)
|
||||||
|
gr.Info(f"{i18n('切分完成')} ")
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
gr.Warning(f"Can't Slice, Error: {e}")
|
gr.Warning(f"Can't Slice, Error: {e}")
|
||||||
|
|
||||||
@ -152,6 +162,39 @@ def save_srt_to_file(srt_text, save_folder, character):
|
|||||||
with open(srt_file, "w", encoding="utf-8") as f:
|
with open(srt_file, "w", encoding="utf-8") as f:
|
||||||
f.write(srt_text)
|
f.write(srt_text)
|
||||||
|
|
||||||
|
def scan_list_folders(folder):
|
||||||
|
if not os.path.exists(folder):
|
||||||
|
os.makedirs(folder, exist_ok=True)
|
||||||
|
list_folders = []
|
||||||
|
for list_folder in os.listdir(folder):
|
||||||
|
if os.path.isdir(os.path.join(folder, list_folder)):
|
||||||
|
list_folders.append(get_relative_path(os.path.join(folder, list_folder), folder))
|
||||||
|
first_list_folder = ""
|
||||||
|
second_list_folder = ""
|
||||||
|
if len(list_folders) > 0:
|
||||||
|
first_list_folder = second_list_folder = list_folders[0]
|
||||||
|
if len(list_folders) > 1:
|
||||||
|
second_list_folder = list_folders[1]
|
||||||
|
return gr.Dropdown(list_folders, value=first_list_folder), gr.Dropdown(list_folders, value=second_list_folder)
|
||||||
|
|
||||||
|
def preview_merged_list(first_list_folder, second_list_folder, merge_list_character_name, save_folder):
|
||||||
|
if first_list_folder == "" or second_list_folder == "":
|
||||||
|
return ""
|
||||||
|
if first_list_folder == second_list_folder:
|
||||||
|
gr.Warning(i18n("两个文件夹不能相同!!!"))
|
||||||
|
return ""
|
||||||
|
first_list_folder = os.path.join(save_folder, first_list_folder)
|
||||||
|
second_list_folder = os.path.join(save_folder, second_list_folder)
|
||||||
|
print(f"first_list_folder: {first_list_folder}, second_list_folder: {second_list_folder}")
|
||||||
|
first_list = os.path.join(first_list_folder, [file for file in os.listdir(first_list_folder) if file.lower().endswith(".list")][0])
|
||||||
|
second_list = os.path.join(second_list_folder, [file for file in os.listdir(second_list_folder) if file.lower().endswith(".list")][0])
|
||||||
|
try:
|
||||||
|
return merge_list_folders(first_list, second_list, merge_list_character_name, first_list_folder, second_list_folder)
|
||||||
|
except Exception as e:
|
||||||
|
gr.Warning(f"Can't Merge, Error: {e}")
|
||||||
|
return ""
|
||||||
|
|
||||||
|
|
||||||
from datetime import datetime
|
from datetime import datetime
|
||||||
|
|
||||||
def change_character_name(input_audio):
|
def change_character_name(input_audio):
|
||||||
@ -178,63 +221,79 @@ with gr.Blocks() as app:
|
|||||||
<li>{i18n("根据面板合并短句并过滤你不希望出现的句子。")}</li>
|
<li>{i18n("根据面板合并短句并过滤你不希望出现的句子。")}</li>
|
||||||
<li>{i18n("随后保存成切分好的音频与list文件。")}</li>
|
<li>{i18n("随后保存成切分好的音频与list文件。")}</li>
|
||||||
</ol>""")
|
</ol>""")
|
||||||
|
with gr.Tabs():
|
||||||
|
with gr.Tab(i18n("SRT编辑界面")):
|
||||||
|
with gr.Row():
|
||||||
|
with gr.Column(scale=2) as input_col:
|
||||||
|
with gr.Tabs():
|
||||||
|
with gr.Tab(i18n("读取本地文件")):
|
||||||
|
input_folder = gr.Textbox("input/srt_and_audios", label=i18n("文件夹路径"),interactive=True)
|
||||||
|
scan_button = gr.Button(i18n("扫描文件夹"), variant="secondary",interactive=True)
|
||||||
|
srt_files_list = gr.Dropdown([], label=i18n("SRT文件"),interactive=True)
|
||||||
|
audio_files_list = gr.Dropdown([], label=i18n("音频文件"),interactive=True)
|
||||||
|
srt_read_button = gr.Button(i18n("读取文件"), variant="secondary",interactive=True)
|
||||||
|
with gr.Tab(i18n("上传文件")):
|
||||||
|
input_srt_file = gr.File(label=i18n("上传SRT文件"), type="filepath", file_types=["srt"])
|
||||||
|
upload_audio = gr.Audio(type="filepath",label=i18n("音频文件"))
|
||||||
|
# input_audio_file = gr.File(label=i18n("上传音频文件"), type="audio", file_types=["mp3", "wav", "ogg"])
|
||||||
|
with gr.Tabs():
|
||||||
|
with gr.Tab(i18n("内容预览")):
|
||||||
|
input_audio = gr.Textbox("", label=i18n("音频文件"),interactive=False)
|
||||||
|
input_text = gr.Textbox("", lines=20, max_lines=30, label=i18n("srt文件内容"))
|
||||||
|
input_srt_file.change(load_srt_from_file, [input_srt_file], [input_text])
|
||||||
|
with gr.Column(scale=1) as control_col:
|
||||||
|
with gr.Tabs():
|
||||||
|
with gr.Tab(i18n("合并字幕设置")):
|
||||||
|
merge_zero_interval = gr.Checkbox(label=i18n("提前合并时间间隔很短的字幕"),interactive=True, value=True)
|
||||||
|
short_interval = gr.Slider(value=0.05, minimum=0, maximum=0.5, step=0.005, label=i18n("判定为短间隔时长"),interactive=True,visible=True)
|
||||||
|
max_interval = gr.Slider(value=0.8, minimum=0.1, maximum=10, step=0.1, label=i18n("最大间隔时间"),interactive=True)
|
||||||
|
max_text_length = gr.Slider(value=50,minimum=5,maximum=200,step=1, label=i18n("最长允许单句长度"),interactive=True)
|
||||||
|
add_period = gr.Checkbox(label=i18n("句末加句号"),interactive=True, value=True)
|
||||||
|
merge_button = gr.Button(i18n("合并字幕"), variant="primary")
|
||||||
|
|
||||||
|
with gr.Tab(i18n("过滤设置")):
|
||||||
|
min_length = gr.Slider(value=5, minimum=0, maximum=20, step=1, label=i18n("允许最短长度"),interactive=True)
|
||||||
|
filter_english = gr.Checkbox(label=i18n("过滤带有英文的"),interactive=True)
|
||||||
|
filter_words = gr.Textbox("", label=i18n("过滤词语,一行一个"),lines=5,max_lines=10,interactive=True)
|
||||||
|
filter_button = gr.Button(i18n("过滤字幕"), variant="primary",interactive=False)
|
||||||
|
with gr.Tab(i18n("切分与保存")):
|
||||||
|
with gr.Group():
|
||||||
|
pre_preserve_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("前置保留时间"),interactive=True)
|
||||||
|
post_preserve_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("后置保留时间"),interactive=True)
|
||||||
|
pre_silence_time = gr.Slider(value=0.05, minimum=0, maximum=1, step=0.01, label=i18n("前置添加静音时间"),interactive=True,visible=False)
|
||||||
|
post_silence_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("后置添加静音时间"),interactive=True,visible=False)
|
||||||
|
with gr.Group():
|
||||||
|
language = gr.Dropdown([i18n(i) for i in ["auto", "zh", "en", "ja", "all_zh", "all_ja"]], value="auto", label=i18n("语言"),interactive=True)
|
||||||
|
audio_format = gr.Dropdown(["mp3", "wav", "ogg"], value="wav", label=i18n("音频格式"),interactive=True)
|
||||||
|
with gr.Group():
|
||||||
|
save_folder = gr.Textbox("output/sliced_audio", label=i18n("保存文件夹"),interactive=True)
|
||||||
|
character = gr.Textbox("character", label=i18n("保存子文件夹名称"),interactive=True)
|
||||||
|
character_warning = gr.Textbox(i18n("注意:该文件夹已存在"), label=i18n("提示"),interactive=False,visible=False)
|
||||||
|
save_srt_button = gr.Button(i18n("保存合并后字幕"),variant="secondary",interactive=True)
|
||||||
|
slice_audio_button = gr.Button(i18n("切分并保存音频、list"), variant="primary",interactive=False)
|
||||||
|
|
||||||
with gr.Row():
|
with gr.Column(scale=2) as output_col:
|
||||||
with gr.Column(scale=2) as input_col:
|
with gr.Tabs():
|
||||||
with gr.Tabs():
|
with gr.Tab(i18n("合并后srt文本")):
|
||||||
with gr.Tab(i18n("读取本地文件")):
|
output_text = gr.Textbox("", lines=20, max_lines=30, label="Sliced SRT")
|
||||||
input_folder = gr.Textbox("input/srt_and_audios", label=i18n("文件夹路径"),interactive=True)
|
with gr.Tab(i18n("切分预览")):
|
||||||
scan_button = gr.Button(i18n("扫描文件夹"), variant="secondary",interactive=True)
|
gr.Textbox(i18n("正在建设,敬请期待"), label=i18n("提示"),interactive=False)
|
||||||
srt_files_list = gr.Dropdown([], label=i18n("SRT文件"),interactive=True)
|
with gr.Tab(i18n("List 合并小工具")):
|
||||||
audio_files_list = gr.Dropdown([], label=i18n("音频文件"),interactive=True)
|
with gr.Row():
|
||||||
srt_read_button = gr.Button(i18n("读取文件"), variant="secondary",interactive=True)
|
with gr.Column(scale=2):
|
||||||
with gr.Tab(i18n("上传文件")):
|
scan_list_folder = gr.Textbox("output/sliced_audio", label=i18n("文件夹路径"),interactive=True)
|
||||||
input_srt_file = gr.File(label=i18n("上传SRT文件"), type="filepath", file_types=["srt"])
|
scan_list_button = gr.Button(i18n("扫描文件夹"), variant="secondary")
|
||||||
upload_audio = gr.Audio(type="filepath",label=i18n("音频文件"))
|
first_list_folder = gr.Dropdown([], label=i18n("主文件夹"),interactive=True)
|
||||||
# input_audio_file = gr.File(label=i18n("上传音频文件"), type="audio", file_types=["mp3", "wav", "ogg"])
|
second_list_folder = gr.Dropdown([], label=i18n("次文件夹"),interactive=True)
|
||||||
with gr.Tabs():
|
merge_list_character_name = gr.Textbox("", label=i18n("角色名称,留空使用主文件夹的"),interactive=True)
|
||||||
with gr.Tab(i18n("内容预览")):
|
merge_list_button = gr.Button(i18n("合并文件夹与List"), variant="primary")
|
||||||
input_audio = gr.Textbox("", label=i18n("音频文件"),interactive=False)
|
with gr.Column(scale=2):
|
||||||
input_text = gr.Textbox("", lines=20, max_lines=30, label=i18n("srt文件内容"))
|
list_preview = gr.Textbox("", lines=20, max_lines=30, label=i18n("合并后的List"))
|
||||||
input_srt_file.change(load_srt_from_file, [input_srt_file], [input_text])
|
|
||||||
with gr.Column(scale=1) as control_col:
|
|
||||||
with gr.Tabs():
|
|
||||||
with gr.Tab(i18n("合并字幕设置")):
|
|
||||||
merge_zero_interval = gr.Checkbox(label=i18n("提前合并时间间隔很短的字幕"),interactive=True, value=True)
|
|
||||||
short_interval = gr.Slider(value=0.05, minimum=0, maximum=0.5, step=0.005, label=i18n("判定为短间隔时长"),interactive=True,visible=True)
|
|
||||||
max_interval = gr.Slider(value=0.8, minimum=0.1, maximum=10, step=0.1, label=i18n("最大间隔时间"),interactive=True)
|
|
||||||
max_text_length = gr.Slider(value=50,minimum=5,maximum=200,step=1, label=i18n("最长允许单句长度"),interactive=True)
|
|
||||||
add_period = gr.Checkbox(label=i18n("句末加句号"),interactive=True, value=True)
|
|
||||||
merge_button = gr.Button(i18n("合并字幕"), variant="primary")
|
|
||||||
|
|
||||||
with gr.Tab(i18n("过滤设置")):
|
scan_list_button.click(scan_list_folders, [scan_list_folder], [first_list_folder, second_list_folder])
|
||||||
min_length = gr.Slider(value=5, minimum=0, maximum=20, step=1, label=i18n("允许最短长度"),interactive=True)
|
merge_list_button.click(preview_merged_list, [first_list_folder, second_list_folder, merge_list_character_name, scan_list_folder], [list_preview])
|
||||||
filter_english = gr.Checkbox(label=i18n("过滤带有英文的"),interactive=True)
|
save_folder.change(lambda x:gr.Textbox(value=x), [save_folder], [scan_list_folder])
|
||||||
filter_words = gr.Textbox("", label=i18n("过滤词语,一行一个"),lines=5,max_lines=10,interactive=True)
|
scan_list_folder.change(lambda x:gr.Textbox(value=x), [scan_list_folder], [save_folder])
|
||||||
filter_button = gr.Button(i18n("过滤字幕"), variant="primary",interactive=False)
|
|
||||||
with gr.Tab(i18n("切分与保存")):
|
|
||||||
with gr.Group():
|
|
||||||
pre_preserve_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("前置保留时间"),interactive=True)
|
|
||||||
post_preserve_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("后置保留时间"),interactive=True)
|
|
||||||
pre_silence_time = gr.Slider(value=0.05, minimum=0, maximum=1, step=0.01, label=i18n("前置添加静音时间"),interactive=True,visible=False)
|
|
||||||
post_silence_time = gr.Slider(value=0.1, minimum=0, maximum=1, step=0.01, label=i18n("后置添加静音时间"),interactive=True,visible=False)
|
|
||||||
with gr.Group():
|
|
||||||
language = gr.Dropdown([i18n(i) for i in ["auto", "zh", "en", "ja", "all_zh", "all_ja"]], value="auto", label=i18n("语言"),interactive=True)
|
|
||||||
audio_format = gr.Dropdown(["mp3", "wav", "ogg"], value="wav", label=i18n("音频格式"),interactive=True)
|
|
||||||
with gr.Group():
|
|
||||||
save_folder = gr.Textbox("output/sliced_audio", label=i18n("保存文件夹"),interactive=True)
|
|
||||||
character = gr.Textbox("character", label=i18n("保存子文件夹名称"),interactive=True)
|
|
||||||
character_warning = gr.Textbox(i18n("注意:该文件夹已存在"), label=i18n("提示"),interactive=False,visible=False)
|
|
||||||
save_srt_button = gr.Button(i18n("保存合并后字幕"),variant="secondary",interactive=True)
|
|
||||||
slice_audio_button = gr.Button(i18n("切分并保存音频、list"), variant="primary",interactive=False)
|
|
||||||
|
|
||||||
with gr.Column(scale=2) as output_col:
|
|
||||||
with gr.Tabs():
|
|
||||||
with gr.Tab(i18n("合并后srt文本")):
|
|
||||||
output_text = gr.Textbox("", lines=20, max_lines=30, label="Sliced SRT")
|
|
||||||
with gr.Tab(i18n("切分预览")):
|
|
||||||
gr.Textbox(i18n("正在建设,敬请期待"), label=i18n("提示"),interactive=False)
|
|
||||||
scan_button.click(get_srt_and_audio_files, [input_folder], [srt_files_list, audio_files_list])
|
scan_button.click(get_srt_and_audio_files, [input_folder], [srt_files_list, audio_files_list])
|
||||||
merge_zero_interval.change(lambda x: gr.update(visible=x), [merge_zero_interval],[short_interval])
|
merge_zero_interval.change(lambda x: gr.update(visible=x), [merge_zero_interval],[short_interval])
|
||||||
srt_files_list.change(change_srt_file, [input_folder, srt_files_list], [audio_files_list])
|
srt_files_list.change(change_srt_file, [input_folder, srt_files_list], [audio_files_list])
|
||||||
|
Loading…
x
Reference in New Issue
Block a user