Merge pull request #95 from KakaruHayate/patch-1

使用librosa加载音频避免ffmpeg.probe读取metadata的错误
This commit is contained in:
RVC-Boss 2024-01-22 18:39:06 +08:00 committed by GitHub
commit ca5b67002b
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -5,7 +5,8 @@ from tools.i18n.i18n import I18nAuto
i18n = I18nAuto() i18n = I18nAuto()
logger = logging.getLogger(__name__) logger = logging.getLogger(__name__)
import ffmpeg import librosa
import soundfile as sf
import torch import torch
import sys import sys
from mdxnet import MDXNetDereverb from mdxnet import MDXNetDereverb
@ -54,16 +55,17 @@ def uvr(model_name, inp_root, save_root_vocal, paths, save_root_ins, agg, format
need_reformat = 1 need_reformat = 1
done = 0 done = 0
try: try:
info = ffmpeg.probe(inp_path, cmd="ffprobe") y, sr = librosa.load(inp_path, sr=None)
if ( info = sf.info(inp_path)
info["streams"][0]["channels"] == 2 channels = info.channels
and info["streams"][0]["sample_rate"] == "44100" if channels == 2 and sr == 44100:
):
need_reformat = 0 need_reformat = 0
pre_fun._path_audio_( pre_fun._path_audio_(
inp_path, save_root_ins, save_root_vocal, format0, is_hp3=is_hp3 inp_path, save_root_ins, save_root_vocal, format0, is_hp3=is_hp3
) )
done = 1 done = 1
else:
need_reformat = 1
except: except:
need_reformat = 1 need_reformat = 1
traceback.print_exc() traceback.print_exc()
@ -72,10 +74,8 @@ def uvr(model_name, inp_root, save_root_vocal, paths, save_root_ins, agg, format
os.path.join(os.environ["TEMP"]), os.path.join(os.environ["TEMP"]),
os.path.basename(inp_path), os.path.basename(inp_path),
) )
os.system( y_resampled = librosa.resample(y, sr, 44100)
"ffmpeg -i %s -vn -acodec pcm_s16le -ac 2 -ar 44100 %s -y" sf.write(tmp_path, y_resampled, 44100, "PCM_16")
% (inp_path, tmp_path)
)
inp_path = tmp_path inp_path = tmp_path
try: try:
if done == 0: if done == 0:
@ -183,4 +183,4 @@ app.queue(concurrency_count=511, max_size=1022).launch(
share=is_share, share=is_share,
server_port=webui_port_uvr5, server_port=webui_port_uvr5,
quiet=True, quiet=True,
) )