mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-09-22 20:19:58 +08:00
fix
This commit is contained in:
commit
7bf0088b05
@ -17,7 +17,7 @@ RUN apt-get update && \
|
|||||||
# Copy only requirements.txt initially to leverage Docker cache
|
# Copy only requirements.txt initially to leverage Docker cache
|
||||||
WORKDIR /workspace
|
WORKDIR /workspace
|
||||||
COPY requirements.txt /workspace/
|
COPY requirements.txt /workspace/
|
||||||
RUN pip install --no-cache-dir -r requirements.txt
|
RUN CMAKE_POLICY_VERSION_MINIMUM=3.5 pip install --no-cache-dir -r requirements.txt
|
||||||
|
|
||||||
# Define a build-time argument for image type
|
# Define a build-time argument for image type
|
||||||
ARG IMAGE_TYPE=full
|
ARG IMAGE_TYPE=full
|
||||||
|
13
api.py
13
api.py
@ -173,6 +173,9 @@ import config as global_config
|
|||||||
import logging
|
import logging
|
||||||
import subprocess
|
import subprocess
|
||||||
|
|
||||||
|
import nltk
|
||||||
|
nltk.download('averaged_perceptron_tagger_eng')
|
||||||
|
|
||||||
|
|
||||||
class DefaultRefer:
|
class DefaultRefer:
|
||||||
def __init__(self, path, text, language):
|
def __init__(self, path, text, language):
|
||||||
@ -1086,9 +1089,10 @@ async def tts_endpoint(request: Request):
|
|||||||
|
|
||||||
@app.get("/")
|
@app.get("/")
|
||||||
async def tts_endpoint(
|
async def tts_endpoint(
|
||||||
refer_wav_path: str = None,
|
refer_wav_path: str = "saotome/saotome-6s.wav",
|
||||||
prompt_text: str = None,
|
prompt_text: str = "今日は友達と一緒に映画を見に行く予定ですが、天気が悪くて少し心配です。",
|
||||||
prompt_language: str = None,
|
prompt_language: str = "all_ja",
|
||||||
|
character: str = "saotome",
|
||||||
text: str = None,
|
text: str = None,
|
||||||
text_language: str = None,
|
text_language: str = None,
|
||||||
cut_punc: str = None,
|
cut_punc: str = None,
|
||||||
@ -1096,10 +1100,11 @@ async def tts_endpoint(
|
|||||||
top_p: float = 1.0,
|
top_p: float = 1.0,
|
||||||
temperature: float = 1.0,
|
temperature: float = 1.0,
|
||||||
speed: float = 1.0,
|
speed: float = 1.0,
|
||||||
inp_refs: list = Query(default=[]),
|
inp_refs: list = Query(default=["saotome/saotome-10s.wav", "saotome/refs/ref1.wav", "saotome/refs/ref2.wav", "saotome/refs/ref3.wav", "saotome/refs/ref4.wav"]),
|
||||||
sample_steps: int = 32,
|
sample_steps: int = 32,
|
||||||
if_sr: bool = False
|
if_sr: bool = False
|
||||||
):
|
):
|
||||||
|
print(f"the base path is {refer_wav_path}")
|
||||||
return handle(refer_wav_path, prompt_text, prompt_language, text, text_language, cut_punc, top_k, top_p, temperature, speed, inp_refs, sample_steps, if_sr)
|
return handle(refer_wav_path, prompt_text, prompt_language, text, text_language, cut_punc, top_k, top_p, temperature, speed, inp_refs, sample_steps, if_sr)
|
||||||
|
|
||||||
|
|
||||||
|
@ -1,42 +1,40 @@
|
|||||||
numpy==1.23.4
|
numpy==1.23.4
|
||||||
scipy
|
scipy==1.13.1
|
||||||
tensorboard
|
tensorboard==2.19.0
|
||||||
librosa==0.9.2
|
librosa==0.9.2
|
||||||
numba==0.56.4
|
numba==0.56.4
|
||||||
pytorch-lightning
|
pytorch-lightning==2.5.1
|
||||||
gradio>=4.0,<=4.24.0
|
gradio==4.24.0
|
||||||
ffmpeg-python
|
ffmpeg-python==0.2.0
|
||||||
onnxruntime; sys_platform == 'darwin'
|
onnxruntime==1.19.2 #(for macOS)
|
||||||
onnxruntime-gpu; sys_platform != 'darwin'
|
onnxruntime-gpu==1.19.2 #(for non-macOS)
|
||||||
tqdm
|
tqdm==4.67.1
|
||||||
funasr==1.0.27
|
funasr==1.0.27
|
||||||
torch<2.4
|
cn2an==0.5.23
|
||||||
cn2an
|
pypinyin==0.53.0
|
||||||
pypinyin
|
pyopenjtalk==0.4.0
|
||||||
pyopenjtalk>=0.3.4
|
g2p-en==2.1.0
|
||||||
g2p_en
|
torchaudio==2.6.0
|
||||||
torchaudio
|
|
||||||
modelscope==1.10.0
|
modelscope==1.10.0
|
||||||
sentencepiece
|
sentencepiece==0.2.0
|
||||||
transformers>=4.43
|
transformers==4.50.0
|
||||||
peft
|
peft==0.15.0
|
||||||
chardet
|
chardet==5.2.0
|
||||||
PyYAML
|
PyYAML==6.0.2
|
||||||
psutil
|
psutil==7.0.0
|
||||||
jieba_fast
|
jieba_fast==0.53
|
||||||
jieba
|
jieba==0.42.1
|
||||||
split-lang
|
split-lang==2.1.0
|
||||||
fast_langdetect>=0.3.0
|
fast-langdetect==0.3.1
|
||||||
Faster_Whisper
|
faster-whisper==1.1.1
|
||||||
wordsegment
|
wordsegment==1.3.1
|
||||||
rotary_embedding_torch
|
rotary-embedding-torch==0.8.6
|
||||||
ToJyutping
|
ToJyutping==3.2.0
|
||||||
g2pk2
|
g2pk2==0.0.3
|
||||||
ko_pron
|
ko-pron==1.3
|
||||||
opencc; sys_platform != 'linux'
|
opencc==1.1.1 #(for Linux)
|
||||||
opencc==1.1.1; sys_platform == 'linux'
|
python-mecab-ko==1.3.7 #(not for Windows)
|
||||||
python_mecab_ko; sys_platform != 'win32'
|
fastapi==0.112.1 # (since <0.112.2)
|
||||||
fastapi<0.112.2
|
x-transformers==2.1.37
|
||||||
x_transformers
|
torchmetrics==1.5.0
|
||||||
torchmetrics<=1.5
|
attrdict==2.0.1
|
||||||
attrdict
|
|
||||||
|
BIN
saotome/refs/ref1.wav
Normal file
BIN
saotome/refs/ref1.wav
Normal file
Binary file not shown.
BIN
saotome/refs/ref2.wav
Normal file
BIN
saotome/refs/ref2.wav
Normal file
Binary file not shown.
BIN
saotome/refs/ref3.wav
Normal file
BIN
saotome/refs/ref3.wav
Normal file
Binary file not shown.
BIN
saotome/refs/ref4.wav
Normal file
BIN
saotome/refs/ref4.wav
Normal file
Binary file not shown.
BIN
saotome/saotome-10s.wav
Normal file
BIN
saotome/saotome-10s.wav
Normal file
Binary file not shown.
BIN
saotome/saotome-6s.wav
Normal file
BIN
saotome/saotome-6s.wav
Normal file
Binary file not shown.
Loading…
x
Reference in New Issue
Block a user