mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-04-05 04:22:46 +08:00
Merge 47bc83bd5fc171bde797e10c64cbc31617d21764 into 9da7e17efe05041e31d3c3f42c8730ae890397f2
This commit is contained in:
commit
41de0d1cc3
65
api_v2.py
65
api_v2.py
@ -23,7 +23,8 @@ POST:
|
||||
{
|
||||
"text": "", # str.(required) text to be synthesized
|
||||
"text_lang: "", # str.(required) language of the text to be synthesized
|
||||
"ref_audio_path": "", # str.(required) reference audio path
|
||||
"ref_audio_path": "", # str.(optional) reference audio path, required if `ref_audio` not set
|
||||
"ref_audio": "" # str.(optional) reference audio encoded as base64, required if `ref_audio_path` not set
|
||||
"aux_ref_audio_paths": [], # list.(optional) auxiliary reference audio paths for multi-speaker tone fusion
|
||||
"prompt_text": "", # str.(optional) prompt text for the reference audio
|
||||
"prompt_lang": "", # str.(required) language of the prompt text for the reference audio
|
||||
@ -44,6 +45,53 @@ POST:
|
||||
}
|
||||
```
|
||||
|
||||
#### 使用base64发送reference audio示例代码
|
||||
```python
|
||||
import requests
|
||||
import base64
|
||||
import json
|
||||
|
||||
# 定义音频文件路径和文本内容
|
||||
audio_file_path = "/src/GPT-SoVITS/reference/news_reporter.wav"
|
||||
audio_text = "系统内随后发售的其它车次车票依然十分抢手,仅个别车次仍有余票。"
|
||||
|
||||
# 读取音频文件并进行Base64编码
|
||||
with open(audio_file_path, "rb") as audio_file:
|
||||
audio_data = audio_file.read()
|
||||
audio_base64 = base64.b64encode(audio_data).decode('utf-8')
|
||||
|
||||
# 构建请求数据
|
||||
payload = {
|
||||
"text": "四渡赤水中,毛泽东险些辞职。因为他的一个打法,违反了最基本的战场原则——先弱后强,遭到了所有人的反对。但在周恩来的支持下,其他人还是按他说的打了。果然,这不仅避开了蒋中正的陷阱,还让红军找到了生机。",
|
||||
"text_lang": "zh",
|
||||
"ref_audio": audio_base64,
|
||||
"prompt_text": audio_text,
|
||||
"prompt_lang": "zh",
|
||||
"top_k": 15,
|
||||
"top_p": 0.7,
|
||||
"temperature": 0.85,
|
||||
"text_split_method": "cut5",
|
||||
"batch_size": 1,
|
||||
"media_type": "wav",
|
||||
"streaming_mode": False,
|
||||
"speed_factor": 1.1
|
||||
}
|
||||
|
||||
# 发送POST请求
|
||||
url = 'http://localhost:9880/tts'
|
||||
headers = {'Content-Type': 'application/json'}
|
||||
response = requests.post(url, headers=headers, data=json.dumps(payload))
|
||||
|
||||
# 检查响应状态码
|
||||
if response.status_code == 200:
|
||||
with open('output.wav', 'wb') as output_file:
|
||||
output_file.write(response.content)
|
||||
print("音频文件已保存为 output.wav")
|
||||
else:
|
||||
print(f"请求失败,状态码: {response.status_code}")
|
||||
print(f"响应内容: {response.text}")
|
||||
```
|
||||
|
||||
RESP:
|
||||
成功: 直接返回 wav 音频流, http code 200
|
||||
失败: 返回包含错误信息的 json, http code 400
|
||||
@ -101,6 +149,8 @@ import os
|
||||
import sys
|
||||
import traceback
|
||||
from typing import Generator
|
||||
import base64
|
||||
import tempfile
|
||||
|
||||
now_dir = os.getcwd()
|
||||
sys.path.append(now_dir)
|
||||
@ -149,6 +199,7 @@ class TTS_Request(BaseModel):
|
||||
text: str = None
|
||||
text_lang: str = None
|
||||
ref_audio_path: str = None
|
||||
ref_audio: str = None
|
||||
aux_ref_audio_paths: list = None
|
||||
prompt_lang: str = None
|
||||
prompt_text: str = ""
|
||||
@ -250,8 +301,8 @@ def check_params(req:dict):
|
||||
prompt_lang:str = req.get("prompt_lang", "")
|
||||
text_split_method:str = req.get("text_split_method", "cut5")
|
||||
|
||||
if ref_audio_path in [None, ""]:
|
||||
return JSONResponse(status_code=400, content={"message": "ref_audio_path is required"})
|
||||
if ref_audio_path in [None, ""] and ref_audio in [None, ""]:
|
||||
return JSONResponse(status_code=400, content={"message": "ref_audio_path or ref_audio is required"})
|
||||
if text in [None, ""]:
|
||||
return JSONResponse(status_code=400, content={"message": "text is required"})
|
||||
if (text_lang in [None, ""]) :
|
||||
@ -377,6 +428,7 @@ async def tts_get_endpoint(
|
||||
sample_steps:int =32,
|
||||
super_sampling:bool = False
|
||||
):
|
||||
|
||||
req = {
|
||||
"text": text,
|
||||
"text_lang": text_lang.lower(),
|
||||
@ -407,6 +459,13 @@ async def tts_get_endpoint(
|
||||
@APP.post("/tts")
|
||||
async def tts_post_endpoint(request: TTS_Request):
|
||||
req = request.dict()
|
||||
if req['ref_audio']:
|
||||
print(req['ref_audio'])
|
||||
# 上传了以base64编码的参考音频,解码后存入临时文件并将文件路径赋值给ref_audio_path
|
||||
decoded_audio = base64.b64decode(req['ref_audio'])
|
||||
with tempfile.NamedTemporaryFile(delete=False) as temp_file:
|
||||
temp_file.write(decoded_audio)
|
||||
req['ref_audio_path'] = temp_file.name
|
||||
return await tts_handle(req)
|
||||
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user