Merge 60414d25a39f3786a392523297734c144d1c59a9 into ea2d2a81667239d37615697e8f0056e35bab2db6

Update README.md
Update Documentation (#2768 )
2026-04-29 21:00:42 +08:00 · 2026-04-19 14:16:06 +01:00 · 2026-04-19 21:02:57 +08:00 · 2026-04-18 22:33:55 +08:00 · 2026-04-18 19:01:11 +08:00 · 2026-04-18 17:33:53 +08:00
25 changed files with 2231 additions and 66 deletions
--- a/GPT_SoVITS/AR/models/utils.py
+++ b/GPT_SoVITS/AR/models/utils.py
@ -262,7 +262,7 @@ def make_reject_y(y_o, y_lens):
    reject_y = []
    reject_y_lens = []
    for b in range(bs):
-        process_item_idx = torch.randint(0, 1, size=(1,))[0]
+        process_item_idx = torch.randint(0, 2, size=(1,))[0]
        if process_item_idx == 0:
            new_y = repeat_P(y_o[b])
            reject_y.append(new_y)
--- a/GPT_SoVITS/AR/modules/patched_mha_with_cache_onnx.py
+++ b/GPT_SoVITS/AR/modules/patched_mha_with_cache_onnx.py
@ -8,30 +8,30 @@ def multi_head_attention_forward_patched(
    query,
    key,
    value,
-    embed_dim_to_check: int,
-    num_heads: int,
+    embed_dim_to_check,
+    num_heads,
    in_proj_weight,
-    in_proj_bias: Optional[Tensor],
-    bias_k: Optional[Tensor],
-    bias_v: Optional[Tensor],
-    add_zero_attn: bool,
-    dropout_p: float,
-    out_proj_weight: Tensor,
-    out_proj_bias: Optional[Tensor],
-    training: bool = True,
-    key_padding_mask: Optional[Tensor] = None,
-    need_weights: bool = True,
-    attn_mask: Optional[Tensor] = None,
-    use_separate_proj_weight: bool = False,
-    q_proj_weight: Optional[Tensor] = None,
-    k_proj_weight: Optional[Tensor] = None,
-    v_proj_weight: Optional[Tensor] = None,
-    static_k: Optional[Tensor] = None,
-    static_v: Optional[Tensor] = None,
-    average_attn_weights: bool = True,
-    is_causal: bool = False,
+    in_proj_bias,
+    bias_k,
+    bias_v,
+    add_zero_attn,
+    dropout_p,
+    out_proj_weight,
+    out_proj_bias,
+    training=True,
+    key_padding_mask=None,
+    need_weights=True,
+    attn_mask=None,
+    use_separate_proj_weight=False,
+    q_proj_weight=None,
+    k_proj_weight=None,
+    v_proj_weight=None,
+    static_k=None,
+    static_v=None,
+    average_attn_weights=True,
+    is_causal=False,
    cache=None,
-) -> Tuple[Tensor, Optional[Tensor]]:
+):
    # set up shape vars
    _, _, embed_dim = query.shape
    attn_mask = _canonical_mask(
--- a/GPT_SoVITS/VoiceSave/init.py
+++ b/GPT_SoVITS/VoiceSave/init.py
@ -0,0 +1,178 @@
+import zipfile
+from . import file_lib as fl
+from . import time_lib as tl
+from . import info_lib as il
+import os
+from typing import Union
+import numpy as np
+import torch
+
+POOL:set = set() 
+def get_unique_name(name,MySet:set=set()):
+    _id = 1
+    if name not in POOL and name not in MySet:
+        POOL.add(name)
+        return name
+    while name in POOL or name in MySet:
+        _id += 1
+        name = f'{name}_{_id}'
+    POOL.add(name)
+    return name
+
+TEMP_DIR = fl.merge_dir_txt2(fl.get_my_dir(), "Temp")
+TEMP_ZIP_DIR = fl.merge_dir_txt2(TEMP_DIR, "ZipTemp")
+def _tensor_to_numpy(tensor: torch.Tensor) -> np.ndarray:
+    cloned = tensor.clone().detach()
+    np_array = cloned.cpu().numpy()
+    return np_array
+
+def save_np(path: str, np_array: np.ndarray) -> None:
+    np.save(path, np_array)
+
+class ZIP_File:
+    def __init__(self, path: str,name:str,MySet:set=set()):
+        self.path = path
+        if not os.path.exists(self.path):
+            with zipfile.ZipFile(self.path, 'w') as zipf:
+                pass
+        self.name = get_unique_name(name,MySet=MySet)#MySet用于补充命名集合，防止文件夹混淆
+        self.temp_write = fl.merge_dir_txt2(TEMP_ZIP_DIR, self.name)
+
+        if not os.path.exists(self.temp_write):
+            os.makedirs(self.temp_write)
+
+    def release(self):
+        '''relaese the zip file, extract it to temp dir'''
+        if os.path.exists(self.temp_write):
+            fl.delete_dir(self.temp_write)
+            fl.create_dir(self.temp_write)
+        with zipfile.ZipFile(self.path, 'r') as zipf:
+            zipf.extractall(self.temp_write)
+        #fl.delete_file(self.path)
+    def create_dir(self, dir_:str):
+        dir_path = fl.merge_dir_txt2(self.temp_write, dir_)
+        if not os.path.exists(dir_path):
+            os.makedirs(dir_path,exist_ok=True)
+
+    def create_file(self, file_name:str,location:str=''):
+        if location == '':
+            file_path = fl.merge_dir_txt2(self.temp_write,file_name)
+        else:
+            file_path = fl.merge_dir_txt2(self.temp_write, location, file_name)
+        if not os.path.exists(file_path):
+            os.makedirs(os.path.dirname(file_path),exist_ok=True)
+        with open(file_path, 'w') as f:
+            pass
+
+    def get_file_path(self, file_name:str,location:str=''):
+        if location == '':
+            file_path = fl.merge_dir_txt2(self.temp_write,file_name)
+        else:
+            file_path = fl.merge_dir_txt2(self.temp_write, location, file_name)
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(f"File {file_path} does not exist.")
+        return file_path
+    
+    def get_file_obj(self, file_name:str,location:str='',mode:str='r'):
+        if location == '':
+            file_path = fl.merge_dir_txt2(self.temp_write,file_name)
+        else:
+            file_path = fl.merge_dir_txt2(self.temp_write, location, file_name)
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(f"File {file_path} does not exist.")
+        return open(file_path, mode)
+    
+    def save_file(self, obj):
+        obj.close()
+    
+    def save_zip(self):
+        with zipfile.ZipFile(self.path, 'w', zipfile.ZIP_DEFLATED) as zipf:
+            for root, dirs, files in os.walk(self.temp_write):
+                for file in files:
+                    file_path = os.path.join(root, file)
+                    arcname = os.path.relpath(file_path, self.temp_write)
+                    zipf.write(file_path, arcname)
+        #fl.delete_dir(self.temp_write)
+
+    def close(self):
+        self.save_zip()
+        fl.delete_dir(self.temp_write)
+        POOL.remove(self.name)
+
+def save_tensor(path: str,
+                 tensors: Union[torch.Tensor, list],
+                 name:str,
+                 MySet:set=set(),
+                 file_names:Union[str,list,None]=None,
+                 **info_save,) -> None:
+    if isinstance(tensors, torch.Tensor):
+        tensors = [tensors]
+    if not file_names:
+        return
+    if isinstance(file_names, str):
+        files = [file_names]
+    else:
+        files = file_names
+
+    print(f"length of tensors: {len(tensors)}, length of files: {len(files)}")
+    if len(tensors) != len(files):
+        raise ValueError("The number of tensors and files must be the same.")
+    np_arrays = []
+    for tensor in tensors:
+        np_array = _tensor_to_numpy(tensor)
+        np_arrays.append(np_array)
+    zf = ZIP_File(path, name, MySet=MySet)
+    zf.create_file("voice.json")
+    info = {'name': name}
+    info.update(info_save)
+    il.save_info(info, str(zf.get_file_path("voice.json")))
+    for i in range(len(files)):
+        file_name = files[i]
+        np_array = np_arrays[i]
+        zf.create_file(file_name)
+        save_np(str(zf.get_file_path(file_name)), np_array)
+    zf.close()
+    del zf
+
+def load_tensor(path: str,
+               name:str,
+               find_func,
+               MySet:set=set(),) -> list[torch.Tensor]:
+    zf = ZIP_File(path, name, MySet=MySet)
+    zf.release()
+    voice_path = find_func(zf,il)
+    tensors = []
+    for i in range(len(voice_path)):
+        v = voice_path[i]
+        np_array = np.load(v,allow_pickle=True)
+        tensor = torch.from_numpy(np_array)
+        tensors.append(tensor)
+    zf.close()
+    del zf
+    return tensors
+
+def add_tensor(add:list[torch.Tensor],
+               path: str,
+               name:str,
+               find_func,
+               MySet:set=set(),
+               file_names:Union[str,list,None]=None,
+               **info_save,):
+    tensors = load_tensor(path,name,find_func,MySet=MySet)
+    tensors.extend(add)
+    save_tensor(path,tensors,name,MySet=MySet,file_names=file_names,**info_save)
+    
+def __find_func__(zf,il):
+    f = zf.get_file_path("voice.json")
+    info = il.load_info(f)
+    if info is None:
+        return None
+    list_names = info["access_list"]
+    ret = []
+    for name in list_names:
+        try:
+            a = zf.get_file_path(name)
+            ret.append(a)
+        except FileNotFoundError:
+            continue
+    return ret
--- a/GPT_SoVITS/VoiceSave/file_lib.py
+++ b/GPT_SoVITS/VoiceSave/file_lib.py
@ -0,0 +1,35 @@
+import os
+import shutil
+from pathlib import Path
+
+def get_my_dir():
+    return os.path.dirname(os.path.abspath(__file__))
+
+def get_parent_dir(dir_path,depth=1):
+    parent_path = Path(dir_path)
+    for _ in range(depth):
+        parent_path = parent_path.parent
+    return parent_path
+
+def merge_dir_txt(a,b):
+    c=os.path.join(a,b)
+    return c
+def merge_dir_txt2(*TXT):
+    return Path(os.path.join(*TXT))
+def create_dir(path: Path, overwrite=False) -> bool:
+    if overwrite and path.exists():
+        shutil.rmtree(path)
+    path = Path(path)
+    path.mkdir(parents=True, exist_ok=True)
+    return path.exists()
+def get_dir_children_dirs(path: Path):
+    return [item for item in path.iterdir() if item.is_dir()]
+def get_dir_children_files(path: Path):
+    return [item for item in path.iterdir() if item.is_file()]
+def delete_dir(path: Path):
+    return shutil.rmtree(path)
+def delete_file(path: Path):
+    return os.remove(path)
+def file_exists(path: Path):
+    path = Path(path)
+    return path.exists()
--- a/GPT_SoVITS/VoiceSave/info_lib.py
+++ b/GPT_SoVITS/VoiceSave/info_lib.py
@ -0,0 +1,10 @@
+import json
+
+def load_info(info_path):
+    with open(info_path, 'r', encoding='utf-8') as f:
+        info = json.load(f)
+    return info
+
+def save_info(info, info_path):
+    with open(info_path, 'w', encoding='utf-8') as f:
+        json.dump(info, f, ensure_ascii=False, indent=4)
--- a/GPT_SoVITS/VoiceSave/time_lib.py
+++ b/GPT_SoVITS/VoiceSave/time_lib.py
@ -0,0 +1,38 @@
+import time
+#time styles
+STYLE_Y = "%Y"
+STYLE_M = "%m"
+STYLE_D = "%d"
+STYLE_H = "%H"
+STYLE_MIN = "%M"
+STYLE_S = "%S"
+STYLE_FULL = "%Y-%m-%d_%H.%M.%S"
+#quick calls
+def get_time_y(STYLE = STYLE_Y):
+    return time.strftime(STYLE, time.localtime())
+def get_time_m(STYLE = STYLE_M):
+    return time.strftime(STYLE, time.localtime())
+def get_time_d(STYLE = STYLE_D):
+    return time.strftime(STYLE, time.localtime())
+def get_time_h(STYLE = STYLE_H):
+    return time.strftime(STYLE, time.localtime())
+def get_time_min(STYLE = STYLE_MIN):
+    return time.strftime(STYLE, time.localtime())
+def get_time_s(STYLE = STYLE_S):
+    return time.strftime(STYLE, time.localtime())
+def get_time_full(STYLE = STYLE_FULL):
+    return time.strftime(STYLE, time.localtime())
+
+def s(t:float):
+    time.sleep(t)
+    return 
+###
+
+if __name__ == '__main__':
+    print(get_time_y())
+    print(get_time_m())
+    print(get_time_d())
+    print(get_time_h())
+    print(get_time_min())
+    print(get_time_s())
+    print(get_time_full())
--- a/GPT_SoVITS/config.json
+++ b/GPT_SoVITS/config.json
@ -0,0 +1,7 @@
+{
+    "running_on" : "local",
+    "Default":{
+        "GPT_Path": "不训练直接推v3底模！",
+        "SoVITS_Path": "不训练直接推v2ProPlus底模！"
+    }
+}
--- a/GPT_SoVITS/feature_extractor/cnhubert.py
+++ b/GPT_SoVITS/feature_extractor/cnhubert.py
@ -24,6 +24,7 @@ class CNHubert(nn.Module):
        super().__init__()
        if base_path is None:
            base_path = cnhubert_base_path
+        print(f"Loading CN-Hubert from \"{base_path}\"")
        if os.path.exists(base_path):
            ...
        else:
@ -69,6 +70,7 @@ class CNHubert(nn.Module):


 def get_model():
+    print("cnhubert_base_path:", cnhubert_base_path)
    model = CNHubert()
    model.eval()
    return model
--- a/GPT_SoVITS/inference_webui.py
+++ b/GPT_SoVITS/inference_webui.py
@ -8,6 +8,62 @@
 """
 import psutil
 import os
+import sys
+import json
+from pathlib import Path
+import uuid
+from scipy.io.wavfile import write
+
+
+
+def get_my_dir():
+    return os.path.dirname(os.path.abspath(__file__))
+
+def get_parent_dir(dir_path,depth=1):
+    parent_path = Path(dir_path)
+    for _ in range(depth):
+        parent_path = parent_path.parent
+    return parent_path
+
+def merge_dir_txt2(*TXT):
+    return Path(os.path.join(*TXT))
+
+with open(merge_dir_txt2(get_my_dir(), "config.json"), "r", encoding="utf-8") as f:
+    config_json = f.read()
+    config_json = json.loads(config_json)
+    running_on = config_json["running_on"]
+    Default = config_json["Default"]
+
+ROOT_DIR = str(get_parent_dir(get_my_dir()))
+sys.path.append(get_my_dir())
+import VoiceSave
+
+POOL:set = set() 
+def _get_unique_name(name,MySet:set=set()):
+    _id = 1
+    if name not in POOL and name not in MySet:
+        POOL.add(name)
+        return name
+    while name in POOL or name in MySet:
+        _id += 1
+        name = f'{name}_{_id}'
+    POOL.add(name)
+    return name
+
+def find_func(zf,il):
+    f = zf.get_file_path("voice.json")
+    info = il.load_info(f)
+    if info is None:
+        return None
+    list_names = info["access_list"]
+    ret = []
+    for name in list_names:
+        try:
+            a = zf.get_file_path(name)
+            ret.append(a)
+        except FileNotFoundError:
+            continue
+    return ret

 def set_high_priority():
    """把当前 Python 进程设为 HIGH_PRIORITY_CLASS"""
@ -70,6 +126,7 @@ with open("./weight.json", "r", encoding="utf-8") as file:
    if isinstance(sovits_path, list):
        sovits_path = sovits_path[0]

+
 # print(2333333)
 # print(os.environ["gpt_path"])
 # print(gpt_path)
@ -96,7 +153,7 @@ import numpy as np
 from feature_extractor import cnhubert
 from transformers import AutoModelForMaskedLM, AutoTokenizer

-cnhubert.cnhubert_base_path = cnhubert_base_path
+cnhubert.cnhubert_base_path = merge_dir_txt2(ROOT_DIR, cnhubert_base_path)

 import random

@ -130,6 +187,12 @@ language = os.environ.get("language", "Auto")
 language = sys.argv[-1] if sys.argv[-1] in scan_language_list() else language
 i18n = I18nAuto(language=language)

+
+if gpt_path in [None, "",]:
+    gpt_path = str(merge_dir_txt2(ROOT_DIR, name2gpt_path[i18n(Default["GPT_Path"])]))
+if sovits_path in [None, "",]:
+    sovits_path = str(merge_dir_txt2(ROOT_DIR, name2sovits_path[i18n(Default["SoVITS_Path"])]))
+
 # os.environ['PYTORCH_ENABLE_MPS_FALLBACK'] = '1'  # 确保直接启动推理UI时也能够设置。

 if torch.cuda.is_available():
@ -160,8 +223,8 @@ dict_language_v2 = {
 }
 dict_language = dict_language_v1 if version == "v1" else dict_language_v2

-tokenizer = AutoTokenizer.from_pretrained(bert_path)
-bert_model = AutoModelForMaskedLM.from_pretrained(bert_path)
+tokenizer = AutoTokenizer.from_pretrained(str(merge_dir_txt2(ROOT_DIR,bert_path)))
+bert_model = AutoModelForMaskedLM.from_pretrained(str(merge_dir_txt2(ROOT_DIR,bert_path)))
 if is_half == True:
    bert_model = bert_model.half().to(device)
 else:
@ -374,6 +437,7 @@ except:


 def change_gpt_weights(gpt_path):
+    print("gpt_path:", gpt_path)
    if "！" in gpt_path or "!" in gpt_path:
        gpt_path = name2gpt_path[gpt_path]
    global hz, max_sec, t2s_model, config
@ -765,6 +829,27 @@ def get_tts_wav(
    sample_steps=8,
    if_sr=False,
    pause_second=0.3,
+
+    SaveSvEmb=False,
+    SaveRefers=False,
+    SaveSvEmbName="sv_emb.voice",
+    SaveRefersName="refers.voice",
+
+    SaveGE=False,
+    SaveGEName="ge.voice",
+
+    InjectSvEmb=False,
+    InjectRefers=False,
+    InjectSvEmbName="sv_emb.voice",
+    InjectRefersName="refers.voice",
+
+    EnableAudioLoad=True,
+
+    SaveOutputAsUndecoded=False,
+    SaveOutputAsUndecodedName="output.voice",
+    AddRandomSaltToSaveOutputAsUndecodedName=False,
+
+    ReturnWay = "yield", # "yield" or "return"
 ):
    global cache
    if ref_wav_path:
@ -898,6 +983,9 @@ def get_tts_wav(
                sv_emb = []
                if sv_cn_model == None:
                    init_sv_cn()
+
+            try:
+                if EnableAudioLoad:
                    if inp_refs:
                        for path in inp_refs:
                            try:  #####这里加上提取sv的逻辑，要么一堆sv一堆refer，要么单个sv单个refer
@ -905,6 +993,7 @@ def get_tts_wav(
                                refers.append(refer)
                                if is_v2pro:
                                    sv_emb.append(sv_cn_model.compute_embedding3(audio_tensor))
+                                #print("refer:", refer.shape)
                            except:
                                traceback.print_exc()
                    if len(refers) == 0:
@ -912,6 +1001,128 @@ def get_tts_wav(
                        refers = [refers]
                        if is_v2pro:
                            sv_emb = [sv_cn_model.compute_embedding3(audio_tensor)]
+                else:
+                    refers = []
+                    sv_emb = []
+            except:
+                traceback.print_exc()
+
+            try:
+                if SaveSvEmb and is_v2pro:
+                    names = []
+                    for i in sv_emb:
+                        names.append(_get_unique_name(str(i.shape))+".npy")
+                    sv_path = merge_dir_txt2(ROOT_DIR,"output","sv_emb_opt")
+                    if not os.path.exists(sv_path):
+                        os.makedirs(sv_path,exist_ok=True)
+                    if not os.path.exists(SaveSvEmbName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","sv_emb_opt",SaveSvEmbName))
+                    else:
+                        _pth_ = SaveSvEmbName
+                    VoiceSave.save_tensor(_pth_,sv_emb,SaveSvEmbName,file_names=names,access_list=names)
+            except:
+                traceback.print_exc()
+
+            try:                
+                if SaveRefers:
+                    names = []
+                    for i in refers:
+                        names.append(_get_unique_name(str(i.shape))+".npy")
+                    refers_path = merge_dir_txt2(ROOT_DIR,"output","refers_opt")
+                    if not os.path.exists(refers_path):
+                        os.makedirs(refers_path,exist_ok=True)
+                    if not os.path.exists(SaveRefersName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","refers_opt",SaveRefersName))
+                    else:
+                        _pth_ = SaveRefersName
+                    VoiceSave.save_tensor(_pth_,refers,SaveRefersName,file_names=names,access_list=names)
+            except:
+                traceback.print_exc()
+            
+            #print("refers数量:", len(refers))
+            #print("sv_emb数量:", len(sv_emb) if is_v2pro else "无sv_emb")
+
+            try:
+                if InjectSvEmb and is_v2pro:
+                    if not os.path.exists(InjectSvEmbName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","sv_emb_opt",InjectSvEmbName))
+                    else:
+                        _pth_ = InjectSvEmbName
+                    _sv_emb = VoiceSave.load_tensor(_pth_,InjectSvEmbName,find_func)
+                    for i in range(len(_sv_emb)):
+                        sv_emb.append(_sv_emb[i].to(device))
+            except:
+                traceback.print_exc()
+
+            try:
+                if InjectRefers:
+                    if not os.path.exists(InjectRefersName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","refers_opt",InjectRefersName))
+                    else:
+                        _pth_ = InjectRefersName
+                    _refers = VoiceSave.load_tensor(_pth_,InjectRefersName,find_func)
+                    for i in range(len(_refers)):
+                        refers.append(_refers[i].to(device))
+            except:
+                traceback.print_exc()
+
+            #print("注入后refers数量:", len(refers))
+            #print("注入后sv_emb数量:", len(sv_emb) if is_v2pro else "无sv_emb")
+
+            try:
+                ges = []
+                for i in range(len(refers)):
+                    if is_v2pro:
+                        ge_ = vq_model.ge_(refers[i],sv_emb[i])
+                    else:
+                        ge_ = vq_model.ge_(refers[i])
+                    ges.append(ge_)
+                if SaveGE:
+                    names = []
+                    for i in ges:
+                        names.append(_get_unique_name(str(i.shape))+".npy")
+                    ge_path = merge_dir_txt2(ROOT_DIR,"output","ge_opt")
+                    if not os.path.exists(ge_path):
+                        os.makedirs(ge_path,exist_ok=True)
+                    if not os.path.exists(SaveGEName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","ge_opt",SaveGEName))
+                    else:
+                        _pth_ = SaveGEName
+                    VoiceSave.save_tensor(_pth_,ges,SaveGEName,file_names=names,access_list=names)
+            except:
+                traceback.print_exc()
+            
+            if AddRandomSaltToSaveOutputAsUndecodedName:
+                ranA = uuid.uuid4()
+                ranB = uuid.uuid4()
+                SaveOutputAsUndecodedName = f"{SaveOutputAsUndecodedName}_{ranA}_{ranB}.voice"
+            try:
+                if SaveOutputAsUndecoded:
+                    if is_v2pro:
+                        z_p,mask,ge = vq_model.decode2(
+                            pred_semantic, torch.LongTensor(phones2).to(device).unsqueeze(0),
+                            refers, speed=speed, sv_emb=sv_emb)
+                    else:
+                        z_p,mask,ge = vq_model.decode2(
+                            pred_semantic, torch.LongTensor(phones2).to(device).unsqueeze(0),
+                            refers, speed=speed)
+                    ret = [z_p.cpu().detach(), 
+                           mask.cpu().detach(),
+                           ge.cpu().detach()]
+                    names = [f"z_p_{str(ret[0].shape)}",
+                             f"mask_{str(ret[1].shape)}",
+                             f"ge_{str(ret[2].shape)}"]
+                    undecoded_path = merge_dir_txt2(ROOT_DIR,"output","undecoded_opt")
+                    if not os.path.exists(undecoded_path):
+                        os.makedirs(undecoded_path,exist_ok=True)
+                    if not os.path.exists(SaveOutputAsUndecodedName):
+                        _pth_ = str(merge_dir_txt2(ROOT_DIR,"output","undecoded_opt",SaveOutputAsUndecodedName))
+                    else:
+                        _pth_ = SaveOutputAsUndecodedName
+                    VoiceSave.save_tensor(_pth_,ret,SaveOutputAsUndecodedName,file_names=names,access_list=names)
+            except:
+                traceback.print_exc()
+
            if is_v2pro:
                audio = vq_model.decode(
                    pred_semantic, torch.LongTensor(phones2).to(device).unsqueeze(0), refers, speed=speed, sv_emb=sv_emb
@ -998,8 +1209,215 @@ def get_tts_wav(
            audio_opt /= max_audio
    else:
        audio_opt = audio_opt.cpu().detach().numpy()
-    yield opt_sr, (audio_opt * 32767).astype(np.int16)

+    if ReturnWay == "yield":
+        yield opt_sr, (audio_opt * 32767).astype(np.int16)
+    else:
+        return opt_sr, (audio_opt * 32767).astype(np.int16)
+
+def batched_tts_wav(
+    ref_wav_path,
+    prompt_text,
+    prompt_language,
+    texts,
+    text_language,
+    how_to_cut=i18n("不切"),
+    top_k=20,
+    top_p=0.6,
+    temperature=0.6,
+    ref_free=False,
+    speed=1,
+    if_freeze=False,
+    inp_refs=None,
+    sample_steps=8,
+    if_sr=False,
+    pause_second=0.3,
+
+    SaveSvEmb=False,
+    SaveRefers=False,
+    SaveSvEmbName="sv_emb.voice",
+    SaveRefersName="refers.voice",
+
+    SaveGE=False,
+    SaveGEName="ge.voice",
+
+    InjectSvEmb=False,
+    InjectRefers=False,
+    InjectSvEmbName="sv_emb.voice",
+    InjectRefersName="refers.voice",
+
+    EnableAudioLoad=True,
+
+    SaveOutputAsUndecoded=False,
+    SaveOutputAsUndecodedName="output.voice",
+    AddRandomSaltToSaveOutputAsUndecodedName=False,
+
+    ReturnWay = "yield", # "yield" or "return"
+):
+    count = 0
+    out = []
+    SaveDir = merge_dir_txt2(ROOT_DIR,"output","tts_output",f"batch_{uuid.uuid4()}")
+    if not os.path.exists(SaveDir):
+        os.makedirs(SaveDir,exist_ok=True)
+    for text in texts:
+        if text in [None, " ", ""]:
+            gr.Warning(i18n(f"输入文本第{count}行中有空行，已跳过"))
+            continue
+        else:
+            unparsed = get_tts_wav(
+                ref_wav_path,
+                prompt_text,
+                prompt_language,
+                text,
+                text_language,
+                how_to_cut,
+                top_k,
+                top_p,
+                temperature,
+                ref_free,
+                speed,
+                if_freeze,
+                inp_refs,
+                sample_steps,
+                if_sr,
+                pause_second,
+
+                SaveSvEmb,
+                SaveRefers,
+                SaveSvEmbName,
+                SaveRefersName,
+
+                SaveGE,
+                SaveGEName,
+
+                InjectSvEmb,
+                InjectRefers,
+                InjectSvEmbName,
+                InjectRefersName,
+
+                EnableAudioLoad,
+
+                SaveOutputAsUndecoded,
+                SaveOutputAsUndecodedName,
+                AddRandomSaltToSaveOutputAsUndecodedName,
+                "yield",
+            )
+            unparsed = list(unparsed)
+            print(unparsed)
+            a = text.strip().replace(' ','_').replace('\n','_')
+            wav_path = os.path.join(SaveDir,f"tts_output_{a}_{str(uuid.uuid4())}.wav")
+            write(wav_path, unparsed[0][0], unparsed[0][1])
+            out.append(wav_path)
+        count += 1
+    if ReturnWay == "yield":
+        yield SaveDir
+    else:
+        return SaveDir
+        
+def read_tts_batch_file(file_path):
+    ret = []
+    with open(file_path, 'r', encoding='utf-8') as f:
+        lines = f.readlines()
+    for l in lines:
+        if l.strip() in [None, " ", ""]:
+            continue
+        else:
+            ret.append(l)
+    return ret
+
+def batch_tts(
+    ref_wav_path,
+    prompt_text,
+    prompt_language,
+    text_paths,
+    text_language,
+    how_to_cut=i18n("不切"),
+    top_k=20,
+    top_p=0.6,
+    temperature=0.6,
+    ref_free=False,
+    speed=1,
+    if_freeze=False,
+    inp_refs=None,
+    sample_steps=8,
+    if_sr=False,
+    pause_second=0.3,
+
+    SaveSvEmb=False,
+    SaveRefers=False,
+    SaveSvEmbName="sv_emb.voice",
+    SaveRefersName="refers.voice",
+
+    SaveGE=False,
+    SaveGEName="ge.voice",
+
+    InjectSvEmb=False,
+    InjectRefers=False,
+    InjectSvEmbName="sv_emb.voice",
+    InjectRefersName="refers.voice",
+
+    EnableAudioLoad=True,
+
+    SaveOutputAsUndecoded=False,
+    SaveOutputAsUndecodedName="output.voice",
+    AddRandomSaltToSaveOutputAsUndecodedName=False,
+
+    ReturnWay = "yield", # "yield" or "return"
+):
+    print(text_paths)
+    text_list = []
+    for i in text_paths:
+        text_list.extend(read_tts_batch_file(i))
+    out = batched_tts_wav(
+        ref_wav_path,
+        prompt_text,
+        prompt_language,
+        text_list,
+        text_language,
+        how_to_cut,
+        top_k,
+        top_p,
+        temperature,
+        ref_free,
+        speed,
+        if_freeze,
+        inp_refs,
+        sample_steps,
+        if_sr,
+        pause_second,
+
+        SaveSvEmb,
+        SaveRefers,
+        SaveSvEmbName,
+        SaveRefersName,
+
+        SaveGE,
+        SaveGEName,
+
+        InjectSvEmb,
+        InjectRefers,
+        InjectSvEmbName,
+        InjectRefersName,
+
+        EnableAudioLoad,
+
+        SaveOutputAsUndecoded,
+        SaveOutputAsUndecodedName,
+        AddRandomSaltToSaveOutputAsUndecodedName,
+
+        "yield"
+    )
+    out = list(out)
+
+    if ReturnWay == "yield":
+        yield out
+    else:
+        return out
+def close_serv():
+    if running_on == "local":
+        sys.exit(0)
+    else:
+        gr.Warning(i18n("服务器环境下该功能不可用"))

 def split(todo_text):
    todo_text = todo_text.replace("……", "。").replace("——", "，")
@ -1178,6 +1596,112 @@ with gr.Blocks(title="GPT-SoVITS WebUI", analytics_enabled=False, js=js, css=css
                    )
                )
                prompt_text = gr.Textbox(label=i18n("参考音频的文本"), value="", lines=5, max_lines=5, scale=1)
+            
+
+                SaveSvEmb = gr.Checkbox(
+                    label=i18n("保存参考音频的语义向量"),
+                    interactive=True,
+                    show_label=True,
+                    value = False,
+                    visible=False if model_version not in {"v2Pro","v2ProPlus"} else True
+                )
+                SaveRefers = gr.Checkbox(
+                    label=i18n("保存参考音频的声纹特征"),
+                    interactive=True,
+                    show_label=True,
+                    value = False,
+                    visible=True
+
+                )
+                SaveSvEmbName = gr.Textbox(
+                    label=i18n("保存的语义向量文件名，默认保存在output/sv_emb_opt目录下"),
+                    value="sv_emb.voice",
+                    interactive=True,
+                    visible=True,
+                )
+                SaveRefersName = gr.Textbox(
+                    label=i18n("保存的声纹特征文件名，默认保存在output/refers_opt目录下"),
+                    value="refers.voice",
+                    interactive=True,
+                    visible=True,
+                )
+
+                InjectSvEmb = gr.Checkbox(
+                    label=i18n("注入参考音频的语义向量"),
+                    interactive=True,
+                    show_label=True,
+                    value = False,
+                    visible=False if model_version not in {"v2Pro","v2ProPlus"} else True
+                )
+                InjectRefers = gr.Checkbox(
+                    label=i18n("注入参考音频的声纹特征"),
+                    interactive=True,
+                    show_label=True,
+                    value = False,
+                    visible=True
+                )
+
+                InjectSvEmbName = gr.Textbox(
+                    label=i18n("注入的语义向量文件名，默认保存在output/sv_emb_opt目录下"),
+                    value="sv_emb.voice",
+                    interactive=True,
+                    visible=True,
+                )
+                InjectRefersName = gr.Textbox(
+                    label=i18n("注入的声纹特征文件名，默认保存在output/refers_opt目录下"),
+                    value="refers.voice",
+                    interactive=True,
+                    visible=True,
+                )
+
+                EnableAudioLoad = gr.Checkbox(
+                    label=i18n("启用音频加载。开启后会加载参考音频"),
+                    value=True,
+                    interactive=True,
+                    show_label=True,
+                    visible=True,
+                )
+
+                SaveGE = gr.Checkbox(
+                    label = i18n("保存GE"),
+                    value = True,
+                    interactive = True,
+                    show_label = True,
+                    visible = True,
+                )
+                     
+                SaveGEName = gr.Textbox(
+                    label = i18n("保存的GE文件名，默认保存在output/ge_opt目录下"),
+                    value = "ge.voice",
+                    interactive = True,
+                    show_label = True,
+                    visible = True,
+                )
+
+                SaveOutputAsUndecoded = gr.Checkbox(
+                    label = i18n("保存未解码的输出"),
+                    value = False,
+                    interactive = True,
+                    show_label = True,
+                    visible = True,
+                )
+
+                SaveOutputAsUndecodedName = gr.Textbox(
+                    label = i18n("保存的未解码输出文件名，默认保存在output/undecoded_opt目录下"),
+                    value = "output.voice",
+                    interactive = True,
+                    show_label = True,
+                    visible = True,
+                )
+
+                AddRandomSaltToSaveOutputAsUndecodedName = gr.Checkbox(
+                    label = i18n("给未解码输出文件名添加随机盐，防止覆盖"),
+                    value = False,
+                    interactive = True,
+                    show_label = True,
+                    visible = True,
+                )
+
            with gr.Column(scale=14):
                prompt_language = gr.Dropdown(
                    label=i18n("参考音频的语种"),
@ -1200,6 +1724,7 @@ with gr.Blocks(title="GPT-SoVITS WebUI", analytics_enabled=False, js=js, css=css
                        visible=False,
                    )
                )
+
                sample_steps = (
                    gr.Radio(
                        label=i18n("采样步数,如果觉得电,提高试试,如果觉得慢,降低试试"),
@ -1222,6 +1747,25 @@ with gr.Blocks(title="GPT-SoVITS WebUI", analytics_enabled=False, js=js, css=css
                    show_label=True,
                    visible=False if model_version != "v3" else True,
                )
+        with gr.Row():
+            gr.Markdown(html_center(i18n("批量语音合成参数"), "h3"))
+            with gr.Column(scale=13):
+                txt_paths = gr.File(label=i18n("批量语音合成文本文件，每行一个文本"),
+                                    file_types=[".txt"],
+                                    interactive=True, 
+                                    file_count="multiple",
+                                    scale=13)
+            with gr.Column(scale=7):
+                out = gr.File(label=i18n("批量合成输出的语音文件"),
+                              file_types=[".wav"],
+                              file_count="directory",)
+                start_batch_btn = gr.Button(i18n("开始批量合成"), 
+                                        variant="primary",
+                                        size="lg",
+                                        interactive=True,
+                                        scale=25)
+                
+
        gr.Markdown(html_center(i18n("*请填写需要合成的目标文本和语种模式"), "h3"))
        with gr.Row():
            with gr.Column(scale=13):
@ -1286,6 +1830,11 @@ with gr.Blocks(title="GPT-SoVITS WebUI", analytics_enabled=False, js=js, css=css
            inference_button = gr.Button(value=i18n("合成语音"), variant="primary", size="lg", scale=25)
            output = gr.Audio(label=i18n("输出的语音"), scale=14)

+        with gr.Row():
+            close_button = gr.Button(value=i18n("关闭服务器"), variant="danger", size="lg", scale=25)
+        
+        close_button.click(close_serv)
+
        inference_button.click(
            get_tts_wav,
            [
@ -1305,9 +1854,71 @@ with gr.Blocks(title="GPT-SoVITS WebUI", analytics_enabled=False, js=js, css=css
                sample_steps,
                if_sr_Checkbox,
                pause_second_slider,
+
+                SaveSvEmb,
+                SaveRefers,
+                SaveSvEmbName,
+                SaveRefersName,
+                SaveGE,
+                SaveGEName,
+                InjectSvEmb,
+                InjectRefers,
+                InjectSvEmbName,
+                InjectRefersName,
+                EnableAudioLoad,
+
+                SaveOutputAsUndecoded,
+                SaveOutputAsUndecodedName,
+                AddRandomSaltToSaveOutputAsUndecodedName,
+
            ],
            [output],
+
+            api_name="get_tts_wav",
        )
+
+        start_batch_btn.click(
+            batch_tts,
+            [
+                inp_ref,
+                prompt_text,
+                prompt_language,
+                txt_paths,
+                text_language,
+                how_to_cut,
+                top_k,
+                top_p,
+                temperature,
+                ref_text_free,
+                speed,
+                if_freeze,
+                inp_refs,
+                sample_steps,
+                if_sr_Checkbox,
+                pause_second_slider,
+
+                SaveSvEmb,
+                SaveRefers,
+                SaveSvEmbName,
+                SaveRefersName,
+                SaveGE,
+                SaveGEName,
+                InjectSvEmb,
+                InjectRefers,
+                InjectSvEmbName,
+                InjectRefersName,
+                EnableAudioLoad,
+
+                SaveOutputAsUndecoded,
+                SaveOutputAsUndecodedName,
+                AddRandomSaltToSaveOutputAsUndecodedName,
+
+            ],
+            [out],
+
+            api_name="batch_tts",
+        )
+        
        SoVITS_dropdown.change(
            change_sovits_weights,
            [SoVITS_dropdown, prompt_language, text_language],
--- a/GPT_SoVITS/module/VoiceChange.py
+++ b/GPT_SoVITS/module/VoiceChange.py
@ -0,0 +1,175 @@
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import numpy as np
+import torchaudio
+import math
+from torchaudio.transforms import Resample
+import VoiceSave
+import uuid
+
+def get_train_set(voice_file_path):
+    if type(voice_file_path) == str:
+        voice_file_path = [voice_file_path]
+    ret = []
+    for i in voice_file_path:
+        tensors_ = VoiceSave.load_tensor(i,
+                              f"get_{uuid.uuid4()}",
+                              find_func=VoiceSave.__find_func__,
+                              MySet=set())
+        ret.append(tensors_)
+    return ret
+
+class MelSpectrogram(nn.Module):
+    def __init__(self, hps):
+        super().__init__()
+        self.filter_length = hps.data.filter_length
+        self.hop_length = hps.data.hop_length
+        self.win_length = hps.data.win_length
+        self.sampling_rate = hps.data.sampling_rate
+        self.n_mel_channels = hps.data.n_mel_channels  
+        self.mel_fmin = hps.data.mel_fmin if hasattr(hps.data, 'mel_fmin') else 0
+        self.mel_fmax = hps.data.mel_fmax if hasattr(hps.data, 'mel_fmax') else None
+
+        # 构建梅尔频谱变换
+        self.mel_transform = torchaudio.transforms.MelSpectrogram(
+            sample_rate=self.sampling_rate,
+            n_fft=self.filter_length,
+            hop_length=self.hop_length,
+            win_length=self.win_length,
+            f_min=self.mel_fmin,
+            f_max=self.mel_fmax,
+            n_mels=192,  # self.n_mel_channels,
+            window_fn=torch.hann_window,
+            center=False,
+            power=1.0,
+        )
+
+    def forward(self, audio):
+        """
+        输入：audio [B, 1, T] 或 [1, T]（单声道音频）
+        输出：mel_spec [B, n_mel_channels, T']
+        """
+        if len(audio.shape) == 2:
+            audio = audio.unsqueeze(0)  # [1, T] → [1, 1, T]
+        
+        # 提取梅尔频谱
+        mel_spec = self.mel_transform(audio.squeeze(1))  # [B, n_mel, T']
+        
+        # 对数缩放（TTS标准操作）
+        mel_spec = torch.log(torch.clamp(mel_spec, min=1e-5))
+        
+        return mel_spec
+
+class PositionalEncoding(nn.Module):
+    def __init__(self, d_model, max_seq_length=5000):
+        super(PositionalEncoding, self).__init__()
+        self.pe = torch.zeros(max_seq_length, d_model)  # 初始化位置编码矩阵
+        position = torch.arange(0, max_seq_length, dtype=torch.float).unsqueeze(1)
+        div_term = torch.exp(torch.arange(0, d_model, 2).float() * -(math.log(10000.0) / d_model))
+        self.pe[:, 0::2] = torch.sin(position * div_term)  # 偶数位置使用正弦函数
+        self.pe[:, 1::2] = torch.cos(position * div_term)  # 奇数位置使用余弦函数
+        self.register_buffer('pe', self.pe.unsqueeze(0))  # 注册为缓冲区
+        
+    def forward(self, x):
+        # 将位置编码添加到输入中
+        return x + self.pe[:, :x.size(1)]
+    
+class Spliter(nn.Module):
+    '''output: z_p shape: torch.Size([1, 192, x]), y_mask shape: torch.Size([1, 1, x]), ge shape: torch.Size([1, 1024, 1])'''
+    def __init__(self,
+                 hps,
+                 ge,
+                 device):
+        super().__init__()
+        self.hps = hps
+
+        self.ge = ge
+        self.device = device
+        #TODO: 将mel_spec与ge输入Transformer模型
+        self.mel_dim = 192
+        self.ge_dim = 1024                
+        self.transformer_dim = 512
+        self.ge_proj = nn.Linear(self.ge_dim, self.transformer_dim).to(self.device)
+        self.mel_proj = nn.Linear(self.mel_dim, self.transformer_dim).to(self.device)
+        self.pos_encoder = PositionalEncoding(self.transformer_dim).to(self.device)
+        self.transformer = nn.TransformerEncoder(
+            nn.TransformerEncoderLayer(
+                d_model=self.transformer_dim,
+                nhead=hps.model.nhead,
+                dim_feedforward=hps.model.ffn_dim,
+                batch_first=False,
+                dropout=0.1
+            ),
+            num_layers=hps.model.num_layers
+        ).to(self.device)
+    
+        self.out_proj = nn.Linear(self.transformer_dim, self.mel_dim).to(self.device)
+
+    @torch.no_grad()
+    def mel_(self,audio_path, hps, device, dtype):
+        sr_target = int(hps.data.sampling_rate)
+        audio, sr_origin = torchaudio.load(audio_path)
+        if audio.shape[0] > 1:
+            audio = audio.mean(0, keepdim=True)
+        if sr_origin != sr_target:
+            resampler = Resample(sr_origin, sr_target).to(device)
+            audio = resampler(audio.to(device))
+        else:
+            audio = audio.to(device)
+        max_audio = audio.abs().max()
+        if max_audio > 1.0:
+            audio = audio / max_audio
+        mel_extractor = MelSpectrogram(hps).to(device)
+        mel_spec = mel_extractor(audio).to(dtype)
+        return mel_spec
+    
+    def forward(self, audio_path, ge,device,dtype):
+        # 输入：audio_path, ge
+        # 输出：z_p, y_mask, ge
+        ge_ = ge
+        mel = self.mel_(audio_path, self.hps, device, dtype)
+
+        mel = mel.permute(2, 0, 1)  
+        # 梅尔谱投影到Transformer维度：[T, 1, 512]
+        mel_feat = self.mel_proj(mel)  
+        
+        # 全局情感特征GE处理：[1,1024,1] → [1,1024] → [1,1,512]
+        ge = ge.to(device, dtype=dtype)
+        ge_squeeze = ge.squeeze(-1)  # [1, 1024]
+        ge_feat = self.ge_proj(ge_squeeze).unsqueeze(0)  # [1, 1, 512]
+        
+        # ===================== 3. 特征融合与Transformer输入 =====================
+        # 将GE特征拼接在梅尔谱序列开头：[T+1, 1, 512]
+        self.transformer_input = torch.cat([ge_feat, mel_feat], dim=0)
+        # 添加位置编码
+        self.transformer_input = self.pos_encoder(self.transformer_input)
+        
+        # ===================== 4. Transformer编码 =====================
+        transformer_out = self.transformer(self.transformer_input)  # [T+1, 1, 512]
+        
+        # ===================== 5. 输出特征重构 =====================
+        # 去除GE开头，提取梅尔谱对应的输出：[T, 1, 512]
+        mel_out = transformer_out[1:, :, :]
+        # 投影回原始梅尔维度：[T, 1, 192]
+        mel_out = self.out_proj(mel_out)
+        # 转换为目标格式：[1, 192, T] → z_p
+        z_p = mel_out.permute(1, 2, 0)
+        
+        # ===================== 6. 生成掩码 =====================
+        T = z_p.shape[-1]  # 梅尔谱时间步
+        y_mask = torch.ones(1, 1, T, device=device, dtype=dtype)  # [1,1,T] 全1掩码
+        
+        # ===================== 7. 输出（严格匹配注释格式） =====================
+        return z_p, y_mask, ge_
+
+class SpliterDataset(torch.utils.data.Dataset):
+    def __init__(self, voice_file_paths):
+        self.voice_file_paths = voice_file_paths
+        self.datas = get_train_set(voice_file_paths)
+
+    def __len__(self):
+        return len(self.datas)
+    
+    def __getitem__(self, idx):
+        return self.datas[idx]
--- a/GPT_SoVITS/module/models.py
+++ b/GPT_SoVITS/module/models.py
@ -25,6 +25,53 @@ import contextlib
 import random


+import torchaudio
+from torchaudio.transforms import Resample
+import os
+from pathlib import Path
+def merge_dir_txt2(*TXT):
+    return Path(os.path.join(*TXT))
+
+def get_my_dir():
+    return os.path.dirname(os.path.abspath(__file__))
+
+def get_parent_dir(dir_path,depth=1):
+    parent_path = Path(dir_path)
+    for _ in range(depth):
+        parent_path = parent_path.parent
+    return parent_path
+
+POOL:set = set() 
+def _get_unique_name(name,MySet:set=set()):
+    _id = 1
+    if name not in POOL and name not in MySet:
+        POOL.add(name)
+        return name
+    while name in POOL or name in MySet:
+        _id += 1
+        name = f'{name}_{_id}'
+    POOL.add(name)
+    return name
+
+def find_func(zf,il):
+    f = zf.get_file_path("voice.json")
+    info = il.load_info(f)
+    if info is None:
+        return None
+    list_names = info["access_list"]
+    global POOL
+    POOL.update(list_names)
+    ret = []
+    for name in list_names:
+        try:
+            a = zf.get_file_path(name)
+            ret.append(a)
+        except FileNotFoundError:
+            continue
+    return ret
+
+ROOT_DIR = str(get_parent_dir(get_my_dir()))
+
 class StochasticDurationPredictor(nn.Module):
    def __init__(
        self,
@ -989,10 +1036,8 @@ class SynthesizerTrn(nn.Module):

        o = self.dec((z * y_mask)[:, :, :], g=ge)
        return o, y_mask, (z, z_p, m_p, logs_p)
-
-
    @torch.no_grad()
-    def decode(self, codes, text, refer, noise_scale=0.5, speed=1, sv_emb=None):
+    def ge_(self, refer, sv_emb=None, InjectGE=False, GE=None, LoadGE=True):
        def get_ge(refer, sv_emb):
            ge = None
            if refer is not None:
@ -1006,8 +1051,10 @@ class SynthesizerTrn(nn.Module):
                    sv_emb = self.sv_emb(sv_emb)  # B*20480->B*512
                    ge += sv_emb.unsqueeze(-1)
                    ge = self.prelu(ge)
+            print(f"ge.shape : {ge.shape}")
            return ge
        
+        if LoadGE:
            if type(refer) == list:
                ges = []
                for idx, _refer in enumerate(refer):
@ -1016,6 +1063,24 @@ class SynthesizerTrn(nn.Module):
                ge = torch.stack(ges, 0).mean(0)
            else:
                ge = get_ge(refer, sv_emb)
+        else:
+            if InjectGE:
+                if type(GE) == list:
+                    GE = torch.stack(GE, 0).mean(0)
+                ge = GE
+            else:
+                raise ValueError("No GE stream provided!")
+        return ge
+
+    @torch.no_grad()
+    def decode(self, codes, text, refer, noise_scale=0.5, speed=1, sv_emb=None,
+                InjectGE=False,GE=None,LoadGE=True,
+                InjectZP=False,ZP=None,LoadZP=True,
+                OverWrite_Mask=False,Mask=None,
+                SaveGE=False,SaveZP=False,SaveMask=False,
+                GE_Name=None, ZP_Name=None, Mask_Name=None,
+                VoiceSave=None):
+        ge = self.ge_(refer, sv_emb, InjectGE, GE, LoadGE)

        y_lengths = torch.LongTensor([codes.size(2) * 2]).to(codes.device)
        text_lengths = torch.LongTensor([text.size(-1)]).to(text.device)
@ -1031,14 +1096,75 @@ class SynthesizerTrn(nn.Module):
            self.ge_to512(ge.transpose(2, 1)).transpose(2, 1) if self.is_v2pro else ge,
            speed,
        )
-        z_p = m_p + torch.randn_like(m_p) * torch.exp(logs_p) * noise_scale

+        if InjectZP:
+            if type(ZP) == list:
+                ZP = torch.stack(ZP, 0).mean(0)
+            else:
+                ZP = ZP
+            z_p = ZP
+        else:
+            if LoadZP:
+                z_p = m_p + torch.randn_like(m_p) * torch.exp(logs_p) * noise_scale
+            else:
+                raise ValueError("No z_p stream provided!")
+            
+        if OverWrite_Mask:
+            if type(Mask) == list:
+                Mask = torch.stack(Mask, 0).mean(0)
+            if Mask is None:
+                raise ValueError("No mask stream provided!")
+            y_mask = Mask
+        print(f"z_p shape: {z_p.shape}, y_mask shape: {y_mask.shape}, ge shape: {ge.shape}")
        z = self.flow(z_p, y_mask, g=ge, reverse=True)

        o = self.dec((z * y_mask)[:, :, :], g=ge)
        return o


+    @torch.no_grad()
+    def decode2(self, codes, text, refer, noise_scale=0.5, speed=1, sv_emb=None,
+                InjectGE=False,GE=None,LoadGE=True,
+                InjectZP=False,ZP=None,LoadZP=True,
+                OverWrite_Mask=False,Mask=None,):
+        ge = self.ge_(refer, sv_emb, InjectGE, GE, LoadGE)
+
+        y_lengths = torch.LongTensor([codes.size(2) * 2]).to(codes.device)
+        text_lengths = torch.LongTensor([text.size(-1)]).to(text.device)
+
+        quantized = self.quantizer.decode(codes)
+        if self.semantic_frame_rate == "25hz":
+            quantized = F.interpolate(quantized, size=int(quantized.shape[-1] * 2), mode="nearest")
+        x, m_p, logs_p, y_mask, _, _ = self.enc_p(
+            quantized,
+            y_lengths,
+            text,
+            text_lengths,
+            self.ge_to512(ge.transpose(2, 1)).transpose(2, 1) if self.is_v2pro else ge,
+            speed,
+        )
+
+        if InjectZP:
+            if type(ZP) == list:
+                ZP = torch.stack(ZP, 0).mean(0)
+            else:
+                ZP = ZP
+            z_p = ZP
+        else:
+            if LoadZP:
+                z_p = m_p + torch.randn_like(m_p) * torch.exp(logs_p) * noise_scale
+            else:
+                raise ValueError("No z_p stream provided!")
+            
+        if OverWrite_Mask:
+            if type(Mask) == list:
+                Mask = torch.stack(Mask, 0).mean(0)
+            if Mask is None:
+                raise ValueError("No mask stream provided!")
+            y_mask = Mask
+        print(f"z_p shape: {z_p.shape}, y_mask shape: {y_mask.shape}, ge shape: {ge.shape}")
+        return z_p, y_mask, ge
+
    @torch.no_grad()
    def decode_streaming(self, codes, text, refer, noise_scale=0.5, speed=1, sv_emb=None, result_length:int=None, overlap_frames:torch.Tensor=None, padding_length:int=None):
        def get_ge(refer, sv_emb):
--- a/GPT_SoVITS/module/modules.py
+++ b/GPT_SoVITS/module/modules.py
@ -432,6 +432,8 @@ class ResidualCouplingLayer(nn.Module):
        self.post.bias.data.zero_()

    def forward(self, x, x_mask, g=None, reverse=False):
+
+        print(f"x.shape: {x.shape}, x_mask.shape: {x_mask.shape}")
        x0, x1 = torch.split(x, [self.half_channels] * 2, 1)
        h = self.pre(x0) * x_mask
        h = self.enc(h, x_mask, g=g)
--- a/GPT_SoVITS/sv.py
+++ b/GPT_SoVITS/sv.py
@ -1,9 +1,10 @@
 import sys
 import os
 import torch
+from pathlib import Path

-sys.path.append(f"{os.getcwd()}/GPT_SoVITS/eres2net")
-sv_path = "GPT_SoVITS/pretrained_models/sv/pretrained_eres2netv2w24s4ep4.ckpt"
+sys.path.append(f"{str(Path(os.path.dirname(os.path.abspath(__file__))).parent)}/GPT_SoVITS/eres2net")
+sv_path = f"{str(Path(os.path.dirname(os.path.abspath(__file__))).parent)}/GPT_SoVITS/pretrained_models/sv/pretrained_eres2netv2w24s4ep4.ckpt"
 from ERes2NetV2 import ERes2NetV2
 import kaldi as Kaldi

--- a/README.md
+++ b/README.md
@ -48,6 +48,8 @@ https://github.com/RVC-Boss/GPT-SoVITS/assets/129054828/05bee1fa-bdd8-4d85-9350-

 请不要尬黑GPT-SoVITS推理速度慢，谢谢！

+CPU-Optimized Inference Version：https://github.com/baicai-1145/GPT-SoVITS-CPUFast
+
 **User guide: [简体中文](https://www.yuque.com/baicaigongchang1145haoyuangong/ib3g1e) | [English](https://rentry.co/GPT-SoVITS-guide#/)**

 ## Installation
@ -80,6 +82,15 @@ conda activate GPTSoVits
 pwsh -F install.ps1 --Device <CU126|CU128|CPU> --Source <HF|HF-Mirror|ModelScope> [--DownloadUVR5]
 ```

+If install.ps1 fails, you can try again or run the following commands:
+
+```pwsh
+conda create -n GPTSoVits python=3.10
+conda activate GPTSoVits
+inst.bat
+pwsh -F inst2.ps1 --Device <CU126|CU128|CPU> --Source <HF|HF-Mirror|ModelScope> [--DownloadUVR5]
+```
+
 ### Linux

 ```bash
--- a/conda-go-webui.bat
+++ b/conda-go-webui.bat
@ -0,0 +1,3 @@
+chcp 65001
+cd /d %~dp0
+conda activate %1 | python -I webui.py zh_CN
--- a/config.json
+++ b/config.json
@ -0,0 +1,5 @@
+{
+    "GPU_CHECK":{
+        "DisableGPUMemCheck":false
+    }
+}
--- a/config.py
+++ b/config.py
@ -1,11 +1,20 @@
 import os
 import re
 import sys
+import json
+from pathlib import Path

 import torch

 from tools.i18n.i18n import I18nAuto

+current_dir = str(Path(__file__).parent)
+def merge_dir_txt2(*TXT):
+    return Path(os.path.join(*TXT))
+config_json_location = merge_dir_txt2(current_dir,"config.json")
+with open(str(config_json_location),"r") as f:
+    __info__ = f.read()
+__info__ = json.loads(__info__)
 i18n = I18nAuto(language=os.environ.get("language", "Auto"))


@ -159,6 +168,7 @@ def get_device_dtype_sm(idx: int) -> tuple[torch.device, torch.dtype, float, flo
    major, minor = capability
    sm_version = major + minor / 10.0
    is_16_series = bool(re.search(r"16\d{2}", name)) and sm_version == 7.5
+    if not __info__["GPU_CHECK"]["DisableGPUMemCheck"]:
        if mem_gb < 4 or sm_version < 5.3:
            return cpu, torch.float32, 0.0, 0.0
    if sm_version == 6.1 or is_16_series == True:
--- a/docs/cn/Changelog_CN.md
+++ b/docs/cn/Changelog_CN.md
@ -594,11 +594,11 @@
  - 内容: 修复实验名结尾出现空格在win中路径不正确的问题
  - 类型: 修复
  - 提交: RVC-Boss
- 2025.06.10 [Commit#746cb536](https://github.com/RVC-Boss/GPT-SoVITS/commit/746cb536c68b1fe6ce3ca7e882235375b8a8dd89)
+- 2025.06.10 [PR#2449](https://github.com/RVC-Boss/GPT-SoVITS/pull/2449)
  - 内容: 语种分割优化
  - 类型: 优化
  - 提交: KamioRinn
- 2025.06.11 [Commit#dd2b9253](https://github.com/RVC-Boss/GPT-SoVITS/commit/dd2b9253aabb09db32db7a3344570ed9df043351)
+- 2025.06.11 [PR#2450](https://github.com/RVC-Boss/GPT-SoVITS/pull/2450)
  - 内容: 修复并行推理对v2pro支持bug
  - 类型: 修复
  - 提交: YYuX-1145
@ -606,21 +606,132 @@
  - 内容: v2pro对ge提取时会出现数值溢出的问题修复
  - 类型: 修复
  - 提交: RVC-Boss
- 2025.06.11 [Commit#37f5abfc](https://github.com/RVC-Boss/GPT-SoVITS/commit/6fdc67ca83418306f11e90b9139278313ac5c3e9)[Commit#6fdc67ca](https://github.com/RVC-Boss/GPT-SoVITS/commit/37f5abfcb4a6553652235909db2e124b6f8ff3a5)
+- 2025.06.17 [PR#2464](https://github.com/RVC-Boss/GPT-SoVITS/pull/2464) [PR#2482](https://github.com/RVC-Boss/GPT-SoVITS/pull/2482)
  - 内容: install.sh逻辑优化
  - 类型: 优化
  - 提交: XXXXRT666
- 2025.06.27 [Commit#90ebefa7](https://github.com/RVC-Boss/GPT-SoVITS/commit/90ebefa78fd544da36eebe0b2003620879c921b0)
+- 2025.06.27 [PR#2489](https://github.com/RVC-Boss/GPT-SoVITS/pull/2489)
  - 内容: onnxruntime加载逻辑优化（对gpu/cpu的判断）
  - 类型: 优化
  - 提交: KamioRinn
- 2025.06.27 [Commit#6df61f58](https://github.com/RVC-Boss/GPT-SoVITS/commit/6df61f58e4d18d4c2ad9d1eddd6a1bd690034c23)
+- 2025.06.27 [PR#2488](https://github.com/RVC-Boss/GPT-SoVITS/pull/2488)
  - 内容: 语言分割及格式化优化
  - 类型: 优化
  - 提交: KamioRinn
+
+## 202507
+
 - 2025.07.10 [Commit#426e1a2bb](https://github.com/RVC-Boss/GPT-SoVITS/commit/426e1a2bb43614af2479b877c37acfb0591e952f)
  - 内容: 提升推理进程优先级（修复win11下可能GPU利用率受限的问题）
-  - 类型: 修复
+  - 类型: 优化
  - 提交: XianYue0125
+- 2025.07.16 [PR#2490](https://github.com/RVC-Boss/GPT-SoVITS/pull/2490)
+  - 内容: 解决 TTS.py 无法识别真正支持版本 v2Pro、v2ProPlus 的问题, 同时更新一版默认配置。
+  - 类型: 修复
+  - 提交: jiangsier-xyz
+- 2025.07.16 [Commit#4d8ebf85](https://github.com/RVC-Boss/GPT-SoVITS/commit/4d8ebf85233d4f1166d7cc02fdc595602975ca8f)
+  - 内容: 修复并行推理模式下v2pro模型识别问题
+  - 类型: 修复
+  - 提交: RVC-Boss
+- 2025.07.17 [PR#2531](https://github.com/RVC-Boss/GPT-SoVITS/pull/2531)
+  - 内容: whisper asr支持性价比更高的distill模型
+  - 类型: 优化
+  - 提交: XXXXRT666
+- 2025.07.18 [PR#2536](https://github.com/RVC-Boss/GPT-SoVITS/pull/2536)
+  - 内容: 优化TTS_Config的代码逻辑
+  - 类型: 优化
+  - 提交: ChasonJiang
+- 2025.07.18 [PR#2537](https://github.com/RVC-Boss/GPT-SoVITS/pull/2537)
+  - 内容: 修复gpt的loss计算问题
+  - 类型: 修复
+  - 提交: ChasonJiang

+## 202508

+- 2025.08.02 [PR#2561](https://github.com/RVC-Boss/GPT-SoVITS/pull/2561)
+  - 内容: WSL Rocm
+  - 类型: 修复
+  - 提交: XXXXRT666
+
+## 202509
+
+- 2025.09.10 [Commit#11aa78bd](https://github.com/RVC-Boss/GPT-SoVITS/commit/11aa78bd9bda8b53047cfcae03abf7ca94d27391)
+  - 内容: 修复环境变量可能不为str的问题
+  - 类型: 修复
+  - 提交: RVC-Boss
+
+## 202511
+
+- 2025.11.28 [PR#2671](https://github.com/RVC-Boss/GPT-SoVITS/pull/2671) [PR#2678](https://github.com/RVC-Boss/GPT-SoVITS/pull/2678)
+  - 内容: 流式推理
+  - 类型: 新功能
+  - 提交: ChasonJiang
+- 2025.11.28 [PR#2636](https://github.com/RVC-Boss/GPT-SoVITS/pull/2636)
+  - 内容: 数学计算文本前端逻辑优化
+  - 类型: 优化
+  - 提交: KamioRinn
+- 2025.11.28 [PR#2469](https://github.com/RVC-Boss/GPT-SoVITS/pull/2469)
+  - 内容: 流式推理
+  - 类型: 新功能
+  - 提交: L-jasmine
+- 2025.11.28 [PR#2577](https://github.com/RVC-Boss/GPT-SoVITS/pull/2577)
+  - 内容: 支持vq分布式训练
+  - 类型: 优化
+  - 提交: wzy3650
+- 2025.11.28 [PR#2627](https://github.com/RVC-Boss/GPT-SoVITS/pull/2627) [PR#2679](https://github.com/RVC-Boss/GPT-SoVITS/pull/2679)
+  - 内容: ASR模型下载逻辑优化
+  - 类型: 优化
+  - 提交: XXXXRT666
+- 2025.11.28 [PR#2662](https://github.com/RVC-Boss/GPT-SoVITS/pull/2662)
+  - 内容: default batch size bug 修复
+  - 类型: 修复
+  - 提交: Spr-Aachen
+
+## 202512
+
+- 2025.12.30 [PR#2703](https://github.com/RVC-Boss/GPT-SoVITS/pull/2703) [PR#2704](https://github.com/RVC-Boss/GPT-SoVITS/pull/2704)
+  - 内容: 修复采样错误
+  - 类型: 修复
+  - 提交: ChasonJiang
+
+## 202602
+
+- 2026.02.08 [PR#2727](https://github.com/RVC-Boss/GPT-SoVITS/pull/2727)
+  - 内容: 修复 Conda 条款未同意导致的构建失败
+  - 类型: 修复
+  - 提交: Oarora
+- 2026.02.09 [PR#2732](https://github.com/RVC-Boss/GPT-SoVITS/pull/2732)
+  - 内容: 环境自动构建优化
+  - 类型: 优化
+  - 提交: XXXXRT666
+
+## 202604
+
+- 2026.04.18 [PR#2763](https://github.com/RVC-Boss/GPT-SoVITS/pull/2763)
+  - 内容: 优化 G2PW 的推理输入构造与多音字处理流程，减少重复计算，降低长句场景下的推理开销
+  - 类型: 优化
+  - 提交: baicai-1145
+- 2026.04.18 [PR#2767](https://github.com/RVC-Boss/GPT-SoVITS/pull/2767)
+  - 内容: 改进 Windows 单卡 v3 LoRA 训练流程
+  - 类型: 优化
+  - 提交: 2409324124
+- 2026.04.18 [PR#2755](https://github.com/RVC-Boss/GPT-SoVITS/pull/2755)
+  - 内容: 修复多个模块中的独立 bug
+  - 类型: 修复
+  - 提交: wishhyt
+- 2026.04.18 [PR#2758](https://github.com/RVC-Boss/GPT-SoVITS/pull/2758)
+  - 内容: 添加数据集的错误处理提示
+  - 类型: 优化
+  - 提交: mushroomcowisheggs
+- 2026.04.18 [PR#2753](https://github.com/RVC-Boss/GPT-SoVITS/pull/2753)
+  - 内容: 并行推理部分bug修复
+  - 类型: 修复
+  - 提交: wishhyt
+- 2026.04.18 [PR#2733](https://github.com/RVC-Boss/GPT-SoVITS/pull/2733)
+  - 内容: bug修复：DPO 训练不支持漏字模拟
+  - 类型: 修复
+  - 提交: Mr-Neutr0n
+- 2026.04.18 [Commit#02425ea](https://github.com/RVC-Boss/GPT-SoVITS/commit/02425ea25680c26c700be0bc158756c69103d827)
+  - 内容: 修复onnx脚本未导入Optional等的问题
+  - 类型: 修复
+  - 提交: RVC-Boss
--- a/docs/en/Changelog_EN.md
+++ b/docs/en/Changelog_EN.md
@ -578,3 +578,160 @@
  - Content: Optimized automatic precision detection logic; added collapsible functionality to WebUI frontend modules.
  - Type: New Feature
  - Contributors: XXXXRT666, RVC-Boss
+- 2025.06.06 [PR#2427](https://github.com/RVC-Boss/GPT-SoVITS/pull/2427)
+  - Content: Fix polyphone detection for "X一X" pattern
+  - Type: Fix
+  - Contributor: wzy3650
+- 2025.06.05 [PR#2439](https://github.com/RVC-Boss/GPT-SoVITS/pull/2439)
+  - Content: Config fix; fix SoVITS model loading
+  - Type: Fix
+  - Contributor: wzy3650
+- 2025.06.09 [Commit#8056efe4](https://github.com/RVC-Boss/GPT-SoVITS/commit/8056efe4ab7bbc3610c72ae356a6f37518441f7d)
+  - Content: Fix possible numerical explosion of `ge.sum` causing silent inference
+  - Type: Fix
+  - Contributor: RVC-Boss
+- 2025.06.10 [Commit#2c0436b9](https://github.com/RVC-Boss/GPT-SoVITS/commit/2c0436b9ce397424ae03476c836fb64c6e5ebcc6)
+  - Content: Fix incorrect Windows path when experiment name ends with a space
+  - Type: Fix
+  - Contributor: RVC-Boss
+- 2025.06.10 [PR#2449](https://github.com/RVC-Boss/GPT-SoVITS/pull/2449)
+  - Content: Optimize language segmentation
+  - Type: Optimization
+  - Contributor: KamioRinn
+- 2025.06.11 [PR#2450](https://github.com/RVC-Boss/GPT-SoVITS/pull/2450)
+  - Content: Fix bug in parallel inference support for v2pro
+  - Type: Fix
+  - Contributor: YYuX-1145
+- 2025.06.11 [Commit#ed89a023](https://github.com/RVC-Boss/GPT-SoVITS/commit/ed89a023378dabba9d4b6580235bb9742245816d)
+  - Content: Fix numerical overflow issue when extracting `ge` for v2pro
+  - Type: Fix
+  - Contributor: RVC-Boss
+- 2025.06.17 [PR#2464](https://github.com/RVC-Boss/GPT-SoVITS/pull/2464) [PR#2482](https://github.com/RVC-Boss/GPT-SoVITS/pull/2482)
+  - Content: Optimize `install.sh` logic
+  - Type: Optimization
+  - Contributor: XXXXRT666
+- 2025.06.27 [PR#2489](https://github.com/RVC-Boss/GPT-SoVITS/pull/2489)
+  - Content: Optimize onnxruntime loading logic (GPU/CPU detection)
+  - Type: Optimization
+  - Contributor: KamioRinn
+- 2025.06.27 [PR#2488](https://github.com/RVC-Boss/GPT-SoVITS/pull/2488)
+  - Content: Optimize language segmentation and formatting
+  - Type: Optimization
+  - Contributor: KamioRinn
+
+## 202507
+
+- 2025.07.10 [Commit#426e1a2bb](https://github.com/RVC-Boss/GPT-SoVITS/commit/426e1a2bb43614af2479b877c37acfb0591e952f)
+  - Content: Increase inference process priority (fix possible GPU utilization limitation on Win11)
+  - Type: Optimization
+  - Contributor: XianYue0125
+- 2025.07.16 [PR#2490](https://github.com/RVC-Boss/GPT-SoVITS/pull/2490)
+  - Content: Fix TTS.py not recognizing actually supported versions v2Pro and v2ProPlus, and update default configuration
+  - Type: Fix
+  - Contributor: jiangsier-xyz
+- 2025.07.16 [Commit#4d8ebf85](https://github.com/RVC-Boss/GPT-SoVITS/commit/4d8ebf85233d4f1166d7cc02fdc595602975ca8f)
+  - Content: Fix v2pro model recognition issue in parallel inference mode
+  - Type: Fix
+  - Contributor: RVC-Boss
+- 2025.07.17 [PR#2531](https://github.com/RVC-Boss/GPT-SoVITS/pull/2531)
+  - Content: Whisper ASR supports more cost-effective distill models
+  - Type: Optimization
+  - Contributor: XXXXRT666
+- 2025.07.18 [PR#2536](https://github.com/RVC-Boss/GPT-SoVITS/pull/2536)
+  - Content: Optimize `TTS_Config` code logic
+  - Type: Optimization
+  - Contributor: ChasonJiang
+- 2025.07.18 [PR#2537](https://github.com/RVC-Boss/GPT-SoVITS/pull/2537)
+  - Content: Fix GPT loss calculation issue
+  - Type: Fix
+  - Contributor: ChasonJiang
+
+## 202508
+
+- 2025.08.02 [PR#2561](https://github.com/RVC-Boss/GPT-SoVITS/pull/2561)
+  - Content: WSL Rocm
+  - Type: Fix
+  - Contributor: XXXXRT666
+
+## 202509
+
+- 2025.09.10 [Commit#11aa78bd](https://github.com/RVC-Boss/GPT-SoVITS/commit/11aa78bd9bda8b53047cfcae03abf7ca94d27391)
+  - Content: Fix issue where environment variable may not be a string
+  - Type: Fix
+  - Contributor: RVC-Boss
+
+## 202511
+
+- 2025.11.28 [PR#2671](https://github.com/RVC-Boss/GPT-SoVITS/pull/2671) [PR#2678](https://github.com/RVC-Boss/GPT-SoVITS/pull/2678)
+  - Content: Streaming inference
+  - Type: New Feature
+  - Contributor: ChasonJiang
+- 2025.11.28 [PR#2636](https://github.com/RVC-Boss/GPT-SoVITS/pull/2636)
+  - Content: Optimize text frontend logic for mathematical expression text
+  - Type: Optimization
+  - Contributor: KamioRinn
+- 2025.11.28 [PR#2469](https://github.com/RVC-Boss/GPT-SoVITS/pull/2469)
+  - Content: Streaming inference
+  - Type: New Feature
+  - Contributor: L-jasmine
+- 2025.11.28 [PR#2577](https://github.com/RVC-Boss/GPT-SoVITS/pull/2577)
+  - Content: Support VQ distributed training
+  - Type: Optimization
+  - Contributor: wzy3650
+- 2025.11.28 [PR#2627](https://github.com/RVC-Boss/GPT-SoVITS/pull/2627) [PR#2679](https://github.com/RVC-Boss/GPT-SoVITS/pull/2679)
+  - Content: Optimize ASR model download logic
+  - Type: Optimization
+  - Contributor: XXXXRT666
+- 2025.11.28 [PR#2662](https://github.com/RVC-Boss/GPT-SoVITS/pull/2662)
+  - Content: Fix default batch size bug
+  - Type: Fix
+  - Contributor: Spr-Aachen
+
+## 202512
+
+- 2025.12.30 [PR#2703](https://github.com/RVC-Boss/GPT-SoVITS/pull/2703) [PR#2704](https://github.com/RVC-Boss/GPT-SoVITS/pull/2704)
+  - Content: Fix sampling error
+  - Type: Fix
+  - Contributor: ChasonJiang
+
+## 202602
+
+- 2026.02.08 [PR#2727](https://github.com/RVC-Boss/GPT-SoVITS/pull/2727)
+  - Content: Fix build failure caused by unaccepted Conda terms
+  - Type: Fix
+  - Contributor: Oarora
+- 2026.02.09 [PR#2732](https://github.com/RVC-Boss/GPT-SoVITS/pull/2732)
+  - Content: Optimize automatic environment setup
+  - Type: Optimization
+  - Contributor: XXXXRT666
+
+## 202604
+
+- 2026.04.18 [PR#2763](https://github.com/RVC-Boss/GPT-SoVITS/pull/2763)
+  - Content: Optimize G2PW inference input construction and polyphone handling to reduce redundant computation and inference overhead for long sentences
+  - Type: Optimization
+  - Contributor: baicai-1145
+- 2026.04.18 [PR#2767](https://github.com/RVC-Boss/GPT-SoVITS/pull/2767)
+  - Content: Improve the LoRA training flow for GPT-SoVITS v3 on a single card under Windows
+  - Type: Optimization
+  - Contributor: 2409324124
+- 2026.04.18 [PR#2755](https://github.com/RVC-Boss/GPT-SoVITS/pull/2755)
+  - Content: Fix miscellaneous bugs in multiple modules
+  - Type: Fix
+  - Contributor: wishhyt
+- 2026.04.18 [PR#2758](https://github.com/RVC-Boss/GPT-SoVITS/pull/2758)
+  - Content: Add error handling hints for dataset processing
+  - Type: Optimization
+  - Contributor: mushroomcowisheggs
+- 2026.04.18 [PR#2753](https://github.com/RVC-Boss/GPT-SoVITS/pull/2753)
+  - Content: Fix some bugs in parallel inference
+  - Type: Fix
+  - Contributor: wishhyt
+- 2026.04.18 [PR#2733](https://github.com/RVC-Boss/GPT-SoVITS/pull/2733)
+  - Content: Fix bug where DPO training does not support missing word simulation
+  - Type: Fix
+  - Contributor: Mr-Neutr0n
+- 2026.04.18 [Commit#02425ea](https://github.com/RVC-Boss/GPT-SoVITS/commit/02425ea25680c26c700be0bc158756c69103d827)
+  - Content: Fix missing imports (e.g., Optional) in ONNX script
+  - Type: Fix
+  - Contributor: RVC-Boss
--- a/docs/ja/Changelog_JA.md
+++ b/docs/ja/Changelog_JA.md
@ -578,3 +578,160 @@
  - 内容: 自動精度検出ロジックを最適化し、WebUI フロントエンドモジュールに折り畳み（Collapsible）機能を追加
  - タイプ: 新機能
  - 貢献者: XXXXRT666, RVC-Boss
+- 2025.06.06 [PR#2427](https://github.com/RVC-Boss/GPT-SoVITS/pull/2427)
+  - 内容: 「X一X」パターンの多音字検出を修正
+  - タイプ: 修正
+  - 貢献者: wzy3650
+- 2025.06.05 [PR#2439](https://github.com/RVC-Boss/GPT-SoVITS/pull/2439)
+  - 内容: 設定の修正；SoVITSモデル読み込みの修正
+  - タイプ: 修正
+  - 貢献者: wzy3650
+- 2025.06.09 [Commit#8056efe4](https://github.com/RVC-Boss/GPT-SoVITS/commit/8056efe4ab7bbc3610c72ae356a6f37518441f7d)
+  - 内容: `ge.sum`の数値爆発による推論の無音化を修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
+- 2025.06.10 [Commit#2c0436b9](https://github.com/RVC-Boss/GPT-SoVITS/commit/2c0436b9ce397424ae03476c836fb64c6e5ebcc6)
+  - 内容: 実験名がスペースで終わる場合のWindowsパスの誤りを修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
+- 2025.06.10 [PR#2449](https://github.com/RVC-Boss/GPT-SoVITS/pull/2449)
+  - 内容: 言語分割の最適化
+  - タイプ: 最適化
+  - 貢献者: KamioRinn
+- 2025.06.11 [PR#2450](https://github.com/RVC-Boss/GPT-SoVITS/pull/2450)
+  - 内容: v2proの並列推論対応におけるバグを修正
+  - タイプ: 修正
+  - 貢献者: YYuX-1145
+- 2025.06.11 [Commit#ed89a023](https://github.com/RVC-Boss/GPT-SoVITS/commit/ed89a023378dabba9d4b6580235bb9742245816d)
+  - 内容: v2proの`ge`抽出時の数値オーバーフロー問題を修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
+- 2025.06.17 [PR#2464](https://github.com/RVC-Boss/GPT-SoVITS/pull/2464) [PR#2482](https://github.com/RVC-Boss/GPT-SoVITS/pull/2482)
+  - 内容: `install.sh`のロジックを最適化
+  - タイプ: 最適化
+  - 貢献者: XXXXRT666
+- 2025.06.27 [PR#2489](https://github.com/RVC-Boss/GPT-SoVITS/pull/2489)
+  - 内容: onnxruntime読み込みロジックを最適化（GPU/CPU検出）
+  - タイプ: 最適化
+  - 貢献者: KamioRinn
+- 2025.06.27 [PR#2488](https://github.com/RVC-Boss/GPT-SoVITS/pull/2488)
+  - 内容: 言語分割と書式を最適化
+  - タイプ: 最適化
+  - 貢献者: KamioRinn
+
+## 202507
+
+- 2025.07.10 [Commit#426e1a2bb](https://github.com/RVC-Boss/GPT-SoVITS/commit/426e1a2bb43614af2479b877c37acfb0591e952f)
+  - 内容: 推論プロセスの優先度を上げる（Win11でのGPU利用制限の可能性を修正）
+  - タイプ: 最適化
+  - 貢献者: XianYue0125
+- 2025.07.16 [PR#2490](https://github.com/RVC-Boss/GPT-SoVITS/pull/2490)
+  - 内容: TTS.pyが実際にサポートされているバージョンv2Proおよびv2ProPlusを認識しない問題を修正し、デフォルト設定を更新
+  - タイプ: 修正
+  - 貢献者: jiangsier-xyz
+- 2025.07.16 [Commit#4d8ebf85](https://github.com/RVC-Boss/GPT-SoVITS/commit/4d8ebf85233d4f1166d7cc02fdc595602975ca8f)
+  - 内容: 並列推論モードでのv2proモデル認識問題を修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
+- 2025.07.17 [PR#2531](https://github.com/RVC-Boss/GPT-SoVITS/pull/2531)
+  - 内容: Whisper ASRがよりコスト効率の高い蒸留モデルをサポート
+  - タイプ: 最適化
+  - 貢献者: XXXXRT666
+- 2025.07.18 [PR#2536](https://github.com/RVC-Boss/GPT-SoVITS/pull/2536)
+  - 内容: `TTS_Config`のコードロジックを最適化
+  - タイプ: 最適化
+  - 貢献者: ChasonJiang
+- 2025.07.18 [PR#2537](https://github.com/RVC-Boss/GPT-SoVITS/pull/2537)
+  - 内容: GPT損失計算の問題を修正
+  - タイプ: 修正
+  - 貢献者: ChasonJiang
+
+## 202508
+
+- 2025.08.02 [PR#2561](https://github.com/RVC-Boss/GPT-SoVITS/pull/2561)
+  - 内容: WSL Rocm対応
+  - タイプ: 修正
+  - 貢献者: XXXXRT666
+
+## 202509
+
+- 2025.09.10 [Commit#11aa78bd](https://github.com/RVC-Boss/GPT-SoVITS/commit/11aa78bd9bda8b53047cfcae03abf7ca94d27391)
+  - 内容: 環境変数が文字列でない可能性がある問題を修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
+
+## 202511
+
+- 2025.11.28 [PR#2671](https://github.com/RVC-Boss/GPT-SoVITS/pull/2671) [PR#2678](https://github.com/RVC-Boss/GPT-SoVITS/pull/2678)
+  - 内容: ストリーミング推論
+  - タイプ: 新機能
+  - 貢献者: ChasonJiang
+- 2025.11.28 [PR#2636](https://github.com/RVC-Boss/GPT-SoVITS/pull/2636)
+  - 内容: 数式テキストに対するテキスト前処理ロジックを最適化
+  - タイプ: 最適化
+  - 貢献者: KamioRinn
+- 2025.11.28 [PR#2469](https://github.com/RVC-Boss/GPT-SoVITS/pull/2469)
+  - 内容: ストリーミング推論
+  - タイプ: 新機能
+  - 貢献者: L-jasmine
+- 2025.11.28 [PR#2577](https://github.com/RVC-Boss/GPT-SoVITS/pull/2577)
+  - 内容: VQ分散学習をサポート
+  - タイプ: 最適化
+  - 貢献者: wzy3650
+- 2025.11.28 [PR#2627](https://github.com/RVC-Boss/GPT-SoVITS/pull/2627) [PR#2679](https://github.com/RVC-Boss/GPT-SoVITS/pull/2679)
+  - 内容: ASRモデルダウンロードロジックを最適化
+  - タイプ: 最適化
+  - 貢献者: XXXXRT666
+- 2025.11.28 [PR#2662](https://github.com/RVC-Boss/GPT-SoVITS/pull/2662)
+  - 内容: デフォルトのバッチサイズのバグを修正
+  - タイプ: 修正
+  - 貢献者: Spr-Aachen
+
+## 202512
+
+- 2025.12.30 [PR#2703](https://github.com/RVC-Boss/GPT-SoVITS/pull/2703) [PR#2704](https://github.com/RVC-Boss/GPT-SoVITS/pull/2704)
+  - 内容: サンプリングエラーを修正
+  - タイプ: 修正
+  - 貢献者: ChasonJiang
+
+## 202602
+
+- 2026.02.08 [PR#2727](https://github.com/RVC-Boss/GPT-SoVITS/pull/2727)
+  - 内容: 受け入れられなかったConda利用規約によるビルド失敗を修正
+  - タイプ: 修正
+  - 貢献者: Oarora
+- 2026.02.09 [PR#2732](https://github.com/RVC-Boss/GPT-SoVITS/pull/2732)
+  - 内容: 自動環境セットアップを最適化
+  - タイプ: 最適化
+  - 貢献者: XXXXRT666
+
+## 202604
+
+- 2026.04.18 [PR#2763](https://github.com/RVC-Boss/GPT-SoVITS/pull/2763)
+  - 内容: G2PW推論入力の構築と多音字処理を最適化し、長文における冗長な計算と推論オーバーヘッドを削減
+  - タイプ: 最適化
+  - 貢献者: baicai-1145
+- 2026.04.18 [PR#2767](https://github.com/RVC-Boss/GPT-SoVITS/pull/2767)
+  - 内容: WindowsでのシングルカードにおけるGPT-SoVITS v3のLoRAトレーニングフローを改善
+  - タイプ: 最適化
+  - 貢献者: 2409324124
+- 2026.04.18 [PR#2755](https://github.com/RVC-Boss/GPT-SoVITS/pull/2755)
+  - 内容: 複数モジュールの雑多なバグを修正
+  - タイプ: 修正
+  - 貢献者: wishhyt
+- 2026.04.18 [PR#2758](https://github.com/RVC-Boss/GPT-SoVITS/pull/2758)
+  - 内容: データセット処理時のエラーハンドリングヒントを追加
+  - タイプ: 最適化
+  - 貢献者: mushroomcowisheggs
+- 2026.04.18 [PR#2753](https://github.com/RVC-Boss/GPT-SoVITS/pull/2753)
+  - 内容: 並列推論の一部バグを修正
+  - タイプ: 修正
+  - 貢献者: wishhyt
+- 2026.04.18 [PR#2733](https://github.com/RVC-Boss/GPT-SoVITS/pull/2733)
+  - 内容: DPOトレーニングが欠落単語シミュレーションをサポートしないバグを修正
+  - タイプ: 修正
+  - 貢献者: Mr-Neutr0n
+- 2026.04.18 [Commit#02425ea](https://github.com/RVC-Boss/GPT-SoVITS/commit/02425ea25680c26c700be0bc158756c69103d827)
+  - 内容: ONNXスクリプトでの（Optionalなどの）不足インポートを修正
+  - タイプ: 修正
+  - 貢献者: RVC-Boss
--- a/docs/ko/Changelog_KO.md
+++ b/docs/ko/Changelog_KO.md
@ -578,3 +578,160 @@
  - 내용: 자동 정밀도 감지 로직 최적화; WebUI 프론트엔드 모듈에 접기 기능 추가
  - 유형: 신규 기능
  - 기여자: XXXXRT666, RVC-Boss
+- 2025.06.06 [PR#2427](https://github.com/RVC-Boss/GPT-SoVITS/pull/2427)
+  - 내용: "X一X" 패턴의 다중 발음 감지 오류 수정
+  - 유형: 수정
+  - 기여자: wzy3650
+- 2025.06.05 [PR#2439](https://github.com/RVC-Boss/GPT-SoVITS/pull/2439)
+  - 내용: 설정 오류 수정; SoVITS 모델 로딩 오류 수정
+  - 유형: 수정
+  - 기여자: wzy3650
+- 2025.06.09 [Commit#8056efe4](https://github.com/RVC-Boss/GPT-SoVITS/commit/8056efe4ab7bbc3610c72ae356a6f37518441f7d)
+  - 내용: `ge.sum`의 수치 폭발 가능성으로 인한 추론 무음 현상 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
+- 2025.06.10 [Commit#2c0436b9](https://github.com/RVC-Boss/GPT-SoVITS/commit/2c0436b9ce397424ae03476c836fb64c6e5ebcc6)
+  - 내용: 실험 이름이 공백으로 끝날 때 발생하는 잘못된 Windows 경로 문제 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
+- 2025.06.10 [PR#2449](https://github.com/RVC-Boss/GPT-SoVITS/pull/2449)
+  - 내용: 언어 분할 최적화
+  - 유형: 최적화
+  - 기여자: KamioRinn
+- 2025.06.11 [PR#2450](https://github.com/RVC-Boss/GPT-SoVITS/pull/2450)
+  - 내용: v2pro 병렬 추론 지원 버그 수정
+  - 유형: 수정
+  - 기여자: YYuX-1145
+- 2025.06.11 [Commit#ed89a023](https://github.com/RVC-Boss/GPT-SoVITS/commit/ed89a023378dabba9d4b6580235bb9742245816d)
+  - 내용: v2pro의 `ge` 추출 시 수치 오버플로우 문제 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
+- 2025.06.17 [PR#2464](https://github.com/RVC-Boss/GPT-SoVITS/pull/2464) [PR#2482](https://github.com/RVC-Boss/GPT-SoVITS/pull/2482)
+  - 내용: `install.sh` 로직 최적화
+  - 유형: 최적화
+  - 기여자: XXXXRT666
+- 2025.06.27 [PR#2489](https://github.com/RVC-Boss/GPT-SoVITS/pull/2489)
+  - 내용: onnxruntime 로딩 로직 최적화 (GPU/CPU 감지)
+  - 유형: 최적화
+  - 기여자: KamioRinn
+- 2025.06.27 [PR#2488](https://github.com/RVC-Boss/GPT-SoVITS/pull/2488)
+  - 내용: 언어 분할 및 형식 최적화
+  - 유형: 최적화
+  - 기여자: KamioRinn
+
+## 202507
+
+- 2025.07.10 [Commit#426e1a2bb](https://github.com/RVC-Boss/GPT-SoVITS/commit/426e1a2bb43614af2479b877c37acfb0591e952f)
+  - 내용: 추론 프로세스 우선순위 증가 (Win11에서 GPU 활용 제한 가능성 수정)
+  - 유형: 최적화
+  - 기여자: XianYue0125
+- 2025.07.16 [PR#2490](https://github.com/RVC-Boss/GPT-SoVITS/pull/2490)
+  - 내용: TTS.py가 실제 지원되는 버전 v2Pro 및 v2ProPlus를 인식하지 못하는 문제 수정 및 기본 설정 업데이트
+  - 유형: 수정
+  - 기여자: jiangsier-xyz
+- 2025.07.16 [Commit#4d8ebf85](https://github.com/RVC-Boss/GPT-SoVITS/commit/4d8ebf85233d4f1166d7cc02fdc595602975ca8f)
+  - 내용: 병렬 추론 모드에서 v2pro 모델 인식 문제 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
+- 2025.07.17 [PR#2531](https://github.com/RVC-Boss/GPT-SoVITS/pull/2531)
+  - 내용: Whisper ASR이 더 비용 효율적인 distill 모델 지원
+  - 유형: 최적화
+  - 기여자: XXXXRT666
+- 2025.07.18 [PR#2536](https://github.com/RVC-Boss/GPT-SoVITS/pull/2536)
+  - 내용: `TTS_Config` 코드 로직 최적화
+  - 유형: 최적화
+  - 기여자: ChasonJiang
+- 2025.07.18 [PR#2537](https://github.com/RVC-Boss/GPT-SoVITS/pull/2537)
+  - 내용: GPT 손실(loss) 계산 문제 수정
+  - 유형: 수정
+  - 기여자: ChasonJiang
+
+## 202508
+
+- 2025.08.02 [PR#2561](https://github.com/RVC-Boss/GPT-SoVITS/pull/2561)
+  - 내용: WSL Rocm
+  - 유형: 수정
+  - 기여자: XXXXRT666
+
+## 202509
+
+- 2025.09.10 [Commit#11aa78bd](https://github.com/RVC-Boss/GPT-SoVITS/commit/11aa78bd9bda8b53047cfcae03abf7ca94d27391)
+  - 내용: 환경 변수가 문자열이 아닐 수 있는 문제 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
+
+## 202511
+
+- 2025.11.28 [PR#2671](https://github.com/RVC-Boss/GPT-SoVITS/pull/2671) [PR#2678](https://github.com/RVC-Boss/GPT-SoVITS/pull/2678)
+  - 내용: 스트리밍 추론
+  - 유형: 새 기능
+  - 기여자: ChasonJiang
+- 2025.11.28 [PR#2636](https://github.com/RVC-Boss/GPT-SoVITS/pull/2636)
+  - 내용: 수학 표현식 텍스트에 대한 텍스트 전처리 로직 최적화
+  - 유형: 최적화
+  - 기여자: KamioRinn
+- 2025.11.28 [PR#2469](https://github.com/RVC-Boss/GPT-SoVITS/pull/2469)
+  - 내용: 스트리밍 추론
+  - 유형: 새 기능
+  - 기여자: L-jasmine
+- 2025.11.28 [PR#2577](https://github.com/RVC-Boss/GPT-SoVITS/pull/2577)
+  - 내용: VQ 분산 학습 지원
+  - 유형: 최적화
+  - 기여자: wzy3650
+- 2025.11.28 [PR#2627](https://github.com/RVC-Boss/GPT-SoVITS/pull/2627) [PR#2679](https://github.com/RVC-Boss/GPT-SoVITS/pull/2679)
+  - 내용: ASR 모델 다운로드 로직 최적화
+  - 유형: 최적화
+  - 기여자: XXXXRT666
+- 2025.11.28 [PR#2662](https://github.com/RVC-Boss/GPT-SoVITS/pull/2662)
+  - 내용: 기본 배치 크기 버그 수정
+  - 유형: 수정
+  - 기여자: Spr-Aachen
+
+## 202512
+
+- 2025.12.30 [PR#2703](https://github.com/RVC-Boss/GPT-SoVITS/pull/2703) [PR#2704](https://github.com/RVC-Boss/GPT-SoVITS/pull/2704)
+  - 내용: 샘플링 오류 수정
+  - 유형: 수정
+  - 기여자: ChasonJiang
+
+## 202602
+
+- 2026.02.08 [PR#2727](https://github.com/RVC-Boss/GPT-SoVITS/pull/2727)
+  - 내용: Conda 약관 미동의로 인한 빌드 실패 수정
+  - 유형: 수정
+  - 기여자: Oarora
+- 2026.02.09 [PR#2732](https://github.com/RVC-Boss/GPT-SoVITS/pull/2732)
+  - 내용: 자동 환경 설정 최적화
+  - 유형: 최적화
+  - 기여자: XXXXRT666
+
+## 202604
+
+- 2026.04.18 [PR#2763](https://github.com/RVC-Boss/GPT-SoVITS/pull/2763)
+  - 내용: G2PW 추론 입력 구성 및 다중 발음 처리를 최적화하여 긴 문장에 대한 중복 계산 및 추론 오버헤드 감소
+  - 유형: 최적화
+  - 기여자: baicai-1145
+- 2026.04.18 [PR#2767](https://github.com/RVC-Boss/GPT-SoVITS/pull/2767)
+  - 내용: Windows 환경 단일 GPU에서 GPT-SoVITS v3의 LoRA 학습 흐름 개선
+  - 유형: 최적화
+  - 기여자: 2409324124
+- 2026.04.18 [PR#2755](https://github.com/RVC-Boss/GPT-SoVITS/pull/2755)
+  - 내용: 여러 모듈의 잡다한 버그 수정
+  - 유형: 수정
+  - 기여자: wishhyt
+- 2026.04.18 [PR#2758](https://github.com/RVC-Boss/GPT-SoVITS/pull/2758)
+  - 내용: 데이터셋 처리를 위한 오류 처리 힌트 추가
+  - 유형: 최적화
+  - 기여자: mushroomcowisheggs
+- 2026.04.18 [PR#2753](https://github.com/RVC-Boss/GPT-SoVITS/pull/2753)
+  - 내용: 병렬 추론의 일부 버그 수정
+  - 유형: 수정
+  - 기여자: wishhyt
+- 2026.04.18 [PR#2733](https://github.com/RVC-Boss/GPT-SoVITS/pull/2733)
+  - 내용: DPO 학습이 누락 단어 시뮬레이션을 지원하지 않는 버그 수정
+  - 유형: 수정
+  - 기여자: Mr-Neutr0n
+- 2026.04.18 [Commit#02425ea](https://github.com/RVC-Boss/GPT-SoVITS/commit/02425ea25680c26c700be0bc158756c69103d827)
+  - 내용: ONNX 스크립트에서 Optional 등 누락된 임포트 문제 수정
+  - 유형: 수정
+  - 기여자: RVC-Boss
--- a/docs/tr/Changelog_TR.md
+++ b/docs/tr/Changelog_TR.md
@ -2,8 +2,6 @@

 ## 202401

-## 202401
-
 - 2024.01.21 [PR#108](https://github.com/RVC-Boss/GPT-SoVITS/pull/108)
  - İçerik: WebUI'ya İngilizce sistem çeviri desteği eklendi.
  - Tür: Dokümantasyon
@ -332,6 +330,8 @@
  - Tür: Optimizasyon
  - Katkıda Bulunan: RVC-Boss, GoHomeToMacDonal
  - İlgili: [PR#672](https://github.com/RVC-Boss/GPT-SoVITS/pull/672)
+- Gelecek güncellemeler, `fast_inference` dalındaki değişikliklerin tutarlılığını doğrulamaya devam edecek.
+
 - 2024.07.13 [PR#1294](https://github.com/RVC-Boss/GPT-SoVITS/pull/1294), [PR#1298](https://github.com/RVC-Boss/GPT-SoVITS/pull/1298)
  - İçerik: i18n taraması yeniden düzenlendi ve çok dilli yapılandırma dosyaları güncellendi
  - Tür: Dokümantasyon
@ -578,3 +578,160 @@
  - İçerik: Otomatik hassasiyet algılama mantığı optimize edildi; WebUI önyüz modüllerine katlanabilir özellik eklendi
  - Tür: Yeni Özellik
  - Katkıda Bulunanlar: XXXXRT666, RVC-Boss
+- 2025.06.06 [PR#2427](https://github.com/RVC-Boss/GPT-SoVITS/pull/2427)
+  - İçerik: "X一X" kalıbı için çok sesli harf tespitini düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: wzy3650
+- 2025.06.05 [PR#2439](https://github.com/RVC-Boss/GPT-SoVITS/pull/2439)
+  - İçerik: Yapılandırma düzeltmesi; SoVITS model yüklemesini düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: wzy3650
+- 2025.06.09 [Commit#8056efe4](https://github.com/RVC-Boss/GPT-SoVITS/commit/8056efe4ab7bbc3610c72ae356a6f37518441f7d)
+  - İçerik: `ge.sum` kaynaklı olası sayısal patlamayı (sessiz çıkarıma yol açan) düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
+- 2025.06.10 [Commit#2c0436b9](https://github.com/RVC-Boss/GPT-SoVITS/commit/2c0436b9ce397424ae03476c836fb64c6e5ebcc6)
+  - İçerik: Deney adı boşlukla bittiğinde oluşan hatalı Windows yolunu düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
+- 2025.06.10 [PR#2449](https://github.com/RVC-Boss/GPT-SoVITS/pull/2449)
+  - İçerik: Dil bölütlemeyi optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: KamioRinn
+- 2025.06.11 [PR#2450](https://github.com/RVC-Boss/GPT-SoVITS/pull/2450)
+  - İçerik: v2pro için paralel çıkarım desteğindeki hatayı düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: YYuX-1145
+- 2025.06.11 [Commit#ed89a023](https://github.com/RVC-Boss/GPT-SoVITS/commit/ed89a023378dabba9d4b6580235bb9742245816d)
+  - İçerik: v2pro için `ge` çıkarımındaki sayısal taşma sorununu düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
+- 2025.06.17 [PR#2464](https://github.com/RVC-Boss/GPT-SoVITS/pull/2464) [PR#2482](https://github.com/RVC-Boss/GPT-SoVITS/pull/2482)
+  - İçerik: `install.sh` mantığını optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: XXXXRT666
+- 2025.06.27 [PR#2489](https://github.com/RVC-Boss/GPT-SoVITS/pull/2489)
+  - İçerik: onnxruntime yükleme mantığını optimize et (GPU/CPU algılama)
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: KamioRinn
+- 2025.06.27 [PR#2488](https://github.com/RVC-Boss/GPT-SoVITS/pull/2488)
+  - İçerik: Dil bölütleme ve biçimlendirmeyi optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: KamioRinn
+
+## 202507
+
+- 2025.07.10 [Commit#426e1a2bb](https://github.com/RVC-Boss/GPT-SoVITS/commit/426e1a2bb43614af2479b877c37acfb0591e952f)
+  - İçerik: Çıkarım işlem önceliğini artır (Win11'de olası GPU kullanım sınırlamasını düzelt)
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: XianYue0125
+- 2025.07.16 [PR#2490](https://github.com/RVC-Boss/GPT-SoVITS/pull/2490)
+  - İçerik: TTS.py'nin gerçekte desteklenen sürümler olan v2Pro ve v2ProPlus'ı tanımaması sorununu düzelt ve varsayılan yapılandırmayı güncelle
+  - Tür: Düzeltme
+  - Katkıda Bulunan: jiangsier-xyz
+- 2025.07.16 [Commit#4d8ebf85](https://github.com/RVC-Boss/GPT-SoVITS/commit/4d8ebf85233d4f1166d7cc02fdc595602975ca8f)
+  - İçerik: Paralel çıkarım modunda v2pro model tanıma sorununu düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
+- 2025.07.17 [PR#2531](https://github.com/RVC-Boss/GPT-SoVITS/pull/2531)
+  - İçerik: Whisper ASR daha uygun maliyetli distill modellerini destekler
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: XXXXRT666
+- 2025.07.18 [PR#2536](https://github.com/RVC-Boss/GPT-SoVITS/pull/2536)
+  - İçerik: `TTS_Config` kod mantığını optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: ChasonJiang
+- 2025.07.18 [PR#2537](https://github.com/RVC-Boss/GPT-SoVITS/pull/2537)
+  - İçerik: GPT kayıp (loss) hesaplama sorununu düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: ChasonJiang
+
+## 202508
+
+- 2025.08.02 [PR#2561](https://github.com/RVC-Boss/GPT-SoVITS/pull/2561)
+  - İçerik: WSL Rocm
+  - Tür: Düzeltme
+  - Katkıda Bulunan: XXXXRT666
+
+## 202509
+
+- 2025.09.10 [Commit#11aa78bd](https://github.com/RVC-Boss/GPT-SoVITS/commit/11aa78bd9bda8b53047cfcae03abf7ca94d27391)
+  - İçerik: Ortam değişkeninin dize (string) olmaması sorununu düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
+
+## 202511
+
+- 2025.11.28 [PR#2671](https://github.com/RVC-Boss/GPT-SoVITS/pull/2671) [PR#2678](https://github.com/RVC-Boss/GPT-SoVITS/pull/2678)
+  - İçerik: Akışlı çıkarım (streaming inference)
+  - Tür: Yeni Özellik
+  - Katkıda Bulunan: ChasonJiang
+- 2025.11.28 [PR#2636](https://github.com/RVC-Boss/GPT-SoVITS/pull/2636)
+  - İçerik: Matematiksel ifade metinleri için metin ön uç (frontend) mantığını optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: KamioRinn
+- 2025.11.28 [PR#2469](https://github.com/RVC-Boss/GPT-SoVITS/pull/2469)
+  - İçerik: Akışlı çıkarım (streaming inference)
+  - Tür: Yeni Özellik
+  - Katkıda Bulunan: L-jasmine
+- 2025.11.28 [PR#2577](https://github.com/RVC-Boss/GPT-SoVITS/pull/2577)
+  - İçerik: VQ dağıtılmış eğitimi destekle
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: wzy3650
+- 2025.11.28 [PR#2627](https://github.com/RVC-Boss/GPT-SoVITS/pull/2627) [PR#2679](https://github.com/RVC-Boss/GPT-SoVITS/pull/2679)
+  - İçerik: ASR model indirme mantığını optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: XXXXRT666
+- 2025.11.28 [PR#2662](https://github.com/RVC-Boss/GPT-SoVITS/pull/2662)
+  - İçerik: Varsayılan parti boyutu (batch size) hatasını düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: Spr-Aachen
+
+## 202512
+
+- 2025.12.30 [PR#2703](https://github.com/RVC-Boss/GPT-SoVITS/pull/2703) [PR#2704](https://github.com/RVC-Boss/GPT-SoVITS/pull/2704)
+  - İçerik: Örnekleme (sampling) hatasını düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: ChasonJiang
+
+## 202602
+
+- 2026.02.08 [PR#2727](https://github.com/RVC-Boss/GPT-SoVITS/pull/2727)
+  - İçerik: Kabul edilmeyen Conda koşullarının neden olduğu derleme hatasını düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: Oarora
+- 2026.02.09 [PR#2732](https://github.com/RVC-Boss/GPT-SoVITS/pull/2732)
+  - İçerik: Otomatik ortam kurulumunu optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: XXXXRT666
+
+# 202604
+
+- 2026.04.18 [PR#2763](https://github.com/RVC-Boss/GPT-SoVITS/pull/2763)
+  - İçerik: Uzun cümlelerde gereksiz hesaplama ve çıkarım yükünü azaltmak için G2PW çıkarım girdi oluşturmayı ve çok sesli harf işlemeyi optimize et
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: baicai-1145
+- 2026.04.18 [PR#2767](https://github.com/RVC-Boss/GPT-SoVITS/pull/2767)
+  - İçerik: Windows altında tek kartta GPT-SoVITS v3 için LoRA eğitim akışını iyileştir
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: 2409324124
+- 2026.04.18 [PR#2755](https://github.com/RVC-Boss/GPT-SoVITS/pull/2755)
+  - İçerik: Birden çok modüldeki çeşitli hataları düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: wishhyt
+- 2026.04.18 [PR#2758](https://github.com/RVC-Boss/GPT-SoVITS/pull/2758)
+  - İçerik: Veri kümesi işleme için hata işleme ipuçları ekle
+  - Tür: Optimizasyon
+  - Katkıda Bulunan: mushroomcowisheggs
+- 2026.04.18 [PR#2753](https://github.com/RVC-Boss/GPT-SoVITS/pull/2753)
+  - İçerik: Paralel çıkarımdaki bazı hataları düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: wishhyt
+- 2026.04.18 [PR#2733](https://github.com/RVC-Boss/GPT-SoVITS/pull/2733)
+  - İçerik: DPO eğitiminin eksik kelime simülasyonunu desteklememe hatasını düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: Mr-Neutr0n
+- 2026.04.18 [Commit#02425ea](https://github.com/RVC-Boss/GPT-SoVITS/commit/02425ea25680c26c700be0bc158756c69103d827)
+  - İçerik: ONNX betiğinde (Optional vb.) eksik içe aktarmaları düzelt
+  - Tür: Düzeltme
+  - Katkıda Bulunan: RVC-Boss
--- a/inst.bat
+++ b/inst.bat
@ -0,0 +1,3 @@
+chcp 65001
+conda install -y -c conda-forge ffmpeg
+conda install -y -c conda-forge cmake
--- a/inst2.ps1
+++ b/inst2.ps1
@ -0,0 +1,209 @@
+Param (
+    [Parameter(Mandatory=$true)][ValidateSet("CU126", "CU128", "CPU")][string]$Device,
+    [Parameter(Mandatory=$true)][ValidateSet("HF", "HF-Mirror", "ModelScope")][string]$Source,
+    [switch]$DownloadUVR5
+)
+
+$global:ErrorActionPreference = 'Stop'
+
+trap {
+    Write-ErrorLog $_
+}
+
+function Write-ErrorLog {
+    param (
+        [System.Management.Automation.ErrorRecord]$ErrorRecord
+    )
+
+    Write-Host "`n[ERROR] Command failed:" -ForegroundColor Red
+    if (-not $ErrorRecord.Exception.Message){
+    } else {
+        Write-Host "Message:" -ForegroundColor Red 
+        $ErrorRecord.Exception.Message -split "`n" | ForEach-Object {
+            Write-Host "    $_"
+        }
+    }
+
+    Write-Host "Command:" -ForegroundColor Red  -NoNewline
+    Write-Host " $($ErrorRecord.InvocationInfo.Line)".Replace("`r", "").Replace("`n", "")
+    Write-Host "Location:" -ForegroundColor Red -NoNewline
+    Write-Host " $($ErrorRecord.InvocationInfo.ScriptName):$($ErrorRecord.InvocationInfo.ScriptLineNumber)"
+    Write-Host "Call Stack:" -ForegroundColor DarkRed
+    $ErrorRecord.ScriptStackTrace -split "`n" | ForEach-Object {
+        Write-Host "    $_" -ForegroundColor DarkRed
+    }
+
+    exit 1
+}
+
+function Write-Info($msg) {
+    Write-Host "[INFO]:" -ForegroundColor Green -NoNewline
+    Write-Host " $msg"
+}
+function Write-Success($msg) {
+    Write-Host "[SUCCESS]:" -ForegroundColor Blue -NoNewline
+    Write-Host " $msg"
+}
+
+function Invoke-Pip {
+    param (
+        [Parameter(ValueFromRemainingArguments = $true)]
+        [string[]]$Args
+    )
+    
+    $output = & pip install @Args 2>&1
+    $exitCode = $LASTEXITCODE
+    
+    if ($exitCode -ne 0) {
+        $errorMessages = @()
+        Write-Host "Pip Install $Args Failed" -ForegroundColor Red
+        foreach ($item in $output) {
+            if ($item -is [System.Management.Automation.ErrorRecord]) {
+                $msg = $item.Exception.Message
+                Write-Host "$msg" -ForegroundColor Red
+                $errorMessages += $msg
+            }
+            else {
+                Write-Host $item
+                $errorMessages += $item
+            }
+        }
+        throw [System.Exception]::new(($errorMessages -join "`n"))
+    }
+}
+
+function Invoke-Download {
+    param (
+        [Parameter(Mandatory = $true)]
+        [string]$Uri,
+
+        [Parameter()]
+        [string]$OutFile
+    )
+
+    try {
+        $params = @{
+            Uri = $Uri
+        }
+
+        if ($OutFile) {
+            $params["OutFile"] = $OutFile
+        }
+
+        $null = Invoke-WebRequest @params -ErrorAction Stop
+
+    } catch {
+        Write-Host "Failed to download:" -ForegroundColor Red
+        Write-Host "  $Uri"
+        throw
+    }
+}
+
+function Invoke-Unzip {
+    param($ZipPath, $DestPath)
+    Expand-Archive -Path $ZipPath -DestinationPath $DestPath -Force
+    Remove-Item $ZipPath -Force
+}
+
+chcp 65001
+Set-Location $PSScriptRoot
+
+$PretrainedURL  = ""
+$G2PWURL        = ""
+$UVR5URL        = ""
+$NLTKURL        = ""
+$OpenJTalkURL   = ""
+
+switch ($Source) {
+    "HF" {
+        Write-Info "Download Model From HuggingFace"
+        $PretrainedURL = "https://huggingface.co/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/pretrained_models.zip"
+        $G2PWURL       = "https://huggingface.co/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/G2PWModel.zip"
+        $UVR5URL       = "https://huggingface.co/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/uvr5_weights.zip"
+        $NLTKURL       = "https://huggingface.co/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/nltk_data.zip"
+        $OpenJTalkURL  = "https://huggingface.co/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/open_jtalk_dic_utf_8-1.11.tar.gz"
+    }
+    "HF-Mirror" {
+        Write-Info "Download Model From HuggingFace-Mirror"
+        $PretrainedURL = "https://hf-mirror.com/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/pretrained_models.zip"
+        $G2PWURL       = "https://hf-mirror.com/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/G2PWModel.zip"
+        $UVR5URL       = "https://hf-mirror.com/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/uvr5_weights.zip"
+        $NLTKURL       = "https://hf-mirror.com/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/nltk_data.zip"
+        $OpenJTalkURL  = "https://hf-mirror.com/XXXXRT/GPT-SoVITS-Pretrained/resolve/main/open_jtalk_dic_utf_8-1.11.tar.gz"
+    }
+    "ModelScope" {
+        Write-Info "Download Model From ModelScope"
+        $PretrainedURL = "https://www.modelscope.cn/models/XXXXRT/GPT-SoVITS-Pretrained/resolve/master/pretrained_models.zip"
+        $G2PWURL       = "https://www.modelscope.cn/models/XXXXRT/GPT-SoVITS-Pretrained/resolve/master/G2PWModel.zip"
+        $UVR5URL       = "https://www.modelscope.cn/models/XXXXRT/GPT-SoVITS-Pretrained/resolve/master/uvr5_weights.zip"
+        $NLTKURL       = "https://www.modelscope.cn/models/XXXXRT/GPT-SoVITS-Pretrained/resolve/master/nltk_data.zip"
+        $OpenJTalkURL  = "https://www.modelscope.cn/models/XXXXRT/GPT-SoVITS-Pretrained/resolve/master/open_jtalk_dic_utf_8-1.11.tar.gz"
+    }
+}
+
+if (-not (Test-Path "GPT_SoVITS/pretrained_models/sv")) {
+    Write-Info "Downloading Pretrained Models..."
+    Invoke-Download -Uri $PretrainedURL -OutFile "pretrained_models.zip"
+    Invoke-Unzip "pretrained_models.zip" "GPT_SoVITS"
+    Write-Success "Pretrained Models Downloaded"
+} else {
+    Write-Info "Pretrained Model Exists"
+    Write-Info "Skip Downloading Pretrained Models"
+}
+
+
+if (-not (Test-Path "GPT_SoVITS/text/G2PWModel")) {
+    Write-Info "Downloading G2PWModel..."
+    Invoke-Download -Uri $G2PWURL -OutFile "G2PWModel.zip"
+    Invoke-Unzip "G2PWModel.zip" "GPT_SoVITS/text"
+    Write-Success "G2PWModel Downloaded"
+} else {
+    Write-Info "G2PWModel Exists"
+    Write-Info "Skip Downloading G2PWModel"
+}
+
+if ($DownloadUVR5) {
+    if (-not (Test-Path "tools/uvr5/uvr5_weights")) {
+        Write-Info "Downloading UVR5 Models..."
+        Invoke-Download -Uri $UVR5URL -OutFile "uvr5_weights.zip"
+        Invoke-Unzip "uvr5_weights.zip" "tools/uvr5"
+        Write-Success "UVR5 Models Downloaded"
+    } else {
+        Write-Info "UVR5 Models Exists"
+        Write-Info "Skip Downloading UVR5 Models"
+    }
+}
+
+switch ($Device) {
+    "CU128" {
+        Write-Info "Installing PyTorch For CUDA 12.8..."
+        Invoke-Pip torch --index-url "https://download.pytorch.org/whl/cu128"
+    }
+    "CU126" {
+        Write-Info "Installing PyTorch For CUDA 12.6..."
+        Invoke-Pip torch --index-url "https://download.pytorch.org/whl/cu126"
+    }
+    "CPU" {
+        Write-Info "Installing PyTorch For CPU..."
+        Invoke-Pip torch --index-url "https://download.pytorch.org/whl/cpu"
+    }
+}
+Write-Success "PyTorch Installed"
+
+Write-Info "Installing Python Dependencies From requirements.txt..."
+Invoke-Pip -r extra-req.txt --no-deps
+Invoke-Pip -r requirements.txt
+Write-Success "Python Dependencies Installed"
+
+Write-Info "Downloading NLTK Data..."
+Invoke-Download -Uri $NLTKURL -OutFile "nltk_data.zip"
+Invoke-Unzip "nltk_data.zip" (python -c "import sys; print(sys.prefix)").Trim()
+
+Write-Info "Downloading Open JTalk Dict..."
+Invoke-Download -Uri $OpenJTalkURL -OutFile "open_jtalk_dic_utf_8-1.11.tar.gz"
+$target = (python -c "import os, pyopenjtalk; print(os.path.dirname(pyopenjtalk.__file__))").Trim()
+tar -xzf open_jtalk_dic_utf_8-1.11.tar.gz -C $target
+Remove-Item "open_jtalk_dic_utf_8-1.11.tar.gz" -Force
+Write-Success "Open JTalk Dic Downloaded"
+
+Write-Success "Installation Completed"
--- a/install.ps1
+++ b/install.ps1
@ -52,7 +52,7 @@ function Invoke-Conda {
        [string[]]$Args
    )

-    $output = & conda install -y -q -c conda-forge @Args 2>&1
+    $output = & conda install -y -c conda-forge @Args 2>&1
    $exitCode = $LASTEXITCODE

    if ($exitCode -ne 0) {
Author	SHA1	Message	Date
__kaning123__	a94fd5a14a	Merge 60414d25a39f3786a392523297734c144d1c59a9 into ea2d2a81667239d37615697e8f0056e35bab2db6	2026-04-19 14:16:06 +01:00
RVC-Boss	ea2d2a8166	Update README.md	2026-04-19 21:02:57 +08:00
SapphireLab	d9f03dad3e	Update Documentation (#2768 ) * 调整日志格式 * docs: Update other languages' changelogs	2026-04-18 22:33:55 +08:00
RVC-Boss	647935357a	Update Changelog_CN.md	2026-04-18 19:01:11 +08:00
RVC-Boss	02425ea256	Fixed issues such as missing imports for types like `Optional`. Fixed issues such as missing imports for types like `Optional`.	2026-04-18 17:33:53 +08:00
Harikrishna KP	938f05fce8	fix: correct torch.randint upper bound to include both values (#2733 )	2026-04-18 17:19:55 +08:00
__kaning123__	60414d25a3	Merge pull request #2 from kaning123/Dev Dev	2026-04-06 13:32:49 +08:00
Kaning123	e6a67650ff	feat: 添加中间量导出功能	2026-04-06 13:01:32 +08:00
Kaning123	24d7290c11	feat: Added VoiceChange.py	2026-04-06 12:59:31 +08:00
Kaning123	fb50fc090f	feat:Added batch tts option	2026-04-06 12:58:00 +08:00
Kaning123	cb2b844f45	feat: Added ReturnWay option to get_tts_wav	2026-04-04 14:17:07 +08:00
Kaning123	5c03499fcf	feat:向 VoiceSave 模块中添加 find_func	2026-04-02 17:26:08 +08:00
Kaning123	46ae12bf17	feat:添加关闭tts webui 的入口与 ge 等中间量的保存入口用于分发及使用	2026-04-02 17:24:19 +08:00
Kaning123	47170fd555	feat: 添加了向张量组文件中追加张量的功能	2026-03-29 11:10:28 +08:00
Kaning123	f3a9603eb0	style: move new entries to the middle of the page	2026-03-21 13:19:48 +08:00
Kaning123	5450922d8d	feat:Added entry to get value "ge" of class SynthesizerTrn	2026-03-19 17:39:55 +08:00
Kaning123	86ac5555e1	feat: Added webUI entries	2026-03-14 15:28:50 +08:00
Kaning123	e49d396b18	fix: 添加了inst.bat 与 inst2.ps1 以应对 install.ps1 运行时可能出现的 “由于调用深度溢出，脚本失败。” 错误	2026-03-14 13:28:46 +08:00
Kaning123	eedb06b303	fix:Fixed config.json loader in config.py	2026-03-14 13:01:11 +08:00
Kaning123	6e3db0126c	fix: Fixed conda-go-webui.bat	2026-03-14 12:59:09 +08:00
Kaning123	0e83383544	feat:added bat file for launching webui with conda	2026-03-14 09:32:11 +08:00
Kaning123	99a2e356f2	feat:remove “-q“ option of conda installation	2026-03-13 21:35:24 +08:00
__kaning123__	53b17bd2d2	Merge pull request #1 from kaning123/Dev Added ability to use preprocessed data to speed up tts efficiency	2026-02-25 14:01:46 +08:00
__kaning123__	69f1c9c2dd	feat: Added path check	2026-02-25 13:56:47 +08:00
__kaning123__	012eb93ef8	feat:添加了是否启用参考音频的变量	2026-02-25 10:37:33 +08:00
__kaning123__	f6e8ec8a78	feat:Added .voice loader	2026-02-25 10:20:48 +08:00
__kaning123__	1c54a945cb	feat: Added entrys to save sv_emb and refers	2026-02-25 07:53:03 +08:00
__kaning123__	a6a53f7231	feat: Added entry to disable checks	2026-02-24 07:48:12 +08:00
__kaning123__	a06011d838	fix:fix import errors	2026-02-23 14:29:40 +08:00
__kaning123__	6ef7c0b70f	feat: Add lib allows tensor saving	2026-02-23 09:51:55 +08:00