mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-10-07 15:19:59 +08:00
make cut3 cut4 great again
This commit is contained in:
parent
989e2b1f24
commit
8d25353835
@ -399,58 +399,39 @@ def cut2(language_splits):
|
|||||||
# 按中文句号。切
|
# 按中文句号。切
|
||||||
def cut3(language_splits):
|
def cut3(language_splits):
|
||||||
sentences_list = []
|
sentences_list = []
|
||||||
sentences = []
|
|
||||||
|
|
||||||
for lang_block in language_splits:
|
for lang_block in language_splits:
|
||||||
text_parts = lang_block['text'].split('。')
|
text_parts = lang_block['text'].split('。')
|
||||||
|
|
||||||
if len(text_parts) == 1:
|
if len(text_parts) <= 1:
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': lang_block['text']})
|
sentences_list.append([{'lang': lang_block['lang'], 'text': lang_block['text']}])
|
||||||
else :
|
else:
|
||||||
for i, part in enumerate(text_parts):
|
for i, part in enumerate(text_parts[:-1]):
|
||||||
if i == 0:
|
sentences_list.append([{'lang': lang_block['lang'], 'text': part.strip() + "。"}])
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part + "。"})
|
|
||||||
sentences_list.append(sentences)
|
|
||||||
sentences = []
|
|
||||||
elif i < len(text_parts) - 1:
|
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part + "。"})
|
|
||||||
sentences_list.append(sentences)
|
|
||||||
sentences = []
|
|
||||||
elif part and not part.isspace():
|
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part})
|
|
||||||
|
|
||||||
if sentences:
|
last_part = text_parts[-1].strip()
|
||||||
sentences_list.append(sentences)
|
if last_part:
|
||||||
|
sentences_list.append([{'lang': lang_block['lang'], 'text': last_part}])
|
||||||
|
|
||||||
return sentences_list
|
return sentences_list
|
||||||
|
|
||||||
|
|
||||||
# cut4
|
# cut4
|
||||||
# 按英文句号.切
|
# 按英文句号.切
|
||||||
def cut4(language_splits):
|
def cut4(language_splits):
|
||||||
sentences_list = []
|
sentences_list = []
|
||||||
sentences = []
|
|
||||||
|
|
||||||
for lang_block in language_splits:
|
for lang_block in language_splits:
|
||||||
text_parts = lang_block['text'].split('.')
|
text_parts = lang_block['text'].split('.')
|
||||||
|
|
||||||
if len(text_parts) == 1:
|
if len(text_parts) <= 1:
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': lang_block['text']})
|
sentences_list.append([{'lang': lang_block['lang'], 'text': lang_block['text']}])
|
||||||
else :
|
else:
|
||||||
for i, part in enumerate(text_parts):
|
for i, part in enumerate(text_parts[:-1]):
|
||||||
if i == 0:
|
sentences_list.append([{'lang': lang_block['lang'], 'text': part.strip() + "."}])
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part + "."})
|
|
||||||
sentences_list.append(sentences)
|
|
||||||
sentences = []
|
|
||||||
elif i < len(text_parts) - 1:
|
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part + "."})
|
|
||||||
sentences_list.append(sentences)
|
|
||||||
sentences = []
|
|
||||||
elif part and not part.isspace():
|
|
||||||
sentences.append({'lang': lang_block['lang'], 'text': part})
|
|
||||||
|
|
||||||
if sentences:
|
last_part = text_parts[-1].strip()
|
||||||
sentences_list.append(sentences)
|
if last_part:
|
||||||
|
sentences_list.append([{'lang': lang_block['lang'], 'text': last_part}])
|
||||||
|
|
||||||
return sentences_list
|
return sentences_list
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user