mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-04-05 19:41:56 +08:00
add LLM translated CMUDICT-KATAKANA dictionary (#1660)
This commit is contained in:
parent
5efb960898
commit
38cd881578
File diff suppressed because it is too large
Load Diff
@ -82,8 +82,9 @@ def post_replace_ph(ph):
|
|||||||
ph = rep_map[ph]
|
ph = rep_map[ph]
|
||||||
# if ph in symbols:
|
# if ph in symbols:
|
||||||
# return ph
|
# return ph
|
||||||
# if ph not in symbols:
|
if ph not in symbols:
|
||||||
# ph = "UNK"
|
ph = "UNK"
|
||||||
|
# UNK may be useful as a pause token as it was trained in the model
|
||||||
return ph
|
return ph
|
||||||
|
|
||||||
|
|
||||||
@ -103,6 +104,8 @@ def symbols_to_japanese(text):
|
|||||||
def preprocess_jap(text, with_prosody=False):
|
def preprocess_jap(text, with_prosody=False):
|
||||||
"""Reference https://r9y9.github.io/ttslearn/latest/notebooks/ch10_Recipe-Tacotron.html"""
|
"""Reference https://r9y9.github.io/ttslearn/latest/notebooks/ch10_Recipe-Tacotron.html"""
|
||||||
text = symbols_to_japanese(text)
|
text = symbols_to_japanese(text)
|
||||||
|
# English words to lower case, should have no influence on japanese words.
|
||||||
|
text = text.lower()
|
||||||
sentences = re.split(_japanese_marks, text)
|
sentences = re.split(_japanese_marks, text)
|
||||||
marks = re.findall(_japanese_marks, text)
|
marks = re.findall(_japanese_marks, text)
|
||||||
text = []
|
text = []
|
||||||
@ -219,5 +222,6 @@ def g2p(norm_text, with_prosody=True):
|
|||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
phones = g2p("こんにちは, hello, AKITOです,よろしくお願いしますね!")
|
from text.symbols2 import symbols
|
||||||
|
phones = g2p("Hello.こんにちは!今日もNiCe天気ですね!tokyotowerに行きましょう!")
|
||||||
print(phones)
|
print(phones)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user