mirror of
https://github.com/RVC-Boss/GPT-SoVITS.git
synced 2025-04-06 03:57:44 +08:00
Bug fix: inference w/o prompt
This commit is contained in:
parent
b65dae788d
commit
13bb68c715
@ -235,7 +235,7 @@ class Text2SemanticDecoder(nn.Module):
|
|||||||
layer.linear2.weight,
|
layer.linear2.weight,
|
||||||
layer.linear2.bias
|
layer.linear2.bias
|
||||||
)
|
)
|
||||||
# (layer.self_attn.in_proj_weight, layer.self_attn.in_proj_bias)
|
|
||||||
block = T2SBlock(
|
block = T2SBlock(
|
||||||
self.num_head,
|
self.num_head,
|
||||||
self.model_dim,
|
self.model_dim,
|
||||||
@ -578,7 +578,7 @@ class Text2SemanticDecoder(nn.Module):
|
|||||||
|
|
||||||
####################### update next step ###################################
|
####################### update next step ###################################
|
||||||
y_emb = self.ar_audio_embedding(y[:, -1:])
|
y_emb = self.ar_audio_embedding(y[:, -1:])
|
||||||
xy_pos = y_emb * self.ar_audio_position.x_scale + self.ar_audio_position.alpha * self.ar_audio_position.pe[:, prompts.shape[1] + idx]
|
xy_pos = y_emb * self.ar_audio_position.x_scale + self.ar_audio_position.alpha * self.ar_audio_position.pe[:, y_len + idx]
|
||||||
|
|
||||||
if ref_free:
|
if ref_free:
|
||||||
return y[:, :-1], 0
|
return y[:, :-1], 0
|
||||||
|
Loading…
x
Reference in New Issue
Block a user