diff --git a/GPT_SoVITS/module/models.py b/GPT_SoVITS/module/models.py index 2dffac1..195a59f 100644 --- a/GPT_SoVITS/module/models.py +++ b/GPT_SoVITS/module/models.py @@ -242,7 +242,7 @@ class TextEncoder(nn.Module): y = self.mrte(y, y_mask, text, text_mask, ge) y = self.encoder2(y * y_mask, y_mask) if(speed!=1): - y = F.interpolate(y, size=int(y.shape[-1] * speed)+1, mode="linear") + y = F.interpolate(y, size=int(y.shape[-1] / speed)+1, mode="linear") y_mask = F.interpolate(y_mask, size=y.shape[-1], mode="nearest") stats = self.proj(y) * y_mask m, logs = torch.split(stats, self.out_channels, dim=1)