fix #382

2021-03-16 17:23:35 +01:00 · 2021-03-16 17:23:35 +01:00 · 5c657715f2
parent b6bac22243
commit 5c657715f2
1 changed files with 5 additions and 1 deletions
--- a/TTS/tts/models/speedy_speech.py
+++ b/TTS/tts/models/speedy_speech.py
@ -181,8 +181,12 @@ class SpeedySpeech(nn.Module):
            x_lengths: [B]
            g: [B, C]
        """
+        # input sequence should be greated than the max convolution size
+        inference_padding = 5
+        if x.shape[1] < 13:
+            inference_padding += 13 - x.shape[1]
        # pad input to prevent dropping the last word
-        x = torch.nn.functional.pad(x, pad=(0, 5), mode='constant', value=0)
+        x = torch.nn.functional.pad(x, pad=(0, inference_padding), mode='constant', value=0)
        o_en, o_en_dp, x_mask, g = self._forward_encoder(x, x_lengths, g)
        # duration predictor pass
        o_dr_log = self.duration_predictor(o_en_dp.detach(), x_mask)