mirror of https://github.com/coqui-ai/TTS.git
Merge pull request #520 from SanjaESC/patch-1
fix taco2 speaker-embeddings dimension during inferencepull/523/head
commit
ea31215087
|
@ -255,6 +255,7 @@ class Tacotron2(TacotronAbstract):
|
|||
if self.num_speakers > 1:
|
||||
if not self.embeddings_per_sample:
|
||||
speaker_embeddings = self.speaker_embedding(speaker_ids)[:, None]
|
||||
speaker_embeddings = torch.unsqueeze(speaker_embeddings, 0).transpose(1, 2)
|
||||
encoder_outputs = self._concat_speaker_embedding(encoder_outputs, speaker_embeddings)
|
||||
|
||||
decoder_outputs, alignments, stop_tokens = self.decoder.inference(encoder_outputs)
|
||||
|
@ -277,6 +278,7 @@ class Tacotron2(TacotronAbstract):
|
|||
if self.num_speakers > 1:
|
||||
if not self.embeddings_per_sample:
|
||||
speaker_embeddings = self.speaker_embedding(speaker_ids)[:, None]
|
||||
speaker_embeddings = torch.unsqueeze(speaker_embeddings, 0).transpose(1, 2)
|
||||
encoder_outputs = self._concat_speaker_embedding(encoder_outputs, speaker_embeddings)
|
||||
|
||||
mel_outputs, alignments, stop_tokens = self.decoder.inference_truncated(encoder_outputs)
|
||||
|
|
Loading…
Reference in New Issue