Merge branch 'main' of https://github.com/babysor/Realtime-Voice-Clone-Chinese

2024-03-22 13:11:31 +08:00 · 2021-11-09 21:08:33 +08:00 · 2021-11-09 21:08:33 +08:00 · 902e1eb537
commit 902e1eb537
parent 5c0e53a29a 4edebdfeba
1 changed files with 1 additions and 1 deletions
--- a/synthesizer/models/tacotron.py
+++ b/synthesizer/models/tacotron.py
@ -60,7 +60,7 @@ class Encoder(nn.Module):
            idx = 1

        # Start by making a copy of each speaker embedding to match the input text length
-        # The output of this has size (batch_size, num_chars * tts_embed_dims)
+        # The output of this has size (batch_size, num_chars * speaker_embedding_size)
        speaker_embedding_size = speaker_embedding.size()[idx]
        e = speaker_embedding.repeat_interleave(num_chars, dim=idx)