Skip to content

Commit

Permalink
Merge pull request neonbjb#49 from faad3/main
Browse files Browse the repository at this point in the history
Fix bug in load_voices in audio.py
  • Loading branch information
neonbjb authored May 17, 2022
2 parents 11e80b0 + dc3d7b1 commit b5fc8f1
Showing 1 changed file with 7 additions and 5 deletions.
12 changes: 7 additions & 5 deletions tortoise/utils/audio.py
Original file line number Diff line number Diff line change
Expand Up @@ -119,14 +119,16 @@ def load_voices(voices):
if latent is None:
assert len(latents) == 0, "Can only combine raw audio voices or latent voices, not both. Do it yourself if you want this."
clips.extend(clip)
elif voice is None:
assert len(voices) == 0, "Can only combine raw audio voices or latent voices, not both. Do it yourself if you want this."
elif clip is None:
assert len(clips) == 0, "Can only combine raw audio voices or latent voices, not both. Do it yourself if you want this."
latents.append(latent)
if len(latents) == 0:
return clips, None
else:
latents = torch.stack(latents, dim=0)
return None, latents.mean(dim=0)
latents_0 = torch.stack([l[0] for l in latents], dim=0).mean(dim=0)
latents_1 = torch.stack([l[1] for l in latents], dim=0).mean(dim=0)
latents = (latents_0,latents_1)
return None, latents


class TacotronSTFT(torch.nn.Module):
Expand Down Expand Up @@ -178,4 +180,4 @@ def wav_to_univnet_mel(wav, do_normalization=False):
mel = stft.mel_spectrogram(wav)
if do_normalization:
mel = normalize_tacotron_mel(mel)
return mel
return mel

0 comments on commit b5fc8f1

Please sign in to comment.