VAEDecodeAudio now does some normalization on the audio.

This commit is contained in:
comfyanonymous 2024-09-16 00:30:36 -04:00
parent e813abbb2c
commit 56e8f5e4fd
1 changed files with 3 additions and 0 deletions

View File

@ -58,6 +58,9 @@ class VAEDecodeAudio:
def decode(self, vae, samples):
audio = vae.decode(samples["samples"]).movedim(-1, 1)
std = torch.std(audio, dim=[1,2], keepdim=True) * 5.0
std[std < 1.0] = 1.0
audio /= std
return ({"waveform": audio, "sample_rate": 44100}, )