VAEDecodeAudio now does some normalization on the audio.

2024-09-16 00:30:36 -04:00 · 2024-09-16 00:30:36 -04:00 · 56e8f5e4fd
parent e813abbb2c
commit 56e8f5e4fd
1 changed files with 3 additions and 0 deletions
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@ -58,6 +58,9 @@ class VAEDecodeAudio:

    def decode(self, vae, samples):
        audio = vae.decode(samples["samples"]).movedim(-1, 1)
+        std = torch.std(audio, dim=[1,2], keepdim=True) * 5.0
+        std[std < 1.0] = 1.0
+        audio /= std
        return ({"waveform": audio, "sample_rate": 44100}, )