VAEDecodeAudio now does some normalization on the audio.

2025-07-07 07:47:09 +08:00 · 2024-09-16 00:30:36 -04:00 · 2024-09-16 00:30:36 -04:00 · 56e8f5e4fd
commit 56e8f5e4fd
parent e813abbb2c
1 changed files with 3 additions and 0 deletions
--- a/comfy_extras/nodes_audio.py
+++ b/comfy_extras/nodes_audio.py
@ -58,6 +58,9 @@ class VAEDecodeAudio:
    def decode(self, vae, samples):
        audio = vae.decode(samples["samples"]).movedim(-1, 1)
        std = torch.std(audio, dim=[1,2], keepdim=True) * 5.0
        std[std < 1.0] = 1.0
        audio /= std
        return ({"waveform": audio, "sample_rate": 44100}, )