Spaces:

naotokui
/

latentgranular

Running

Fix: prevent exponential growth in augmentation

by KyungsuKim - opened Sep 9, 2025

←

Files changed (1) hide show

app.py CHANGED Viewed

@@ -41,16 +41,18 @@ class LatentGranularSynthesis:
                 y = librosa.util.normalize(y)
                 if aug_checkbox:
                     # Apply volume augmentation
                     for vol in self.vol_aug:
                         y_vol = y * vol
-                        y = np.hstack((y, y_vol))
                     # Apply pitch augmentation
                     for pitch in self.pitch_aug:
                         y_pitch = librosa.effects.pitch_shift(y, sr=sr, n_steps=pitch)
-                        y = np.hstack((y, y_pitch))
                 # Encode audio
                 latent = self.encdec.encode(y, max_waveform_length=44100*1).cpu()
                 self.codedb = torch.cat((self.codedb, latent), dim=-1)

                 y = librosa.util.normalize(y)
                 if aug_checkbox:
+                    y_augmented = y
                     # Apply volume augmentation
                     for vol in self.vol_aug:
                         y_vol = y * vol
+                        y_augmented = np.hstack((y_augmented, y_vol))
                     # Apply pitch augmentation
                     for pitch in self.pitch_aug:
                         y_pitch = librosa.effects.pitch_shift(y, sr=sr, n_steps=pitch)
+                        y_augmented = np.hstack((y_augmented, y_pitch))
+                    y = y_augmented
                 # Encode audio
                 latent = self.encdec.encode(y, max_waveform_length=44100*1).cpu()
                 self.codedb = torch.cat((self.codedb, latent), dim=-1)