nvidia
/

bigvgan_base_24khz_100band

Audio-to-Audio

PyTorch

neural-vocoder

audio-generation

Model card Files Files and versions Community

L0SG commited on 6 days ago

Commit

8d0df17

•

1 Parent(s): d26e285

update

Browse files

Files changed (2) hide show

README.md +2 -2
bigvgan.py +34 -20

README.md CHANGED Viewed

@@ -59,10 +59,10 @@ from meldataset import get_mel_spectrogram
 # load wav file and compute mel spectrogram
 wav, sr = librosa.load('/path/to/your/audio.wav', sr=model.h.sampling_rate, mono=True) # wav is np.ndarray with shape [T_time] and values in [-1, 1]
-wav = torch.FloatTensor(wav).to(device).unsqueeze(0) # wav is FloatTensor with shape [B(1), T_time]
 # compute mel spectrogram from the ground truth audio
-mel = get_mel_spectrogram(wav, model.h) # mel is FloatTensor with shape [B(1), C_mel, T_frame]
 # generate waveform from mel
 with torch.inference_mode():

 # load wav file and compute mel spectrogram
 wav, sr = librosa.load('/path/to/your/audio.wav', sr=model.h.sampling_rate, mono=True) # wav is np.ndarray with shape [T_time] and values in [-1, 1]
+wav = torch.FloatTensor(wav).unsqueeze(0) # wav is FloatTensor with shape [B(1), T_time]
 # compute mel spectrogram from the ground truth audio
+mel = get_mel_spectrogram(wav, model.h).to(device) # mel is FloatTensor with shape [B(1), C_mel, T_frame]
 # generate waveform from mel
 with torch.inference_mode():

bigvgan.py CHANGED Viewed

@@ -257,14 +257,18 @@ class BigVGAN(
         return x
     def remove_weight_norm(self):
-        print('Removing weight norm...')
-        for l in self.ups:
-            for l_i in l:
-                remove_weight_norm(l_i)
-        for l in self.resblocks:
-            l.remove_weight_norm()
-        remove_weight_norm(self.conv_pre)
-        remove_weight_norm(self.conv_post)
     ##################################################################
     # additional methods for huggingface_hub support
@@ -304,17 +308,21 @@ class BigVGAN(
         ##################################################################
         # download and load hyperparameters (h) used by BigVGAN
         ##################################################################
-        config_file = hf_hub_download(
-            repo_id=model_id,
-            filename='config.json',
-            revision=revision,
-            cache_dir=cache_dir,
-            force_download=force_download,
-            proxies=proxies,
-            resume_download=resume_download,
-            token=token,
-            local_files_only=local_files_only,
-        )
         h = load_hparams_from_json(config_file)
         ##################################################################
@@ -347,6 +355,12 @@ class BigVGAN(
                 )
         checkpoint_dict = torch.load(model_file, map_location=map_location)
-        model.load_state_dict(checkpoint_dict['generator'])
         return model

         return x
     def remove_weight_norm(self):
+        try:
+            print('Removing weight norm...')
+            for l in self.ups:
+                for l_i in l:
+                    remove_weight_norm(l_i)
+            for l in self.resblocks:
+                l.remove_weight_norm()
+            remove_weight_norm(self.conv_pre)
+            remove_weight_norm(self.conv_post)
+        except ValueError:
+            print('[INFO] Model already removed weight norm. Skipping!')
+            pass
     ##################################################################
     # additional methods for huggingface_hub support
         ##################################################################
         # download and load hyperparameters (h) used by BigVGAN
         ##################################################################
+        if os.path.isdir(model_id):
+            print("Loading config.json from local directory")
+            config_file = os.path.join(model_id, 'config.json')
+        else:
+            config_file = hf_hub_download(
+                repo_id=model_id,
+                filename='config.json',
+                revision=revision,
+                cache_dir=cache_dir,
+                force_download=force_download,
+                proxies=proxies,
+                resume_download=resume_download,
+                token=token,
+                local_files_only=local_files_only,
+            )
         h = load_hparams_from_json(config_file)
         ##################################################################
                 )
         checkpoint_dict = torch.load(model_file, map_location=map_location)
+        try:
+            model.load_state_dict(checkpoint_dict['generator'])
+        except RuntimeError:
+            print(f"[INFO] the pretrained checkpoint does not contain weight norm. Loading the checkpoint after removing weight norm!")
+            model.remove_weight_norm()
+            model.load_state_dict(checkpoint_dict['generator'])
         return model