BoxOfColors commited on
Commit
d5b590c
·
1 Parent(s): e071ca4

fix: pre-download cvssp/audioldm2 at startup to avoid GPU budget drain

Browse files
Files changed (1) hide show
  1. app.py +8 -0
app.py CHANGED
@@ -80,6 +80,14 @@ print("Pre-downloading MMAudio CLIP model (apple/DFN5B-CLIP-ViT-H-14-384)…")
80
  snapshot_download(repo_id="apple/DFN5B-CLIP-ViT-H-14-384")
81
  print("MMAudio CLIP model pre-downloaded.")
82
 
 
 
 
 
 
 
 
 
83
  # ================================================================== #
84
  # SHARED CONSTANTS / HELPERS #
85
  # ================================================================== #
 
80
  snapshot_download(repo_id="apple/DFN5B-CLIP-ViT-H-14-384")
81
  print("MMAudio CLIP model pre-downloaded.")
82
 
83
+ # Pre-download TARO's AudioLDM2 VAE + vocoder (cvssp/audioldm2).
84
+ # AutoencoderKL.from_pretrained() and SpeechT5HifiGan.from_pretrained() fetch
85
+ # this repo inside the GPU window on every cold worker start, burning GPU budget
86
+ # before inference even begins. Pre-fetching here ensures the cache is warm.
87
+ print("Pre-downloading AudioLDM2 (cvssp/audioldm2)…")
88
+ snapshot_download(repo_id="cvssp/audioldm2")
89
+ print("AudioLDM2 pre-downloaded.")
90
+
91
  # ================================================================== #
92
  # SHARED CONSTANTS / HELPERS #
93
  # ================================================================== #