Spaces:

fffiloni
/

Image2SFX-comparison

Running

App Files Files Community

fffiloni commited on Jun 14

Commit

aa7631f

•

1 Parent(s): 8100a2d

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -62

app.py CHANGED Viewed

@@ -77,94 +77,106 @@ def get_caption(image_in):
 def get_magnet(prompt):
     amended_prompt = f"{prompt}"
     print(amended_prompt)
-    client = Client("https://fffiloni-magnet.hf.space/")
-    result = client.predict(
-        "facebook/audio-magnet-medium",	# Literal['facebook/magnet-small-10secs', 'facebook/magnet-medium-10secs', 'facebook/magnet-small-30secs', 'facebook/magnet-medium-30secs', 'facebook/audio-magnet-small', 'facebook/audio-magnet-medium']  in 'Model' Radio component
-        "",	# str  in 'Model Path (custom models)' Textbox component
-        amended_prompt,	# str  in 'Input Text' Textbox component
-        3,	# float  in 'Temperature' Number component
-        0.9,	# float  in 'Top-p' Number component
-        10,	# float  in 'Max CFG coefficient' Number component
-        1,	# float  in 'Min CFG coefficient' Number component
-        20,	# float  in 'Decoding Steps (stage 1)' Number component
-        10,	# float  in 'Decoding Steps (stage 2)' Number component
-        10,	# float  in 'Decoding Steps (stage 3)' Number component
-        10,	# float  in 'Decoding Steps (stage 4)' Number component
-        "prod-stride1 (new!)",	# Literal['max-nonoverlap', 'prod-stride1 (new!)']  in 'Span Scoring' Radio component
-        api_name="/predict_full"
-    )
-    print(result)
-    return result[1]
 def get_audioldm(prompt):
-    client = Client("https://haoheliu-audioldm2-text2audio-text2music.hf.space/")
-    result = client.predict(
-        prompt,	# str in 'Input text' Textbox component
-        "Low quality. Music.",	# str in 'Negative prompt' Textbox component
-        10,	# int | float (numeric value between 5 and 15) in 'Duration (seconds)' Slider component
-        3.5,	# int | float (numeric value between 0 and 7) in 'Guidance scale' Slider component
-        45,	# int | float in 'Seed' Number component
-        3,	# int | float (numeric value between 1 and 5) in 'Number waveforms to generate' Slider component
-        fn_index=1
-    )
-    print(result)
-    audio_result = extract_audio(result)
-    return audio_result
 def get_audiogen(prompt):
-    client = Client("https://fffiloni-audiogen.hf.space/")
-    result = client.predict(
-        prompt,
-        10,
-        api_name="/infer"
-    )
-    return result
 def get_tango(prompt):
     try:
         client = Client("declare-lab/tango")
-    except:
-        raise gr.Error("Tango space API is not ready, please try again in few minutes ")
-    result = client.predict(
 				prompt,	# str representing string value in 'Prompt' Textbox component
 				100,	# int | float representing numeric value between 100 and 200 in 'Steps' Slider component
 				4,	# int | float representing numeric value between 1 and 10 in 'Guidance Scale' Slider component
 				api_name="/predict"
-    )
-    print(result)
-    return result
 def get_tango2(prompt):
     try:
         client = Client("declare-lab/tango2")
-    except:
-        raise gr.Error("Tango2 space API is not ready, please try again in few minutes ")
-    result = client.predict(
     		prompt,
     		100,
     		4,
     		api_name="/predict"
-    )
-    print(result)
-    return result
 def get_stable_audio_open(prompt):
     try:
         client = Client("fffiloni/Stable-Audio-Open-A10", hf_token=hf_token)
     except:
         raise gr.Error("Stable Audio Open space API is not ready, please try again in few minutes ")
-    result = client.predict(
-		prompt=prompt,
-		seconds_total=30,
-		steps=100,
-		cfg_scale=7,
-		api_name="/predict"
-    )
-    print(result)
-    return result
 def infer(image_in, chosen_model):
     caption = get_caption(image_in)
@@ -217,7 +229,6 @@ with gr.Blocks(css=css) as demo:
         fn=infer,
         inputs=[image_in, chosen_model],
         outputs=[audio_o],
-        concurrency_limit = 2
     )
 demo.queue(max_size=10).launch(debug=True, show_error=True)

 def get_magnet(prompt):
     amended_prompt = f"{prompt}"
     print(amended_prompt)
+    try:
+        client = Client("https://fffiloni-magnet.hf.space/")
+        result = client.predict(
+            "facebook/audio-magnet-medium",	# Literal['facebook/magnet-small-10secs', 'facebook/magnet-medium-10secs', 'facebook/magnet-small-30secs', 'facebook/magnet-medium-30secs', 'facebook/audio-magnet-small', 'facebook/audio-magnet-medium']  in 'Model' Radio component
+            "",	# str  in 'Model Path (custom models)' Textbox component
+            amended_prompt,	# str  in 'Input Text' Textbox component
+            3,	# float  in 'Temperature' Number component
+            0.9,	# float  in 'Top-p' Number component
+            10,	# float  in 'Max CFG coefficient' Number component
+            1,	# float  in 'Min CFG coefficient' Number component
+            20,	# float  in 'Decoding Steps (stage 1)' Number component
+            10,	# float  in 'Decoding Steps (stage 2)' Number component
+            10,	# float  in 'Decoding Steps (stage 3)' Number component
+            10,	# float  in 'Decoding Steps (stage 4)' Number component
+            "prod-stride1 (new!)",	# Literal['max-nonoverlap', 'prod-stride1 (new!)']  in 'Span Scoring' Radio component
+            api_name="/predict_full"
+        )
+        print(result)
+        return result[1]
+    except:
+        raise gr.Error("MAGNet space API is not ready, please try again in few minutes ")
 def get_audioldm(prompt):
+    try:
+        client = Client("https://haoheliu-audioldm2-text2audio-text2music.hf.space/")
+        result = client.predict(
+            prompt,	# str in 'Input text' Textbox component
+            "Low quality. Music.",	# str in 'Negative prompt' Textbox component
+            10,	# int | float (numeric value between 5 and 15) in 'Duration (seconds)' Slider component
+            3.5,	# int | float (numeric value between 0 and 7) in 'Guidance scale' Slider component
+            45,	# int | float in 'Seed' Number component
+            3,	# int | float (numeric value between 1 and 5) in 'Number waveforms to generate' Slider component
+            fn_index=1
+        )
+        print(result)
+        audio_result = extract_audio(result)
+        return audio_result
+    except:
+        raise gr.Error("AudioLDM space API is not ready, please try again in few minutes ")
 def get_audiogen(prompt):
+    try:
+        client = Client("https://fffiloni-audiogen.hf.space/")
+        result = client.predict(
+            prompt,
+            10,
+            api_name="/infer"
+        )
+        return result
+    except:
+        raise gr.Error("AudioGen space API is not ready, please try again in few minutes ")
 def get_tango(prompt):
     try:
         client = Client("declare-lab/tango")
+        result = client.predict(
 				prompt,	# str representing string value in 'Prompt' Textbox component
 				100,	# int | float representing numeric value between 100 and 200 in 'Steps' Slider component
 				4,	# int | float representing numeric value between 1 and 10 in 'Guidance Scale' Slider component
 				api_name="/predict"
+        )
+        print(result)
+        return result[0]
+    except:
+        raise gr.Error("Tango space API is not ready, please try again in few minutes ")
 def get_tango2(prompt):
     try:
         client = Client("declare-lab/tango2")
+        result = client.predict(
     		prompt,
     		100,
     		4,
     		api_name="/predict"
+        )
+        print(result)
+        return result
+    except:
+        raise gr.Error("Tango2 space API is not ready, please try again in few minutes ")
 def get_stable_audio_open(prompt):
     try:
         client = Client("fffiloni/Stable-Audio-Open-A10", hf_token=hf_token)
+        result = client.predict(
+    		prompt=prompt,
+    		seconds_total=30,
+    		steps=100,
+    		cfg_scale=7,
+    		api_name="/predict"
+        )
+        print(result)
+        return result
     except:
         raise gr.Error("Stable Audio Open space API is not ready, please try again in few minutes ")
 def infer(image_in, chosen_model):
     caption = get_caption(image_in)
         fn=infer,
         inputs=[image_in, chosen_model],
         outputs=[audio_o],
     )
 demo.queue(max_size=10).launch(debug=True, show_error=True)