Spaces:

mrcuddle
/

DARE-MERGE-SAFETENSORS

Running

App Files Files Community

mrcuddle commited on Nov 25, 2024

Commit

a26bb9f

verified ·

1 Parent(s): dbb2714

Update app.py

Browse files

Files changed (1) hide show

app.py +79 -35

app.py CHANGED Viewed

@@ -1,40 +1,84 @@
 import gradio as gr
 import subprocess
 import spaces
 @spaces.GPU
-def merge_models(base_model, model_to_merge, p, lambda_value, token, repo, commit_message, upload):
-    command = f"python model_merger.py {base_model} {model_to_merge} -p {p} -lambda {lambda_value} --repo {repo} --commit-message '{commit_message}'"
-    if upload:
-        command += f" --token {token} --upload"
-    result = subprocess.run(command, shell=True, capture_output=True, text=True)
-    return result.stdout
-iface = gr.Interface(
-    fn=merge_models,
-    inputs=[
-        gr.Textbox(label="Base Model"),
-        gr.Textbox(label="Model to Merge"),
-        gr.Slider(minimum=0, maximum=1, value=0.5, label="Dropout Probability"),
-        gr.Slider(minimum=0, maximum=10, value=3, label="Scaling Factor (Lambda)"),
-        gr.Textbox(label="HuggingFace Token (optional)"),
-        gr.Textbox(label="New Model Name (without your username) (optional)"),
-        gr.Textbox(label="Commit Message (optional)", value="Upload merged model"),
-        gr.Checkbox(label="Upload to HuggingFace Hub"),
-    ],
-    outputs="text",
-    title="Safetensors Model Merger",
-    description="""
-- Combine any two models using a Super Mario merge(DARE).
-- Based on: https://github.com/martyn/safetensors-merge-supermario.
-- Works with:
-- Stable Diffusion (1.5, XL/XL Turbo)
-- LLMs(Mistral, Llama, etc)
-- LoRas(must be same size)
-- Any two homologous models
-""",
-)
-iface.launch()

 import gradio as gr
 import subprocess
+import os
+import logging
+from pathlib import Path
 import spaces
 @spaces.GPU
+def merge_and_upload(base_model, model_to_merge, scaling_factor, weight_drop_prob, repo_name, token, commit_message):
+    # Define a fixed output path
+    outpath = Path('/tmp/output')
+    # Construct the command to run hf_merge.py
+    command = [
+        "python3", "hf_merge.py",
+        base_model,
+        model_to_merge,
+        "-p", str(weight_drop_prob),
+        "-lambda", str(scaling_factor),
+        "--token", token,
+        "--repo", repo_name,
+        "--commit-message", commit_message,
+        "-U"
+    ]
+    # Set up logging
+    logging.basicConfig(level=logging.INFO)
+    log_output = ""
+    # Run the command and capture the output
+    result = subprocess.run(command, capture_output=True, text=True)
+    # Log the output
+    log_output += result.stdout + "\n"
+    log_output += result.stderr + "\n"
+    logging.info(result.stdout)
+    logging.error(result.stderr)
+    # Check if the merge was successful
+    if result.returncode != 0:
+        return None, f"Error in merging models: {result.stderr}", log_output
+    # Assuming the script handles the upload and returns the repo URL
+    repo_url = f"https://huggingface.co/{repo_name}"
+    return repo_url, "Model merged and uploaded successfully!", log_output
+# Define the Gradio interface
+with gr.Blocks(theme="Ytheme/Minecraft", fill_width=True, delete_cache=(60, 3600)) as demo:
+    gr.Markdown("# SuperMario Safetensors Merger")
+    gr.Markdown("Combine any two models using a Super Mario merge(DARE)")
+    gr.Markdown("Based on: https://github.com/martyn/safetensors-merge-supermario")
+    gr.Markdown("Works with:")
+    gr.Markdown("* Stable Diffusion (1.5, XL/XL Turbo)")
+    gr.Markdown("* LLMs (Mistral, Llama, etc)")
+    gr.Markdown("* LoRas (must be same size)")
+    gr.Markdown("* Any two homologous models")
+    with gr.Column():
+        with gr.Row():
+            token = gr.Textbox(label="Your HF write token", placeholder="hf_...", value="", max_lines=1)
+        with gr.Row():
+            base_model = gr.Textbox(label="Base Model", placeholder=".safetensors")
+        with gr.Row():
+            model_to_merge = gr.Textbox(label="Merge Model", placeholder=".bin/.safetensors")
+        with gr.Row():
+            repo_name = gr.Textbox(label="New Model", placeholder="SDXL-", info="If empty, auto-complete", value="", max_lines=1)
+        with gr.Row():
+            scaling_factor = gr.Slider(minimum=0, maximum=10, value=3.0, label="Scaling Factor")
+        with gr.Row():
+            weight_drop_prob = gr.Slider(minimum=0, maximum=1, value=0.3, label="Weight Drop Probability")
+        with gr.Row():
+            commit_message = gr.Textbox(label="Commit Message", value="Upload merged model", max_lines=1)
+        progress = gr.Progress()
+        repo_url = gr.Markdown(label="Repository URL")
+        output = gr.Textbox(label="Output")
+        gr.Button("Merge").click(
+            merge_and_upload,
+            inputs=[base_model, model_to_merge, scaling_factor, weight_drop_prob, repo_name, token, commit_message],
+            outputs=[repo_url, output]
+        )
+demo.launch()