import gradio as gr import os from gradio_client import Client title="Prompt Converter" description="""

Prompt Converter

Stable Diffusion 2 uses OpenCLIP ViT-H model trained on LAION dataset so it knows different things than the OpenAI ViT-L we're all used to prompting.
This demo converts a v1.x stable diffusion prompt to a stable diffusion 2.x prompt,
by generating an image through RunwayML Stable Diffusion 1.5, then Interrogate the resulting image through CLIP Interrogator 2 to give you a Stable Diffusion 2 equivalent prompt.

""" stable_diffusion = Client("https://runwayml-stable-diffusion-v1-5.hf.space/") clip_interrogator_2 = Client("https://fffiloni-clip-interrogator-2.hf.space/") def get_images(prompt): print("Calling SD") gallery_dir = stable_diffusion.predict(prompt, fn_index=2) print(f"Gallery Directory: {gallery_dir}") img_results = [os.path.join(gallery_dir, img) for img in os.listdir(gallery_dir)] return img_results[0] def get_new_prompt(img, mode): interrogate = clip_interrogator_2.predict( img, # str (filepath or URL to image) in 'parameter_3' Image component mode, # str in 'Select mode' Radio component 12, # int | float (numeric value between 2 and 24) in 'best mode max flavors' Slider component api_name="/clipi2" ) #interrogate = clip_interrogator_2(img, mode, 12, api_name="clipi2") return interrogate def infer(prompt, mode): img = get_images(prompt) result = get_new_prompt(img, mode) #return result[0], img return img with gr.Blocks() as demo: gr.HTML(description) with gr.Row(): with gr.Column(): prompt_input = gr.Textbox(lines=4, label="Input v1.x Stable Diffusion prompt") mode_input = gr.Radio(['best', 'classic', 'fast'], label='mode', value='fast') submit_btn = gr.Button("Submit") with gr.Column(): sd_inter = gr.Image() prompt_output = gr.Textbox(lines=4, label="Converted v2.x Stable Diffusion prompt") submit_btn.click( fn=infer, inputs=[prompt_input,mode_input], outputs=[sd_inter] ) examples=[ ["girl with steampunk weapons and uniform, serious, finely detailed, made by wlop, boichi, ilya kuvshinov, full body portrait, illustration, grass, sunny, sky, anime, side view, perfect anime face, detailed face, zoomed out, smooth","fast"], ["a yellow cockatiel riding on the rings of saturn wearing a propeller hat, fantasy, intricate, elegant, highly detailed, digital painting, artstation, concept art, smooth, sharp focus, illustration, art by artgerm and greg rutkowski and alphonse mucha ","classic"], ["painting, view from inside edward hopper's painting nighthawks, of a group of werebears robbing a bank, foggy ","best"] ] gr.Examples( examples = examples, fn = infer, inputs=[prompt_input,mode_input], outputs=[sd_inter] ) #demo=gr.Interface(fn=infer, inputs=[prompt_input,mode_input], outputs=[prompt_output],title=title,description=description,examples=examples) demo.queue(max_size=10,concurrency_count=20) demo.launch(enable_queue=True)