hysts's picture
hysts HF staff
Support training text encoder
e755b70
raw
history blame
12.4 kB
#!/usr/bin/env python
"""Unofficial demo app for https://github.com/cloneofsimo/lora.
The code in this repo is partly adapted from the following repository:
https://huggingface.co/spaces/multimodalart/dreambooth-training/tree/a00184917aa273c6d8adab08d5deb9b39b997938
The license of the original code is MIT, which is specified in the README.md.
"""
from __future__ import annotations
import os
import pathlib
import gradio as gr
import torch
from inference import InferencePipeline
from trainer import Trainer
from uploader import upload
TITLE = '# LoRA + StableDiffusion Training UI'
DESCRIPTION = 'This is an unofficial demo for [https://github.com/cloneofsimo/lora](https://github.com/cloneofsimo/lora).'
USAGE_INFO = '''You can train and download models in the "Training" tab, and test them in the "Test" tab.
You can also test the pretrained models in the [original repo](https://github.com/cloneofsimo/lora).
Models with names starting with "lora/" are the pretrained models and the ones with names starting with "results/" are your trained models.
After training, you can press "Reload Weight List" button to load your trained model names.
Note that your trained models will be deleted when the second training is started.
'''
SPACE_ID = os.getenv('SPACE_ID', 'hysts/LoRA-SD-training')
SHARED_UI_WARNING = f'''# Attention - This Space doesn't work in this shared UI. You can duplicate and use it with a paid private T4 GPU.
<center><a class="duplicate-button" style="display:inline-block" target="_blank" href="https://huggingface.co/spaces/{SPACE_ID}?duplicate=true"><img src="https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=&logoWidth=14" alt="Duplicate Space"></a></center>
'''
CUDA_NOT_AVAILABLE_WARNING = '''# Attention - CUDA is not available in this environment.
You can assign a GPU from the Settings tab if you are running this on HF Spaces.
T4 small is sufficient to run this demo.
'''
def show_warning(warning_text: str) -> gr.Blocks:
with gr.Blocks() as demo:
with gr.Box():
gr.Markdown(warning_text)
return demo
def update_output_files() -> dict:
paths = sorted(pathlib.Path('results').glob('*.pt'))
paths = [path.as_posix() for path in paths] # type: ignore
return gr.update(value=paths or None)
def create_training_demo(trainer: Trainer,
pipe: InferencePipeline) -> gr.Blocks:
with gr.Blocks() as demo:
base_model = gr.Dropdown(
choices=['stabilityai/stable-diffusion-2-1-base'],
value='stabilityai/stable-diffusion-2-1-base',
label='Base Model',
visible=False)
resolution = gr.Dropdown(choices=['512'],
value='512',
label='Resolution',
visible=False)
with gr.Row():
with gr.Box():
gr.Markdown('Training Data')
concept_images = gr.Files(label='Images for your concept')
concept_prompt = gr.Textbox(label='Concept Prompt',
max_lines=1)
gr.Markdown('''
- Upload images of the style you are planning on training on.
- For a concept prompt, use a unique, made up word to avoid collisions.
''')
with gr.Box():
gr.Markdown('Training Parameters')
num_training_steps = gr.Number(
label='Number of Training Steps', value=1000, precision=0)
learning_rate = gr.Number(label='Learning Rate', value=0.0001)
train_text_encoder = gr.Checkbox(label='Train Text Encoder',
value=False)
learning_rate_text = gr.Number(
label='Learning Rate for Text Encoder', value=0.00005)
gradient_accumulation = gr.Number(
label='Number of Gradient Accumulation',
value=1,
precision=0)
fp16 = gr.Checkbox(label='FP16', value=True)
use_8bit_adam = gr.Checkbox(label='Use 8bit Adam', value=True)
gr.Markdown('''
- It will take about 8 minutes to train for 1000 steps with a T4 GPU.
- You may want to try a small number of steps first, like 1, to see if everything works fine in your environment.
''')
run_button = gr.Button('Start Training')
with gr.Box():
with gr.Row():
check_status_button = gr.Button('Check Training Status')
with gr.Column():
with gr.Box():
gr.Markdown('Message')
training_status = gr.Markdown()
output_files = gr.Files(label='Trained Weight Files')
run_button.click(fn=pipe.clear)
run_button.click(fn=trainer.run,
inputs=[
base_model,
resolution,
concept_images,
concept_prompt,
num_training_steps,
learning_rate,
train_text_encoder,
learning_rate_text,
gradient_accumulation,
fp16,
use_8bit_adam,
],
outputs=[
training_status,
output_files,
],
queue=False)
check_status_button.click(fn=trainer.check_if_running,
inputs=None,
outputs=training_status,
queue=False)
check_status_button.click(fn=update_output_files,
inputs=None,
outputs=output_files,
queue=False)
return demo
def find_weight_files() -> list[str]:
curr_dir = pathlib.Path(__file__).parent
paths = sorted(curr_dir.rglob('*.pt'))
paths = [path for path in paths if not path.stem.endswith('.text_encoder')]
return [path.relative_to(curr_dir).as_posix() for path in paths]
def reload_lora_weight_list() -> dict:
return gr.update(choices=find_weight_files())
def create_inference_demo(pipe: InferencePipeline) -> gr.Blocks:
with gr.Blocks() as demo:
with gr.Row():
with gr.Column():
base_model = gr.Dropdown(
choices=['stabilityai/stable-diffusion-2-1-base'],
value='stabilityai/stable-diffusion-2-1-base',
label='Base Model',
visible=False)
reload_button = gr.Button('Reload Weight List')
lora_weight_name = gr.Dropdown(choices=find_weight_files(),
value='lora/lora_disney.pt',
label='LoRA Weight File')
prompt = gr.Textbox(
label='Prompt',
max_lines=1,
placeholder='Example: "style of sks, baby lion"')
alpha = gr.Slider(label='Alpha',
minimum=0,
maximum=2,
step=0.05,
value=1)
alpha_for_text = gr.Slider(label='Alpha for Text Encoder',
minimum=0,
maximum=2,
step=0.05,
value=1)
seed = gr.Slider(label='Seed',
minimum=0,
maximum=100000,
step=1,
value=1)
with gr.Accordion('Other Parameters', open=False):
num_steps = gr.Slider(label='Number of Steps',
minimum=0,
maximum=100,
step=1,
value=50)
guidance_scale = gr.Slider(label='CFG Scale',
minimum=0,
maximum=50,
step=0.1,
value=7)
run_button = gr.Button('Generate')
gr.Markdown('''
- The pretrained models for "disney", "illust" and "pop" are trained with the concept prompt "style of sks".
- The pretrained model for "kiriko" is trained with the concept prompt "game character bnha". For this model, the text encoder is also trained.
''')
with gr.Column():
result = gr.Image(label='Result')
reload_button.click(fn=reload_lora_weight_list,
inputs=None,
outputs=lora_weight_name)
prompt.submit(fn=pipe.run,
inputs=[
base_model,
lora_weight_name,
prompt,
alpha,
alpha_for_text,
seed,
num_steps,
guidance_scale,
],
outputs=result,
queue=False)
run_button.click(fn=pipe.run,
inputs=[
base_model,
lora_weight_name,
prompt,
alpha,
alpha_for_text,
seed,
num_steps,
guidance_scale,
],
outputs=result,
queue=False)
return demo
def create_upload_demo() -> gr.Blocks:
with gr.Blocks() as demo:
model_name = gr.Textbox(label='Model Name')
hf_token = gr.Textbox(
label='Hugging Face Token (with write permission)')
upload_button = gr.Button('Upload')
with gr.Box():
gr.Markdown('Message')
result = gr.Markdown()
gr.Markdown('''
- You can upload your trained model to your private Model repo (i.e. https://huggingface.co/{your_username}/{model_name}).
- You can find your Hugging Face token [here](https://huggingface.co/settings/tokens).
''')
upload_button.click(fn=upload,
inputs=[model_name, hf_token],
outputs=result)
return demo
pipe = InferencePipeline()
trainer = Trainer()
with gr.Blocks(css='style.css') as demo:
if os.getenv('IS_SHARED_UI'):
show_warning(SHARED_UI_WARNING)
if not torch.cuda.is_available():
show_warning(CUDA_NOT_AVAILABLE_WARNING)
gr.Markdown(TITLE)
gr.Markdown(DESCRIPTION)
with gr.Tabs():
with gr.TabItem('Training'):
create_training_demo(trainer, pipe)
with gr.TabItem('Test'):
create_inference_demo(pipe)
with gr.TabItem('Upload'):
create_upload_demo()
with gr.Accordion('Usage', open=False):
gr.Markdown(USAGE_INFO)
demo.queue(default_enabled=False).launch(share=False)