yiff_toolkit / tp_bs8x6
k4d3's picture
aw
dc2fcd8
raw
history blame
2.25 kB
#/usr/bin/env zsh
#"block_dims=1,1,1,1,1,1,1,1,1,1,1,1,8,8,8,8,8,8,8,8,8,8,8,8,8"
# alpha=1 @ dim=16 is the same lr than alpha=4 @ dim=256
cd ~/source/repos/sd-scripts &&
accelerate launch --num_cpu_threads_per_process=2 "./sdxl_train_network.py" \
--pretrained_model_name_or_path=/home/kade/ComfyUI/models/checkpoints/ponyDiffusionV6XL_v6StartWithThisOne.safetensors \
--train_data_dir=/home/kade/training_dir \
--resolution="1024,1024" \
--output_dir="/home/kade/output_dir" \
--output_name="chunie-v3-bs8x12" \
--enable_bucket \
--min_bucket_reso=256 \
--max_bucket_reso=2048 \
--network_alpha=4 \
--save_model_as="safetensors" \
--network_module="lycoris.kohya" \
--network_args \
"preset=full" \
"conv_dim=16" \
"conv_alpha=1" \
"rank_dropout=0" \
"module_dropout=0" \
"use_tucker=False" \
"use_scalar=False" \
"rank_dropout_scale=False" \
"algo=locon" \
"dora_wd=False" \
"train_norm=False" \
--network_dropout=0 \
--lr_scheduler="cosine" \
--lr_scheduler_args="num_cycles=0.375" \
--lr_warmup_steps=6 \
--learning_rate=0.0002 \
--unet_lr=0.0002 \
--text_encoder_lr=0.0001 \
--network_dim=8 \
--no_half_vae \
--flip_aug \
--save_every_n_steps=20 \
--mixed_precision="bf16" \
--save_precision="fp16" \
--cache_latents \
--cache_latents_to_disk \
--optimizer_type=ClybW \
--max_grad_norm=1 \
--max_data_loader_n_workers=8 \
--bucket_reso_steps=32 \
--multires_noise_iterations=12 \
--multires_noise_discount=0.4 \
--log_prefix=xl-locon-bs8x12 \
--log_with=tensorboard \
--logging_dir=/home/kade/output_dir/logs \
--gradient_accumulation_steps=6 \
--gradient_checkpointing \
--train_batch_size=8 \
--dataset_repeats=1 \
--shuffle_caption \
--max_train_steps=500 \
--sdpa \
--sample_prompts=/home/kade/training_dir/sample-prompts.txt \
--sample_sampler="euler_a" \
--sample_every_n_steps=20 \
--caption_extension=".txt" \
--seed=1728871242 &&
cd ~
# --scale_weight_norms=1 \