Dump / 8ep_config /config_file.toml
Alterneko's picture
feat: upload cosdif-1-5-v1-epochs-2 checkpoint
60a6b18
raw
history blame
1.38 kB
[model_arguments]
v2 = false
v_parameterization = false
pretrained_model_name_or_path = "/content/pretrained_model/Chillout-mix.safetensors"
[optimizer_arguments]
min_snr_gamma = 5
optimizer_type = "AdamW8bit"
learning_rate = 2e-6
max_grad_norm = 1.0
train_text_encoder = true
lr_scheduler = "cosine_with_restarts"
lr_warmup_steps = 265
lr_scheduler_num_cycles = 3
[dataset_arguments]
debug_dataset = false
in_json = "/content/fine_tune/meta_lat.json"
train_data_dir = "/content/fine_tune/train_data"
dataset_repeats = 1
shuffle_caption = true
keep_tokens = 0
resolution = "512,512"
caption_dropout_rate = 0
caption_tag_dropout_rate = 0
caption_dropout_every_n_epochs = 0
color_aug = false
token_warmup_min = 1
token_warmup_step = 0
[training_arguments]
output_dir = "/content/fine_tune/output"
output_name = "cosdif-1-5-v1-epochs-2"
save_precision = "fp16"
save_every_n_steps = 10000
save_state = true
train_batch_size = 1
max_token_length = 225
mem_eff_attn = false
xformers = true
max_train_steps = 10000
max_data_loader_n_workers = 8
persistent_data_loader_workers = true
gradient_checkpointing = false
gradient_accumulation_steps = 1
mixed_precision = "fp16"
clip_skip = 2
logging_dir = "/content/fine_tune/logs"
log_prefix = "cosdif-1-5-v1-epochs-2"
[sample_prompt_arguments]
sample_every_n_steps = 250
sample_sampler = "ddim"
[saving_arguments]
save_model_as = "ckpt"