hfpox commited on
Commit
5e8007f
·
verified ·
1 Parent(s): 5254320

Upload folder using huggingface_hub

Browse files
.job_config.json ADDED
@@ -0,0 +1,155 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "job": "extension",
3
+ "config": {
4
+ "name": "fp32prolookv2",
5
+ "process": [
6
+ {
7
+ "type": "diffusion_trainer",
8
+ "training_folder": "/app/ai-toolkit/output",
9
+ "sqlite_db_path": "/app/ai-toolkit/aitk_db.db",
10
+ "device": "cuda",
11
+ "trigger_word": null,
12
+ "performance_log_every": 10,
13
+ "network": {
14
+ "type": "lora",
15
+ "linear": 32,
16
+ "linear_alpha": 32,
17
+ "conv": 16,
18
+ "conv_alpha": 16,
19
+ "lokr_full_rank": true,
20
+ "lokr_factor": -1,
21
+ "network_kwargs": {
22
+ "ignore_if_contains": []
23
+ }
24
+ },
25
+ "save": {
26
+ "dtype": "fp32",
27
+ "save_every": 398,
28
+ "max_step_saves_to_keep": 100000,
29
+ "save_format": "diffusers",
30
+ "push_to_hub": false
31
+ },
32
+ "datasets": [
33
+ {
34
+ "folder_path": "/app/ai-toolkit/datasets/prolookv2",
35
+ "mask_path": null,
36
+ "mask_min_value": 0.1,
37
+ "default_caption": "",
38
+ "caption_ext": "txt",
39
+ "caption_dropout_rate": 0.05,
40
+ "cache_latents_to_disk": false,
41
+ "is_reg": false,
42
+ "network_weight": 1,
43
+ "resolution": [
44
+ 512,
45
+ 768,
46
+ 1024,
47
+ 1280,
48
+ 1536
49
+ ],
50
+ "controls": [],
51
+ "shrink_video_to_frames": true,
52
+ "num_frames": 1,
53
+ "do_i2v": true,
54
+ "flip_x": false,
55
+ "flip_y": false
56
+ }
57
+ ],
58
+ "train": {
59
+ "batch_size": 1,
60
+ "bypass_guidance_embedding": false,
61
+ "steps": 25000,
62
+ "gradient_accumulation": 1,
63
+ "train_unet": true,
64
+ "train_text_encoder": false,
65
+ "gradient_checkpointing": true,
66
+ "noise_scheduler": "flowmatch",
67
+ "optimizer": "adamw8bit",
68
+ "timestep_type": "weighted",
69
+ "content_or_style": "balanced",
70
+ "optimizer_params": {
71
+ "weight_decay": 0.0001
72
+ },
73
+ "unload_text_encoder": false,
74
+ "cache_text_embeddings": true,
75
+ "lr": 0.0001,
76
+ "ema_config": {
77
+ "use_ema": false,
78
+ "ema_decay": 0.99
79
+ },
80
+ "skip_first_sample": true,
81
+ "force_first_sample": false,
82
+ "disable_sampling": true,
83
+ "dtype": "bf16",
84
+ "diff_output_preservation": false,
85
+ "diff_output_preservation_multiplier": 1,
86
+ "diff_output_preservation_class": "person",
87
+ "switch_boundary_every": 1,
88
+ "loss_type": "mse"
89
+ },
90
+ "model": {
91
+ "name_or_path": "Qwen/Qwen-Image",
92
+ "quantize": true,
93
+ "qtype": "qfloat8",
94
+ "quantize_te": true,
95
+ "qtype_te": "qfloat8",
96
+ "arch": "qwen_image",
97
+ "low_vram": false,
98
+ "model_kwargs": {},
99
+ "layer_offloading": false,
100
+ "layer_offloading_text_encoder_percent": 1,
101
+ "layer_offloading_transformer_percent": 1
102
+ },
103
+ "sample": {
104
+ "sampler": "flowmatch",
105
+ "sample_every": 250,
106
+ "width": 1024,
107
+ "height": 1024,
108
+ "samples": [
109
+ {
110
+ "prompt": "woman with red hair, playing chess at the park, bomb going off in the background"
111
+ },
112
+ {
113
+ "prompt": "a woman holding a coffee cup, in a beanie, sitting at a cafe"
114
+ },
115
+ {
116
+ "prompt": "a horse is a DJ at a night club, fish eye lens, smoke machine, lazer lights, holding a martini"
117
+ },
118
+ {
119
+ "prompt": "a man showing off his cool new t shirt at the beach, a shark is jumping out of the water in the background"
120
+ },
121
+ {
122
+ "prompt": "a bear building a log cabin in the snow covered mountains"
123
+ },
124
+ {
125
+ "prompt": "woman playing the guitar, on stage, singing a song, laser lights, punk rocker"
126
+ },
127
+ {
128
+ "prompt": "hipster man with a beard, building a chair, in a wood shop"
129
+ },
130
+ {
131
+ "prompt": "photo of a man, white background, medium shot, modeling clothing, studio lighting, white backdrop"
132
+ },
133
+ {
134
+ "prompt": "a man holding a sign that says, 'this is a sign'"
135
+ },
136
+ {
137
+ "prompt": "a bulldog, in a post apocalyptic world, with a shotgun, in a leather jacket, in a desert, with a motorcycle"
138
+ }
139
+ ],
140
+ "neg": "",
141
+ "seed": 42,
142
+ "walk_seed": true,
143
+ "guidance_scale": 4,
144
+ "sample_steps": 25,
145
+ "num_frames": 1,
146
+ "fps": 1
147
+ }
148
+ }
149
+ ]
150
+ },
151
+ "meta": {
152
+ "name": "[name]",
153
+ "version": "1.0"
154
+ }
155
+ }
config.yaml ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ job: extension
2
+ config:
3
+ name: fp32prolookv2
4
+ process:
5
+ - type: diffusion_trainer
6
+ training_folder: /app/ai-toolkit/output
7
+ sqlite_db_path: /app/ai-toolkit/aitk_db.db
8
+ device: cuda
9
+ trigger_word: null
10
+ performance_log_every: 10
11
+ network:
12
+ type: lora
13
+ linear: 32
14
+ linear_alpha: 32
15
+ conv: 16
16
+ conv_alpha: 16
17
+ lokr_full_rank: true
18
+ lokr_factor: -1
19
+ network_kwargs:
20
+ ignore_if_contains: []
21
+ save:
22
+ dtype: fp32
23
+ save_every: 398
24
+ max_step_saves_to_keep: 100000
25
+ save_format: diffusers
26
+ push_to_hub: false
27
+ datasets:
28
+ - folder_path: /app/ai-toolkit/datasets/prolookv2
29
+ mask_path: null
30
+ mask_min_value: 0.1
31
+ default_caption: ''
32
+ caption_ext: txt
33
+ caption_dropout_rate: 0.05
34
+ cache_latents_to_disk: false
35
+ is_reg: false
36
+ network_weight: 1
37
+ resolution:
38
+ - 512
39
+ - 768
40
+ - 1024
41
+ - 1280
42
+ - 1536
43
+ controls: []
44
+ shrink_video_to_frames: true
45
+ num_frames: 1
46
+ do_i2v: true
47
+ flip_x: false
48
+ flip_y: false
49
+ train:
50
+ batch_size: 1
51
+ bypass_guidance_embedding: false
52
+ steps: 25000
53
+ gradient_accumulation: 1
54
+ train_unet: true
55
+ train_text_encoder: false
56
+ gradient_checkpointing: true
57
+ noise_scheduler: flowmatch
58
+ optimizer: adamw8bit
59
+ timestep_type: weighted
60
+ content_or_style: balanced
61
+ optimizer_params:
62
+ weight_decay: 0.0001
63
+ unload_text_encoder: false
64
+ cache_text_embeddings: true
65
+ lr: 0.0001
66
+ ema_config:
67
+ use_ema: false
68
+ ema_decay: 0.99
69
+ skip_first_sample: true
70
+ force_first_sample: false
71
+ disable_sampling: true
72
+ dtype: bf16
73
+ diff_output_preservation: false
74
+ diff_output_preservation_multiplier: 1
75
+ diff_output_preservation_class: person
76
+ switch_boundary_every: 1
77
+ loss_type: mse
78
+ model:
79
+ name_or_path: Qwen/Qwen-Image
80
+ quantize: true
81
+ qtype: qfloat8
82
+ quantize_te: true
83
+ qtype_te: qfloat8
84
+ arch: qwen_image
85
+ low_vram: false
86
+ model_kwargs: {}
87
+ layer_offloading: false
88
+ layer_offloading_text_encoder_percent: 1
89
+ layer_offloading_transformer_percent: 1
90
+ sample:
91
+ sampler: flowmatch
92
+ sample_every: 250
93
+ width: 1024
94
+ height: 1024
95
+ samples:
96
+ - prompt: woman with red hair, playing chess at the park, bomb going off in
97
+ the background
98
+ - prompt: a woman holding a coffee cup, in a beanie, sitting at a cafe
99
+ - prompt: a horse is a DJ at a night club, fish eye lens, smoke machine, lazer
100
+ lights, holding a martini
101
+ - prompt: a man showing off his cool new t shirt at the beach, a shark is jumping
102
+ out of the water in the background
103
+ - prompt: a bear building a log cabin in the snow covered mountains
104
+ - prompt: woman playing the guitar, on stage, singing a song, laser lights,
105
+ punk rocker
106
+ - prompt: hipster man with a beard, building a chair, in a wood shop
107
+ - prompt: photo of a man, white background, medium shot, modeling clothing,
108
+ studio lighting, white backdrop
109
+ - prompt: a man holding a sign that says, 'this is a sign'
110
+ - prompt: a bulldog, in a post apocalyptic world, with a shotgun, in a leather
111
+ jacket, in a desert, with a motorcycle
112
+ neg: ''
113
+ seed: 42
114
+ walk_seed: true
115
+ guidance_scale: 4
116
+ sample_steps: 25
117
+ num_frames: 1
118
+ fps: 1
119
+ meta:
120
+ name: fp32prolookv2
121
+ version: '1.0'
fp32prolookv2.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfd5c0188c26c524fe4869054f239214faf8e72ee1f4f71843c135378a0a9e47
3
+ size 1179881960
fp32prolookv2_000015124.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21214283813633d5837da43545cbe0cfc9c5902deb1fc48de04bd3fa4f2caa7d
3
+ size 1179881960
fp32prolookv2_000015522.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9616939a63e2c184ff5252bce102ce1217b54dabe24cc378d19206d8c62b356d
3
+ size 1179881960
fp32prolookv2_000015920.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e7a04b53262c6f6c9e0b21cf9d4348009a057f6ae48053a9c5c3fb4c8dcf050
3
+ size 1179881960
fp32prolookv2_000016318.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfb73bf82d95366cfbed3311e6f9674938c1c2439601c6fe27daa6ea9a153bb6
3
+ size 1179881960
fp32prolookv2_000016716.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:516e12d780743437daf51b0c23a60d88f7c6917299ec4d893ede1a3a75246b4f
3
+ size 1179881960
fp32prolookv2_000017114.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1490698d97d19b4e614fce84dee821efef6b1d53d82743456544b3ceeab360c5
3
+ size 1179881960
fp32prolookv2_000017512.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:620838b1042df2000c27bb3b57d45b867d00c68cff167a728558a73272ffa873
3
+ size 1179881960
fp32prolookv2_000017910.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de6733543314ab2c797951009ada206804eaaa11afeafdbd9937b3c653ad10d
3
+ size 1179881960
fp32prolookv2_000018308.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5892bbc4d563fdf29f62e37c45e42ca0e500b837e656a6ce89906cd46f01cc3
3
+ size 1179881960
fp32prolookv2_000018706.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff4d9d6b44d239f48a948050044872aee91370e4a91b2317cea0957b247c8db2
3
+ size 1179881960
fp32prolookv2_000019104.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6639617a4a858847d9b87d1734eacbfe2604cee30031b29920f3240b91c79ac
3
+ size 1179881960
fp32prolookv2_000019502.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0360347ce3153a04edeb7396c32b7b7d7980434965a3294ebfd83f1eabe27903
3
+ size 1179881960
fp32prolookv2_000019900.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e4441c094928889f729e714f39fedf78af6cb50018e6bd7eaeaa3455e84abc1
3
+ size 1179881960
fp32prolookv2_000020298.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2b37ea1eabc5f5f13107d07f4ac0ed131152eb74e6d5c5f831949caa122aa93
3
+ size 1179881960
fp32prolookv2_000020696.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:084de87769339e5dbed1b611a1839b818f5c05e3353238aad58ad736e868f914
3
+ size 1179881960
fp32prolookv2_000021094.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d58dc911ffb998dfb10a4fc9ddcdedcb94e4308631f89570a1ba96c920c5327
3
+ size 1179881960
fp32prolookv2_000021492.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9bdca38bc25173b71481c6b3a65f8a7c365e5bcf9a5b549a4a8ef2b79efa8a5
3
+ size 1179881960
fp32prolookv2_000021890.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49561654eaa5efe21a7ff74a666eca5309163f92fbed704d6832a661958e0f28
3
+ size 1179881960
fp32prolookv2_000022288.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b97ea43e457b6a73304b7ac1283347cbe542e938ff6c3c6cc9fbf42d25105b
3
+ size 1179881960
fp32prolookv2_000022686.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13c13a88fd0fccb427a913173e008eaf2181d3ada707b3923840eb93bf980067
3
+ size 1179881960
fp32prolookv2_000023084.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef838afc71088820b066474c9a5172dc601d47409fc491987a701905414da2bd
3
+ size 1179881960
fp32prolookv2_000023482.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e83df547903055494c73575768b888f3ec57f350b2f6f7bb19fb08d0e33bf30
3
+ size 1179881960
fp32prolookv2_000023880.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df6595cb8dab74d408a6899ece04478ad9da3cba868276c0446e38061076e67c
3
+ size 1179881960
fp32prolookv2_000024278.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48ca662f566a7a3b5edc01b0c1de3cf08d7724a1ed50a9dd143b19a9ef457a02
3
+ size 1179881960
fp32prolookv2_000024676.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db26b47113e002fff8f72d17e99bc04d4d1c093ebf8b0c46b7544553ce13019c
3
+ size 1179881960
log.txt ADDED
The diff for this file is too large to render. See raw diff
 
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04ae3efbaaeb009889365f1e818cc535b948e7ef39e036c778824f4ce634a5a
3
+ size 598613389
pid.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ 1493