Upload decoder/decoder_config.json with huggingface_hub
Browse files
decoder/decoder_config.json
CHANGED
@@ -15,7 +15,7 @@
|
|
15 |
"attn_dim_head": 64,
|
16 |
"sparse_attn": true,
|
17 |
"memory_efficient": true,
|
18 |
-
"resnet_weight_standardization":
|
19 |
"self_attn": [false, true, true, true]
|
20 |
}
|
21 |
],
|
@@ -33,7 +33,7 @@
|
|
33 |
"data": {
|
34 |
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
35 |
"num_workers": 6,
|
36 |
-
"batch_size":
|
37 |
"start_shard": 0,
|
38 |
"end_shard": 231349,
|
39 |
"shard_width": 6,
|
@@ -56,12 +56,12 @@
|
|
56 |
},
|
57 |
"train": {
|
58 |
"epochs": 1000,
|
59 |
-
"lr":
|
60 |
-
"wd": 0.
|
61 |
"max_grad_norm": 0.5,
|
62 |
"save_every_n_samples": 5000000,
|
63 |
"find_unused_parameters": false,
|
64 |
-
"warmup_steps":
|
65 |
"amp": true,
|
66 |
"n_sample_images": 10,
|
67 |
"device": "cuda:0",
|
|
|
15 |
"attn_dim_head": 64,
|
16 |
"sparse_attn": true,
|
17 |
"memory_efficient": true,
|
18 |
+
"resnet_weight_standardization": false,
|
19 |
"self_attn": [false, true, true, true]
|
20 |
}
|
21 |
],
|
|
|
33 |
"data": {
|
34 |
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
35 |
"num_workers": 6,
|
36 |
+
"batch_size": 21,
|
37 |
"start_shard": 0,
|
38 |
"end_shard": 231349,
|
39 |
"shard_width": 6,
|
|
|
56 |
},
|
57 |
"train": {
|
58 |
"epochs": 1000,
|
59 |
+
"lr": 1.2e-4,
|
60 |
+
"wd": 0.0,
|
61 |
"max_grad_norm": 0.5,
|
62 |
"save_every_n_samples": 5000000,
|
63 |
"find_unused_parameters": false,
|
64 |
+
"warmup_steps": 1000,
|
65 |
"amp": true,
|
66 |
"n_sample_images": 10,
|
67 |
"device": "cuda:0",
|