Aduc-sdr commited on
Commit
0326fdf
·
verified ·
1 Parent(s): 1d83a79

Upload main.yaml

Browse files
Files changed (1) hide show
  1. main.yaml +85 -0
main.yaml ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ __object__:
2
+ path: projects.video_diffusion_sr.train
3
+ name: VideoDiffusionTrainer
4
+
5
+ dit:
6
+ model:
7
+ __object__:
8
+ path: models.dit.nadit
9
+ name: NaDiT
10
+ args: as_params
11
+ vid_in_channels: 33
12
+ vid_out_channels: 16
13
+ vid_dim: 3072
14
+ txt_in_dim: 5120
15
+ txt_dim: ${.vid_dim}
16
+ emb_dim: ${eval:'6 * ${.vid_dim}'}
17
+ heads: 24
18
+ head_dim: 128 # llm-like
19
+ expand_ratio: 4
20
+ norm: fusedrms
21
+ norm_eps: 1e-5
22
+ ada: single
23
+ qk_bias: False
24
+ qk_rope: True
25
+ qk_norm: fusedrms
26
+ patch_size: [ 1,2,2 ]
27
+ num_layers: 36 # llm-like
28
+ shared_mlp: False
29
+ shared_qkv: False
30
+ mlp_type: normal
31
+ block_type: ${eval:'${.num_layers} * ["mmdit_sr"]'} # space-full
32
+ window: ${eval:'${.num_layers} * [(4,3,3)]'} # space-full
33
+ window_method: ${eval:'${.num_layers} // 2 * ["720pwin_by_size_bysize","720pswin_by_size_bysize"]'} # space-full
34
+ compile: False
35
+ gradient_checkpoint: True
36
+ fsdp:
37
+ sharding_strategy: _HYBRID_SHARD_ZERO2
38
+
39
+ ema:
40
+ decay: 0.9998
41
+
42
+ vae:
43
+ model:
44
+ __inherit__: models/video_vae_v3/s8_c16_t4_inflation_sd3.yaml
45
+ freeze_encoder: False
46
+ # gradient_checkpoint: True
47
+ slicing:
48
+ split_size: 4
49
+ memory_device: same
50
+ memory_limit:
51
+ conv_max_mem: 0.5
52
+ norm_max_mem: 0.5
53
+ checkpoint: ./ckpts/ema_vae.pth
54
+ scaling_factor: 0.9152
55
+ compile: False
56
+ grouping: False
57
+ dtype: bfloat16
58
+
59
+ diffusion:
60
+ schedule:
61
+ type: lerp
62
+ T: 1000.0
63
+ sampler:
64
+ type: euler
65
+ prediction_type: v_lerp
66
+ timesteps:
67
+ training:
68
+ type: logitnormal
69
+ loc: 0.0
70
+ scale: 1.0
71
+ sampling:
72
+ type: uniform_trailing
73
+ steps: 50
74
+ transform: True
75
+ loss:
76
+ type: v_lerp
77
+ cfg:
78
+ scale: 7.5
79
+ rescale: 0
80
+
81
+ condition:
82
+ i2v: 0.0
83
+ v2v: 0.0
84
+ sr: 1.0
85
+ noise_scale: 0.25