wlsaidhi commited on
Commit
f1a8a91
·
verified ·
1 Parent(s): cbd46ef

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer/tokenizer.json filter=lfs diff=lfs merge=lfs -text
model_index.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "MatrixGame3I2VPipeline",
3
+ "_diffusers_version": "0.33.1",
4
+ "scheduler": [
5
+ "diffusers",
6
+ "FlowUniPCMultistepScheduler"
7
+ ],
8
+ "transformer": [
9
+ "diffusers",
10
+ "MatrixGame3WanModel"
11
+ ],
12
+ "vae": [
13
+ "diffusers",
14
+ "AutoencoderKLWan"
15
+ ],
16
+ "text_encoder": [
17
+ "transformers",
18
+ "UMT5EncoderModel"
19
+ ],
20
+ "tokenizer": [
21
+ "transformers",
22
+ "T5TokenizerFast"
23
+ ],
24
+ "light_vae": [
25
+ "diffusers",
26
+ "AutoencoderKLWan"
27
+ ]
28
+ }
transformer/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "MatrixGame3WanModel",
3
+ "patch_size": [
4
+ 1,
5
+ 2,
6
+ 2
7
+ ],
8
+ "in_channels": 48,
9
+ "out_channels": 48,
10
+ "num_attention_heads": 24,
11
+ "attention_head_dim": 128,
12
+ "ffn_dim": 14336,
13
+ "num_layers": 30,
14
+ "freq_dim": 256,
15
+ "eps": 1e-06,
16
+ "qk_norm": "rms_norm_across_heads",
17
+ "cross_attn_norm": true,
18
+ "text_len": 512,
19
+ "text_dim": 4096,
20
+ "image_dim": 0,
21
+ "use_text_crossattn": true,
22
+ "use_memory": true,
23
+ "sigma_theta": 0.8,
24
+ "camera_embed_in_channels": 1536,
25
+ "action_config": {
26
+ "blocks": [
27
+ 0,
28
+ 1,
29
+ 2,
30
+ 3,
31
+ 4,
32
+ 5,
33
+ 6,
34
+ 7,
35
+ 8,
36
+ 9,
37
+ 10,
38
+ 11,
39
+ 12,
40
+ 13,
41
+ 14
42
+ ],
43
+ "enable_keyboard": true,
44
+ "enable_mouse": true,
45
+ "heads_num": 16,
46
+ "hidden_size": 128,
47
+ "img_hidden_size": 3072,
48
+ "keyboard_dim_in": 6,
49
+ "keyboard_hidden_dim": 1024,
50
+ "mouse_dim_in": 2,
51
+ "mouse_hidden_dim": 1024,
52
+ "mouse_qk_dim_list": [
53
+ 8,
54
+ 28,
55
+ 28
56
+ ],
57
+ "patch_size": [
58
+ 1,
59
+ 2,
60
+ 2
61
+ ],
62
+ "qk_norm": true,
63
+ "qkv_bias": false,
64
+ "rope_dim_list": [
65
+ 8,
66
+ 28,
67
+ 28
68
+ ],
69
+ "rope_theta": 256,
70
+ "vae_time_compression_ratio": 4,
71
+ "windows_size": 3
72
+ }
73
+ }
transformer/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ca38c750b5464253f8a5ee86ed78d2d9e5d7837c89bbaef1400019ae19f0d5
3
+ size 12939976240