| { | |
| "architecture": "IgorModel", | |
| "description": "", | |
| "version": 0, | |
| "config": { | |
| "resolution": 224, | |
| "patch_size": 14, | |
| "in_channels": 3, | |
| "d_t": 8, | |
| "augment_type": "resize_crop", | |
| "augment_level": "clip", | |
| "random_crop_scale": [ | |
| 0.8, | |
| 1.0 | |
| ], | |
| "random_crop_ratio": [ | |
| 0.9, | |
| 1.1 | |
| ], | |
| "mlp_ratio": 4.0, | |
| "use_xformers": null, | |
| "encoder_depth": 12, | |
| "encoder_embed_dim": 768, | |
| "encoder_n_heads": 12, | |
| "action_latent_dim": 32, | |
| "st_use_qk_norm": true, | |
| "num_learned_tokens": 2, | |
| "map_heads": 24, | |
| "decoder_depth": 12, | |
| "decoder_embed_dim": 768, | |
| "decoder_n_heads": 12, | |
| "use_qk_norm": true, | |
| "n_codes": 32, | |
| "grid_size": 16, | |
| "embed_tokens": 256 | |
| } | |
| } |