{ "_class_name": "MaskGiTUViT", "_version": "0.0.1", "add_cross_attention": true, "attention_dropout": 0.0, "block_out_channels": [ 512, 1024 ], "codebook_size": 8192, "encoder_hidden_size": 768, "hidden_dropout": 0.0, "hidden_size": 1024, "in_channels": 384, "initializer_range": 0.02, "intermediate_size": 4096, "layer_norm_eps": 0.000001, "mask_token_id": 8255, "max_position_embeddings": 256, "norm_type": "rmsnorm", "num_attention_heads": 16, "num_classes": null, "num_hidden_layers": 22, "num_res_blocks": 3, "num_vq_tokens": 1024, "patch_size": 1, "project_encoder_hidden_states": false, "use_bias": false, "use_codebook_size_for_output": true, "use_encoder_layernorm": true, "use_normformer": false, "use_position_embeddings": false, "vocab_size": 8256 }