| { |
| "_attn_implementation_autoset": true, |
| "auto_map": { |
| "AutoModel": "huggingface_mae.MAEModel", |
| "AutoConfig": "huggingface_mae.MAEConfig" |
| }, |
| "apply_loss_unmasked": false, |
| "architectures": [ |
| "MAEModel" |
| ], |
| "crop_size": -1, |
| "decoder": { |
| "_target_": "mae_modules.CAMAEDecoder", |
| "depth": 8, |
| "embed_dim": 512, |
| "mlp_ratio": 4, |
| "norm_layer": { |
| "_partial_": true, |
| "_target_": "torch.nn.LayerNorm", |
| "eps": 1e-06 |
| }, |
| "num_heads": 16, |
| "num_modalities": 6, |
| "qkv_bias": true, |
| "tokens_per_modality": 256 |
| }, |
| "encoder": { |
| "_target_": "mae_modules.MAEEncoder", |
| "channel_agnostic": true, |
| "max_in_chans": 11, |
| "vit_backbone": { |
| "_target_": "vit.sincos_positional_encoding_vit", |
| "vit_backbone": { |
| "_target_": "vit.vit_small_patch16_256", |
| "global_pool": "avg" |
| } |
| } |
| }, |
| "fourier_loss": { |
| "_target_": "loss.FourierLoss", |
| "num_multimodal_modalities": 6 |
| }, |
| "fourier_loss_weight": 0.0, |
| "input_norm": { |
| "_args_": [ |
| { |
| "_target_": "normalizer.Normalizer" |
| }, |
| { |
| "_target_": "torch.nn.InstanceNorm2d", |
| "affine": false, |
| "num_features": null, |
| "track_running_stats": false |
| } |
| ], |
| "_target_": "torch.nn.Sequential" |
| }, |
| "layernorm_unfreeze": true, |
| "loss": { |
| "_target_": "torch.nn.MSELoss", |
| "reduction": "none" |
| }, |
| "lr_scheduler": { |
| "_partial_": true, |
| "_target_": "torch.optim.lr_scheduler.OneCycleLR", |
| "anneal_strategy": "cos", |
| "max_lr": 0.0001, |
| "pct_start": 0.1 |
| }, |
| "mask_fourier_loss": true, |
| "mask_ratio": 0.0, |
| "model_type": "MAE", |
| "norm_pix_loss": false, |
| "num_blocks_to_freeze": 0, |
| "optimizer": { |
| "_partial_": true, |
| "_target_": "timm.optim.lion.Lion", |
| "betas": [ |
| 0.9, |
| 0.95 |
| ], |
| "lr": 0.0001, |
| "weight_decay": 0.05 |
| }, |
| "torch_dtype": "float32", |
| "transformers_version": "4.46.1", |
| "trim_encoder_blocks": null, |
| "use_MAE_weight_init": false |
| } |
|
|