reza-alipour commited on Dec 11, 2023

Commit

48f31c9

•

1 Parent(s): 3c12aea

Upload folder using huggingface_hub

Browse files

Files changed (37) hide show

checkpoint-16000/ema_model/config.json +39 -0
checkpoint-16000/ema_model/pytorch_model.bin +3 -0
checkpoint-16000/metadata.json +1 -0
checkpoint-16000/optimizer.bin +3 -0
checkpoint-16000/pytorch_model.bin +3 -0
checkpoint-16000/random_states_0.pkl +3 -0
checkpoint-16000/scheduler.bin +3 -0
checkpoint-16000/unwrapped_model/config.json +32 -0
checkpoint-16000/unwrapped_model/pytorch_model.bin +3 -0
checkpoint-17000/ema_model/config.json +39 -0
checkpoint-17000/ema_model/pytorch_model.bin +3 -0
checkpoint-17000/metadata.json +1 -0
checkpoint-17000/optimizer.bin +3 -0
checkpoint-17000/pytorch_model.bin +3 -0
checkpoint-17000/random_states_0.pkl +3 -0
checkpoint-17000/scheduler.bin +3 -0
checkpoint-17000/unwrapped_model/config.json +32 -0
checkpoint-17000/unwrapped_model/pytorch_model.bin +3 -0
checkpoint-18000/ema_model/config.json +39 -0
checkpoint-18000/ema_model/pytorch_model.bin +3 -0
checkpoint-18000/metadata.json +1 -0
checkpoint-18000/optimizer.bin +3 -0
checkpoint-18000/pytorch_model.bin +3 -0
checkpoint-18000/random_states_0.pkl +3 -0
checkpoint-18000/scheduler.bin +3 -0
checkpoint-18000/unwrapped_model/config.json +32 -0
checkpoint-18000/unwrapped_model/pytorch_model.bin +3 -0
checkpoint-19000/ema_model/config.json +39 -0
checkpoint-19000/ema_model/pytorch_model.bin +3 -0
checkpoint-19000/metadata.json +1 -0
checkpoint-19000/optimizer.bin +3 -0
checkpoint-19000/pytorch_model.bin +3 -0
checkpoint-19000/random_states_0.pkl +3 -0
checkpoint-19000/scheduler.bin +3 -0
checkpoint-19000/unwrapped_model/config.json +32 -0
checkpoint-19000/unwrapped_model/pytorch_model.bin +3 -0
config.yaml +104 -0

checkpoint-16000/ema_model/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "decay": 0.9999,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "inv_gamma": 1.0,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "min_decay": 0.0,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "optimization_step": 16000,
+  "power": 0.6666666666666666,
+  "update_after_step": 0,
+  "use_bias": false,
+  "use_ema_warmup": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-16000/ema_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9442c377fd7f403432cf274e442ebbf9cd5a9d77039ef1ad553b705fa7fb0d5
+size 2433247453

checkpoint-16000/metadata.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"global_step": 16000}

checkpoint-16000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fac61908bf95a9fbb0fce9a67f1651fc15bb7d6a882a21671405345db656b0e7
+size 4866486533

checkpoint-16000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:824b778a4bfa117fcaeea2bbe95593d11853f871f7e0e398c8031c5483cc0715
+size 2433254429

checkpoint-16000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ccae0f99cb4b7afd849d0f2cf73f7f72e68a7b0e26a839bdfbdaaec351fb1a6d
+size 14663

checkpoint-16000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61e7811b299e3751399e44fb63e5aa649eda39379a7c5656abcb05e077fa23de
+size 627

checkpoint-16000/unwrapped_model/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "use_bias": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-16000/unwrapped_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:824b778a4bfa117fcaeea2bbe95593d11853f871f7e0e398c8031c5483cc0715
+size 2433254429

checkpoint-17000/ema_model/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "decay": 0.9999,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "inv_gamma": 1.0,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "min_decay": 0.0,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "optimization_step": 17000,
+  "power": 0.6666666666666666,
+  "update_after_step": 0,
+  "use_bias": false,
+  "use_ema_warmup": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-17000/ema_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c49970ad1419ceb322abcbf1a9c4a688f01fdf1c372b5dc2c45b83a1d7cd3907
+size 2433247453

checkpoint-17000/metadata.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"global_step": 17000}

checkpoint-17000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d06214b9da04bb3402f04a05ff7bf28e679ea568efc8840137895b6ae948f63e
+size 4866486533

checkpoint-17000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0711d3091631d614ecd49ec7267fa3aecbcd63fa173ba630069d5e2114791f21
+size 2433254429

checkpoint-17000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8429c96e11c465ee4ac12c19a4d6c2d5df410c4f011c47c22476bc5ea55555eb
+size 14663

checkpoint-17000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:927cb1e3c51f59387f003f7128d398b83c764d5386962b2ff194e10e35375b8a
+size 627

checkpoint-17000/unwrapped_model/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "use_bias": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-17000/unwrapped_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0711d3091631d614ecd49ec7267fa3aecbcd63fa173ba630069d5e2114791f21
+size 2433254429

checkpoint-18000/ema_model/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "decay": 0.9999,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "inv_gamma": 1.0,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "min_decay": 0.0,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "optimization_step": 18000,
+  "power": 0.6666666666666666,
+  "update_after_step": 0,
+  "use_bias": false,
+  "use_ema_warmup": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-18000/ema_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3dc543cf2ac968d4002802669098abb4a1c4e97505e61b99088fbf81ab9b477c
+size 2433247453

checkpoint-18000/metadata.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"global_step": 18000}

checkpoint-18000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb5734aaeee42598b647908b68220386aa0c8a5ec66f343734919bc1ab127d13
+size 4866486533

checkpoint-18000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f8794e5fb15d54d66180b19be7dd4c6c9e93f738f37c250a3f414283ac62ae2
+size 2433254429

checkpoint-18000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:da53af8ef43be89c1c05c1dbb3366f3db6e11d359c79936788812e16c618f801
+size 14599

checkpoint-18000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:106c03c9203bf87eacbb68b21e440e6322338d101f1083b7c57a201947e76bcd
+size 627

checkpoint-18000/unwrapped_model/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "use_bias": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-18000/unwrapped_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8f8794e5fb15d54d66180b19be7dd4c6c9e93f738f37c250a3f414283ac62ae2
+size 2433254429

checkpoint-19000/ema_model/config.json ADDED Viewed

	@@ -0,0 +1,39 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "decay": 0.9999,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "inv_gamma": 1.0,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "min_decay": 0.0,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "optimization_step": 19000,
+  "power": 0.6666666666666666,
+  "update_after_step": 0,
+  "use_bias": false,
+  "use_ema_warmup": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-19000/ema_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fd1c2c51f3326fe29e5b1c6ff228b3953e7db3853b417ba72acc0ed21d0b70a4
+size 2433247453

checkpoint-19000/metadata.json ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"global_step": 19000}

checkpoint-19000/optimizer.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee1dd5b0fdb53b14c9e5fea404b8747d2b9be4834822e6fcf5c45de0837f3ae1
+size 4866486533

checkpoint-19000/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fff2ba7f92d6ebfd7f8e9321c3a9c884cf37e634fc46e90f8ab42636d211bb4
+size 2433254429

checkpoint-19000/random_states_0.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:bc79935ca199f1c08e936bdcece8113d5133a45e7416fed4eb90961d2bf14a92
+size 14663

checkpoint-19000/scheduler.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:01f80899eef09d4382fd001aa8e09cb281ec6d0a2f35143b7d598b51ceb1d5c5
+size 627

checkpoint-19000/unwrapped_model/config.json ADDED Viewed

	@@ -0,0 +1,32 @@

+{
+  "_class_name": "MaskGiTUViT_v2",
+  "_version": "0.0.1",
+  "add_cond_embeds": true,
+  "add_micro_cond_embeds": true,
+  "attention_dropout": 0.0,
+  "block_num_heads": 12,
+  "block_out_channels": [
+    768
+  ],
+  "codebook_size": 8192,
+  "cond_embed_dim": 768,
+  "encoder_hidden_size": 768,
+  "force_down_up_sample": true,
+  "hidden_dropout": 0.0,
+  "hidden_size": 1024,
+  "in_channels": 768,
+  "intermediate_size": 2816,
+  "layer_norm_eps": 1e-06,
+  "ln_elementwise_affine": true,
+  "mask_token_id": 8255,
+  "micro_cond_embed_dim": 1280,
+  "micro_cond_encode_dim": 256,
+  "norm_type": "rmsnorm",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 22,
+  "num_res_blocks": 3,
+  "use_bias": false,
+  "use_fused_mlp": false,
+  "use_fused_residual_norm": false,
+  "vocab_size": 8256
+}

checkpoint-19000/unwrapped_model/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6fff2ba7f92d6ebfd7f8e9321c3a9c884cf37e634fc46e90f8ab42636d211bb4
+size 2433254429

config.yaml ADDED Viewed

	@@ -0,0 +1,104 @@

+wandb:
+  entity: r-ap
+  run_id: xvom3pxa
+experiment:
+  name: muse-multi
+  project: muse-prod
+  output_dir: output/
+  max_train_examples: 28500
+  max_eval_examples: 1000
+  save_every: 1000
+  eval_every: 700
+  generate_every: 200
+  log_every: 50
+  log_grad_norm_every: 100000000
+  resume_from_checkpoint: latest
+  resume_lr_scheduler: true
+  checkpoints_total_limit: 4
+  logging_dir: output/logs
+model:
+  vq_model:
+    type: vqgan
+  text_encoder:
+    type: clip
+    pretrained: openMUSE/clip-vit-large-patch14-text-enc
+  transformer:
+    vocab_size: 8256
+    hidden_size: 1024
+    intermediate_size: 2816
+    num_hidden_layers: 22
+    num_attention_heads: 16
+    in_channels: 768
+    block_out_channels:
+    - 768
+    block_has_attention:
+    - true
+    block_num_heads: 12
+    num_res_blocks: 3
+    res_ffn_factor: 4
+    patch_size: 1
+    encoder_hidden_size: 768
+    add_cross_attention: true
+    project_encoder_hidden_states: true
+    codebook_size: 8192
+    num_vq_tokens: 256
+    initializer_range: 0.02
+    norm_type: rmsnorm
+    layer_norm_eps: 1.0e-06
+    ln_elementwise_affine: true
+    use_encoder_layernorm: false
+    use_bias: false
+    hidden_dropout: 0.0
+    attention_dropout: 0.0
+    use_codebook_size_for_output: true
+    use_empty_embeds_for_uncond: true
+    add_cond_embeds: true
+    cond_embed_dim: 768
+    add_micro_cond_embeds: true
+    micro_cond_encode_dim: 256
+    micro_cond_embed_dim: 1280
+    force_down_up_sample: true
+  architecture: uvit
+  enable_xformers_memory_efficient_attention: true
+dataset:
+  preprocessing:
+    max_seq_length: 77
+    resolution: 256
+optimizer:
+  name: adamw
+  params:
+    learning_rate: 0.0001
+    scale_lr: false
+    beta1: 0.9
+    beta2: 0.999
+    weight_decay: 0.01
+    epsilon: 1.0e-08
+lr_scheduler:
+  scheduler: constant_with_warmup
+  params:
+    learning_rate: ${optimizer.params.learning_rate}
+    warmup_steps: 100
+training:
+  gradient_accumulation_steps: 1
+  batch_size: 20
+  mixed_precision: 'no'
+  enable_tf32: true
+  use_ema: true
+  ema_decay: 0.9999
+  ema_update_after_step: 0
+  ema_update_every: 1
+  seed: 13399
+  max_train_steps: 20000
+  overfit_one_batch: false
+  cond_dropout_prob: 0.1
+  min_masking_rate: 0.0
+  label_smoothing: 0.1
+  max_grad_norm: null
+  guidance_scale: 8
+  generation_timesteps: 16
+  use_soft_code_target: false
+  use_stochastic_code: false
+  soft_code_temp: 1.0
+  mask_schedule: cosine
+  mask_contiguous_region_prob: 0.15
+config: configs/segmentation.yaml