Timsty
/

cross13tasks

Model card Files Files and versions

Timsty commited on 11 days ago

Commit

f8880d9

·

verified ·

1 Parent(s): ce452c8

Delete config.yaml

Files changed (1) hide show

config.yaml +0 -104

config.yaml DELETED Viewed

@@ -1,104 +0,0 @@
-run_id: 0418_QwenLatent_13tasks_actionstate_30k
-run_root_dir: ./runs
-seed: 42
-trackers:
-- jsonl
-- wandb
-wandb_entity: timsty
-wandb_project: vla_jepa
-is_debug: false
-framework:
-  name: QwenLatent
-  qwenvl:
-    base_vlm: /mnt/data/fangyu/model/Qwen/Qwen3-VL-2B-Instruct
-    attn_implementation: flash_attention_2
-    vl_hidden_dim: 2048
-    num_data_tokens: 32
-  action_model:
-    ckpt_path: /mnt/data/fangyu/code/reward_new/runs/0418_Action_13tasks_actionstate_fixchunk15/final_model/pytorch_model.pt
-    action_size: 37
-    state_size: 74
-    use_state: ${datasets.vla_data.state_use_action_chunk}
-    hidden_size: 1024
-    intermediate_size: 3072
-    dataset_vocab_size: 256
-    num_data_tokens: 32
-    num_t_samples: 4
-    min_action_len: 5
-    num_encoder_layers: 28
-    num_decoder_layers: 28
-    num_attention_heads: 16
-    num_key_value_heads: 8
-    head_dim: 128
-    max_position_embeddings: 2048
-    max_action_chunk_size: 50
-    rms_norm_eps: 1.0e-06
-    attention_dropout: 0.0
-    use_vae_reparameterization: false
-    use_ema: false
-    chunk_size: ${datasets.vla_data.chunk_size}
-    loss_mode: full
-    qwen3_pretrained_name_or_path: /mnt/data/fangyu/model/Qwen/Qwen3-0.6B
-datasets:
-  vla_data:
-    dataset_py: lerobot_datasets
-    data_root_dir: /mnt/data/fangyu/dataset/IPEC-COMMUNITY
-    data_mix: cross_embodiedment_13tasks
-    CoT_prompt: 'Task: {instruction}. What are the next 15 actions to take?'
-    default_image_resolution:
-    - 3
-    - 224
-    - 224
-    per_device_batch_size: 32
-    load_all_data_for_training: true
-    obs:
-    - image_0
-    image_size:
-    - 224
-    - 224
-    video_backend: torchcodec
-    load_video: true
-    chunk_size: 15
-    state_use_action_chunk: true
-    num_history_steps: 0
-    include_state: ${datasets.vla_data.state_use_action_chunk}
-trainer:
-  epochs: 100
-  max_train_steps: 50000
-  num_warmup_steps: 5000
-  num_stable_steps: 0
-  mode: decay_aux_loss
-  loss_weights_decay_steps: 5000
-  save_interval: 5000
-  eval_interval: 50
-  max_checkpoints_to_keep: 20
-  learning_rate:
-    base: 2.5e-05
-    qwen_vl_interface: 2.5e-05
-    action_model: 2.5e-05
-  lr_scheduler_type: warmup_stable_cosine
-  scheduler_specific_kwargs:
-    min_lr_ratio: 0.001
-  freeze_modules: ''
-  loss_scale:
-    align_loss: 1.0
-    recon_loss: 1.0
-    predict_loss: 1.0
-  warmup_ratio: 0.1
-  weight_decay: 0.0
-  logging_frequency: 10
-  gradient_clipping: 5.0
-  gradient_accumulation_steps: 1
-  optimizer:
-    name: AdamW
-    betas:
-    - 0.9
-    - 0.95
-    eps: 1.0e-08
-    weight_decay: 1.0e-08
-  is_resume: false
-  resume_epoch: null
-  resume_step: null
-  enable_gradient_checkpointing: true
-  enable_mixed_precision_training: true
-output_dir: ./runs/0418_QwenLatent_13tasks_actionstate_30k