joon-stack commited on
Commit
bfceca3
·
verified ·
1 Parent(s): 107c5fb

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ wandb/run-20260325_200057-qudlwnz5/run-qudlwnz5.wandb filter=lfs diff=lfs merge=lfs -text
.hydra/config.yaml ADDED
@@ -0,0 +1,327 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ name: libero_cosmos_policy
3
+ type: mg
4
+ backend: robomimic
5
+ paths: []
6
+ task_suite_name: null
7
+ observations_keys:
8
+ - image
9
+ observation_source_keys:
10
+ image: agentview_rgb_jpeg
11
+ action_dim: 7
12
+ frame_stack: 1
13
+ horizon: 1
14
+ temporal_index_mode: clip
15
+ use_proprio: false
16
+ proprio_source: robot_states
17
+ image_chw:
18
+ - 3
19
+ - 224
20
+ - 224
21
+ image_value_range: zero_to_one
22
+ image_transport_dtype: uint8
23
+ duration_focus: null
24
+ hf:
25
+ repo_id: nvidia/LIBERO-Cosmos-Policy
26
+ repo_type: dataset
27
+ allow_patterns:
28
+ - success_only/*_regen/*.hdf5
29
+ local_files_only: false
30
+ train:
31
+ optimizer:
32
+ type: adamw
33
+ lr: 0.0001
34
+ weight_decay: 1.0e-06
35
+ batch_size: 256
36
+ num_workers: 4
37
+ prefetch_factor: null
38
+ log_interval: 100
39
+ total_steps: 5000
40
+ eval_interval: 500
41
+ use_aug: true
42
+ aug_mode: default
43
+ use_amp: true
44
+ device_transfer_non_blocking: true
45
+ seed: 42
46
+ scheduler:
47
+ type: cosine
48
+ warmup_steps: 500
49
+ num_cycles: 0.5
50
+ min_lr_scale: 0.0
51
+ decoder_dataloader:
52
+ enabled: false
53
+ batch_size: 64
54
+ num_workers: 4
55
+ prefetch_factor: null
56
+ shuffle: true
57
+ stages:
58
+ stage1: true
59
+ stage2: false
60
+ stage3: false
61
+ stage1:
62
+ batch_size: 256
63
+ num_workers: 16
64
+ prefetch_factor: 2
65
+ log_interval: 100
66
+ total_steps: 20000
67
+ eval_interval: 500
68
+ optimizer:
69
+ lr: 0.0001
70
+ weight_decay: 1.0e-06
71
+ stage2:
72
+ batch_size: 256
73
+ num_workers: 4
74
+ prefetch_factor: null
75
+ log_interval: 100
76
+ total_steps: 5000
77
+ eval_interval: 500
78
+ latent_target: auto
79
+ optimizer:
80
+ lr: 0.0001
81
+ weight_decay: 1.0e-06
82
+ action_probe:
83
+ enabled: true
84
+ stage3:
85
+ batch_size: 256
86
+ num_workers: 4
87
+ prefetch_factor: null
88
+ log_interval: 100
89
+ total_steps: 5000
90
+ eval_interval: 500
91
+ final_eval_num_episodes: 100
92
+ log_eval_video: false
93
+ optimizer:
94
+ lr: 0.0001
95
+ weight_decay: 1.0e-06
96
+ trainable_scope: all
97
+ non_decoder_lr_scale: 1.0
98
+ checkpoint:
99
+ enabled: true
100
+ base_dir: null
101
+ save_interval: 1000
102
+ save_last: true
103
+ latest_only: true
104
+ load:
105
+ stage1:
106
+ mode: none
107
+ path: null
108
+ stage2:
109
+ mode: handoff
110
+ path: null
111
+ teacher_path: null
112
+ stage3:
113
+ mode: handoff
114
+ path: null
115
+ model:
116
+ idm:
117
+ type: token_idm
118
+ action_dim: 128
119
+ token_dim: 768
120
+ model_dim: 512
121
+ latent_dim: 32
122
+ num_action_tokens: 4
123
+ num_blocks: 4
124
+ num_heads: 8
125
+ dropout: 0.0
126
+ fdm:
127
+ type: token_fdm_duration
128
+ action_dim: 128
129
+ token_dim: 768
130
+ model_dim: 512
131
+ num_action_tokens: 4
132
+ num_blocks: 4
133
+ num_heads: 8
134
+ dropout: 0.0
135
+ hyperbolic_latent:
136
+ enabled: false
137
+ backend: geoopt
138
+ manifold: poincare
139
+ curvature: 1.0
140
+ learnable_curvature: false
141
+ fdm_input_mode: logmap0
142
+ prelift_mode: none
143
+ prelift_scale: 1.0
144
+ lift_max_norm: 5.0
145
+ tangent_max_norm: 5.0
146
+ eps: 1.0e-06
147
+ encoders:
148
+ type: dino
149
+ image_key: image
150
+ model_id: facebook/dinov2-base
151
+ input_value_range: zero_to_one
152
+ freeze_backbone: true
153
+ drop_cls_token: true
154
+ output_dim: 768
155
+ mean:
156
+ - 0.485
157
+ - 0.456
158
+ - 0.406
159
+ std:
160
+ - 0.229
161
+ - 0.224
162
+ - 0.225
163
+ type: dino_lam
164
+ idm_input: future
165
+ fdm_target: future
166
+ pixel_decoders: null
167
+ latent_action_decoders: null
168
+ objective:
169
+ fdm_target: future
170
+ idm_input: future
171
+ stage_overrides: {}
172
+ multiscale:
173
+ enabled: true
174
+ consistency:
175
+ enabled: false
176
+ weight: 10.0
177
+ num_pairs: 4
178
+ sample_source: all_horizons
179
+ teacher_mode: direct_teacher
180
+ prediction_mode: direct_duration
181
+ allow_plain_fdm_oneshot: true
182
+ weight_mode: uniform
183
+ weights: {}
184
+ temporal:
185
+ max_offset: 20
186
+ anchor_mode: fixed
187
+ extra_random_count: 0
188
+ branch_order:
189
+ enabled: false
190
+ radial_weight: 0.0
191
+ local_radial_margin_weight: 0.0
192
+ local_radial_margin_alpha: 0.05
193
+ branch_weight: 0.0
194
+ z0_origin_weight: 0.0
195
+ prefix_weight: 0.0
196
+ radius_progress_weight: 1.0
197
+ radius_progress_mode: offset_margin
198
+ radius_progress_alpha: 0.02
199
+ branch_margin_deg: 10.0
200
+ eps: 1.0e-06
201
+ latent_plan:
202
+ enabled: false
203
+ total_horizon: 20
204
+ eval:
205
+ type: robomimic
206
+ data_path: ${data.paths}
207
+ reset_mode: env_reset
208
+ num_eval_episodes: 20
209
+ max_steps: 500
210
+ record_video: true
211
+ checkpoint_path: null
212
+ checkpoint_strict: true
213
+ use_checkpoint_cfg: true
214
+ video_output_path: null
215
+ obs_keys: null
216
+ use_proprio: null
217
+ use_object: false
218
+ resize_hw: null
219
+ image_value_range: null
220
+ seed: 0
221
+ agent:
222
+ encoders:
223
+ image:
224
+ in_channels: 3
225
+ output_dim: 512
226
+ output_mode: global
227
+ type: resnet18
228
+ pretrained: false
229
+ proprio:
230
+ input_dim: 9
231
+ hidden_dim: 128
232
+ output_dim: 64
233
+ type: group
234
+ modalities:
235
+ - agentview_image
236
+ - robot0_eye_in_hand_image
237
+ proj_dim: 128
238
+ policies:
239
+ decoder:
240
+ type: mlp
241
+ hidden_dims:
242
+ - 256
243
+ - 256
244
+ hidden_dims:
245
+ - 512
246
+ - 512
247
+ - 256
248
+ - 64
249
+ action_dim: 256
250
+ emb_dim: 384
251
+ gt_action_dim: 7
252
+ type: latent_action
253
+ probes:
254
+ enabled: true
255
+ every: 10
256
+ steps_per_call: 1
257
+ sequence:
258
+ enabled: true
259
+ horizons:
260
+ - 20
261
+ target_key: gt_action_seq_max
262
+ list:
263
+ z_to_s_t:
264
+ name: z_to_s_t
265
+ enabled: false
266
+ shuffle: true
267
+ type: regression
268
+ input: z_t
269
+ target: s_t
270
+ loss: mse
271
+ lr: 0.001
272
+ every: 10
273
+ mlp:
274
+ hidden_dims:
275
+ - 128
276
+ - 64
277
+ z_to_s_tp:
278
+ name: z_to_s_tp
279
+ enabled: false
280
+ shuffle: true
281
+ type: regression
282
+ input: z_t
283
+ target: s_tp
284
+ loss: mse
285
+ lr: 0.001
286
+ every: 10
287
+ mlp:
288
+ hidden_dims:
289
+ - 128
290
+ - 64
291
+ z_to_action_t:
292
+ name: z_to_action_t
293
+ probe_type: z_to_action
294
+ enabled: true
295
+ shuffle: true
296
+ type: regression
297
+ input: z_t
298
+ target: gt_action
299
+ loss: mse
300
+ lr: 0.001
301
+ every: 1
302
+ mlp:
303
+ hidden_dims:
304
+ - 128
305
+ - 64
306
+ z_to_action_seq_h20:
307
+ name: z_to_action_seq_h20
308
+ probe_type: z_to_action_sequence
309
+ enabled: true
310
+ shuffle: true
311
+ type: regression
312
+ input: z_t
313
+ target: gt_action_seq_max
314
+ sequence_horizon: 20
315
+ loss: mse
316
+ lr: 0.001
317
+ every: 10
318
+ mlp:
319
+ hidden_dims:
320
+ - 128
321
+ - 64
322
+ logger:
323
+ project: latent_action
324
+ run_name: latent_action_training
325
+ tags:
326
+ - debug
327
+ output_root: outputs/token_fdm_duration/dino_suite_all_k20_extra0
.hydra/hydra.yaml ADDED
@@ -0,0 +1,192 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ hydra:
2
+ run:
3
+ dir: ${output_root}/${data.name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
4
+ sweep:
5
+ dir: ${output_root}/multirun/${data.name}/${now:%Y-%m-%d}/${now:%H-%M-%S}
6
+ subdir: ${hydra.job.num}
7
+ launcher:
8
+ _target_: hydra._internal.core_plugins.basic_launcher.BasicLauncher
9
+ sweeper:
10
+ _target_: hydra._internal.core_plugins.basic_sweeper.BasicSweeper
11
+ max_batch_size: null
12
+ params: null
13
+ help:
14
+ app_name: ${hydra.job.name}
15
+ header: '${hydra.help.app_name} is powered by Hydra.
16
+
17
+ '
18
+ footer: 'Powered by Hydra (https://hydra.cc)
19
+
20
+ Use --hydra-help to view Hydra specific help
21
+
22
+ '
23
+ template: '${hydra.help.header}
24
+
25
+ == Configuration groups ==
26
+
27
+ Compose your configuration from those groups (group=option)
28
+
29
+
30
+ $APP_CONFIG_GROUPS
31
+
32
+
33
+ == Config ==
34
+
35
+ Override anything in the config (foo.bar=value)
36
+
37
+
38
+ $CONFIG
39
+
40
+
41
+ ${hydra.help.footer}
42
+
43
+ '
44
+ hydra_help:
45
+ template: 'Hydra (${hydra.runtime.version})
46
+
47
+ See https://hydra.cc for more info.
48
+
49
+
50
+ == Flags ==
51
+
52
+ $FLAGS_HELP
53
+
54
+
55
+ == Configuration groups ==
56
+
57
+ Compose your configuration from those groups (For example, append hydra/job_logging=disabled
58
+ to command line)
59
+
60
+
61
+ $HYDRA_CONFIG_GROUPS
62
+
63
+
64
+ Use ''--cfg hydra'' to Show the Hydra config.
65
+
66
+ '
67
+ hydra_help: ???
68
+ hydra_logging:
69
+ version: 1
70
+ formatters:
71
+ simple:
72
+ format: '[%(asctime)s][HYDRA] %(message)s'
73
+ handlers:
74
+ console:
75
+ class: logging.StreamHandler
76
+ formatter: simple
77
+ stream: ext://sys.stdout
78
+ root:
79
+ level: INFO
80
+ handlers:
81
+ - console
82
+ loggers:
83
+ logging_example:
84
+ level: DEBUG
85
+ disable_existing_loggers: false
86
+ job_logging:
87
+ version: 1
88
+ formatters:
89
+ simple:
90
+ format: '[%(asctime)s][%(name)s][%(levelname)s] - %(message)s'
91
+ handlers:
92
+ console:
93
+ class: logging.StreamHandler
94
+ formatter: simple
95
+ stream: ext://sys.stdout
96
+ file:
97
+ class: logging.FileHandler
98
+ formatter: simple
99
+ filename: ${hydra.runtime.output_dir}/${hydra.job.name}.log
100
+ root:
101
+ level: INFO
102
+ handlers:
103
+ - console
104
+ - file
105
+ disable_existing_loggers: false
106
+ env: {}
107
+ mode: RUN
108
+ searchpath: []
109
+ callbacks: {}
110
+ output_subdir: .hydra
111
+ overrides:
112
+ hydra:
113
+ - hydra.mode=RUN
114
+ task:
115
+ - data=libero_cosmos_policy
116
+ - data.task_suite_name=null
117
+ - data.hf.allow_patterns=[success_only/*_regen/*.hdf5]
118
+ - data.image_chw=[3,224,224]
119
+ - data.temporal_index_mode=clip
120
+ - model.fdm.type=token_fdm_duration
121
+ - objective.idm_input=future
122
+ - objective.temporal.max_offset=20
123
+ - objective.temporal.anchor_mode=fixed
124
+ - objective.temporal.extra_random_count=0
125
+ - train.use_aug=true
126
+ - train.use_amp=true
127
+ - train.stage1.batch_size=256
128
+ - train.stage1.num_workers=16
129
+ - train.stage1.prefetch_factor=2
130
+ - train.stage1.total_steps=20000
131
+ - train.stage1.log_interval=100
132
+ - train.checkpoint.enabled=true
133
+ - train.checkpoint.save_interval=1000
134
+ - train.checkpoint.save_last=true
135
+ - train.checkpoint.latest_only=true
136
+ - output_root=outputs/token_fdm_duration/dino_suite_all_k20_extra0
137
+ job:
138
+ name: run
139
+ chdir: null
140
+ override_dirname: data.hf.allow_patterns=[success_only/*_regen/*.hdf5],data.image_chw=[3,224,224],data.task_suite_name=null,data.temporal_index_mode=clip,data=libero_cosmos_policy,model.fdm.type=token_fdm_duration,objective.idm_input=future,objective.temporal.anchor_mode=fixed,objective.temporal.extra_random_count=0,objective.temporal.max_offset=20,output_root=outputs/token_fdm_duration/dino_suite_all_k20_extra0,train.checkpoint.enabled=true,train.checkpoint.latest_only=true,train.checkpoint.save_interval=1000,train.checkpoint.save_last=true,train.stage1.batch_size=256,train.stage1.log_interval=100,train.stage1.num_workers=16,train.stage1.prefetch_factor=2,train.stage1.total_steps=20000,train.use_amp=true,train.use_aug=true
141
+ id: ???
142
+ num: ???
143
+ config_name: dino_lam
144
+ env_set: {}
145
+ env_copy: []
146
+ config:
147
+ override_dirname:
148
+ kv_sep: '='
149
+ item_sep: ','
150
+ exclude_keys: []
151
+ runtime:
152
+ version: 1.3.2
153
+ version_base: '1.1'
154
+ cwd: /home/jovyan/youngjoonjeong/latent_action
155
+ config_sources:
156
+ - path: hydra.conf
157
+ schema: pkg
158
+ provider: hydra
159
+ - path: /home/jovyan/youngjoonjeong/latent_action/configs
160
+ schema: file
161
+ provider: main
162
+ - path: ''
163
+ schema: structured
164
+ provider: schema
165
+ output_dir: /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52
166
+ choices:
167
+ logger: wandb
168
+ probes: action_t
169
+ agent: latent_action_agent
170
+ model/policies@agent.policies: latent_action
171
+ model/policies/decoder@agent.policies.decoder: mlp
172
+ model/encoders@agent.encoders: group_encoder
173
+ model/encoders/proprio@agent.encoders.proprio: mlp
174
+ model/encoders/image@agent.encoders.image: resnet18
175
+ eval: robomimic_eval
176
+ objective: multiscale
177
+ model: dino_lam
178
+ model/encoders: dino_encoder
179
+ model/hyperbolic_latent: base
180
+ train: latent_action_trainer
181
+ train/optimizer: adamw
182
+ data: libero_cosmos_policy
183
+ hydra/env: default
184
+ hydra/callbacks: null
185
+ hydra/job_logging: default
186
+ hydra/hydra_logging: default
187
+ hydra/hydra_help: default
188
+ hydra/help: default
189
+ hydra/sweeper: basic
190
+ hydra/launcher: basic
191
+ hydra/output: default
192
+ verbose: false
.hydra/overrides.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ - data=libero_cosmos_policy
2
+ - data.task_suite_name=null
3
+ - data.hf.allow_patterns=[success_only/*_regen/*.hdf5]
4
+ - data.image_chw=[3,224,224]
5
+ - data.temporal_index_mode=clip
6
+ - model.fdm.type=token_fdm_duration
7
+ - objective.idm_input=future
8
+ - objective.temporal.max_offset=20
9
+ - objective.temporal.anchor_mode=fixed
10
+ - objective.temporal.extra_random_count=0
11
+ - train.use_aug=true
12
+ - train.use_amp=true
13
+ - train.stage1.batch_size=256
14
+ - train.stage1.num_workers=16
15
+ - train.stage1.prefetch_factor=2
16
+ - train.stage1.total_steps=20000
17
+ - train.stage1.log_interval=100
18
+ - train.checkpoint.enabled=true
19
+ - train.checkpoint.save_interval=1000
20
+ - train.checkpoint.save_last=true
21
+ - train.checkpoint.latest_only=true
22
+ - output_root=outputs/token_fdm_duration/dino_suite_all_k20_extra0
config_resolved.yaml ADDED
@@ -0,0 +1,333 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ name: libero_cosmos_policy
3
+ type: mg
4
+ backend: robomimic
5
+ paths: []
6
+ task_suite_name: null
7
+ observations_keys:
8
+ - image
9
+ observation_source_keys:
10
+ image: agentview_rgb_jpeg
11
+ action_dim: 7
12
+ frame_stack: 1
13
+ horizon: 1
14
+ temporal_index_mode: clip
15
+ use_proprio: false
16
+ proprio_source: robot_states
17
+ image_chw:
18
+ - 3
19
+ - 224
20
+ - 224
21
+ image_value_range: zero_to_one
22
+ image_transport_dtype: uint8
23
+ duration_focus: null
24
+ hf:
25
+ repo_id: nvidia/LIBERO-Cosmos-Policy
26
+ repo_type: dataset
27
+ allow_patterns:
28
+ - success_only/*_regen/*.hdf5
29
+ local_files_only: false
30
+ action_sequence_targets:
31
+ enabled: true
32
+ horizons:
33
+ - 20
34
+ target_key: gt_action_seq_max
35
+ train:
36
+ optimizer:
37
+ type: adamw
38
+ lr: 0.0001
39
+ weight_decay: 1.0e-06
40
+ batch_size: 256
41
+ num_workers: 4
42
+ prefetch_factor: null
43
+ log_interval: 100
44
+ total_steps: 5000
45
+ eval_interval: 500
46
+ use_aug: true
47
+ aug_mode: default
48
+ use_amp: true
49
+ device_transfer_non_blocking: true
50
+ seed: 42
51
+ scheduler:
52
+ type: cosine
53
+ warmup_steps: 500
54
+ num_cycles: 0.5
55
+ min_lr_scale: 0.0
56
+ decoder_dataloader:
57
+ enabled: false
58
+ batch_size: 64
59
+ num_workers: 4
60
+ prefetch_factor: null
61
+ shuffle: true
62
+ stages:
63
+ stage1: true
64
+ stage2: false
65
+ stage3: false
66
+ stage1:
67
+ batch_size: 256
68
+ num_workers: 16
69
+ prefetch_factor: 2
70
+ log_interval: 100
71
+ total_steps: 20000
72
+ eval_interval: 500
73
+ optimizer:
74
+ lr: 0.0001
75
+ weight_decay: 1.0e-06
76
+ stage2:
77
+ batch_size: 256
78
+ num_workers: 4
79
+ prefetch_factor: null
80
+ log_interval: 100
81
+ total_steps: 5000
82
+ eval_interval: 500
83
+ latent_target: auto
84
+ optimizer:
85
+ lr: 0.0001
86
+ weight_decay: 1.0e-06
87
+ action_probe:
88
+ enabled: true
89
+ stage3:
90
+ batch_size: 256
91
+ num_workers: 4
92
+ prefetch_factor: null
93
+ log_interval: 100
94
+ total_steps: 5000
95
+ eval_interval: 500
96
+ final_eval_num_episodes: 100
97
+ log_eval_video: false
98
+ optimizer:
99
+ lr: 0.0001
100
+ weight_decay: 1.0e-06
101
+ trainable_scope: all
102
+ non_decoder_lr_scale: 1.0
103
+ checkpoint:
104
+ enabled: true
105
+ base_dir: null
106
+ save_interval: 1000
107
+ save_last: true
108
+ latest_only: true
109
+ load:
110
+ stage1:
111
+ mode: none
112
+ path: null
113
+ stage2:
114
+ mode: handoff
115
+ path: null
116
+ teacher_path: null
117
+ stage3:
118
+ mode: handoff
119
+ path: null
120
+ model:
121
+ idm:
122
+ type: token_idm
123
+ action_dim: 128
124
+ token_dim: 768
125
+ model_dim: 512
126
+ latent_dim: 32
127
+ num_action_tokens: 4
128
+ num_blocks: 4
129
+ num_heads: 8
130
+ dropout: 0.0
131
+ fdm:
132
+ type: token_fdm_duration
133
+ action_dim: 128
134
+ token_dim: 768
135
+ model_dim: 512
136
+ num_action_tokens: 4
137
+ num_blocks: 4
138
+ num_heads: 8
139
+ dropout: 0.0
140
+ hyperbolic_latent:
141
+ enabled: false
142
+ backend: geoopt
143
+ manifold: poincare
144
+ curvature: 1.0
145
+ learnable_curvature: false
146
+ fdm_input_mode: logmap0
147
+ prelift_mode: none
148
+ prelift_scale: 1.0
149
+ lift_max_norm: 5.0
150
+ tangent_max_norm: 5.0
151
+ eps: 1.0e-06
152
+ encoders:
153
+ type: dino
154
+ image_key: image
155
+ model_id: facebook/dinov2-base
156
+ input_value_range: zero_to_one
157
+ freeze_backbone: true
158
+ drop_cls_token: true
159
+ output_dim: 768
160
+ mean:
161
+ - 0.485
162
+ - 0.456
163
+ - 0.406
164
+ std:
165
+ - 0.229
166
+ - 0.224
167
+ - 0.225
168
+ type: dino_lam
169
+ idm_input: future
170
+ fdm_target: future
171
+ pixel_decoders: null
172
+ latent_action_decoders: null
173
+ objective:
174
+ fdm_target: future
175
+ idm_input: future
176
+ stage_overrides: {}
177
+ multiscale:
178
+ enabled: true
179
+ consistency:
180
+ enabled: false
181
+ weight: 10.0
182
+ num_pairs: 4
183
+ sample_source: all_horizons
184
+ teacher_mode: direct_teacher
185
+ prediction_mode: direct_duration
186
+ allow_plain_fdm_oneshot: true
187
+ weight_mode: uniform
188
+ weights: {}
189
+ temporal:
190
+ max_offset: 20
191
+ anchor_mode: fixed
192
+ extra_random_count: 0
193
+ branch_order:
194
+ enabled: false
195
+ radial_weight: 0.0
196
+ local_radial_margin_weight: 0.0
197
+ local_radial_margin_alpha: 0.05
198
+ branch_weight: 0.0
199
+ z0_origin_weight: 0.0
200
+ prefix_weight: 0.0
201
+ radius_progress_weight: 1.0
202
+ radius_progress_mode: offset_margin
203
+ radius_progress_alpha: 0.02
204
+ branch_margin_deg: 10.0
205
+ eps: 1.0e-06
206
+ latent_plan:
207
+ enabled: false
208
+ total_horizon: 20
209
+ eval:
210
+ type: robomimic
211
+ data_path: []
212
+ reset_mode: env_reset
213
+ num_eval_episodes: 20
214
+ max_steps: 500
215
+ record_video: true
216
+ checkpoint_path: null
217
+ checkpoint_strict: true
218
+ use_checkpoint_cfg: true
219
+ video_output_path: null
220
+ obs_keys: null
221
+ use_proprio: null
222
+ use_object: false
223
+ resize_hw: null
224
+ image_value_range: null
225
+ seed: 0
226
+ agent:
227
+ encoders:
228
+ image:
229
+ in_channels: 3
230
+ output_dim: 512
231
+ output_mode: global
232
+ type: resnet18
233
+ pretrained: false
234
+ proprio:
235
+ input_dim: 9
236
+ hidden_dim: 128
237
+ output_dim: 64
238
+ type: group
239
+ modalities:
240
+ - agentview_image
241
+ - robot0_eye_in_hand_image
242
+ proj_dim: 128
243
+ policies:
244
+ decoder:
245
+ type: mlp
246
+ hidden_dims:
247
+ - 256
248
+ - 256
249
+ hidden_dims:
250
+ - 512
251
+ - 512
252
+ - 256
253
+ - 64
254
+ action_dim: 256
255
+ emb_dim: 384
256
+ gt_action_dim: 7
257
+ type: latent_action
258
+ probes:
259
+ enabled: true
260
+ every: 10
261
+ steps_per_call: 1
262
+ sequence:
263
+ enabled: true
264
+ horizons:
265
+ - 20
266
+ target_key: gt_action_seq_max
267
+ list:
268
+ z_to_s_t:
269
+ name: z_to_s_t
270
+ enabled: false
271
+ shuffle: true
272
+ type: regression
273
+ input: z_t
274
+ target: s_t
275
+ loss: mse
276
+ lr: 0.001
277
+ every: 10
278
+ mlp:
279
+ hidden_dims:
280
+ - 128
281
+ - 64
282
+ z_to_s_tp:
283
+ name: z_to_s_tp
284
+ enabled: false
285
+ shuffle: true
286
+ type: regression
287
+ input: z_t
288
+ target: s_tp
289
+ loss: mse
290
+ lr: 0.001
291
+ every: 10
292
+ mlp:
293
+ hidden_dims:
294
+ - 128
295
+ - 64
296
+ z_to_action_t:
297
+ name: z_to_action_t
298
+ probe_type: z_to_action
299
+ enabled: true
300
+ shuffle: true
301
+ type: regression
302
+ input: z_t
303
+ target: gt_action
304
+ loss: mse
305
+ lr: 0.001
306
+ every: 1
307
+ mlp:
308
+ hidden_dims:
309
+ - 128
310
+ - 64
311
+ z_to_action_seq_h20:
312
+ name: z_to_action_seq_h20
313
+ probe_type: z_to_action_sequence
314
+ enabled: true
315
+ shuffle: true
316
+ type: regression
317
+ input: z_t
318
+ target: gt_action_seq_max
319
+ sequence_horizon: 20
320
+ loss: mse
321
+ lr: 0.001
322
+ every: 10
323
+ mlp:
324
+ hidden_dims:
325
+ - 128
326
+ - 64
327
+ output_dim: 140
328
+ logger:
329
+ project: latent_action
330
+ run_name: latent_action_training
331
+ tags:
332
+ - debug
333
+ output_root: outputs/token_fdm_duration/dino_suite_all_k20_extra0
git.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "branch": "integration/master-hyperbolic",
3
+ "captured_at": "2026-03-25T20:00:54.494786+00:00",
4
+ "commit": "84bdcca892435da456b8a676dae358493a0a6e59",
5
+ "dirty": false,
6
+ "repo_root": "/home/jovyan/youngjoonjeong/latent_action",
7
+ "short_commit": "84bdcca",
8
+ "status": []
9
+ }
hydra_resolved.yaml ADDED
@@ -0,0 +1,333 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ name: libero_cosmos_policy
3
+ type: mg
4
+ backend: robomimic
5
+ paths: []
6
+ task_suite_name: null
7
+ observations_keys:
8
+ - image
9
+ observation_source_keys:
10
+ image: agentview_rgb_jpeg
11
+ action_dim: 7
12
+ frame_stack: 1
13
+ horizon: 1
14
+ temporal_index_mode: clip
15
+ use_proprio: false
16
+ proprio_source: robot_states
17
+ image_chw:
18
+ - 3
19
+ - 224
20
+ - 224
21
+ image_value_range: zero_to_one
22
+ image_transport_dtype: uint8
23
+ duration_focus: null
24
+ hf:
25
+ repo_id: nvidia/LIBERO-Cosmos-Policy
26
+ repo_type: dataset
27
+ allow_patterns:
28
+ - success_only/*_regen/*.hdf5
29
+ local_files_only: false
30
+ action_sequence_targets:
31
+ enabled: true
32
+ horizons:
33
+ - 20
34
+ target_key: gt_action_seq_max
35
+ train:
36
+ optimizer:
37
+ type: adamw
38
+ lr: 0.0001
39
+ weight_decay: 1.0e-06
40
+ batch_size: 256
41
+ num_workers: 4
42
+ prefetch_factor: null
43
+ log_interval: 100
44
+ total_steps: 5000
45
+ eval_interval: 500
46
+ use_aug: true
47
+ aug_mode: default
48
+ use_amp: true
49
+ device_transfer_non_blocking: true
50
+ seed: 42
51
+ scheduler:
52
+ type: cosine
53
+ warmup_steps: 500
54
+ num_cycles: 0.5
55
+ min_lr_scale: 0.0
56
+ decoder_dataloader:
57
+ enabled: false
58
+ batch_size: 64
59
+ num_workers: 4
60
+ prefetch_factor: null
61
+ shuffle: true
62
+ stages:
63
+ stage1: true
64
+ stage2: false
65
+ stage3: false
66
+ stage1:
67
+ batch_size: 256
68
+ num_workers: 16
69
+ prefetch_factor: 2
70
+ log_interval: 100
71
+ total_steps: 20000
72
+ eval_interval: 500
73
+ optimizer:
74
+ lr: 0.0001
75
+ weight_decay: 1.0e-06
76
+ stage2:
77
+ batch_size: 256
78
+ num_workers: 4
79
+ prefetch_factor: null
80
+ log_interval: 100
81
+ total_steps: 5000
82
+ eval_interval: 500
83
+ latent_target: auto
84
+ optimizer:
85
+ lr: 0.0001
86
+ weight_decay: 1.0e-06
87
+ action_probe:
88
+ enabled: true
89
+ stage3:
90
+ batch_size: 256
91
+ num_workers: 4
92
+ prefetch_factor: null
93
+ log_interval: 100
94
+ total_steps: 5000
95
+ eval_interval: 500
96
+ final_eval_num_episodes: 100
97
+ log_eval_video: false
98
+ optimizer:
99
+ lr: 0.0001
100
+ weight_decay: 1.0e-06
101
+ trainable_scope: all
102
+ non_decoder_lr_scale: 1.0
103
+ checkpoint:
104
+ enabled: true
105
+ base_dir: null
106
+ save_interval: 1000
107
+ save_last: true
108
+ latest_only: true
109
+ load:
110
+ stage1:
111
+ mode: none
112
+ path: null
113
+ stage2:
114
+ mode: handoff
115
+ path: null
116
+ teacher_path: null
117
+ stage3:
118
+ mode: handoff
119
+ path: null
120
+ model:
121
+ idm:
122
+ type: token_idm
123
+ action_dim: 128
124
+ token_dim: 768
125
+ model_dim: 512
126
+ latent_dim: 32
127
+ num_action_tokens: 4
128
+ num_blocks: 4
129
+ num_heads: 8
130
+ dropout: 0.0
131
+ fdm:
132
+ type: token_fdm_duration
133
+ action_dim: 128
134
+ token_dim: 768
135
+ model_dim: 512
136
+ num_action_tokens: 4
137
+ num_blocks: 4
138
+ num_heads: 8
139
+ dropout: 0.0
140
+ hyperbolic_latent:
141
+ enabled: false
142
+ backend: geoopt
143
+ manifold: poincare
144
+ curvature: 1.0
145
+ learnable_curvature: false
146
+ fdm_input_mode: logmap0
147
+ prelift_mode: none
148
+ prelift_scale: 1.0
149
+ lift_max_norm: 5.0
150
+ tangent_max_norm: 5.0
151
+ eps: 1.0e-06
152
+ encoders:
153
+ type: dino
154
+ image_key: image
155
+ model_id: facebook/dinov2-base
156
+ input_value_range: zero_to_one
157
+ freeze_backbone: true
158
+ drop_cls_token: true
159
+ output_dim: 768
160
+ mean:
161
+ - 0.485
162
+ - 0.456
163
+ - 0.406
164
+ std:
165
+ - 0.229
166
+ - 0.224
167
+ - 0.225
168
+ type: dino_lam
169
+ idm_input: future
170
+ fdm_target: future
171
+ pixel_decoders: null
172
+ latent_action_decoders: null
173
+ objective:
174
+ fdm_target: future
175
+ idm_input: future
176
+ stage_overrides: {}
177
+ multiscale:
178
+ enabled: true
179
+ consistency:
180
+ enabled: false
181
+ weight: 10.0
182
+ num_pairs: 4
183
+ sample_source: all_horizons
184
+ teacher_mode: direct_teacher
185
+ prediction_mode: direct_duration
186
+ allow_plain_fdm_oneshot: true
187
+ weight_mode: uniform
188
+ weights: {}
189
+ temporal:
190
+ max_offset: 20
191
+ anchor_mode: fixed
192
+ extra_random_count: 0
193
+ branch_order:
194
+ enabled: false
195
+ radial_weight: 0.0
196
+ local_radial_margin_weight: 0.0
197
+ local_radial_margin_alpha: 0.05
198
+ branch_weight: 0.0
199
+ z0_origin_weight: 0.0
200
+ prefix_weight: 0.0
201
+ radius_progress_weight: 1.0
202
+ radius_progress_mode: offset_margin
203
+ radius_progress_alpha: 0.02
204
+ branch_margin_deg: 10.0
205
+ eps: 1.0e-06
206
+ latent_plan:
207
+ enabled: false
208
+ total_horizon: 20
209
+ eval:
210
+ type: robomimic
211
+ data_path: []
212
+ reset_mode: env_reset
213
+ num_eval_episodes: 20
214
+ max_steps: 500
215
+ record_video: true
216
+ checkpoint_path: null
217
+ checkpoint_strict: true
218
+ use_checkpoint_cfg: true
219
+ video_output_path: null
220
+ obs_keys: null
221
+ use_proprio: null
222
+ use_object: false
223
+ resize_hw: null
224
+ image_value_range: null
225
+ seed: 0
226
+ agent:
227
+ encoders:
228
+ image:
229
+ in_channels: 3
230
+ output_dim: 512
231
+ output_mode: global
232
+ type: resnet18
233
+ pretrained: false
234
+ proprio:
235
+ input_dim: 9
236
+ hidden_dim: 128
237
+ output_dim: 64
238
+ type: group
239
+ modalities:
240
+ - agentview_image
241
+ - robot0_eye_in_hand_image
242
+ proj_dim: 128
243
+ policies:
244
+ decoder:
245
+ type: mlp
246
+ hidden_dims:
247
+ - 256
248
+ - 256
249
+ hidden_dims:
250
+ - 512
251
+ - 512
252
+ - 256
253
+ - 64
254
+ action_dim: 256
255
+ emb_dim: 384
256
+ gt_action_dim: 7
257
+ type: latent_action
258
+ probes:
259
+ enabled: true
260
+ every: 10
261
+ steps_per_call: 1
262
+ sequence:
263
+ enabled: true
264
+ horizons:
265
+ - 20
266
+ target_key: gt_action_seq_max
267
+ list:
268
+ z_to_s_t:
269
+ name: z_to_s_t
270
+ enabled: false
271
+ shuffle: true
272
+ type: regression
273
+ input: z_t
274
+ target: s_t
275
+ loss: mse
276
+ lr: 0.001
277
+ every: 10
278
+ mlp:
279
+ hidden_dims:
280
+ - 128
281
+ - 64
282
+ z_to_s_tp:
283
+ name: z_to_s_tp
284
+ enabled: false
285
+ shuffle: true
286
+ type: regression
287
+ input: z_t
288
+ target: s_tp
289
+ loss: mse
290
+ lr: 0.001
291
+ every: 10
292
+ mlp:
293
+ hidden_dims:
294
+ - 128
295
+ - 64
296
+ z_to_action_t:
297
+ name: z_to_action_t
298
+ probe_type: z_to_action
299
+ enabled: true
300
+ shuffle: true
301
+ type: regression
302
+ input: z_t
303
+ target: gt_action
304
+ loss: mse
305
+ lr: 0.001
306
+ every: 1
307
+ mlp:
308
+ hidden_dims:
309
+ - 128
310
+ - 64
311
+ z_to_action_seq_h20:
312
+ name: z_to_action_seq_h20
313
+ probe_type: z_to_action_sequence
314
+ enabled: true
315
+ shuffle: true
316
+ type: regression
317
+ input: z_t
318
+ target: gt_action_seq_max
319
+ sequence_horizon: 20
320
+ loss: mse
321
+ lr: 0.001
322
+ every: 10
323
+ mlp:
324
+ hidden_dims:
325
+ - 128
326
+ - 64
327
+ output_dim: 140
328
+ logger:
329
+ project: latent_action
330
+ run_name: latent_action_training
331
+ tags:
332
+ - debug
333
+ output_root: outputs/token_fdm_duration/dino_suite_all_k20_extra0
intent.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Intent
2
+
3
+ Hypothesis:
4
+ -
5
+
6
+ Primary comparison:
7
+ -
8
+
9
+ Success criterion:
10
+ -
11
+
12
+ Failure modes to watch:
13
+ -
notes.md ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ # Notes
2
+
3
+ Result summary:
4
+ -
5
+
6
+ Interpretation:
7
+ -
8
+
9
+ Next action:
10
+ -
outputs/token_fdm_duration/dino_suite_all_k20_extra0/registry.jsonl ADDED
@@ -0,0 +1 @@
 
 
1
+ {"base_run_name": "latent_action_training", "config_resolved_yaml": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/config_resolved.yaml", "created_at": "2026-03-25T20:00:54.495122+00:00", "data_name": "libero_cosmos_policy", "enabled_stages": {"stage1": true, "stage2": false, "stage3": false}, "git_json": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/git.json", "intent_md": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/intent.md", "notes_md": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/notes.md", "run_dir": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52"}
registry_entry.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "base_run_name": "latent_action_training",
3
+ "config_resolved_yaml": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/config_resolved.yaml",
4
+ "created_at": "2026-03-25T20:00:54.495122+00:00",
5
+ "data_name": "libero_cosmos_policy",
6
+ "enabled_stages": {
7
+ "stage1": true,
8
+ "stage2": false,
9
+ "stage3": false
10
+ },
11
+ "git_json": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/git.json",
12
+ "intent_md": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/intent.md",
13
+ "notes_md": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/notes.md",
14
+ "run_dir": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52"
15
+ }
run.log ADDED
File without changes
stages/stage1/artifacts/probe_history.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
stages/stage1/checkpoint_latest.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3987875cf73ed546f1d6d4568bacc54c695ab49ade5a4735caf5528195989f8c
3
+ size 671070930
stages/stage1/hydra_resolved.yaml ADDED
@@ -0,0 +1,423 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ data:
2
+ name: libero_cosmos_policy
3
+ type: mg
4
+ backend: robomimic
5
+ paths:
6
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE3_turn_on_the_stove_and_put_the_moka_pot_on_it_demo.hdf5
7
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE4_put_the_black_bowl_in_the_bottom_drawer_of_the_cabinet_and_close_it_demo.hdf5
8
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE6_put_the_yellow_and_white_mug_in_the_microwave_and_close_it_demo.hdf5
9
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE8_put_both_moka_pots_on_the_stove_demo.hdf5
10
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE1_put_both_the_alphabet_soup_and_the_cream_cheese_box_in_the_basket_demo.hdf5
11
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_alphabet_soup_and_the_tomato_sauce_in_the_basket_demo.hdf5
12
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_cream_cheese_box_and_the_butter_in_the_basket_demo.hdf5
13
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE5_put_the_white_mug_on_the_left_plate_and_put_the_yellow_and_white_mug_on_the_right_plate_demo.hdf5
14
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE6_put_the_white_mug_on_the_plate_and_put_the_chocolate_pudding_to_the_right_of_the_plate_demo.hdf5
15
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/STUDY_SCENE1_pick_up_the_book_and_place_it_in_the_back_compartment_of_the_caddy_demo.hdf5
16
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_middle_drawer_of_the_cabinet_demo.hdf5
17
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_top_drawer_and_put_the_bowl_inside_demo.hdf5
18
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/push_the_plate_to_the_front_of_the_stove_demo.hdf5
19
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_plate_demo.hdf5
20
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_stove_demo.hdf5
21
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_top_of_the_cabinet_demo.hdf5
22
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_cream_cheese_in_the_bowl_demo.hdf5
23
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_the_rack_demo.hdf5
24
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_top_of_the_cabinet_demo.hdf5
25
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/turn_on_the_stove_demo.hdf5
26
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_alphabet_soup_and_place_it_in_the_basket_demo.hdf5
27
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_bbq_sauce_and_place_it_in_the_basket_demo.hdf5
28
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_butter_and_place_it_in_the_basket_demo.hdf5
29
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_chocolate_pudding_and_place_it_in_the_basket_demo.hdf5
30
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_cream_cheese_and_place_it_in_the_basket_demo.hdf5
31
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_ketchup_and_place_it_in_the_basket_demo.hdf5
32
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_milk_and_place_it_in_the_basket_demo.hdf5
33
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_orange_juice_and_place_it_in_the_basket_demo.hdf5
34
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_salad_dressing_and_place_it_in_the_basket_demo.hdf5
35
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_tomato_sauce_and_place_it_in_the_basket_demo.hdf5
36
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_between_the_plate_and_the_ramekin_and_place_it_on_the_plate_demo.hdf5
37
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_from_table_center_and_place_it_on_the_plate_demo.hdf5
38
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_in_the_top_drawer_of_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5
39
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_cookie_box_and_place_it_on_the_plate_demo.hdf5
40
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_plate_and_place_it_on_the_plate_demo.hdf5
41
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_ramekin_and_place_it_on_the_plate_demo.hdf5
42
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_cookie_box_and_place_it_on_the_plate_demo.hdf5
43
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_ramekin_and_place_it_on_the_plate_demo.hdf5
44
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_stove_and_place_it_on_the_plate_demo.hdf5
45
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5
46
+ task_suite_name: null
47
+ observations_keys:
48
+ - image
49
+ observation_source_keys:
50
+ image: agentview_rgb_jpeg
51
+ action_dim: 7
52
+ frame_stack: 1
53
+ horizon: 1
54
+ temporal_index_mode: clip
55
+ use_proprio: false
56
+ proprio_source: robot_states
57
+ image_chw:
58
+ - 3
59
+ - 224
60
+ - 224
61
+ image_value_range: zero_to_one
62
+ image_transport_dtype: uint8
63
+ duration_focus: null
64
+ hf:
65
+ repo_id: nvidia/LIBERO-Cosmos-Policy
66
+ repo_type: dataset
67
+ allow_patterns:
68
+ - success_only/*_regen/*.hdf5
69
+ local_files_only: false
70
+ action_sequence_targets:
71
+ enabled: true
72
+ horizons:
73
+ - 20
74
+ target_key: gt_action_seq_max
75
+ temporal:
76
+ max_offset: 20
77
+ anchor_mode: fixed
78
+ extra_random_count: 0
79
+ load_full_context: false
80
+ multiscale:
81
+ enabled: true
82
+ use_aug: false
83
+ emit_states: false
84
+ emit_duration_label: false
85
+ emit_future_offset_fields: false
86
+ sample_transform:
87
+ weak_augmentation:
88
+ enabled: false
89
+ train:
90
+ optimizer:
91
+ type: adamw
92
+ lr: 0.0001
93
+ weight_decay: 1.0e-06
94
+ batch_size: 256
95
+ num_workers: 4
96
+ prefetch_factor: null
97
+ log_interval: 100
98
+ total_steps: 5000
99
+ eval_interval: 500
100
+ use_aug: true
101
+ aug_mode: default
102
+ use_amp: true
103
+ device_transfer_non_blocking: true
104
+ seed: 42
105
+ scheduler:
106
+ type: cosine
107
+ warmup_steps: 500
108
+ num_cycles: 0.5
109
+ min_lr_scale: 0.0
110
+ decoder_dataloader:
111
+ enabled: false
112
+ batch_size: 64
113
+ num_workers: 4
114
+ prefetch_factor: null
115
+ shuffle: true
116
+ stages:
117
+ stage1: true
118
+ stage2: false
119
+ stage3: false
120
+ stage1:
121
+ batch_size: 256
122
+ num_workers: 16
123
+ prefetch_factor: 2
124
+ log_interval: 100
125
+ total_steps: 20000
126
+ eval_interval: 500
127
+ optimizer:
128
+ lr: 0.0001
129
+ weight_decay: 1.0e-06
130
+ stage2:
131
+ batch_size: 256
132
+ num_workers: 4
133
+ prefetch_factor: null
134
+ log_interval: 100
135
+ total_steps: 5000
136
+ eval_interval: 500
137
+ latent_target: auto
138
+ optimizer:
139
+ lr: 0.0001
140
+ weight_decay: 1.0e-06
141
+ action_probe:
142
+ enabled: true
143
+ stage3:
144
+ batch_size: 256
145
+ num_workers: 4
146
+ prefetch_factor: null
147
+ log_interval: 100
148
+ total_steps: 5000
149
+ eval_interval: 500
150
+ final_eval_num_episodes: 100
151
+ log_eval_video: false
152
+ optimizer:
153
+ lr: 0.0001
154
+ weight_decay: 1.0e-06
155
+ trainable_scope: all
156
+ non_decoder_lr_scale: 1.0
157
+ checkpoint:
158
+ enabled: true
159
+ base_dir: null
160
+ save_interval: 1000
161
+ save_last: true
162
+ latest_only: true
163
+ load:
164
+ stage1:
165
+ mode: none
166
+ path: null
167
+ stage2:
168
+ mode: handoff
169
+ path: null
170
+ teacher_path: null
171
+ stage3:
172
+ mode: handoff
173
+ path: null
174
+ model:
175
+ idm:
176
+ type: token_idm
177
+ action_dim: 128
178
+ token_dim: 768
179
+ model_dim: 512
180
+ latent_dim: 32
181
+ num_action_tokens: 4
182
+ num_blocks: 4
183
+ num_heads: 8
184
+ dropout: 0.0
185
+ fdm:
186
+ type: token_fdm_duration
187
+ action_dim: 128
188
+ token_dim: 768
189
+ model_dim: 512
190
+ num_action_tokens: 4
191
+ num_blocks: 4
192
+ num_heads: 8
193
+ dropout: 0.0
194
+ prediction_mode: direct
195
+ hyperbolic_latent:
196
+ enabled: false
197
+ backend: geoopt
198
+ manifold: poincare
199
+ curvature: 1.0
200
+ learnable_curvature: false
201
+ fdm_input_mode: logmap0
202
+ prelift_mode: none
203
+ prelift_scale: 1.0
204
+ lift_max_norm: 5.0
205
+ tangent_max_norm: 5.0
206
+ eps: 1.0e-06
207
+ encoders:
208
+ type: dino
209
+ image_key: image
210
+ model_id: facebook/dinov2-base
211
+ input_value_range: zero_to_one
212
+ freeze_backbone: true
213
+ drop_cls_token: true
214
+ output_dim: 768
215
+ mean:
216
+ - 0.485
217
+ - 0.456
218
+ - 0.406
219
+ std:
220
+ - 0.229
221
+ - 0.224
222
+ - 0.225
223
+ type: dino_lam
224
+ idm_input: future
225
+ fdm_target: future
226
+ pixel_decoders: null
227
+ latent_action_decoders: null
228
+ temporal:
229
+ max_offset: 20
230
+ anchor_mode: fixed
231
+ extra_random_count: 0
232
+ load_full_context: false
233
+ multiscale_loss:
234
+ enabled: true
235
+ prediction_mode: direct_duration
236
+ weight_mode: uniform
237
+ weights: {}
238
+ allow_plain_fdm_oneshot: true
239
+ direct_duration_backend: duration_aware
240
+ consistency:
241
+ enabled: false
242
+ weight: 10.0
243
+ num_pairs: 4
244
+ sample_source: all_horizons
245
+ teacher_mode: direct_teacher
246
+ branch_order:
247
+ enabled: false
248
+ radial_weight: 0.0
249
+ local_radial_margin_weight: 0.0
250
+ local_radial_margin_alpha: 0.05
251
+ branch_weight: 0.0
252
+ z0_origin_weight: 0.0
253
+ prefix_weight: 0.0
254
+ radius_progress_weight: 1.0
255
+ radius_progress_mode: offset_margin
256
+ radius_progress_alpha: 0.02
257
+ branch_margin_deg: 10.0
258
+ branch_margin_rad: 0.17453292519943295
259
+ eps: 1.0e-06
260
+ objective:
261
+ fdm_target: future
262
+ idm_input: future
263
+ multiscale:
264
+ enabled: true
265
+ consistency:
266
+ enabled: false
267
+ weight: 10.0
268
+ num_pairs: 4
269
+ sample_source: all_horizons
270
+ teacher_mode: direct_teacher
271
+ prediction_mode: direct_duration
272
+ allow_plain_fdm_oneshot: true
273
+ weight_mode: uniform
274
+ weights: {}
275
+ temporal:
276
+ max_offset: 20
277
+ anchor_mode: fixed
278
+ extra_random_count: 0
279
+ load_full_context: false
280
+ branch_order:
281
+ enabled: false
282
+ radial_weight: 0.0
283
+ local_radial_margin_weight: 0.0
284
+ local_radial_margin_alpha: 0.05
285
+ branch_weight: 0.0
286
+ z0_origin_weight: 0.0
287
+ prefix_weight: 0.0
288
+ radius_progress_weight: 1.0
289
+ radius_progress_mode: offset_margin
290
+ radius_progress_alpha: 0.02
291
+ branch_margin_deg: 10.0
292
+ eps: 1.0e-06
293
+ latent_plan:
294
+ enabled: false
295
+ total_horizon: 20
296
+ num_chunks: 1
297
+ chunk_dim: 128
298
+ plan_dim: 128
299
+ eval:
300
+ type: robomimic
301
+ data_path: []
302
+ reset_mode: env_reset
303
+ num_eval_episodes: 20
304
+ max_steps: 500
305
+ record_video: true
306
+ checkpoint_path: null
307
+ checkpoint_strict: true
308
+ use_checkpoint_cfg: true
309
+ video_output_path: null
310
+ obs_keys: null
311
+ use_proprio: null
312
+ use_object: false
313
+ resize_hw: null
314
+ image_value_range: null
315
+ seed: 0
316
+ agent:
317
+ encoders:
318
+ image:
319
+ in_channels: 3
320
+ output_dim: 512
321
+ output_mode: global
322
+ type: resnet18
323
+ pretrained: false
324
+ proprio:
325
+ input_dim: 9
326
+ hidden_dim: 128
327
+ output_dim: 64
328
+ type: group
329
+ modalities:
330
+ - agentview_image
331
+ - robot0_eye_in_hand_image
332
+ proj_dim: 128
333
+ policies:
334
+ decoder:
335
+ type: mlp
336
+ hidden_dims:
337
+ - 256
338
+ - 256
339
+ hidden_dims:
340
+ - 512
341
+ - 512
342
+ - 256
343
+ - 64
344
+ action_dim: 256
345
+ emb_dim: 384
346
+ gt_action_dim: 7
347
+ type: latent_action
348
+ probes:
349
+ enabled: true
350
+ every: 10
351
+ steps_per_call: 1
352
+ sequence:
353
+ enabled: true
354
+ horizons:
355
+ - 20
356
+ target_key: gt_action_seq_max
357
+ list:
358
+ z_to_s_t:
359
+ name: z_to_s_t
360
+ enabled: false
361
+ shuffle: true
362
+ type: regression
363
+ input: z_t
364
+ target: s_t
365
+ loss: mse
366
+ lr: 0.001
367
+ every: 10
368
+ mlp:
369
+ hidden_dims:
370
+ - 128
371
+ - 64
372
+ z_to_s_tp:
373
+ name: z_to_s_tp
374
+ enabled: false
375
+ shuffle: true
376
+ type: regression
377
+ input: z_t
378
+ target: s_tp
379
+ loss: mse
380
+ lr: 0.001
381
+ every: 10
382
+ mlp:
383
+ hidden_dims:
384
+ - 128
385
+ - 64
386
+ z_to_action_t:
387
+ name: z_to_action_t
388
+ probe_type: z_to_action
389
+ enabled: true
390
+ shuffle: true
391
+ type: regression
392
+ input: z_t
393
+ target: gt_action
394
+ loss: mse
395
+ lr: 0.001
396
+ every: 1
397
+ mlp:
398
+ hidden_dims:
399
+ - 128
400
+ - 64
401
+ z_to_action_seq_h20:
402
+ name: z_to_action_seq_h20
403
+ probe_type: z_to_action_sequence
404
+ enabled: true
405
+ shuffle: true
406
+ type: regression
407
+ input: z_t
408
+ target: gt_action_seq_max
409
+ sequence_horizon: 20
410
+ loss: mse
411
+ lr: 0.001
412
+ every: 10
413
+ mlp:
414
+ hidden_dims:
415
+ - 128
416
+ - 64
417
+ output_dim: 140
418
+ logger:
419
+ project: latent_action
420
+ run_name: latent_action_training
421
+ tags:
422
+ - debug
423
+ output_root: outputs/token_fdm_duration/dino_suite_all_k20_extra0
stages/stage1/metrics.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
stages/stage1/parent_run.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "explicit_path": null,
3
+ "mode": "none",
4
+ "slurm_job_id": null,
5
+ "source_stage": null,
6
+ "stage": "stage1"
7
+ }
stages/stage1/summary.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metrics": {
3
+ "loss/fdm_fit_loss": 0.2659306824207306,
4
+ "loss/fdm_h20": 0.2659306824207306,
5
+ "loss/total_loss": 0.2659306824207306,
6
+ "probe/z_to_action_seq_h20/l2": 0.03165977820754051,
7
+ "probe/z_to_action_seq_h20/valid_ratio": 0.979296863079071,
8
+ "probe/z_to_action_seq_h20_shuffled/l2": 0.20211628079414368,
9
+ "probe/z_to_action_seq_h20_shuffled/valid_ratio": 0.979296863079071,
10
+ "probe/z_to_action_t/l2": 0.018910784274339676,
11
+ "probe/z_to_action_t_shuffled/l2": 0.19590125977993011,
12
+ "time/data_wait_s": 3.6241065219510347,
13
+ "time/iter_s": 7.669815575005487,
14
+ "time/step_s": 4.045709053054452
15
+ },
16
+ "best_steps": {
17
+ "loss/fdm_fit_loss": 17800,
18
+ "loss/fdm_h20": 17800,
19
+ "loss/total_loss": 17800,
20
+ "probe/z_to_action_seq_h20/l2": 19770,
21
+ "probe/z_to_action_seq_h20/valid_ratio": 2800,
22
+ "probe/z_to_action_seq_h20_shuffled/l2": 18950,
23
+ "probe/z_to_action_seq_h20_shuffled/valid_ratio": 2800,
24
+ "probe/z_to_action_t/l2": 18330,
25
+ "probe/z_to_action_t_shuffled/l2": 15545,
26
+ "time/data_wait_s": 0,
27
+ "time/iter_s": 0,
28
+ "time/step_s": 0
29
+ },
30
+ "flush_count": 20000,
31
+ "last_metrics": {
32
+ "loss/fdm_fit_loss": 0.27370309829711914,
33
+ "loss/fdm_h20": 0.27370309829711914,
34
+ "loss/total_loss": 0.27370309829711914,
35
+ "probe/z_to_action_seq_h20/l2": 0.03549542278051376,
36
+ "probe/z_to_action_seq_h20/valid_ratio": 0.944140613079071,
37
+ "probe/z_to_action_seq_h20_shuffled/l2": 0.21182116866111755,
38
+ "probe/z_to_action_seq_h20_shuffled/valid_ratio": 0.944140613079071,
39
+ "probe/z_to_action_t/l2": 0.027867570519447327,
40
+ "probe/z_to_action_t_shuffled/l2": 0.2077900469303131,
41
+ "time/data_wait_s": 0.0005364101380109787,
42
+ "time/iter_s": 0.4869440640322864,
43
+ "time/step_s": 0.4864076538942754
44
+ },
45
+ "last_step": 19999,
46
+ "paths": {
47
+ "artifacts_dir": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1/artifacts",
48
+ "metrics_jsonl": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1/metrics.jsonl",
49
+ "parent_run_json": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1/parent_run.json"
50
+ },
51
+ "stage": "stage1",
52
+ "stage_metadata": {
53
+ "checkpoint_path": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1",
54
+ "run_name": "latent_action_training_stage1_latent_action",
55
+ "status": "completed",
56
+ "tags": [
57
+ "debug"
58
+ ],
59
+ "wandb_project": "latent_action_stage1",
60
+ "wandb_run_id": "qudlwnz5",
61
+ "wandb_run_url": "https://wandb.ai/joonstack/latent_action_stage1/runs/qudlwnz5"
62
+ },
63
+ "status": "completed",
64
+ "updated_at": "2026-03-25T22:44:40.659757+00:00"
65
+ }
wandb/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Current SDK version is 0.25.1
2
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Configure stats pid to 3245764
3
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Loading settings from environment variables
4
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/wandb/run-20260325_200057-qudlwnz5/logs/debug.log
5
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/wandb/run-20260325_200057-qudlwnz5/logs/debug-internal.log
6
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:init():844] calling init triggers
7
+ 2026-03-25 20:00:57,305 INFO MainThread:3245764 [wandb_init.py:init():849] wandb.init called with sweep_config: {}
8
+ config: {'data': {'name': 'libero_cosmos_policy', 'type': 'mg', 'backend': 'robomimic', 'paths': ['/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE3_turn_on_the_stove_and_put_the_moka_pot_on_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE4_put_the_black_bowl_in_the_bottom_drawer_of_the_cabinet_and_close_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE6_put_the_yellow_and_white_mug_in_the_microwave_and_close_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE8_put_both_moka_pots_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE1_put_both_the_alphabet_soup_and_the_cream_cheese_box_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_alphabet_soup_and_the_tomato_sauce_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_cream_cheese_box_and_the_butter_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE5_put_the_white_mug_on_the_left_plate_and_put_the_yellow_and_white_mug_on_the_right_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE6_put_the_white_mug_on_the_plate_and_put_the_chocolate_pudding_to_the_right_of_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/STUDY_SCENE1_pick_up_the_book_and_place_it_in_the_back_compartment_of_the_caddy_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_middle_drawer_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_top_drawer_and_put_the_bowl_inside_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/push_the_plate_to_the_front_of_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_top_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_cream_cheese_in_the_bowl_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_the_rack_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_top_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/turn_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_alphabet_soup_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_bbq_sauce_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_butter_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_chocolate_pudding_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_cream_cheese_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_ketchup_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_milk_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_orange_juice_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_salad_dressing_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_tomato_sauce_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_between_the_plate_and_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_from_table_center_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_in_the_top_drawer_of_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_cookie_box_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_plate_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_cookie_box_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_stove_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5'], 'task_suite_name': None, 'observations_keys': ['image'], 'observation_source_keys': {'image': 'agentview_rgb_jpeg'}, 'action_dim': 7, 'frame_stack': 1, 'horizon': 1, 'temporal_index_mode': 'clip', 'use_proprio': False, 'proprio_source': 'robot_states', 'image_chw': [3, 224, 224], 'image_value_range': 'zero_to_one', 'image_transport_dtype': 'uint8', 'duration_focus': None, 'hf': {'repo_id': 'nvidia/LIBERO-Cosmos-Policy', 'repo_type': 'dataset', 'allow_patterns': ['success_only/*_regen/*.hdf5'], 'local_files_only': False}, 'action_sequence_targets': {'enabled': True, 'horizons': [20], 'target_key': 'gt_action_seq_max'}, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'multiscale': {'enabled': True}, 'use_aug': False, 'emit_states': False, 'emit_duration_label': False, 'emit_future_offset_fields': False, 'sample_transform': {'weak_augmentation': {'enabled': False}}}, 'train': {'optimizer': {'type': 'adamw', 'lr': 0.0001, 'weight_decay': 1e-06}, 'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'use_aug': True, 'aug_mode': 'default', 'use_amp': True, 'device_transfer_non_blocking': True, 'seed': 42, 'scheduler': {'type': 'cosine', 'warmup_steps': 500, 'num_cycles': 0.5, 'min_lr_scale': 0.0}, 'decoder_dataloader': {'enabled': False, 'batch_size': 64, 'num_workers': 4, 'prefetch_factor': None, 'shuffle': True}, 'stages': {'stage1': True, 'stage2': False, 'stage3': False}, 'stage1': {'batch_size': 256, 'num_workers': 16, 'prefetch_factor': 2, 'log_interval': 100, 'total_steps': 20000, 'eval_interval': 500, 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}}, 'stage2': {'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'latent_target': 'auto', 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}, 'action_probe': {'enabled': True}}, 'stage3': {'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'final_eval_num_episodes': 100, 'log_eval_video': False, 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}, 'trainable_scope': 'all', 'non_decoder_lr_scale': 1.0}, 'checkpoint': {'enabled': True, 'base_dir': None, 'save_interval': 1000, 'save_last': True, 'latest_only': True, 'load': {'stage1': {'mode': 'none', 'path': None}, 'stage2': {'mode': 'handoff', 'path': None, 'teacher_path': None}, 'stage3': {'mode': 'handoff', 'path': None}}}}, 'model': {'idm': {'type': 'token_idm', 'action_dim': 128, 'token_dim': 768, 'model_dim': 512, 'latent_dim': 32, 'num_action_tokens': 4, 'num_blocks': 4, 'num_heads': 8, 'dropout': 0.0}, 'fdm': {'type': 'token_fdm_duration', 'action_dim': 128, 'token_dim': 768, 'model_dim': 512, 'num_action_tokens': 4, 'num_blocks': 4, 'num_heads': 8, 'dropout': 0.0, 'prediction_mode': 'direct'}, 'hyperbolic_latent': {'enabled': False, 'backend': 'geoopt', 'manifold': 'poincare', 'curvature': 1.0, 'learnable_curvature': False, 'fdm_input_mode': 'logmap0', 'prelift_mode': 'none', 'prelift_scale': 1.0, 'lift_max_norm': 5.0, 'tangent_max_norm': 5.0, 'eps': 1e-06}, 'encoders': {'type': 'dino', 'image_key': 'image', 'model_id': 'facebook/dinov2-base', 'input_value_range': 'zero_to_one', 'freeze_backbone': True, 'drop_cls_token': True, 'output_dim': 768, 'mean': [0.485, 0.456, 0.406], 'std': [0.229, 0.224, 0.225]}, 'type': 'dino_lam', 'idm_input': 'future', 'fdm_target': 'future', 'pixel_decoders': None, 'latent_action_decoders': None, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'multiscale_loss': {'enabled': True, 'prediction_mode': 'direct_duration', 'weight_mode': 'uniform', 'weights': {}, 'allow_plain_fdm_oneshot': True, 'direct_duration_backend': 'duration_aware', 'consistency': {'enabled': False, 'weight': 10.0, 'num_pairs': 4, 'sample_source': 'all_horizons', 'teacher_mode': 'direct_teacher'}}, 'branch_order': {'enabled': False, 'radial_weight': 0.0, 'local_radial_margin_weight': 0.0, 'local_radial_margin_alpha': 0.05, 'branch_weight': 0.0, 'z0_origin_weight': 0.0, 'prefix_weight': 0.0, 'radius_progress_weight': 1.0, 'radius_progress_mode': 'offset_margin', 'radius_progress_alpha': 0.02, 'branch_margin_deg': 10.0, 'branch_margin_rad': 0.17453292519943295, 'eps': 1e-06}}, 'objective': {'fdm_target': 'future', 'idm_input': 'future', 'multiscale': {'enabled': True, 'consistency': {'enabled': False, 'weight': 10.0, 'num_pairs': 4, 'sample_source': 'all_horizons', 'teacher_mode': 'direct_teacher'}, 'prediction_mode': 'direct_duration', 'allow_plain_fdm_oneshot': True, 'weight_mode': 'uniform', 'weights': {}}, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'branch_order': {'enabled': False, 'radial_weight': 0.0, 'local_radial_margin_weight': 0.0, 'local_radial_margin_alpha': 0.05, 'branch_weight': 0.0, 'z0_origin_weight': 0.0, 'prefix_weight': 0.0, 'radius_progress_weight': 1.0, 'radius_progress_mode': 'offset_margin', 'radius_progress_alpha': 0.02, 'branch_margin_deg': 10.0, 'eps': 1e-06}, 'latent_plan': {'enabled': False, 'total_horizon': 20, 'num_chunks': 1, 'chunk_dim': 128, 'plan_dim': 128}}, 'eval': {'type': 'robomimic', 'data_path': [], 'reset_mode': 'env_reset', 'num_eval_episodes': 20, 'max_steps': 500, 'record_video': True, 'checkpoint_path': None, 'checkpoint_strict': True, 'use_checkpoint_cfg': True, 'video_output_path': None, 'obs_keys': None, 'use_proprio': None, 'use_object': False, 'resize_hw': None, 'image_value_range': None, 'seed': 0}, 'agent': {'encoders': {'image': {'in_channels': 3, 'output_dim': 512, 'output_mode': 'global', 'type': 'resnet18', 'pretrained': False}, 'proprio': {'input_dim': 9, 'hidden_dim': 128, 'output_dim': 64}, 'type': 'group', 'modalities': ['agentview_image', 'robot0_eye_in_hand_image'], 'proj_dim': 128}, 'policies': {'decoder': {'type': 'mlp', 'hidden_dims': [256, 256]}, 'hidden_dims': [512, 512, 256, 64], 'action_dim': 256, 'emb_dim': 384, 'gt_action_dim': 7}, 'type': 'latent_action'}, 'probes': {'enabled': True, 'every': 10, 'steps_per_call': 1, 'sequence': {'enabled': True, 'horizons': [20], 'target_key': 'gt_action_seq_max'}, 'list': {'z_to_s_t': {'name': 'z_to_s_t', 'enabled': False, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 's_t', 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_s_tp': {'name': 'z_to_s_tp', 'enabled': False, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 's_tp', 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_action_t': {'name': 'z_to_action_t', 'probe_type': 'z_to_action', 'enabled': True, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 'gt_action', 'loss': 'mse', 'lr': 0.001, 'every': 1, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_action_seq_h20': {'name': 'z_to_action_seq_h20', 'probe_type': 'z_to_action_sequence', 'enabled': True, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 'gt_action_seq_max', 'sequence_horizon': 20, 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}, 'output_dim': 140}}}, 'logger': {'project': 'latent_action', 'run_name': 'latent_action_training', 'tags': ['debug']}, 'output_root': 'outputs/token_fdm_duration/dino_suite_all_k20_extra0', '_wandb': {}}
9
+ 2026-03-25 20:00:57,305 INFO MainThread:3245764 [wandb_init.py:init():892] starting backend
10
+ 2026-03-25 20:00:57,521 INFO MainThread:3245764 [wandb_init.py:init():895] sending inform_init request
11
+ 2026-03-25 20:00:57,524 INFO MainThread:3245764 [wandb_init.py:init():903] backend started and connected
12
+ 2026-03-25 20:00:57,526 INFO MainThread:3245764 [wandb_init.py:init():973] updated telemetry
13
+ 2026-03-25 20:00:57,532 INFO MainThread:3245764 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout
14
+ 2026-03-25 20:00:58,418 INFO MainThread:3245764 [wandb_init.py:init():1042] starting run threads in backend
15
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_console_start():2524] atexit reg
16
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2373] redirect: wrap_raw
17
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2442] Wrapping output streams.
18
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2465] Redirects installed.
19
+ 2026-03-25 20:00:58,527 INFO MainThread:3245764 [wandb_init.py:init():1082] run started, returning control to user process
20
+ 2026-03-25 22:44:40,660 INFO MainThread:3245764 [wandb_run.py:_finish():2291] finishing run joonstack/latent_action_stage1/qudlwnz5
21
+ 2026-03-25 22:44:40,661 INFO MainThread:3245764 [wandb_run.py:_atexit_cleanup():2490] got exitcode: 0
22
+ 2026-03-25 22:44:40,662 INFO MainThread:3245764 [wandb_run.py:_restore():2472] restore
23
+ 2026-03-25 22:44:40,662 INFO MainThread:3245764 [wandb_run.py:_restore():2478] restore done
24
+ 2026-03-25 22:44:41,910 INFO MainThread:3245764 [wandb_run.py:_footer_sync_info():3868] logging synced files
wandb/run-20260325_200057-qudlwnz5/files/config.yaml ADDED
@@ -0,0 +1,524 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ _wandb:
2
+ value:
3
+ cli_version: 0.25.1
4
+ e:
5
+ zgphb5mlnbcfb9jpehhh8zgxm0bu2zcl:
6
+ args:
7
+ - --config-name
8
+ - dino_lam
9
+ - data=libero_cosmos_policy
10
+ - data.task_suite_name=null
11
+ - data.hf.allow_patterns=[success_only/*_regen/*.hdf5]
12
+ - data.image_chw=[3,224,224]
13
+ - data.temporal_index_mode=clip
14
+ - model.fdm.type=token_fdm_duration
15
+ - objective.idm_input=future
16
+ - objective.temporal.max_offset=20
17
+ - objective.temporal.anchor_mode=fixed
18
+ - objective.temporal.extra_random_count=0
19
+ - train.use_aug=true
20
+ - train.use_amp=true
21
+ - train.stage1.batch_size=256
22
+ - train.stage1.num_workers=16
23
+ - train.stage1.prefetch_factor=2
24
+ - train.stage1.total_steps=20000
25
+ - train.stage1.log_interval=100
26
+ - train.checkpoint.enabled=true
27
+ - train.checkpoint.save_interval=1000
28
+ - train.checkpoint.save_last=true
29
+ - train.checkpoint.latest_only=true
30
+ - output_root=outputs/token_fdm_duration/dino_suite_all_k20_extra0
31
+ codePath: run.py
32
+ cpu_count: 32
33
+ cpu_count_logical: 64
34
+ cudaVersion: "12.4"
35
+ disk:
36
+ /:
37
+ total: "1889053200384"
38
+ used: "1645352988672"
39
+ email: zuni1218@gmail.com
40
+ executable: /home/jovyan/youngjoonjeong/latent_action/.venv/bin/python3
41
+ git:
42
+ commit: 84bdcca892435da456b8a676dae358493a0a6e59
43
+ remote: https://github.com/joon-stack/latent_action.git
44
+ gpu: NVIDIA H100 NVL
45
+ gpu_count: 1
46
+ gpu_nvidia:
47
+ - architecture: Hopper
48
+ cudaCores: 16896
49
+ memoryTotal: "100485038080"
50
+ name: NVIDIA H100 NVL
51
+ uuid: GPU-c6a0d739-1597-848e-b639-5dba9b4deb79
52
+ host: 91b1e4a5838d
53
+ memory:
54
+ total: "540748169216"
55
+ os: Linux-5.15.0-171-generic-x86_64-with-glibc2.35
56
+ program: /home/jovyan/youngjoonjeong/latent_action/run.py
57
+ python: CPython 3.10.18
58
+ root: /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52
59
+ startedAt: "2026-03-25T20:00:57.302961Z"
60
+ writerId: zgphb5mlnbcfb9jpehhh8zgxm0bu2zcl
61
+ m: []
62
+ python_version: 3.10.18
63
+ t:
64
+ "1":
65
+ - 1
66
+ - 5
67
+ - 11
68
+ - 41
69
+ - 49
70
+ - 50
71
+ - 53
72
+ - 83
73
+ "2":
74
+ - 1
75
+ - 5
76
+ - 11
77
+ - 41
78
+ - 49
79
+ - 50
80
+ - 53
81
+ - 83
82
+ "3":
83
+ - 2
84
+ - 13
85
+ - 15
86
+ - 16
87
+ - 61
88
+ "4": 3.10.18
89
+ "5": 0.25.1
90
+ "6": 4.41.2
91
+ "10":
92
+ - 21
93
+ "12": 0.25.1
94
+ "13": linux-x86_64
95
+ agent:
96
+ value:
97
+ encoders:
98
+ image:
99
+ in_channels: 3
100
+ output_dim: 512
101
+ output_mode: global
102
+ pretrained: false
103
+ type: resnet18
104
+ modalities:
105
+ - agentview_image
106
+ - robot0_eye_in_hand_image
107
+ proj_dim: 128
108
+ proprio:
109
+ hidden_dim: 128
110
+ input_dim: 9
111
+ output_dim: 64
112
+ type: group
113
+ policies:
114
+ action_dim: 256
115
+ decoder:
116
+ hidden_dims:
117
+ - 256
118
+ - 256
119
+ type: mlp
120
+ emb_dim: 384
121
+ gt_action_dim: 7
122
+ hidden_dims:
123
+ - 512
124
+ - 512
125
+ - 256
126
+ - 64
127
+ type: latent_action
128
+ data:
129
+ value:
130
+ action_dim: 7
131
+ action_sequence_targets:
132
+ enabled: true
133
+ horizons:
134
+ - 20
135
+ target_key: gt_action_seq_max
136
+ backend: robomimic
137
+ duration_focus: null
138
+ emit_duration_label: false
139
+ emit_future_offset_fields: false
140
+ emit_states: false
141
+ frame_stack: 1
142
+ hf:
143
+ allow_patterns:
144
+ - success_only/*_regen/*.hdf5
145
+ local_files_only: false
146
+ repo_id: nvidia/LIBERO-Cosmos-Policy
147
+ repo_type: dataset
148
+ horizon: 1
149
+ image_chw:
150
+ - 3
151
+ - 224
152
+ - 224
153
+ image_transport_dtype: uint8
154
+ image_value_range: zero_to_one
155
+ multiscale:
156
+ enabled: true
157
+ name: libero_cosmos_policy
158
+ observation_source_keys:
159
+ image: agentview_rgb_jpeg
160
+ observations_keys:
161
+ - image
162
+ paths:
163
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE3_turn_on_the_stove_and_put_the_moka_pot_on_it_demo.hdf5
164
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE4_put_the_black_bowl_in_the_bottom_drawer_of_the_cabinet_and_close_it_demo.hdf5
165
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE6_put_the_yellow_and_white_mug_in_the_microwave_and_close_it_demo.hdf5
166
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE8_put_both_moka_pots_on_the_stove_demo.hdf5
167
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE1_put_both_the_alphabet_soup_and_the_cream_cheese_box_in_the_basket_demo.hdf5
168
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_alphabet_soup_and_the_tomato_sauce_in_the_basket_demo.hdf5
169
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_cream_cheese_box_and_the_butter_in_the_basket_demo.hdf5
170
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE5_put_the_white_mug_on_the_left_plate_and_put_the_yellow_and_white_mug_on_the_right_plate_demo.hdf5
171
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE6_put_the_white_mug_on_the_plate_and_put_the_chocolate_pudding_to_the_right_of_the_plate_demo.hdf5
172
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/STUDY_SCENE1_pick_up_the_book_and_place_it_in_the_back_compartment_of_the_caddy_demo.hdf5
173
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_middle_drawer_of_the_cabinet_demo.hdf5
174
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_top_drawer_and_put_the_bowl_inside_demo.hdf5
175
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/push_the_plate_to_the_front_of_the_stove_demo.hdf5
176
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_plate_demo.hdf5
177
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_stove_demo.hdf5
178
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_top_of_the_cabinet_demo.hdf5
179
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_cream_cheese_in_the_bowl_demo.hdf5
180
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_the_rack_demo.hdf5
181
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_top_of_the_cabinet_demo.hdf5
182
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/turn_on_the_stove_demo.hdf5
183
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_alphabet_soup_and_place_it_in_the_basket_demo.hdf5
184
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_bbq_sauce_and_place_it_in_the_basket_demo.hdf5
185
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_butter_and_place_it_in_the_basket_demo.hdf5
186
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_chocolate_pudding_and_place_it_in_the_basket_demo.hdf5
187
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_cream_cheese_and_place_it_in_the_basket_demo.hdf5
188
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_ketchup_and_place_it_in_the_basket_demo.hdf5
189
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_milk_and_place_it_in_the_basket_demo.hdf5
190
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_orange_juice_and_place_it_in_the_basket_demo.hdf5
191
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_salad_dressing_and_place_it_in_the_basket_demo.hdf5
192
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_tomato_sauce_and_place_it_in_the_basket_demo.hdf5
193
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_between_the_plate_and_the_ramekin_and_place_it_on_the_plate_demo.hdf5
194
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_from_table_center_and_place_it_on_the_plate_demo.hdf5
195
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_in_the_top_drawer_of_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5
196
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_cookie_box_and_place_it_on_the_plate_demo.hdf5
197
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_plate_and_place_it_on_the_plate_demo.hdf5
198
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_ramekin_and_place_it_on_the_plate_demo.hdf5
199
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_cookie_box_and_place_it_on_the_plate_demo.hdf5
200
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_ramekin_and_place_it_on_the_plate_demo.hdf5
201
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_stove_and_place_it_on_the_plate_demo.hdf5
202
+ - /home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5
203
+ proprio_source: robot_states
204
+ sample_transform:
205
+ weak_augmentation:
206
+ enabled: false
207
+ task_suite_name: null
208
+ temporal:
209
+ anchor_mode: fixed
210
+ extra_random_count: 0
211
+ load_full_context: false
212
+ max_offset: 20
213
+ temporal_index_mode: clip
214
+ type: mg
215
+ use_aug: false
216
+ use_proprio: false
217
+ eval:
218
+ value:
219
+ checkpoint_path: null
220
+ checkpoint_strict: true
221
+ data_path: []
222
+ image_value_range: null
223
+ max_steps: 500
224
+ num_eval_episodes: 20
225
+ obs_keys: null
226
+ record_video: true
227
+ reset_mode: env_reset
228
+ resize_hw: null
229
+ seed: 0
230
+ type: robomimic
231
+ use_checkpoint_cfg: true
232
+ use_object: false
233
+ use_proprio: null
234
+ video_output_path: null
235
+ logger:
236
+ value:
237
+ project: latent_action
238
+ run_name: latent_action_training
239
+ tags:
240
+ - debug
241
+ model:
242
+ value:
243
+ branch_order:
244
+ branch_margin_deg: 10
245
+ branch_margin_rad: 0.17453292519943295
246
+ branch_weight: 0
247
+ enabled: false
248
+ eps: 1e-06
249
+ local_radial_margin_alpha: 0.05
250
+ local_radial_margin_weight: 0
251
+ prefix_weight: 0
252
+ radial_weight: 0
253
+ radius_progress_alpha: 0.02
254
+ radius_progress_mode: offset_margin
255
+ radius_progress_weight: 1
256
+ z0_origin_weight: 0
257
+ encoders:
258
+ drop_cls_token: true
259
+ freeze_backbone: true
260
+ image_key: image
261
+ input_value_range: zero_to_one
262
+ mean:
263
+ - 0.485
264
+ - 0.456
265
+ - 0.406
266
+ model_id: facebook/dinov2-base
267
+ output_dim: 768
268
+ std:
269
+ - 0.229
270
+ - 0.224
271
+ - 0.225
272
+ type: dino
273
+ fdm:
274
+ action_dim: 128
275
+ dropout: 0
276
+ model_dim: 512
277
+ num_action_tokens: 4
278
+ num_blocks: 4
279
+ num_heads: 8
280
+ prediction_mode: direct
281
+ token_dim: 768
282
+ type: token_fdm_duration
283
+ fdm_target: future
284
+ hyperbolic_latent:
285
+ backend: geoopt
286
+ curvature: 1
287
+ enabled: false
288
+ eps: 1e-06
289
+ fdm_input_mode: logmap0
290
+ learnable_curvature: false
291
+ lift_max_norm: 5
292
+ manifold: poincare
293
+ prelift_mode: none
294
+ prelift_scale: 1
295
+ tangent_max_norm: 5
296
+ idm:
297
+ action_dim: 128
298
+ dropout: 0
299
+ latent_dim: 32
300
+ model_dim: 512
301
+ num_action_tokens: 4
302
+ num_blocks: 4
303
+ num_heads: 8
304
+ token_dim: 768
305
+ type: token_idm
306
+ idm_input: future
307
+ latent_action_decoders: null
308
+ multiscale_loss:
309
+ allow_plain_fdm_oneshot: true
310
+ consistency:
311
+ enabled: false
312
+ num_pairs: 4
313
+ sample_source: all_horizons
314
+ teacher_mode: direct_teacher
315
+ weight: 10
316
+ direct_duration_backend: duration_aware
317
+ enabled: true
318
+ prediction_mode: direct_duration
319
+ weight_mode: uniform
320
+ pixel_decoders: null
321
+ temporal:
322
+ anchor_mode: fixed
323
+ extra_random_count: 0
324
+ load_full_context: false
325
+ max_offset: 20
326
+ type: dino_lam
327
+ objective:
328
+ value:
329
+ branch_order:
330
+ branch_margin_deg: 10
331
+ branch_weight: 0
332
+ enabled: false
333
+ eps: 1e-06
334
+ local_radial_margin_alpha: 0.05
335
+ local_radial_margin_weight: 0
336
+ prefix_weight: 0
337
+ radial_weight: 0
338
+ radius_progress_alpha: 0.02
339
+ radius_progress_mode: offset_margin
340
+ radius_progress_weight: 1
341
+ z0_origin_weight: 0
342
+ fdm_target: future
343
+ idm_input: future
344
+ latent_plan:
345
+ chunk_dim: 128
346
+ enabled: false
347
+ num_chunks: 1
348
+ plan_dim: 128
349
+ total_horizon: 20
350
+ multiscale:
351
+ allow_plain_fdm_oneshot: true
352
+ consistency:
353
+ enabled: false
354
+ num_pairs: 4
355
+ sample_source: all_horizons
356
+ teacher_mode: direct_teacher
357
+ weight: 10
358
+ enabled: true
359
+ prediction_mode: direct_duration
360
+ weight_mode: uniform
361
+ temporal:
362
+ anchor_mode: fixed
363
+ extra_random_count: 0
364
+ load_full_context: false
365
+ max_offset: 20
366
+ output_root:
367
+ value: outputs/token_fdm_duration/dino_suite_all_k20_extra0
368
+ probes:
369
+ value:
370
+ enabled: true
371
+ every: 10
372
+ list:
373
+ z_to_action_seq_h20:
374
+ enabled: true
375
+ every: 10
376
+ input: z_t
377
+ loss: mse
378
+ lr: 0.001
379
+ mlp:
380
+ hidden_dims:
381
+ - 128
382
+ - 64
383
+ name: z_to_action_seq_h20
384
+ output_dim: 140
385
+ probe_type: z_to_action_sequence
386
+ sequence_horizon: 20
387
+ shuffle: true
388
+ target: gt_action_seq_max
389
+ type: regression
390
+ z_to_action_t:
391
+ enabled: true
392
+ every: 1
393
+ input: z_t
394
+ loss: mse
395
+ lr: 0.001
396
+ mlp:
397
+ hidden_dims:
398
+ - 128
399
+ - 64
400
+ name: z_to_action_t
401
+ probe_type: z_to_action
402
+ shuffle: true
403
+ target: gt_action
404
+ type: regression
405
+ z_to_s_t:
406
+ enabled: false
407
+ every: 10
408
+ input: z_t
409
+ loss: mse
410
+ lr: 0.001
411
+ mlp:
412
+ hidden_dims:
413
+ - 128
414
+ - 64
415
+ name: z_to_s_t
416
+ shuffle: true
417
+ target: s_t
418
+ type: regression
419
+ z_to_s_tp:
420
+ enabled: false
421
+ every: 10
422
+ input: z_t
423
+ loss: mse
424
+ lr: 0.001
425
+ mlp:
426
+ hidden_dims:
427
+ - 128
428
+ - 64
429
+ name: z_to_s_tp
430
+ shuffle: true
431
+ target: s_tp
432
+ type: regression
433
+ sequence:
434
+ enabled: true
435
+ horizons:
436
+ - 20
437
+ target_key: gt_action_seq_max
438
+ steps_per_call: 1
439
+ train:
440
+ value:
441
+ aug_mode: default
442
+ batch_size: 256
443
+ checkpoint:
444
+ base_dir: null
445
+ enabled: true
446
+ latest_only: true
447
+ load:
448
+ stage1:
449
+ mode: none
450
+ path: null
451
+ stage2:
452
+ mode: handoff
453
+ path: null
454
+ teacher_path: null
455
+ stage3:
456
+ mode: handoff
457
+ path: null
458
+ save_interval: 1000
459
+ save_last: true
460
+ decoder_dataloader:
461
+ batch_size: 64
462
+ enabled: false
463
+ num_workers: 4
464
+ prefetch_factor: null
465
+ shuffle: true
466
+ device_transfer_non_blocking: true
467
+ eval_interval: 500
468
+ log_interval: 100
469
+ num_workers: 4
470
+ optimizer:
471
+ lr: 0.0001
472
+ type: adamw
473
+ weight_decay: 1e-06
474
+ prefetch_factor: null
475
+ scheduler:
476
+ min_lr_scale: 0
477
+ num_cycles: 0.5
478
+ type: cosine
479
+ warmup_steps: 500
480
+ seed: 42
481
+ stage1:
482
+ batch_size: 256
483
+ eval_interval: 500
484
+ log_interval: 100
485
+ num_workers: 16
486
+ optimizer:
487
+ lr: 0.0001
488
+ weight_decay: 1e-06
489
+ prefetch_factor: 2
490
+ total_steps: 20000
491
+ stage2:
492
+ action_probe:
493
+ enabled: true
494
+ batch_size: 256
495
+ eval_interval: 500
496
+ latent_target: auto
497
+ log_interval: 100
498
+ num_workers: 4
499
+ optimizer:
500
+ lr: 0.0001
501
+ weight_decay: 1e-06
502
+ prefetch_factor: null
503
+ total_steps: 5000
504
+ stage3:
505
+ batch_size: 256
506
+ eval_interval: 500
507
+ final_eval_num_episodes: 100
508
+ log_eval_video: false
509
+ log_interval: 100
510
+ non_decoder_lr_scale: 1
511
+ num_workers: 4
512
+ optimizer:
513
+ lr: 0.0001
514
+ weight_decay: 1e-06
515
+ prefetch_factor: null
516
+ total_steps: 5000
517
+ trainable_scope: all
518
+ stages:
519
+ stage1: true
520
+ stage2: false
521
+ stage3: false
522
+ total_steps: 5000
523
+ use_amp: true
524
+ use_aug: true
wandb/run-20260325_200057-qudlwnz5/files/output.log ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ wandb: Detected [huggingface_hub.inference] in use.
2
+ wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
3
+ wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/
4
+ wandb: WARNING The get_url method is deprecated and will be removed in a future release. Please use `run.url` instead.
5
+ [checkpoint] stage=stage1, path=/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1
6
+ [checkpoint] stage=stage1, config_yaml=/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/stages/stage1/hydra_resolved.yaml
7
+
wandb/run-20260325_200057-qudlwnz5/files/requirements.txt ADDED
@@ -0,0 +1,175 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ joblib==1.5.3
2
+ fastjsonschema==2.21.2
3
+ exceptiongroup==1.3.1
4
+ fonttools==4.62.1
5
+ easydict==1.13
6
+ egl_probe==1.0.2
7
+ xyzservices==2025.11.0
8
+ Werkzeug==3.1.6
9
+ decorator==5.2.1
10
+ pytz==2026.1.post1
11
+ regex==2026.2.28
12
+ rpds-py==0.30.0
13
+ scikit-learn==1.7.2
14
+ tzdata==2025.3
15
+ antlr4-python3-runtime==4.9.3
16
+ evdev==1.9.3
17
+ gitdb==4.0.12
18
+ PyYAML==6.0.3
19
+ tomli==2.4.0
20
+ pandas==2.3.3
21
+ soundfile==0.13.1
22
+ tokenizers==0.19.1
23
+ future==1.0.0
24
+ attrs==26.1.0
25
+ MarkupSafe==3.0.3
26
+ platformdirs==4.9.4
27
+ triton==3.1.0
28
+ annotated-types==0.7.0
29
+ rdkit==2025.9.6
30
+ narwhals==2.18.0
31
+ Markdown==3.10.2
32
+ python-xlib==0.33
33
+ transformers==4.41.2
34
+ typing-inspection==0.4.2
35
+ threadpoolctl==3.6.0
36
+ traitlets==5.14.3
37
+ pycparser==3.0
38
+ python-dateutil==2.9.0.post0
39
+ sentry-sdk==2.55.0
40
+ nbformat==5.10.4
41
+ aiohappyeyeballs==2.6.1
42
+ GitPython==3.1.46
43
+ pydantic==2.12.5
44
+ pyarrow-hotfix==0.7
45
+ ImageIO==2.37.3
46
+ nvidia-cublas-cu12==12.4.5.8
47
+ typing_extensions==4.15.0
48
+ nvidia-cuda-cupti-cu12==12.4.127
49
+ tensorboard-data-server==0.7.2
50
+ importlib_resources==6.5.2
51
+ cloudpickle==3.1.2
52
+ pynput==1.8.1
53
+ multidict==6.7.1
54
+ diffusers==0.11.1
55
+ iniconfig==2.3.0
56
+ requests==2.32.5
57
+ vector-quantize-pytorch==1.28.0
58
+ nvidia-cudnn-cu12==9.1.0.70
59
+ torchinfo==1.8.0
60
+ matplotlib==3.9.4
61
+ six==1.17.0
62
+ tqdm==4.67.3
63
+ nvidia-cuda-runtime-cu12==12.4.127
64
+ wandb==0.25.1
65
+ robomimic==0.5.0
66
+ tensorboardX==2.6.4
67
+ async-timeout==5.0.1
68
+ python-dotenv==1.2.2
69
+ mink==1.1.0
70
+ nvidia-curand-cu12==10.3.5.147
71
+ urllib3==2.6.3
72
+ cffi==2.0.0
73
+ nvidia-cusolver-cu12==11.6.1.9
74
+ tensorboard==2.20.0
75
+ nvidia-nvjitlink-cu12==12.4.127
76
+ smmap==5.0.3
77
+ datasets==2.19.2
78
+ frozenlist==1.8.0
79
+ nvidia-cusparse-cu12==12.3.1.170
80
+ importlib_metadata==9.0.0
81
+ gym-notices==0.1.0
82
+ termcolor==3.3.0
83
+ jupyter_core==5.9.1
84
+ packaging==26.0
85
+ PyOpenGL==3.1.10
86
+ numpy==1.26.4
87
+ jsonschema==4.26.0
88
+ bokeh==3.9.0
89
+ nvidia-nccl-cu12==2.21.5
90
+ filelock==3.25.2
91
+ torch==2.5.1
92
+ nltk==3.9.3
93
+ pytest==9.0.2
94
+ aiosignal==1.4.0
95
+ scipy==1.15.3
96
+ daqp==0.8.3
97
+ tornado==6.5.5
98
+ proglog==0.1.12
99
+ huggingface-hub==0.23.4
100
+ pyparsing==3.3.2
101
+ imageio-ffmpeg==0.6.0
102
+ referencing==0.37.0
103
+ pluggy==1.6.0
104
+ einops==0.8.2
105
+ yarl==1.23.0
106
+ dill==0.3.8
107
+ torchvision==0.20.1
108
+ jsonschema-specifications==2025.9.1
109
+ pip==23.0.1
110
+ moviepy==2.2.1
111
+ mdit-py-plugins==0.5.0
112
+ etils==1.13.0
113
+ nvidia-nvtx-cu12==12.4.127
114
+ numba==0.64.0
115
+ safetensors==0.7.0
116
+ kiwisolver==1.5.0
117
+ contourpy==1.3.2
118
+ networkx==3.4.2
119
+ cycler==0.12.1
120
+ aiohttp==3.13.3
121
+ zipp==3.23.0
122
+ mpmath==1.3.0
123
+ gym==0.26.2
124
+ opencv-python==4.11.0.86
125
+ pillow==11.3.0
126
+ xxhash==3.6.0
127
+ psutil==7.2.2
128
+ hydra-core==1.3.2
129
+ absl-py==2.4.0
130
+ glfw==2.10.0
131
+ idna==3.11
132
+ einx==0.4.2
133
+ Pygments==2.19.2
134
+ PyOpenGL-accelerate==3.1.10
135
+ frozendict==2.4.7
136
+ sympy==1.13.1
137
+ h5py==3.16.0
138
+ Cython==0.29.37
139
+ qpsolvers==4.11.0
140
+ certifi==2026.2.25
141
+ geoopt==0.5.1
142
+ nvidia-cufft-cu12==11.2.1.3
143
+ charset-normalizer==3.4.6
144
+ mdurl==0.1.2
145
+ pydantic_core==2.41.5
146
+ nvidia-cuda-nvrtc-cu12==12.4.127
147
+ protobuf==6.33.6
148
+ grpcio==1.78.0
149
+ jupytext==1.19.1
150
+ robosuite==1.5.1
151
+ bddl==3.6.0
152
+ propcache==0.4.1
153
+ Jinja2==3.1.6
154
+ click==8.3.1
155
+ markdown-it-py==4.0.0
156
+ fsspec==2024.3.1
157
+ omegaconf==2.3.0
158
+ llvmlite==0.46.0
159
+ setuptools==82.0.1
160
+ pyarrow==19.0.1
161
+ multiprocess==0.70.16
162
+ mujoco==3.6.0
163
+ plotly==6.6.0
164
+ jaraco.functools==4.4.0
165
+ platformdirs==4.4.0
166
+ tomli==2.4.0
167
+ backports.tarfile==1.2.0
168
+ jaraco.context==6.1.0
169
+ autocommand==2.2.2
170
+ jaraco.text==4.0.0
171
+ importlib_metadata==8.7.1
172
+ more-itertools==10.8.0
173
+ packaging==26.0
174
+ zipp==3.23.0
175
+ wheel==0.46.3
wandb/run-20260325_200057-qudlwnz5/files/wandb-metadata.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-171-generic-x86_64-with-glibc2.35",
3
+ "python": "CPython 3.10.18",
4
+ "startedAt": "2026-03-25T20:00:57.302961Z",
5
+ "args": [
6
+ "--config-name",
7
+ "dino_lam",
8
+ "data=libero_cosmos_policy",
9
+ "data.task_suite_name=null",
10
+ "data.hf.allow_patterns=[success_only/*_regen/*.hdf5]",
11
+ "data.image_chw=[3,224,224]",
12
+ "data.temporal_index_mode=clip",
13
+ "model.fdm.type=token_fdm_duration",
14
+ "objective.idm_input=future",
15
+ "objective.temporal.max_offset=20",
16
+ "objective.temporal.anchor_mode=fixed",
17
+ "objective.temporal.extra_random_count=0",
18
+ "train.use_aug=true",
19
+ "train.use_amp=true",
20
+ "train.stage1.batch_size=256",
21
+ "train.stage1.num_workers=16",
22
+ "train.stage1.prefetch_factor=2",
23
+ "train.stage1.total_steps=20000",
24
+ "train.stage1.log_interval=100",
25
+ "train.checkpoint.enabled=true",
26
+ "train.checkpoint.save_interval=1000",
27
+ "train.checkpoint.save_last=true",
28
+ "train.checkpoint.latest_only=true",
29
+ "output_root=outputs/token_fdm_duration/dino_suite_all_k20_extra0"
30
+ ],
31
+ "program": "/home/jovyan/youngjoonjeong/latent_action/run.py",
32
+ "codePath": "run.py",
33
+ "git": {
34
+ "remote": "https://github.com/joon-stack/latent_action.git",
35
+ "commit": "84bdcca892435da456b8a676dae358493a0a6e59"
36
+ },
37
+ "email": "zuni1218@gmail.com",
38
+ "root": "/home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52",
39
+ "host": "91b1e4a5838d",
40
+ "executable": "/home/jovyan/youngjoonjeong/latent_action/.venv/bin/python3",
41
+ "cpu_count": 32,
42
+ "cpu_count_logical": 64,
43
+ "gpu": "NVIDIA H100 NVL",
44
+ "gpu_count": 1,
45
+ "disk": {
46
+ "/": {
47
+ "total": "1889053200384",
48
+ "used": "1645352988672"
49
+ }
50
+ },
51
+ "memory": {
52
+ "total": "540748169216"
53
+ },
54
+ "gpu_nvidia": [
55
+ {
56
+ "name": "NVIDIA H100 NVL",
57
+ "memoryTotal": "100485038080",
58
+ "cudaCores": 16896,
59
+ "architecture": "Hopper",
60
+ "uuid": "GPU-c6a0d739-1597-848e-b639-5dba9b4deb79"
61
+ }
62
+ ],
63
+ "cudaVersion": "12.4",
64
+ "writerId": "zgphb5mlnbcfb9jpehhh8zgxm0bu2zcl"
65
+ }
wandb/run-20260325_200057-qudlwnz5/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"time/data_wait_s":0.0005364101380109787,"loss/total_loss":0.27370309829711914,"probe/z_to_action_seq_h20/l2":0.03549542278051376,"_timestamp":1.77447867603798e+09,"time/iter_s":0.4869440640322864,"_wandb":{"runtime":9822},"probe/z_to_action_seq_h20_shuffled/valid_ratio":0.944140613079071,"time/step_s":0.4864076538942754,"probe/z_to_action_t_shuffled/l2":0.2077900469303131,"probe/z_to_action_seq_h20_shuffled/l2":0.21182116866111755,"probe/z_to_action_t/l2":0.027867570519447327,"loss/fdm_fit_loss":0.27370309829711914,"loss/fdm_h20":0.27370309829711914,"probe/z_to_action_seq_h20/valid_ratio":0.944140613079071,"_step":19999,"_runtime":9822.244018516}
wandb/run-20260325_200057-qudlwnz5/logs/debug-core.log ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"time":"2026-03-25T20:00:57.333745886Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpr17fz98x/port-3245764.txt","pid":3245764,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false}
2
+ {"time":"2026-03-25T20:00:57.334247558Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":3245764}
3
+ {"time":"2026-03-25T20:00:57.334229645Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-3245764-3246101-3854211172/socket","Net":"unix"}}
4
+ {"time":"2026-03-25T20:00:57.521004148Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"}
5
+ {"time":"2026-03-25T20:00:57.525759429Z","level":"INFO","msg":"handleInformInit: received","streamId":"qudlwnz5","id":"1(@)"}
6
+ {"time":"2026-03-25T20:00:57.863985537Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"qudlwnz5","id":"1(@)"}
7
+ {"time":"2026-03-25T20:01:03.533019493Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"2webd6hskw9a"}
8
+ {"time":"2026-03-25T22:44:40.662595918Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"2webd6hskw9a"}
9
+ {"time":"2026-03-25T22:44:41.91056233Z","level":"INFO","msg":"connection: cancelling request","id":"1(@)","requestId":"2webd6hskw9a"}
10
+ {"time":"2026-03-25T22:44:41.91105048Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"qudlwnz5","id":"1(@)"}
11
+ {"time":"2026-03-25T22:44:41.912031578Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"qudlwnz5","id":"1(@)"}
12
+ {"time":"2026-03-25T22:44:42.151131844Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"}
13
+ {"time":"2026-03-25T22:44:42.151173852Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"}
14
+ {"time":"2026-03-25T22:44:42.151183039Z","level":"INFO","msg":"server is shutting down"}
15
+ {"time":"2026-03-25T22:44:42.151208807Z","level":"INFO","msg":"connection: closing","id":"1(@)"}
16
+ {"time":"2026-03-25T22:44:42.151268228Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-3245764-3246101-3854211172/socket","Net":"unix"}}
17
+ {"time":"2026-03-25T22:44:42.151299827Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"}
18
+ {"time":"2026-03-25T22:44:42.151310276Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"}
19
+ {"time":"2026-03-25T22:44:42.151320816Z","level":"INFO","msg":"server is closed"}
wandb/run-20260325_200057-qudlwnz5/logs/debug-internal.log ADDED
The diff for this file is too large to render. See raw diff
 
wandb/run-20260325_200057-qudlwnz5/logs/debug.log ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Current SDK version is 0.25.1
2
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Configure stats pid to 3245764
3
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_setup.py:_flush():81] Loading settings from environment variables
4
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/wandb/run-20260325_200057-qudlwnz5/logs/debug.log
5
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /home/jovyan/youngjoonjeong/latent_action/outputs/token_fdm_duration/dino_suite_all_k20_extra0/libero_cosmos_policy/2026-03-25/20-00-52/wandb/run-20260325_200057-qudlwnz5/logs/debug-internal.log
6
+ 2026-03-25 20:00:57,304 INFO MainThread:3245764 [wandb_init.py:init():844] calling init triggers
7
+ 2026-03-25 20:00:57,305 INFO MainThread:3245764 [wandb_init.py:init():849] wandb.init called with sweep_config: {}
8
+ config: {'data': {'name': 'libero_cosmos_policy', 'type': 'mg', 'backend': 'robomimic', 'paths': ['/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE3_turn_on_the_stove_and_put_the_moka_pot_on_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE4_put_the_black_bowl_in_the_bottom_drawer_of_the_cabinet_and_close_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE6_put_the_yellow_and_white_mug_in_the_microwave_and_close_it_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/KITCHEN_SCENE8_put_both_moka_pots_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE1_put_both_the_alphabet_soup_and_the_cream_cheese_box_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_alphabet_soup_and_the_tomato_sauce_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE2_put_both_the_cream_cheese_box_and_the_butter_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE5_put_the_white_mug_on_the_left_plate_and_put_the_yellow_and_white_mug_on_the_right_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/LIVING_ROOM_SCENE6_put_the_white_mug_on_the_plate_and_put_the_chocolate_pudding_to_the_right_of_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_10_regen/STUDY_SCENE1_pick_up_the_book_and_place_it_in_the_back_compartment_of_the_caddy_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_middle_drawer_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/open_the_top_drawer_and_put_the_bowl_inside_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/push_the_plate_to_the_front_of_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_bowl_on_top_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_cream_cheese_in_the_bowl_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_the_rack_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/put_the_wine_bottle_on_top_of_the_cabinet_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_goal_regen/turn_on_the_stove_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_alphabet_soup_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_bbq_sauce_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_butter_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_chocolate_pudding_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_cream_cheese_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_ketchup_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_milk_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_orange_juice_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_salad_dressing_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_object_regen/pick_up_the_tomato_sauce_and_place_it_in_the_basket_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_between_the_plate_and_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_from_table_center_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_in_the_top_drawer_of_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_cookie_box_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_plate_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_next_to_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_cookie_box_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_ramekin_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_stove_and_place_it_on_the_plate_demo.hdf5', '/home/jovyan/.cache/huggingface/hub/datasets--nvidia--LIBERO-Cosmos-Policy/snapshots/b463cbd5d114909e4daea65eb03bed9787290042/success_only/libero_spatial_regen/pick_up_the_black_bowl_on_the_wooden_cabinet_and_place_it_on_the_plate_demo.hdf5'], 'task_suite_name': None, 'observations_keys': ['image'], 'observation_source_keys': {'image': 'agentview_rgb_jpeg'}, 'action_dim': 7, 'frame_stack': 1, 'horizon': 1, 'temporal_index_mode': 'clip', 'use_proprio': False, 'proprio_source': 'robot_states', 'image_chw': [3, 224, 224], 'image_value_range': 'zero_to_one', 'image_transport_dtype': 'uint8', 'duration_focus': None, 'hf': {'repo_id': 'nvidia/LIBERO-Cosmos-Policy', 'repo_type': 'dataset', 'allow_patterns': ['success_only/*_regen/*.hdf5'], 'local_files_only': False}, 'action_sequence_targets': {'enabled': True, 'horizons': [20], 'target_key': 'gt_action_seq_max'}, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'multiscale': {'enabled': True}, 'use_aug': False, 'emit_states': False, 'emit_duration_label': False, 'emit_future_offset_fields': False, 'sample_transform': {'weak_augmentation': {'enabled': False}}}, 'train': {'optimizer': {'type': 'adamw', 'lr': 0.0001, 'weight_decay': 1e-06}, 'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'use_aug': True, 'aug_mode': 'default', 'use_amp': True, 'device_transfer_non_blocking': True, 'seed': 42, 'scheduler': {'type': 'cosine', 'warmup_steps': 500, 'num_cycles': 0.5, 'min_lr_scale': 0.0}, 'decoder_dataloader': {'enabled': False, 'batch_size': 64, 'num_workers': 4, 'prefetch_factor': None, 'shuffle': True}, 'stages': {'stage1': True, 'stage2': False, 'stage3': False}, 'stage1': {'batch_size': 256, 'num_workers': 16, 'prefetch_factor': 2, 'log_interval': 100, 'total_steps': 20000, 'eval_interval': 500, 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}}, 'stage2': {'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'latent_target': 'auto', 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}, 'action_probe': {'enabled': True}}, 'stage3': {'batch_size': 256, 'num_workers': 4, 'prefetch_factor': None, 'log_interval': 100, 'total_steps': 5000, 'eval_interval': 500, 'final_eval_num_episodes': 100, 'log_eval_video': False, 'optimizer': {'lr': 0.0001, 'weight_decay': 1e-06}, 'trainable_scope': 'all', 'non_decoder_lr_scale': 1.0}, 'checkpoint': {'enabled': True, 'base_dir': None, 'save_interval': 1000, 'save_last': True, 'latest_only': True, 'load': {'stage1': {'mode': 'none', 'path': None}, 'stage2': {'mode': 'handoff', 'path': None, 'teacher_path': None}, 'stage3': {'mode': 'handoff', 'path': None}}}}, 'model': {'idm': {'type': 'token_idm', 'action_dim': 128, 'token_dim': 768, 'model_dim': 512, 'latent_dim': 32, 'num_action_tokens': 4, 'num_blocks': 4, 'num_heads': 8, 'dropout': 0.0}, 'fdm': {'type': 'token_fdm_duration', 'action_dim': 128, 'token_dim': 768, 'model_dim': 512, 'num_action_tokens': 4, 'num_blocks': 4, 'num_heads': 8, 'dropout': 0.0, 'prediction_mode': 'direct'}, 'hyperbolic_latent': {'enabled': False, 'backend': 'geoopt', 'manifold': 'poincare', 'curvature': 1.0, 'learnable_curvature': False, 'fdm_input_mode': 'logmap0', 'prelift_mode': 'none', 'prelift_scale': 1.0, 'lift_max_norm': 5.0, 'tangent_max_norm': 5.0, 'eps': 1e-06}, 'encoders': {'type': 'dino', 'image_key': 'image', 'model_id': 'facebook/dinov2-base', 'input_value_range': 'zero_to_one', 'freeze_backbone': True, 'drop_cls_token': True, 'output_dim': 768, 'mean': [0.485, 0.456, 0.406], 'std': [0.229, 0.224, 0.225]}, 'type': 'dino_lam', 'idm_input': 'future', 'fdm_target': 'future', 'pixel_decoders': None, 'latent_action_decoders': None, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'multiscale_loss': {'enabled': True, 'prediction_mode': 'direct_duration', 'weight_mode': 'uniform', 'weights': {}, 'allow_plain_fdm_oneshot': True, 'direct_duration_backend': 'duration_aware', 'consistency': {'enabled': False, 'weight': 10.0, 'num_pairs': 4, 'sample_source': 'all_horizons', 'teacher_mode': 'direct_teacher'}}, 'branch_order': {'enabled': False, 'radial_weight': 0.0, 'local_radial_margin_weight': 0.0, 'local_radial_margin_alpha': 0.05, 'branch_weight': 0.0, 'z0_origin_weight': 0.0, 'prefix_weight': 0.0, 'radius_progress_weight': 1.0, 'radius_progress_mode': 'offset_margin', 'radius_progress_alpha': 0.02, 'branch_margin_deg': 10.0, 'branch_margin_rad': 0.17453292519943295, 'eps': 1e-06}}, 'objective': {'fdm_target': 'future', 'idm_input': 'future', 'multiscale': {'enabled': True, 'consistency': {'enabled': False, 'weight': 10.0, 'num_pairs': 4, 'sample_source': 'all_horizons', 'teacher_mode': 'direct_teacher'}, 'prediction_mode': 'direct_duration', 'allow_plain_fdm_oneshot': True, 'weight_mode': 'uniform', 'weights': {}}, 'temporal': {'max_offset': 20, 'anchor_mode': 'fixed', 'extra_random_count': 0, 'load_full_context': False}, 'branch_order': {'enabled': False, 'radial_weight': 0.0, 'local_radial_margin_weight': 0.0, 'local_radial_margin_alpha': 0.05, 'branch_weight': 0.0, 'z0_origin_weight': 0.0, 'prefix_weight': 0.0, 'radius_progress_weight': 1.0, 'radius_progress_mode': 'offset_margin', 'radius_progress_alpha': 0.02, 'branch_margin_deg': 10.0, 'eps': 1e-06}, 'latent_plan': {'enabled': False, 'total_horizon': 20, 'num_chunks': 1, 'chunk_dim': 128, 'plan_dim': 128}}, 'eval': {'type': 'robomimic', 'data_path': [], 'reset_mode': 'env_reset', 'num_eval_episodes': 20, 'max_steps': 500, 'record_video': True, 'checkpoint_path': None, 'checkpoint_strict': True, 'use_checkpoint_cfg': True, 'video_output_path': None, 'obs_keys': None, 'use_proprio': None, 'use_object': False, 'resize_hw': None, 'image_value_range': None, 'seed': 0}, 'agent': {'encoders': {'image': {'in_channels': 3, 'output_dim': 512, 'output_mode': 'global', 'type': 'resnet18', 'pretrained': False}, 'proprio': {'input_dim': 9, 'hidden_dim': 128, 'output_dim': 64}, 'type': 'group', 'modalities': ['agentview_image', 'robot0_eye_in_hand_image'], 'proj_dim': 128}, 'policies': {'decoder': {'type': 'mlp', 'hidden_dims': [256, 256]}, 'hidden_dims': [512, 512, 256, 64], 'action_dim': 256, 'emb_dim': 384, 'gt_action_dim': 7}, 'type': 'latent_action'}, 'probes': {'enabled': True, 'every': 10, 'steps_per_call': 1, 'sequence': {'enabled': True, 'horizons': [20], 'target_key': 'gt_action_seq_max'}, 'list': {'z_to_s_t': {'name': 'z_to_s_t', 'enabled': False, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 's_t', 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_s_tp': {'name': 'z_to_s_tp', 'enabled': False, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 's_tp', 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_action_t': {'name': 'z_to_action_t', 'probe_type': 'z_to_action', 'enabled': True, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 'gt_action', 'loss': 'mse', 'lr': 0.001, 'every': 1, 'mlp': {'hidden_dims': [128, 64]}}, 'z_to_action_seq_h20': {'name': 'z_to_action_seq_h20', 'probe_type': 'z_to_action_sequence', 'enabled': True, 'shuffle': True, 'type': 'regression', 'input': 'z_t', 'target': 'gt_action_seq_max', 'sequence_horizon': 20, 'loss': 'mse', 'lr': 0.001, 'every': 10, 'mlp': {'hidden_dims': [128, 64]}, 'output_dim': 140}}}, 'logger': {'project': 'latent_action', 'run_name': 'latent_action_training', 'tags': ['debug']}, 'output_root': 'outputs/token_fdm_duration/dino_suite_all_k20_extra0', '_wandb': {}}
9
+ 2026-03-25 20:00:57,305 INFO MainThread:3245764 [wandb_init.py:init():892] starting backend
10
+ 2026-03-25 20:00:57,521 INFO MainThread:3245764 [wandb_init.py:init():895] sending inform_init request
11
+ 2026-03-25 20:00:57,524 INFO MainThread:3245764 [wandb_init.py:init():903] backend started and connected
12
+ 2026-03-25 20:00:57,526 INFO MainThread:3245764 [wandb_init.py:init():973] updated telemetry
13
+ 2026-03-25 20:00:57,532 INFO MainThread:3245764 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout
14
+ 2026-03-25 20:00:58,418 INFO MainThread:3245764 [wandb_init.py:init():1042] starting run threads in backend
15
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_console_start():2524] atexit reg
16
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2373] redirect: wrap_raw
17
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2442] Wrapping output streams.
18
+ 2026-03-25 20:00:58,525 INFO MainThread:3245764 [wandb_run.py:_redirect():2465] Redirects installed.
19
+ 2026-03-25 20:00:58,527 INFO MainThread:3245764 [wandb_init.py:init():1082] run started, returning control to user process
20
+ 2026-03-25 22:44:40,660 INFO MainThread:3245764 [wandb_run.py:_finish():2291] finishing run joonstack/latent_action_stage1/qudlwnz5
21
+ 2026-03-25 22:44:40,661 INFO MainThread:3245764 [wandb_run.py:_atexit_cleanup():2490] got exitcode: 0
22
+ 2026-03-25 22:44:40,662 INFO MainThread:3245764 [wandb_run.py:_restore():2472] restore
23
+ 2026-03-25 22:44:40,662 INFO MainThread:3245764 [wandb_run.py:_restore():2478] restore done
24
+ 2026-03-25 22:44:41,910 INFO MainThread:3245764 [wandb_run.py:_footer_sync_info():3868] logging synced files
wandb/run-20260325_200057-qudlwnz5/run-qudlwnz5.wandb ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6838dfeb86abfb1f6ca625eb16a905847270272d4cd7b40c5c7758190e2037f
3
+ size 22197604