lsnu commited on Mar 24

Commit

ddc5223

verified ·

1 Parent(s): d5d49c1

Add files using upload-large-folder tool

Browse files

Files changed (39) hide show

artifacts/data/reveal_proxy/proxy_train_clip224_v5_actionhist.pt +3 -0
artifacts/data/reveal_proxy/proxy_train_smoke_v5_actionhist.pt +3 -0
artifacts/data/reveal_proxy/proxy_train_v5_actionhist.pt +3 -0
artifacts/data/reveal_proxy/proxy_val_clip224_v5_actionhist.pt +3 -0
artifacts/data/reveal_proxy/proxy_val_smoke_v5_actionhist.pt +3 -0
artifacts/data/reveal_proxy/proxy_val_v5_actionhist.pt +3 -0
artifacts/outputs/interaction_debug/ablation_no_interaction_head_actionhist/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/ablation_no_interaction_head_actionhist/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/ablation_no_world_model_actionhist/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/ablation_none_actionhist/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/ablation_none_actionhist/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt +3 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/config_resolved.yaml +123 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/diagnostics/proxy_diagnostics.json +7 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/metrics.json +432 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/checkpoint_best.pt +3 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/config_resolved.yaml +123 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_clip_actionhist/checkpoint_best.pt +3 -0
artifacts/outputs/interaction_debug/proxy_interaction_state_recency_oracleft/checkpoint_best.pt +3 -0
artifacts/outputs/interaction_debug/reveal_eval_commit8_compare/reveal_benchmark.json +41 -0
artifacts/outputs/interaction_debug/reveal_eval_commit8_compare/reveal_benchmark.md +37 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_commit4/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_commit4/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke_commit4_short/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke_commit4_short/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_full_commit4/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_full_commit4/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_smoke_commit4_short/reveal_benchmark.json +15 -0
artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_smoke_commit4_short/reveal_benchmark.md +13 -0
artifacts/outputs/interaction_debug/reveal_eval_old_no_leak_baselines_commit4/reveal_benchmark.json +28 -0
artifacts/outputs/interaction_debug/reveal_eval_old_no_leak_baselines_commit4/reveal_benchmark.md +25 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_clipped/rollout_eval.json +23 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_clipped/rollout_eval.md +11 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_recovered/rollout_eval.json +31 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_recovered/rollout_eval.md +11 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_rerun/rollout_eval.json +23 -0
artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_rerun/rollout_eval.md +11 -0

artifacts/data/reveal_proxy/proxy_train_clip224_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ec73ee20b3f68ad49efbeb571f779a3554a657d75270fd2398f8ddd78c53524e
+size 13366472

artifacts/data/reveal_proxy/proxy_train_smoke_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:208036101fb18e4c55e015d89599343370f883f0da87e1f63880ea389a4005da
+size 822400

artifacts/data/reveal_proxy/proxy_train_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:86bedaa237f1d35268462d39491f4d223cf3b0b0e9c1d2b9c0d6151a6124854b
+size 13294184

artifacts/data/reveal_proxy/proxy_val_clip224_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e10909f7dd6c30f1c74f7d740b26b3202ad484f1219aa1dee8d23310bfb265b9
+size 4408000

artifacts/data/reveal_proxy/proxy_val_smoke_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0e93133295b1914e188baabd36e48adb5264c70fd5c27be202f339807608bd62
+size 303736

artifacts/data/reveal_proxy/proxy_val_v5_actionhist.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1cc98e332deb8194e0539aec72d1dead90b778b50f8021e890bb392b26bb6fa1
+size 4581536

artifacts/outputs/interaction_debug/ablation_no_interaction_head_actionhist/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.16666666666666666,
+      "bag_proxy": 0.5,
+      "cloth_proxy": 0.5
+    },
+    "mean_success": 0.38888888888888884,
+    "visibility_integral": 42.193298303418686,
+    "corridor_availability": 0.9207814501391517,
+    "reocclusion_rate": 0.016840277777777777,
+    "persistence_horizon_mae": 0.0,
+    "disturbance_cost": 0.5719093395810988
+  }
+}

artifacts/outputs/interaction_debug/ablation_no_interaction_head_actionhist/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt
+- mean_success: 0.389
+- visibility_integral: 42.193
+- corridor_availability: 0.921
+- reocclusion_rate: 0.017
+- persistence_horizon_mae: 0.000
+- disturbance_cost: 0.572
+- foliage_proxy_success: 0.167
+- bag_proxy_success: 0.500
+- cloth_proxy_success: 0.500

artifacts/outputs/interaction_debug/ablation_no_world_model_actionhist/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5416666666666666,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5277777777777778,
+    "visibility_integral": 32.94181125528283,
+    "corridor_availability": 0.8710797395971086,
+    "reocclusion_rate": 0.003125,
+    "persistence_horizon_mae": 1.1577362408331497,
+    "disturbance_cost": 0.42711537962572443
+  }
+}

artifacts/outputs/interaction_debug/ablation_none_actionhist/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5416666666666666,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5277777777777778,
+    "visibility_integral": 32.84789120488696,
+    "corridor_availability": 0.8711970953477753,
+    "reocclusion_rate": 0.003125,
+    "persistence_horizon_mae": 1.1544888946683267,
+    "disturbance_cost": 0.4288607043110662
+  }
+}

artifacts/outputs/interaction_debug/ablation_none_actionhist/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt
+- mean_success: 0.528
+- visibility_integral: 32.848
+- corridor_availability: 0.871
+- reocclusion_rate: 0.003
+- persistence_horizon_mae: 1.154
+- disturbance_cost: 0.429
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.542
+- cloth_proxy_success: 0.625

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:34a4ab95f18c0b0b1f6b3dee49341ac2cf46b05e8f3cfe8a9c4cefeb948bb495
+size 14262770

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,123 @@

+experiment_name: proxy_interaction_state_actionhist
+output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction_debug
+device: cuda
+seed: 13
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 96
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v5_actionhist.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v5_actionhist.pt
+  rebuild_dataset: true
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 13
+optim:
+  epochs: 10
+  batch_size: 16
+  num_workers: 0
+  lr: 0.001
+  weight_decay: 0.0001
+trainer:
+  policy_type: interaction_state
+  use_bf16: true
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 128
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: true
+  fusion:
+    hidden_dim: 128
+    num_cameras: 3
+    num_layers: 2
+    num_heads: 4
+    ff_dim: 256
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 128
+    action_dim: 14
+    history_steps: 6
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    num_heads: 4
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 128
+    num_heads: 4
+    num_layers: 2
+    ff_dim: 256
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+  reveal_head:
+    hidden_dim: 128
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 4
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 128
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 4
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  planner:
+    hidden_dim: 128
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 4
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+loss_weights:
+  action: 1.0
+  phase: 0.15
+  arm_role: 0.2
+  support_mode: 0.15
+  corridor: 0.2
+  persistence: 0.1
+  disturbance: 0.1
+  world_model: 0.25
+  belief: 0.05
+  planner_success: 0.2
+  planner_risk: 0.1
+  planner_ranking: 0.1
+  proposal_reconstruction: 0.2
+  proposal_success: 0.1
+  proposal_ranking: 0.1

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/diagnostics/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "planner_top1_accuracy": 0.1984732824427481,
+  "planner_regret": 0.07150506228208542,
+  "risk_calibration_mse": 0.009851997718214989,
+  "role_collapse_rate": 0.0,
+  "num_samples": 131
+}

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/metrics.json ADDED Viewed

	@@ -0,0 +1,432 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.10911335345978539,
+      "arm_role": 0.16803828751047453,
+      "belief": 0.19615339611967406,
+      "corridor": 0.3072426902751128,
+      "disturbance": 0.022138183771555003,
+      "persistence": 4.085065553585689,
+      "phase": 0.6928596496582031,
+      "planner_ranking": 0.13037589440743128,
+      "planner_risk": 0.02288868693479647,
+      "planner_success": 0.6770538414518038,
+      "proposal_ranking": 0.11255756175766389,
+      "proposal_reconstruction": 0.18574035447090864,
+      "proposal_success": 0.6725843846797943,
+      "reocclusion": 0.5957262838880221,
+      "support_mode": 0.5480141110407809,
+      "total": 1.8947660674651463,
+      "uncertainty": 0.21132264643286666,
+      "world_model": 3.2140407264232635
+    },
+    "val": {
+      "action": 0.03260375331673357,
+      "arm_role": 0.00019734147483379475,
+      "belief": 0.12217340038882361,
+      "corridor": 0.2606741752889421,
+      "disturbance": 0.0038526968952889242,
+      "persistence": 4.259798420800103,
+      "phase": 0.4765485127766927,
+      "planner_ranking": 0.09453996519247691,
+      "planner_risk": 0.014876836703883277,
+      "planner_success": 0.7184285786416795,
+      "proposal_ranking": 0.09570289817121294,
+      "proposal_reconstruction": 0.08512727750672235,
+      "proposal_success": 0.6778848502371047,
+      "reocclusion": 0.30221917231877643,
+      "support_mode": 0.02004129211935732,
+      "total": 1.6661332448323567,
+      "uncertainty": 0.08814782814847098,
+      "world_model": 3.2738216982947455
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.027130307474484045,
+      "arm_role": 8.922153043992391e-05,
+      "belief": 0.11714147465924422,
+      "corridor": 0.24812329125901064,
+      "disturbance": 0.0032305579976916,
+      "persistence": 4.067985733350118,
+      "phase": 0.4347850941121578,
+      "planner_ranking": 0.10891644563525915,
+      "planner_risk": 0.014627174474298954,
+      "planner_success": 0.5990801006555557,
+      "proposal_ranking": 0.09713093843311071,
+      "proposal_reconstruction": 0.080568744490544,
+      "proposal_success": 0.6738408307234446,
+      "reocclusion": 0.30479869805276394,
+      "support_mode": 0.00354524122303701,
+      "total": 1.5207980622847874,
+      "uncertainty": 0.043511384554828204,
+      "world_model": 2.9335382282733917
+    },
+    "val": {
+      "action": 0.020881797497471172,
+      "arm_role": 4.6685139548369785e-05,
+      "belief": 0.11459854990243912,
+      "corridor": 0.25242144697242314,
+      "disturbance": 0.0016878885928437943,
+      "persistence": 3.9848385651906333,
+      "phase": 0.5357780622111427,
+      "planner_ranking": 0.12248502175013225,
+      "planner_risk": 0.014007404032680724,
+      "planner_success": 0.5618854893578423,
+      "proposal_ranking": 0.08806857880618837,
+      "proposal_reconstruction": 0.07101386454370287,
+      "proposal_success": 0.6761446727646722,
+      "reocclusion": 0.2807581913140085,
+      "support_mode": 0.00033569296485640935,
+      "total": 1.5498341586854723,
+      "uncertainty": 0.03854438621136877,
+      "world_model": 3.084032244152493
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.021659845563893516,
+      "arm_role": 4.9689525894791586e-05,
+      "belief": 0.11830708974351485,
+      "corridor": 0.2507151396324237,
+      "disturbance": 0.004413674871708888,
+      "persistence": 2.643252914150556,
+      "phase": 0.43942634264628094,
+      "planner_ranking": 0.10935842959831159,
+      "planner_risk": 0.014072448286848763,
+      "planner_success": 0.5583219341933727,
+      "proposal_ranking": 0.09152727667242289,
+      "proposal_reconstruction": 0.0724022975191474,
+      "proposal_success": 0.6700933004419009,
+      "reocclusion": 0.31216587871313095,
+      "support_mode": 0.000645008350450856,
+      "total": 1.2870350579420726,
+      "uncertainty": 0.028561103138296556,
+      "world_model": 2.6294024040301642
+    },
+    "val": {
+      "action": 0.02809068684776624,
+      "arm_role": 5.452130871061753e-05,
+      "belief": 0.10888734211524327,
+      "corridor": 0.23266181018617418,
+      "disturbance": 0.0027104780440115267,
+      "persistence": 2.1311826043658786,
+      "phase": 0.48636723723676467,
+      "planner_ranking": 0.08748033228847715,
+      "planner_risk": 0.013984487702449163,
+      "planner_success": 0.5531185136901008,
+      "proposal_ranking": 0.08530248867140876,
+      "proposal_reconstruction": 0.07563025090429518,
+      "proposal_success": 0.6710293292999268,
+      "reocclusion": 0.31506533589628005,
+      "support_mode": 0.0013758842574639453,
+      "total": 1.145080222023858,
+      "uncertainty": 0.013753527258005407,
+      "world_model": 2.241931358973185
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.02241998988514145,
+      "arm_role": 7.662544400470021e-05,
+      "belief": 0.1198031771928072,
+      "corridor": 0.23061849611500898,
+      "disturbance": 0.008813309230996916,
+      "persistence": 1.791534848511219,
+      "phase": 0.4151729643344879,
+      "planner_ranking": 0.10807953278223674,
+      "planner_risk": 0.013897615058037141,
+      "planner_success": 0.5403684402505556,
+      "proposal_ranking": 0.09165094265093406,
+      "proposal_reconstruction": 0.07184119118998449,
+      "proposal_success": 0.6651807849605879,
+      "reocclusion": 0.27597781488051015,
+      "support_mode": 0.0006089698921035355,
+      "total": 1.035346123079459,
+      "uncertainty": 0.02133664352974544,
+      "world_model": 2.009356458981832
+    },
+    "val": {
+      "action": 0.024748968995279737,
+      "arm_role": 0.00046029978289475874,
+      "belief": 0.1361072982350985,
+      "corridor": 0.2555284963713752,
+      "disturbance": 0.01113364020259016,
+      "persistence": 1.8078472415606182,
+      "phase": 0.49851488404803806,
+      "planner_ranking": 0.09051681806643803,
+      "planner_risk": 0.012982964619166322,
+      "planner_success": 0.5361581941445669,
+      "proposal_ranking": 0.08841735952430302,
+      "proposal_reconstruction": 0.07644655058781306,
+      "proposal_success": 0.6653637025091383,
+      "reocclusion": 0.3103545730312665,
+      "support_mode": 0.0022364634981689355,
+      "total": 1.2436118059688144,
+      "uncertainty": 0.044811665597889155,
+      "world_model": 2.755778524610731
+    }
+  },
+  {
+    "epoch": 4,
+    "train": {
+      "action": 0.030993331456556916,
+      "arm_role": 8.697735347595881e-05,
+      "belief": 0.11502061566958825,
+      "corridor": 0.2168644548704227,
+      "disturbance": 0.005981470370898023,
+      "persistence": 1.325400508319338,
+      "phase": 0.4057002601524194,
+      "planner_ranking": 0.10196248659243186,
+      "planner_risk": 0.013080424706762036,
+      "planner_success": 0.5429841242730618,
+      "proposal_ranking": 0.09320679493248463,
+      "proposal_reconstruction": 0.08633392583578825,
+      "proposal_success": 0.6598697329560915,
+      "reocclusion": 0.23775681791206202,
+      "support_mode": 0.0005070095260938009,
+      "total": 0.9538104037443796,
+      "uncertainty": 0.01720601328027745,
+      "world_model": 1.8480148315429688
+    },
+    "val": {
+      "action": 0.02140410254812903,
+      "arm_role": 5.1328555046994654e-05,
+      "belief": 0.10880060328377618,
+      "corridor": 0.21354658570554522,
+      "disturbance": 0.0037805813287074366,
+      "persistence": 1.2975979381137424,
+      "phase": 0.47454749047756195,
+      "planner_ranking": 0.08853000981940164,
+      "planner_risk": 0.011068900529709127,
+      "planner_success": 0.5381979445616404,
+      "proposal_ranking": 0.09127837005588743,
+      "proposal_reconstruction": 0.07022183057334688,
+      "proposal_success": 0.6659399072329203,
+      "reocclusion": 0.19952762044138378,
+      "support_mode": 0.00027834434553773864,
+      "total": 0.952674925327301,
+      "uncertainty": 0.01160443677670426,
+      "world_model": 1.8811089727613661
+    }
+  },
+  {
+    "epoch": 5,
+    "train": {
+      "action": 0.02381352987140417,
+      "arm_role": 6.333578160896043e-05,
+      "belief": 0.1099607174595197,
+      "corridor": 0.21310261078178883,
+      "disturbance": 0.002459915580402594,
+      "persistence": 1.6992873040338357,
+      "phase": 0.4683965767423312,
+      "planner_ranking": 0.10114171418050925,
+      "planner_risk": 0.011117635760456324,
+      "planner_success": 0.5304318008323511,
+      "proposal_ranking": 0.09141425788402557,
+      "proposal_reconstruction": 0.07442743517458439,
+      "proposal_success": 0.6563858091831207,
+      "reocclusion": 0.331877409790953,
+      "support_mode": 0.3825794731577237,
+      "total": 0.9921379586060842,
+      "uncertainty": 0.010878979364254823,
+      "world_model": 1.6345916986465454
+    },
+    "val": {
+      "action": 0.02524013713830047,
+      "arm_role": 9.413575834413577e-05,
+      "belief": 0.12235430793629752,
+      "corridor": 0.249200153681967,
+      "disturbance": 0.004427346711357434,
+      "persistence": 3.935940318637424,
+      "phase": 0.6591929793357849,
+      "planner_ranking": 0.09305098156134288,
+      "planner_risk": 0.010506668748954931,
+      "planner_success": 0.5443058278825548,
+      "proposal_ranking": 0.08850305030743282,
+      "proposal_reconstruction": 0.07236838009622362,
+      "proposal_success": 0.6759181155098809,
+      "reocclusion": 0.7287290294965109,
+      "support_mode": 1.1460433138741388,
+      "total": 1.4354194932513766,
+      "uncertainty": 0.024242303644617397,
+      "world_model": 1.8577234480116103
+    }
+  },
+  {
+    "epoch": 6,
+    "train": {
+      "action": 0.02330849994905293,
+      "arm_role": 0.00015805537501970926,
+      "belief": 0.1124286272873481,
+      "corridor": 0.23743322926263014,
+      "disturbance": 0.0031262978930802396,
+      "persistence": 3.8017045756181083,
+      "phase": 0.6851730346679688,
+      "planner_ranking": 0.09221760835498571,
+      "planner_risk": 0.01065190702987214,
+      "planner_success": 0.52338948721687,
+      "proposal_ranking": 0.09460213221609592,
+      "proposal_reconstruction": 0.0690260889629523,
+      "proposal_success": 0.6765442565083504,
+      "reocclusion": 0.6601327558358511,
+      "support_mode": 0.7531089782714844,
+      "total": 1.3313229431708653,
+      "uncertainty": 0.016478817832345765,
+      "world_model": 1.75758895277977
+    },
+    "val": {
+      "action": 0.023909604797760647,
+      "arm_role": 0.000182229990362733,
+      "belief": 0.10623268286387126,
+      "corridor": 0.2390136702193154,
+      "disturbance": 0.0034688233410836095,
+      "persistence": 3.879435486263699,
+      "phase": 0.6545324060651991,
+      "planner_ranking": 0.09108450180954403,
+      "planner_risk": 0.00950968601844377,
+      "planner_success": 0.5444046192699008,
+      "proposal_ranking": 0.09340034839179781,
+      "proposal_reconstruction": 0.06825375143024656,
+      "proposal_success": 0.6806784537103441,
+      "reocclusion": 0.6431198517481486,
+      "support_mode": 0.6673565440707736,
+      "total": 1.3279486762152777,
+      "uncertainty": 0.008409220777038071,
+      "world_model": 1.7654762268066406
+    }
+  },
+  {
+    "epoch": 7,
+    "train": {
+      "action": 0.0222570748689274,
+      "arm_role": 0.00010212738478306467,
+      "belief": 0.11000798580547173,
+      "corridor": 0.23306679725646973,
+      "disturbance": 0.0033048741412737095,
+      "persistence": 3.4312864542007446,
+      "phase": 0.6377454921603203,
+      "planner_ranking": 0.09635432902723551,
+      "planner_risk": 0.011387234243253866,
+      "planner_success": 0.5442424913247427,
+      "proposal_ranking": 0.08986945698658626,
+      "proposal_reconstruction": 0.06708647248645623,
+      "proposal_success": 0.673826314508915,
+      "reocclusion": 0.5967350701491038,
+      "support_mode": 0.6117285092671713,
+      "total": 1.236641672750314,
+      "uncertainty": 0.01299802268234392,
+      "world_model": 1.639583835999171
+    },
+    "val": {
+      "action": 0.022002756595611572,
+      "arm_role": 2.9528787207608628e-05,
+      "belief": 0.12314293947484758,
+      "corridor": 0.24459290835592482,
+      "disturbance": 0.004033175555782186,
+      "persistence": 2.5022888514730663,
+      "phase": 0.5651864541901482,
+      "planner_ranking": 0.08950987623797522,
+      "planner_risk": 0.009576339947266711,
+      "planner_success": 0.5564733445644379,
+      "proposal_ranking": 0.08564452992545234,
+      "proposal_reconstruction": 0.0668929773900244,
+      "proposal_success": 0.6727176573541429,
+      "reocclusion": 0.44570984774165684,
+      "support_mode": 0.46422717306349015,
+      "total": 1.1864347391658359,
+      "uncertainty": 0.029489829101496272,
+      "world_model": 1.938715272479587
+    }
+  },
+  {
+    "epoch": 8,
+    "train": {
+      "action": 0.019501756915512185,
+      "arm_role": 4.518414956085811e-05,
+      "belief": 0.11856034491211176,
+      "corridor": 0.22101152688264847,
+      "disturbance": 0.005134509168177222,
+      "persistence": 2.0068868373831115,
+      "phase": 0.48705990488330525,
+      "planner_ranking": 0.09284681857873996,
+      "planner_risk": 0.01043116363386313,
+      "planner_success": 0.5206327053407828,
+      "proposal_ranking": 0.08962376570949952,
+      "proposal_reconstruction": 0.06520200536275904,
+      "proposal_success": 0.6658588672677676,
+      "reocclusion": 0.3816298767924309,
+      "support_mode": 0.28521304662960273,
+      "total": 0.9868118191758791,
+      "uncertainty": 0.015137382831502086,
+      "world_model": 1.557202582557996
+    },
+    "val": {
+      "action": 0.01789842639118433,
+      "arm_role": 4.689901551399897e-05,
+      "belief": 0.11476549340618981,
+      "corridor": 0.20894784231980643,
+      "disturbance": 0.006007373902118868,
+      "persistence": 1.3287181854248047,
+      "phase": 0.4533460769388411,
+      "planner_ranking": 0.09486487342251672,
+      "planner_risk": 0.009565845442314943,
+      "planner_success": 0.5391222304768033,
+      "proposal_ranking": 0.09564895927906036,
+      "proposal_reconstruction": 0.06366962691148122,
+      "proposal_success": 0.6531099279721578,
+      "reocclusion": 0.20913477883570725,
+      "support_mode": 0.020122037941796914,
+      "total": 0.8832472761472067,
+      "uncertainty": 0.004256232098365824,
+      "world_model": 1.6128649711608887
+    }
+  },
+  {
+    "epoch": 9,
+    "train": {
+      "action": 0.016334226393761735,
+      "arm_role": 6.246064898126254e-05,
+      "belief": 0.10857280095418294,
+      "corridor": 0.19824294683833918,
+      "disturbance": 0.003975103861497094,
+      "persistence": 1.1797814977665741,
+      "phase": 0.40182892481486004,
+      "planner_ranking": 0.09200050433476765,
+      "planner_risk": 0.009777653632530322,
+      "planner_success": 0.4811691368619601,
+      "proposal_ranking": 0.09789401820550363,
+      "proposal_reconstruction": 0.06257841860254605,
+      "proposal_success": 0.6470200767119726,
+      "reocclusion": 0.24410315960024795,
+      "support_mode": 0.004229606854399511,
+      "total": 0.8042063365379969,
+      "uncertainty": 0.004445769324471864,
+      "world_model": 1.4606107970078785
+    },
+    "val": {
+      "action": 0.016275615017447207,
+      "arm_role": 6.341466885512798e-05,
+      "belief": 0.10352056639062034,
+      "corridor": 0.19860318468676674,
+      "disturbance": 0.0032389340146134296,
+      "persistence": 1.292702876859241,
+      "phase": 0.44613948629962075,
+      "planner_ranking": 0.09405012097623613,
+      "planner_risk": 0.00965356407687068,
+      "planner_success": 0.5550677445199754,
+      "proposal_ranking": 0.09946481055683559,
+      "proposal_reconstruction": 0.062025451825724706,
+      "proposal_success": 0.637408435344696,
+      "reocclusion": 0.1942617915984657,
+      "support_mode": 0.0015144004525306325,
+      "total": 0.8655187752511766,
+      "uncertainty": 0.002816161386565202,
+      "world_model": 1.5848071972529094
+    }
+  }
+]

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/checkpoint_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:54df000293b3795beb34e6696ed2e18664ea87df6aaf81cf39ec9b23c589580a
+size 3810162

artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,123 @@

+experiment_name: proxy_interaction_state_actionhist_smoke
+output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction_debug
+device: cuda
+seed: 13
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 64
+  train_episodes_per_proxy: 6
+  val_episodes_per_proxy: 2
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_smoke_v5_actionhist.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_smoke_v5_actionhist.pt
+  rebuild_dataset: true
+  chunk_horizon: 4
+  rollout_horizon: 3
+  history_steps: 6
+  planner_candidates: 4
+  seed: 13
+optim:
+  epochs: 4
+  batch_size: 8
+  num_workers: 0
+  lr: 0.001
+  weight_decay: 0.0001
+trainer:
+  policy_type: interaction_state
+  use_bf16: true
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 64
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: true
+  fusion:
+    hidden_dim: 64
+    num_cameras: 3
+    num_layers: 2
+    num_heads: 4
+    ff_dim: 128
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 64
+    action_dim: 14
+    history_steps: 6
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    num_heads: 4
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 64
+    num_heads: 4
+    num_layers: 2
+    ff_dim: 128
+    dropout: 0.1
+    chunk_size: 4
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 4
+    num_phases: 5
+    num_arm_roles: 4
+  reveal_head:
+    hidden_dim: 64
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 3
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 4
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 64
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 3
+    field_size: 16
+    num_heads: 4
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  planner:
+    hidden_dim: 64
+    num_candidates: 4
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 4
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+loss_weights:
+  action: 1.0
+  phase: 0.15
+  arm_role: 0.2
+  support_mode: 0.15
+  corridor: 0.2
+  persistence: 0.1
+  disturbance: 0.1
+  world_model: 0.25
+  belief: 0.05
+  planner_success: 0.2
+  planner_risk: 0.1
+  planner_ranking: 0.1
+  proposal_reconstruction: 0.2
+  proposal_success: 0.1
+  proposal_ranking: 0.1

artifacts/outputs/interaction_debug/proxy_interaction_state_clip_actionhist/checkpoint_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e4adeddd399c964ef4536e44b963d3e061fe4734a9e0ae84d6961ffc81b1331
+size 942404672

artifacts/outputs/interaction_debug/proxy_interaction_state_recency_oracleft/checkpoint_best.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be03ccc29ab53e41e5b6065bd5cc4ae35edd53da600a4ae7e2e4beb5693c76ab
+size 14260274

artifacts/outputs/interaction_debug/reveal_eval_commit8_compare/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,41 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.2916666666666667,
+      "bag_proxy": 0.5416666666666666,
+      "cloth_proxy": 0.7083333333333334
+    },
+    "mean_success": 0.5138888888888888,
+    "visibility_integral": 24.377886186043423,
+    "corridor_availability": 0.7185707421352466,
+    "reocclusion_rate": 0.035547913343965974,
+    "persistence_horizon_mae": 1.5261633908191676,
+    "disturbance_cost": 0.33828365347451633
+  },
+  "backbone": {
+    "per_task_success": {
+      "foliage_proxy": 0.2916666666666667,
+      "bag_proxy": 0.3333333333333333,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.4166666666666667,
+    "visibility_integral": 16.212429179085625,
+    "corridor_availability": 0.5099402347372638,
+    "reocclusion_rate": 0.035937500000000004,
+    "persistence_horizon_mae": 0.0,
+    "disturbance_cost": 0.14064574577949113
+  },
+  "reveal": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5555555555555555,
+    "visibility_integral": 32.11319461464882,
+    "corridor_availability": 0.8064262109498183,
+    "reocclusion_rate": 0.05781655348648813,
+    "persistence_horizon_mae": 1.9629322701129155,
+    "disturbance_cost": 0.22681122702649897
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_commit8_compare/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,37 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt
+- mean_success: 0.514
+- visibility_integral: 24.378
+- corridor_availability: 0.719
+- reocclusion_rate: 0.036
+- persistence_horizon_mae: 1.526
+- disturbance_cost: 0.338
+- foliage_proxy_success: 0.292
+- bag_proxy_success: 0.542
+- cloth_proxy_success: 0.708
+## backbone
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only/checkpoint_best.pt
+- mean_success: 0.417
+- visibility_integral: 16.212
+- corridor_availability: 0.510
+- reocclusion_rate: 0.036
+- persistence_horizon_mae: 0.000
+- disturbance_cost: 0.141
+- foliage_proxy_success: 0.292
+- bag_proxy_success: 0.333
+- cloth_proxy_success: 0.625
+## reveal
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_reveal_state/checkpoint_best.pt
+- mean_success: 0.556
+- visibility_integral: 32.113
+- corridor_availability: 0.806
+- reocclusion_rate: 0.058
+- persistence_horizon_mae: 1.963
+- disturbance_cost: 0.227
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_commit4/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5416666666666666,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5277777777777778,
+    "visibility_integral": 32.84789120488696,
+    "corridor_availability": 0.8711970953477753,
+    "reocclusion_rate": 0.003125,
+    "persistence_horizon_mae": 1.1544888946683267,
+    "disturbance_cost": 0.4288607043110662
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_commit4/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist/checkpoint_best.pt
+- mean_success: 0.528
+- visibility_integral: 32.848
+- corridor_availability: 0.871
+- reocclusion_rate: 0.003
+- persistence_horizon_mae: 1.154
+- disturbance_cost: 0.429
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.542
+- cloth_proxy_success: 0.625

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.0,
+      "bag_proxy": 0.0,
+      "cloth_proxy": 0.0
+    },
+    "mean_success": 0.0,
+    "visibility_integral": 63.63303746117486,
+    "corridor_availability": 0.9842249751091003,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.931804162517397,
+    "disturbance_cost": 0.8506438152657615
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/checkpoint_best.pt
+- mean_success: 0.000
+- visibility_integral: 63.633
+- corridor_availability: 0.984
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.932
+- disturbance_cost: 0.851
+- foliage_proxy_success: 0.000
+- bag_proxy_success: 0.000
+- cloth_proxy_success: 0.000

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke_commit4_short/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.5,
+      "bag_proxy": 0.75,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.625,
+    "visibility_integral": 26.89287617057562,
+    "corridor_availability": 0.8617658143242201,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.787702427190893,
+    "disturbance_cost": 0.3262111305569609
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_interaction_actionhist_smoke_commit4_short/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_debug/proxy_interaction_state_actionhist_smoke/checkpoint_best.pt
+- mean_success: 0.625
+- visibility_integral: 26.893
+- corridor_availability: 0.862
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.788
+- disturbance_cost: 0.326
+- foliage_proxy_success: 0.500
+- bag_proxy_success: 0.750
+- cloth_proxy_success: 0.625

artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_full_commit4/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.2916666666666667,
+      "bag_proxy": 0.041666666666666664,
+      "cloth_proxy": 0.16666666666666666
+    },
+    "mean_success": 0.16666666666666666,
+    "visibility_integral": 17.456528491444057,
+    "corridor_availability": 0.48336762624482316,
+    "reocclusion_rate": 0.11013933982683982,
+    "persistence_horizon_mae": 1.8837784738524963,
+    "disturbance_cost": 0.2859070710207258
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_full_commit4/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/checkpoint_best.pt
+- mean_success: 0.167
+- visibility_integral: 17.457
+- corridor_availability: 0.483
+- reocclusion_rate: 0.110
+- persistence_horizon_mae: 1.884
+- disturbance_cost: 0.286
+- foliage_proxy_success: 0.292
+- bag_proxy_success: 0.042
+- cloth_proxy_success: 0.167

artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_smoke_commit4_short/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "interaction": {
+    "per_task_success": {
+      "foliage_proxy": 0.375,
+      "bag_proxy": 0.375,
+      "cloth_proxy": 0.25
+    },
+    "mean_success": 0.3333333333333333,
+    "visibility_integral": 43.64047184586525,
+    "corridor_availability": 0.9287551492452621,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.8099890020956475,
+    "disturbance_cost": 0.6381748262792826
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_interaction_rolefix_smoke_commit4_short/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## interaction
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/checkpoint_best.pt
+- mean_success: 0.333
+- visibility_integral: 43.640
+- corridor_availability: 0.929
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.810
+- disturbance_cost: 0.638
+- foliage_proxy_success: 0.375
+- bag_proxy_success: 0.375
+- cloth_proxy_success: 0.250

artifacts/outputs/interaction_debug/reveal_eval_old_no_leak_baselines_commit4/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,28 @@

+{
+  "backbone": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5555555555555555,
+    "visibility_integral": 29.27436817354626,
+    "corridor_availability": 0.7935162136952082,
+    "reocclusion_rate": 0.07854136604136604,
+    "persistence_horizon_mae": 0.0,
+    "disturbance_cost": 0.4006388829503622
+  },
+  "reveal": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5416666666666666,
+    "visibility_integral": 30.107333534293705,
+    "corridor_availability": 0.8134206715557311,
+    "reocclusion_rate": 0.05241552429052429,
+    "persistence_horizon_mae": 2.0996421982129196,
+    "disturbance_cost": 0.42389288420478505
+  }
+}

artifacts/outputs/interaction_debug/reveal_eval_old_no_leak_baselines_commit4/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,25 @@

+# Reveal Proxy Benchmark
+## backbone
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only/checkpoint_best.pt
+- mean_success: 0.556
+- visibility_integral: 29.274
+- corridor_availability: 0.794
+- reocclusion_rate: 0.079
+- persistence_horizon_mae: 0.000
+- disturbance_cost: 0.401
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667
+## reveal
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_reveal_state/checkpoint_best.pt
+- mean_success: 0.542
+- visibility_integral: 30.107
+- corridor_availability: 0.813
+- reocclusion_rate: 0.052
+- persistence_horizon_mae: 2.100
+- disturbance_cost: 0.424
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.625

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_clipped/rollout_eval.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt",
+  "plan_requested": true,
+  "plan_applied": true,
+  "planner_mode": "proxy_pretrained",
+  "support_mode_conditioning": true,
+  "episodes_per_task": 1,
+  "episode_length": 5,
+  "resolution": 128,
+  "cameras": [
+    "front",
+    "wrist_left",
+    "wrist_right"
+  ],
+  "tasks": {
+    "open_drawer": {
+      "error": "A path could not be found. Most likely due to the target being inaccessible or a collison was detected.",
+      "mean_success": 0.0,
+      "mean_return": 0.0
+    }
+  },
+  "mean_success": 0.0
+}

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_clipped/rollout_eval.md ADDED Viewed

	@@ -0,0 +1,11 @@

+# RLBench Rollout Eval
+- Checkpoint: `/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt`
+- Plan requested: `True`
+- Plan applied: `True`
+- Support-mode conditioning: `True`
+- Mean success: `0.000`
+## Per-task
+- `open_drawer`: error=A path could not be found. Most likely due to the target being inaccessible or a collison was detected.

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_recovered/rollout_eval.json ADDED Viewed

	@@ -0,0 +1,31 @@

+{
+  "checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt",
+  "plan_requested": true,
+  "plan_applied": true,
+  "planner_mode": "proxy_pretrained",
+  "support_mode_conditioning": true,
+  "episodes_per_task": 1,
+  "episode_length": 5,
+  "resolution": 128,
+  "cameras": [
+    "front",
+    "wrist_left",
+    "wrist_right"
+  ],
+  "tasks": {
+    "open_drawer": {
+      "task_class": "OpenDrawer",
+      "successes": [
+        0.0
+      ],
+      "returns": [
+        0.0
+      ],
+      "path_recoveries": 0,
+      "noop_fallbacks": 0,
+      "mean_success": 0.0,
+      "mean_return": 0.0
+    }
+  },
+  "mean_success": 0.0
+}

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_recovered/rollout_eval.md ADDED Viewed

	@@ -0,0 +1,11 @@

+# RLBench Rollout Eval
+- Checkpoint: `/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt`
+- Plan requested: `True`
+- Plan applied: `True`
+- Support-mode conditioning: `True`
+- Mean success: `0.000`
+## Per-task
+- `open_drawer`: mean_success=0.000, returns=[0.0]

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_rerun/rollout_eval.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt",
+  "plan_requested": true,
+  "plan_applied": true,
+  "planner_mode": "proxy_pretrained",
+  "support_mode_conditioning": true,
+  "episodes_per_task": 1,
+  "episode_length": 5,
+  "resolution": 128,
+  "cameras": [
+    "front",
+    "wrist_left",
+    "wrist_right"
+  ],
+  "tasks": {
+    "open_drawer": {
+      "error": "A path could not be found because the target is outside of workspace.",
+      "mean_success": 0.0,
+      "mean_return": 0.0
+    }
+  },
+  "mean_success": 0.0
+}

artifacts/outputs/interaction_debug/rlbench_open_drawer_rollout_eval_commit4_rerun/rollout_eval.md ADDED Viewed

	@@ -0,0 +1,11 @@

+# RLBench Rollout Eval
+- Checkpoint: `/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt`
+- Plan requested: `True`
+- Plan applied: `True`
+- Support-mode conditioning: `True`
+- Mean success: `0.000`
+## Per-task
+- `open_drawer`: error=A path could not be found because the target is outside of workspace.