Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.02867290366350942,0.011463257366429714,-0.02887656604578487,-0.02600612910926127,27.234100594973334,10.972999999998995,0.72,5056.6,-0.4,-323.98,217.46,0.6708195781707764,450000
|
| 3 |
+
0.0,0.0,-0.0488876627715917,0.029199732070436933,-0.046781637220506544,0.02339874869809982,30.924384212662204,6.997999999999383,0.86,14901.74,-0.24,-226.58,137.96,0.4372998046875,500000
|
| 4 |
+
0.0,0.0,-0.03574048522523012,0.047686374001355364,-0.03288299381366747,0.02639781711342885,33.63589021187137,5.403999999999642,0.92,21621.9,-0.14,-162.52,106.08,0.3397250270843506,550000
|
| 5 |
+
0.0,0.0,-0.03021578923036463,0.0394976072294332,-0.027182995475428965,0.04382907760796754,33.35598161165096,5.011999999999664,0.92,26354.74,-0.16,-165.74,98.24,0.3102375030517578,600000
|
| 6 |
+
0.0,0.0,-0.046524057758791516,0.052021306978465985,-0.04276920476237997,0.05582660234860478,35.489654628825754,3.515999999999815,0.96,31097.68,-0.06,-102.68,68.32,0.22407721996307373,650000
|
| 7 |
+
0.0,0.0,-0.04960850795848323,0.05351060405942106,-0.04591604539822911,0.04705534775815299,34.55363053605605,2.954999999999944,1.0,34128.74,0.0,-85.9,57.1,0.1833690023422241,700000
|
| 8 |
+
0.0,0.0,-0.04936068078573048,0.05831210187676398,-0.04556115923074419,0.06058237165215024,35.652750134571484,2.7019999999999236,1.0,36914.78,0.0,-76.34,52.04,0.175793137550354,750000
|
| 9 |
+
0.0,0.0,-0.04387414746665861,0.06582031519898665,-0.040122722990781116,0.06399927349208273,34.111627533222105,3.854999999999768,0.94,40472.76,-0.08,-111.76,75.1,0.2414384078979492,800000
|
| 10 |
+
0.0,0.0,-0.04896650897225149,0.0584491363024676,-0.04537151845582367,0.06050740348977812,35.56282834898023,2.947999999999887,0.98,44257.28,-0.02,-81.0,56.96,0.18764180183410645,850000
|
| 11 |
+
0.0,0.0,-0.04472016123840982,0.06184074474297109,-0.040681187702692065,0.06725994341997119,35.844154673332625,2.5549999999999597,1.0,46761.82,0.0,-70.64,49.1,0.1693114709854126,900000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.02867290366350942,0.011463257366429714,-0.02887656604578487,-0.02600612910926127,27.234100594973334,10.972999999998995,0.72,5056.6,-0.4,-323.98,217.46,0.6708195781707764,450000
|
| 3 |
+
0.0,0.0,-0.0488876627715917,0.029199732070436933,-0.046781637220506544,0.02339874869809982,30.924384212662204,6.997999999999383,0.86,14901.74,-0.24,-226.58,137.96,0.4372998046875,500000
|
| 4 |
+
0.0,0.0,-0.03574048522523012,0.047686374001355364,-0.03288299381366747,0.02639781711342885,33.63589021187137,5.403999999999642,0.92,21621.9,-0.14,-162.52,106.08,0.3397250270843506,550000
|
| 5 |
+
0.0,0.0,-0.03021578923036463,0.0394976072294332,-0.027182995475428965,0.04382907760796754,33.35598161165096,5.011999999999664,0.92,26354.74,-0.16,-165.74,98.24,0.3102375030517578,600000
|
| 6 |
+
0.0,0.0,-0.046524057758791516,0.052021306978465985,-0.04276920476237997,0.05582660234860478,35.489654628825754,3.515999999999815,0.96,31097.68,-0.06,-102.68,68.32,0.22407721996307373,650000
|
| 7 |
+
0.0,0.0,-0.04960850795848323,0.05351060405942106,-0.04591604539822911,0.04705534775815299,34.55363053605605,2.954999999999944,1.0,34128.74,0.0,-85.9,57.1,0.1833690023422241,700000
|
| 8 |
+
0.0,0.0,-0.04936068078573048,0.05831210187676398,-0.04556115923074419,0.06058237165215024,35.652750134571484,2.7019999999999236,1.0,36914.78,0.0,-76.34,52.04,0.175793137550354,750000
|
| 9 |
+
0.0,0.0,-0.04387414746665861,0.06582031519898665,-0.040122722990781116,0.06399927349208273,34.111627533222105,3.854999999999768,0.94,40472.76,-0.08,-111.76,75.1,0.2414384078979492,800000
|
| 10 |
+
0.0,0.0,-0.04896650897225149,0.0584491363024676,-0.04537151845582367,0.06050740348977812,35.56282834898023,2.947999999999887,0.98,44257.28,-0.02,-81.0,56.96,0.18764180183410645,850000
|
| 11 |
+
0.0,0.0,-0.04472016123840982,0.06184074474297109,-0.040681187702692065,0.06725994341997119,35.844154673332625,2.5549999999999597,1.0,46761.82,0.0,-70.64,49.1,0.1693114709854126,900000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.99999994,0.025157133,2.5157132,1.0251571,0.53231317,-26.891712,-103.67446,-172.2503,0.13399374,-0.14884958,10.510901,405000
|
| 3 |
+
1.0,1.0,0.025113257,2.5113258,1.0251132,0.77921313,-19.04549,-103.03257,-172.13354,0.3299345,-0.15223771,11.391849,410000
|
| 4 |
+
1.0,0.9999999,0.023235314,2.3235314,1.0232352,0.7512946,-27.673769,-105.85537,-178.86087,0.50038725,-0.4437714,11.955674,415000
|
| 5 |
+
1.0,1.0,0.022527503,2.2527504,1.0225275,1.2428778,-22.596699,-105.58801,-186.42746,0.3160805,-0.28271976,14.373287,420000
|
| 6 |
+
1.0,1.0,0.023217924,2.3217926,1.0232179,0.9237636,-39.350384,-106.337845,-187.28612,0.25962913,-0.15568459,14.160808,425000
|
| 7 |
+
1.0,1.0,0.023621818,2.362182,1.0236218,4.3968186,-25.211662,-104.02071,-187.45119,0.5784953,-0.5873601,33.55614,430000
|
| 8 |
+
1.0,1.0,0.0251925,2.5192497,1.0251925,1.3648342,-24.053425,-103.02919,-187.50647,0.35545927,-0.34532136,21.68988,435000
|
| 9 |
+
1.0,1.0,0.02521493,2.521493,1.0252149,1.604153,-26.96808,-101.5722,-191.61823,0.92516464,-0.96857643,29.963015,440000
|
| 10 |
+
1.0,0.99999994,0.023334352,2.3334353,1.0233343,1.2581676,-37.785847,-102.24515,-202.25917,0.15806566,-0.21556772,16.773167,445000
|
| 11 |
+
1.0,1.0,0.026809376,2.6809375,1.0268093,1.4568628,-4.5243387,-101.99981,-181.94754,0.3197963,-0.3033229,22.476076,450000
|
| 12 |
+
1.0,1.0,0.026387896,2.6387897,1.0263879,1.2023535,-6.2533994,-97.68756,-178.05121,0.1526876,-0.2164221,16.206255,455000
|
| 13 |
+
1.0,1.0,0.026118184,2.6118183,1.0261182,1.2065241,-18.78402,-95.51681,-191.9236,0.42062873,-0.4463129,15.317608,460000
|
| 14 |
+
1.0,0.9999999,0.028214788,2.8214788,1.0282147,1.289976,-20.51815,-94.15615,-194.60336,0.15496647,-0.17340407,14.155297,465000
|
| 15 |
+
1.0,1.0,0.02640535,2.640535,1.0264053,1.4825348,-9.145197,-92.48812,-194.21062,0.27726346,-0.3197029,20.028833,470000
|
| 16 |
+
1.0,1.0,0.027353358,2.7353358,1.0273534,1.1836166,-8.634992,-96.52739,-198.756,0.22825176,-0.17488514,16.71601,475000
|
| 17 |
+
1.0,1.0,0.02695355,2.695355,1.0269536,1.5686903,-9.323476,-96.56451,-192.85529,0.37681964,-0.22715092,18.565798,480000
|
| 18 |
+
1.0,1.0,0.026193237,2.6193237,1.0261933,1.1369078,-12.74843,-96.366196,-181.73361,0.1317066,-0.26755702,14.013101,485000
|
| 19 |
+
1.0,1.0,0.028329657,2.8329659,1.0283296,2.538432,-9.117981,-93.268196,-190.5664,0.1780087,-0.17786413,18.999344,490000
|
| 20 |
+
1.0,0.99999994,0.028367547,2.836755,1.0283675,2.0601337,-21.544312,-93.60598,-193.21124,0.46069407,-0.41348884,32.147987,495000
|
| 21 |
+
1.0,1.0,0.02745549,2.745549,1.0274554,1.1408931,-16.635332,-92.632034,-184.18936,0.13581789,-0.21753965,15.989874,500000
|
| 22 |
+
1.0,0.99999994,0.028493382,2.8493383,1.0284933,1.5111655,-5.97856,-92.368164,-195.51163,0.23915003,-0.19570182,16.69968,505000
|
| 23 |
+
1.0,0.9999999,0.027989589,2.798959,1.0279895,1.5369517,-13.603284,-91.58053,-176.48103,0.28107885,-0.4413799,21.673958,510000
|
| 24 |
+
1.0,0.9999901,0.027572297,2.7572298,1.0275624,1.0297557,0.82993084,-88.66686,-171.9292,0.21027854,-0.21160015,15.316832,515000
|
| 25 |
+
1.0,1.0,0.026589934,2.6589935,1.02659,1.1302769,-1.9311945,-89.384605,-179.8292,0.16891453,-0.26917547,16.111519,520000
|
| 26 |
+
1.0,1.0000001,0.02797164,2.797164,1.0279717,1.7714993,-5.1349754,-91.82836,-169.75162,0.1795532,-0.16546644,15.686453,525000
|
| 27 |
+
1.0,1.0,0.02972116,2.972116,1.0297211,3.9209125,-11.591069,-92.44326,-179.12503,0.7461984,-0.34941038,32.133583,530000
|
| 28 |
+
1.0,0.9999396,0.028732024,2.8732023,1.0286716,2.7485232,2.2264824,-90.89141,-179.37616,0.421374,-0.4223844,28.846163,535000
|
| 29 |
+
1.0,0.9999999,0.029354481,2.9354482,1.0293543,1.4808971,-0.39686167,-86.62581,-170.97238,0.3301482,-0.24302964,22.01601,540000
|
| 30 |
+
1.0,1.0,0.02824355,2.8243551,1.0282435,1.196995,-8.212218,-89.84618,-192.50697,0.17205356,-0.21746291,17.68002,545000
|
| 31 |
+
1.0,0.99999994,0.027313815,2.7313814,1.0273137,1.3159078,-5.526501,-88.45916,-177.21669,0.34176654,-0.21142854,18.370007,550000
|
| 32 |
+
1.0,0.99998313,0.026809677,2.6809678,1.0267928,1.505472,0.64103436,-87.57682,-171.60443,0.8050131,-0.8677561,24.70426,555000
|
| 33 |
+
1.0,1.0,0.028479535,2.8479536,1.0284796,1.8479054,-2.3692818,-90.33882,-190.21123,0.6045487,-0.53351456,32.414917,560000
|
| 34 |
+
1.0,1.0,0.027306596,2.7306597,1.0273066,1.6418797,1.5755324,-86.00034,-175.61833,0.48290777,-0.23012751,26.27731,565000
|
| 35 |
+
1.0,1.0,0.028812345,2.8812346,1.0288123,1.4088321,-6.6962147,-86.68374,-188.03596,0.26674983,-0.3705712,22.354813,570000
|
| 36 |
+
1.0,1.0,0.027958095,2.7958097,1.0279582,2.1789005,-7.0649147,-91.747116,-189.65019,0.4352608,-0.25116655,28.023155,575000
|
| 37 |
+
1.0,0.9999589,0.027199455,2.7199454,1.0271584,0.9810616,2.1859703,-88.72465,-184.81218,0.21929246,-0.19292563,13.493492,580000
|
| 38 |
+
1.0,1.0,0.030407228,3.0407228,1.0304072,1.1152725,-1.1895856,-83.35737,-163.9159,0.3662737,-0.20014341,16.979311,585000
|
| 39 |
+
1.0,1.0,0.029095434,2.9095435,1.0290954,1.4334427,-0.33924088,-86.0289,-191.83453,0.3218287,-0.3722298,24.570652,590000
|
| 40 |
+
1.0,1.0,0.029855452,2.9855456,1.0298555,1.1751639,-1.6925819,-85.66372,-187.55261,0.15117049,-0.2987684,15.508531,595000
|
| 41 |
+
1.0,1.0000001,0.028974392,2.897439,1.0289745,1.361495,0.43888986,-86.19103,-190.31033,0.1818742,-0.28831422,18.0083,600000
|
| 42 |
+
1.0,1.0,0.030579604,3.0579605,1.0305796,1.3688914,-5.1868277,-84.06667,-160.24855,0.22067493,-0.15921643,15.408772,605000
|
| 43 |
+
1.0,0.99999994,0.0290608,2.9060802,1.0290607,1.0749149,-0.18576913,-85.88476,-167.7035,0.22567034,-0.19181833,14.963071,610000
|
| 44 |
+
1.0,1.0,0.029777136,2.9777136,1.0297772,1.4772668,-1.2207552,-86.17348,-185.10791,0.3131353,-0.1445865,18.562372,615000
|
| 45 |
+
1.0,1.0,0.027791819,2.779182,1.0277919,1.2263137,-7.468808,-86.70676,-183.23918,0.24187972,-0.124534935,14.215077,620000
|
| 46 |
+
1.0,0.99999994,0.029488675,2.9488678,1.0294886,2.3008575,-2.9173937,-81.540085,-162.2597,0.45000547,-0.45436323,27.43052,625000
|
| 47 |
+
1.0,0.9999999,0.03304253,3.304253,1.0330424,1.1009369,-8.010798,-86.10673,-166.99625,0.23161161,-0.15467167,14.42505,630000
|
| 48 |
+
1.0,1.0,0.028398268,2.8398268,1.0283983,1.2683347,2.4165225,-81.82644,-166.50897,0.4698519,-0.22387849,17.060617,635000
|
| 49 |
+
1.0,0.99999297,0.028513413,2.8513415,1.0285064,1.0603459,0.8634237,-83.07632,-184.48326,0.13762239,-0.17841047,13.7100315,640000
|
| 50 |
+
1.0,1.0000001,0.030850738,3.0850737,1.0308509,1.0063349,-6.119576,-84.837,-173.29623,0.13152419,-0.2876541,14.184723,645000
|
| 51 |
+
1.0,0.9999999,0.027130157,2.7130156,1.02713,1.744371,-3.694085,-77.00824,-179.12402,0.30397892,-0.34729686,24.008179,650000
|
| 52 |
+
1.0,0.99999994,0.02846169,2.846169,1.0284616,1.6476061,-1.03453,-82.62798,-172.2966,0.45145506,-0.4111906,28.578028,655000
|
| 53 |
+
1.0,0.9999999,0.029099101,2.9099102,1.029099,1.0226222,1.0894544,-80.10908,-184.60036,0.17011172,-0.11648369,12.606863,660000
|
| 54 |
+
1.0,0.99999994,0.030114004,3.0114005,1.0301139,1.0247539,-3.7409632,-82.38372,-180.51791,0.34927693,-0.19711797,15.946648,665000
|
| 55 |
+
1.0,1.0,0.029359099,2.93591,1.0293591,1.1407241,-0.8996131,-82.0368,-165.055,0.18203667,-0.36729115,20.570862,670000
|
| 56 |
+
1.0,1.0,0.027800802,2.7800803,1.0278008,0.94336385,-2.3100398,-79.81594,-183.07901,0.1770483,-0.26989076,12.1538105,675000
|
| 57 |
+
1.0,1.0,0.028826227,2.8826227,1.0288262,0.96859473,-3.0086403,-81.17747,-173.3624,0.14399034,-0.23791951,12.935832,680000
|
| 58 |
+
1.0,0.99999994,0.029899344,2.9899344,1.0298992,1.8025011,0.89308864,-81.68165,-159.62326,0.5098676,-0.5711018,34.44747,685000
|
| 59 |
+
1.0,1.0000001,0.02909045,2.909045,1.0290905,1.4307975,-1.3456149,-78.490685,-176.74768,0.5574124,-0.5478476,27.587158,690000
|
| 60 |
+
1.0,0.99991804,0.031072412,3.1072412,1.0309905,1.3462108,1.7484103,-78.277824,-179.27621,0.36681306,-0.20657629,17.481045,695000
|
| 61 |
+
1.0,1.0,0.02866352,2.866352,1.0286635,1.310079,-1.9671917,-82.247,-167.81079,0.6681708,-0.7706908,25.66786,700000
|
| 62 |
+
1.0,1.0,0.03066139,3.0661392,1.0306613,1.8792429,-0.48563617,-81.46601,-179.0039,0.24187243,-0.15345678,16.47634,705000
|
| 63 |
+
1.0,1.0,0.03255529,3.255529,1.0325553,1.0426214,-4.326896,-78.38122,-177.68349,0.16984126,-0.3232741,15.097506,710000
|
| 64 |
+
1.0,1.0,0.028775923,2.8775926,1.0287759,1.0344267,-2.201786,-78.27268,-168.79538,0.21650673,-0.24039692,13.591915,715000
|
| 65 |
+
1.0,1.0,0.030905962,3.0905964,1.030906,1.4879193,-0.04249753,-80.4499,-173.50764,0.17480858,-0.14259417,17.908833,720000
|
| 66 |
+
1.0,1.0,0.030289765,3.0289767,1.0302898,1.153807,-3.2742999,-78.48632,-172.845,0.36190283,-0.20452476,14.627241,725000
|
| 67 |
+
1.0,0.99999994,0.029811835,2.9811838,1.0298117,1.6162747,0.19062641,-79.489685,-167.67587,0.23334767,-0.26864174,18.429594,730000
|
| 68 |
+
1.0,1.0,0.029936913,2.9936912,1.0299369,1.2919143,-2.3219457,-76.75367,-173.92172,0.18950911,-0.37761837,20.501825,735000
|
| 69 |
+
1.0,1.0,0.030583125,3.0583124,1.0305831,1.0020924,-3.8779254,-78.95847,-166.17645,0.17481792,-0.14044605,13.936207,740000
|
| 70 |
+
1.0,1.0000001,0.029932035,2.9932036,1.0299321,1.2503451,-1.8170642,-80.866325,-165.38596,0.27001324,-0.25996187,18.59056,745000
|
| 71 |
+
1.0,1.0,0.026945347,2.6945348,1.0269454,1.0872494,-3.4809084,-75.342735,-183.88287,0.17580277,-0.31675202,15.2077055,750000
|
| 72 |
+
1.0,0.9999999,0.028875742,2.8875744,1.0288756,1.158755,-0.32245803,-81.822685,-179.0785,0.19723153,-0.13587615,13.791277,755000
|
| 73 |
+
1.0,1.0000001,0.029557452,2.9557452,1.0295576,1.2797717,-2.7225082,-75.676956,-183.25209,0.48249784,-0.44401678,21.209183,760000
|
| 74 |
+
1.0,0.9999999,0.030168341,3.0168343,1.0301682,1.039604,-0.29801273,-78.17334,-181.96777,0.1791617,-0.268606,16.297937,765000
|
| 75 |
+
1.0,1.0,0.03026244,3.0262442,1.0302625,1.0960665,-0.9961767,-76.904564,-181.67613,0.1472198,-0.2133097,14.638384,770000
|
| 76 |
+
1.0,1.0,0.029020883,2.9020882,1.0290209,1.9126447,1.1025565,-73.928055,-168.68607,0.8830315,-0.8811148,28.69691,775000
|
| 77 |
+
1.0,0.9999999,0.026768215,2.6768217,1.0267681,2.168081,-2.507389,-78.297935,-177.02034,0.9942874,-0.8256104,33.560005,780000
|
| 78 |
+
1.0,1.0,0.029241005,2.9241004,1.029241,1.3147159,0.18927641,-76.90078,-179.8806,0.3238694,-0.6623882,22.157047,785000
|
| 79 |
+
1.0,0.99999994,0.03273215,3.2732153,1.0327321,3.245547,-6.440209,-78.10644,-167.83926,1.4206494,-1.4985799,67.45865,790000
|
| 80 |
+
1.0,1.0000001,0.0309261,3.0926101,1.0309262,1.7712936,-6.7748995,-78.68036,-149.60652,0.3127793,-0.50636345,32.42936,795000
|
| 81 |
+
1.0,1.0,0.028302658,2.8302658,1.0283027,1.5178775,-4.623312,-74.289856,-162.8892,0.47776693,-0.2178857,19.766258,800000
|
| 82 |
+
1.0,1.0,0.027624436,2.7624438,1.0276245,0.9988994,-3.718313,-77.24389,-180.65868,0.18850729,-0.21744314,13.770182,805000
|
| 83 |
+
1.0,1.0,0.030929865,3.0929866,1.0309299,1.2587565,-1.5539808,-77.31718,-160.09221,0.18924849,-0.44038606,23.902521,810000
|
| 84 |
+
1.0,0.9999999,0.029325422,2.9325423,1.0293252,1.3022418,2.9071474,-74.15098,-151.52704,0.23969454,-0.25326788,16.678091,815000
|
| 85 |
+
1.0,1.0,0.032281272,3.2281272,1.0322813,1.1061958,-2.2815404,-73.260765,-171.6884,0.2074157,-0.19928178,13.576932,820000
|
| 86 |
+
1.0,1.0,0.027961243,2.7961245,1.0279613,1.3516855,-2.8398328,-73.7302,-182.4437,0.2295364,-0.42085585,17.26958,825000
|
| 87 |
+
1.0,1.0,0.030254275,3.0254276,1.0302542,1.6477684,-5.554787,-74.28219,-158.6764,0.2948131,-0.59618485,23.41027,830000
|
| 88 |
+
1.0,1.0,0.03004852,3.0048523,1.0300485,1.4816443,-6.275089,-75.81646,-179.62883,0.4856126,-0.4701814,21.868565,835000
|
| 89 |
+
1.0,1.0000001,0.028501328,2.850133,1.0285014,1.1150454,0.891432,-73.28914,-171.41383,0.27181777,-0.29515952,16.80836,840000
|
| 90 |
+
1.0,1.0,0.029717376,2.9717376,1.0297173,0.9611149,-1.1746378,-77.93211,-160.30507,0.164268,-0.14209498,14.242855,845000
|
| 91 |
+
1.0,1.0,0.029581558,2.958156,1.0295815,2.8112862,-1.0053928,-77.28289,-157.81905,2.0261583,-2.030685,50.976357,850000
|
| 92 |
+
1.0,1.0,0.029129354,2.9129353,1.0291294,1.4264927,-2.0379643,-74.056175,-164.71466,0.35019082,-0.15869084,16.734995,855000
|
| 93 |
+
1.0,1.0,0.029617704,2.9617705,1.0296177,1.2352985,-5.7739,-74.17617,-157.48624,0.29675552,-0.3497808,19.456741,860000
|
| 94 |
+
1.0,0.9999999,0.03141515,3.1415153,1.031415,1.159293,0.46420175,-72.782616,-168.17328,0.19167876,-0.18615498,15.760767,865000
|
| 95 |
+
1.0,1.0,0.031298604,3.1298604,1.0312986,1.1478783,-0.4238211,-72.408554,-155.93524,0.4366696,-0.41830447,14.587732,870000
|
| 96 |
+
1.0,0.99999994,0.028046932,2.8046932,1.0280468,1.7066001,-0.69876814,-73.606834,-169.63846,0.22007403,-0.16337667,16.09037,875000
|
| 97 |
+
1.0,0.9999949,0.030467726,3.0467725,1.0304626,1.3358862,1.2025062,-72.44623,-156.06421,0.51550955,-0.56755215,22.389702,880000
|
| 98 |
+
1.0,0.99999994,0.031030923,3.1030922,1.0310309,1.5794549,-0.2063334,-71.77701,-180.00485,0.5333202,-0.60327566,21.14301,885000
|
| 99 |
+
1.0,1.0,0.028529227,2.852923,1.0285292,4.000989,-4.5180883,-73.07194,-158.98949,0.6402899,-0.93612427,40.81414,890000
|
| 100 |
+
1.0,0.99999994,0.028406568,2.8406568,1.0284065,1.4421934,-0.7852998,-68.89236,-175.58554,0.32959756,-0.4134327,22.533663,895000
|
| 101 |
+
1.0,0.9999999,0.027761918,2.7761917,1.0277618,1.1799005,-0.6992659,-67.682594,-170.13539,0.22685947,-0.26550597,16.37744,900000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,0.99999994,0.025157133,2.5157132,1.0251571,0.53231317,-26.891712,-103.67446,-172.2503,0.13399374,-0.14884958,10.510901,405000
|
| 3 |
+
1.0,1.0,0.025113257,2.5113258,1.0251132,0.77921313,-19.04549,-103.03257,-172.13354,0.3299345,-0.15223771,11.391849,410000
|
| 4 |
+
1.0,0.9999999,0.023235314,2.3235314,1.0232352,0.7512946,-27.673769,-105.85537,-178.86087,0.50038725,-0.4437714,11.955674,415000
|
| 5 |
+
1.0,1.0,0.022527503,2.2527504,1.0225275,1.2428778,-22.596699,-105.58801,-186.42746,0.3160805,-0.28271976,14.373287,420000
|
| 6 |
+
1.0,1.0,0.023217924,2.3217926,1.0232179,0.9237636,-39.350384,-106.337845,-187.28612,0.25962913,-0.15568459,14.160808,425000
|
| 7 |
+
1.0,1.0,0.023621818,2.362182,1.0236218,4.3968186,-25.211662,-104.02071,-187.45119,0.5784953,-0.5873601,33.55614,430000
|
| 8 |
+
1.0,1.0,0.0251925,2.5192497,1.0251925,1.3648342,-24.053425,-103.02919,-187.50647,0.35545927,-0.34532136,21.68988,435000
|
| 9 |
+
1.0,1.0,0.02521493,2.521493,1.0252149,1.604153,-26.96808,-101.5722,-191.61823,0.92516464,-0.96857643,29.963015,440000
|
| 10 |
+
1.0,0.99999994,0.023334352,2.3334353,1.0233343,1.2581676,-37.785847,-102.24515,-202.25917,0.15806566,-0.21556772,16.773167,445000
|
| 11 |
+
1.0,1.0,0.026809376,2.6809375,1.0268093,1.4568628,-4.5243387,-101.99981,-181.94754,0.3197963,-0.3033229,22.476076,450000
|
| 12 |
+
1.0,1.0,0.026387896,2.6387897,1.0263879,1.2023535,-6.2533994,-97.68756,-178.05121,0.1526876,-0.2164221,16.206255,455000
|
| 13 |
+
1.0,1.0,0.026118184,2.6118183,1.0261182,1.2065241,-18.78402,-95.51681,-191.9236,0.42062873,-0.4463129,15.317608,460000
|
| 14 |
+
1.0,0.9999999,0.028214788,2.8214788,1.0282147,1.289976,-20.51815,-94.15615,-194.60336,0.15496647,-0.17340407,14.155297,465000
|
| 15 |
+
1.0,1.0,0.02640535,2.640535,1.0264053,1.4825348,-9.145197,-92.48812,-194.21062,0.27726346,-0.3197029,20.028833,470000
|
| 16 |
+
1.0,1.0,0.027353358,2.7353358,1.0273534,1.1836166,-8.634992,-96.52739,-198.756,0.22825176,-0.17488514,16.71601,475000
|
| 17 |
+
1.0,1.0,0.02695355,2.695355,1.0269536,1.5686903,-9.323476,-96.56451,-192.85529,0.37681964,-0.22715092,18.565798,480000
|
| 18 |
+
1.0,1.0,0.026193237,2.6193237,1.0261933,1.1369078,-12.74843,-96.366196,-181.73361,0.1317066,-0.26755702,14.013101,485000
|
| 19 |
+
1.0,1.0,0.028329657,2.8329659,1.0283296,2.538432,-9.117981,-93.268196,-190.5664,0.1780087,-0.17786413,18.999344,490000
|
| 20 |
+
1.0,0.99999994,0.028367547,2.836755,1.0283675,2.0601337,-21.544312,-93.60598,-193.21124,0.46069407,-0.41348884,32.147987,495000
|
| 21 |
+
1.0,1.0,0.02745549,2.745549,1.0274554,1.1408931,-16.635332,-92.632034,-184.18936,0.13581789,-0.21753965,15.989874,500000
|
| 22 |
+
1.0,0.99999994,0.028493382,2.8493383,1.0284933,1.5111655,-5.97856,-92.368164,-195.51163,0.23915003,-0.19570182,16.69968,505000
|
| 23 |
+
1.0,0.9999999,0.027989589,2.798959,1.0279895,1.5369517,-13.603284,-91.58053,-176.48103,0.28107885,-0.4413799,21.673958,510000
|
| 24 |
+
1.0,0.9999901,0.027572297,2.7572298,1.0275624,1.0297557,0.82993084,-88.66686,-171.9292,0.21027854,-0.21160015,15.316832,515000
|
| 25 |
+
1.0,1.0,0.026589934,2.6589935,1.02659,1.1302769,-1.9311945,-89.384605,-179.8292,0.16891453,-0.26917547,16.111519,520000
|
| 26 |
+
1.0,1.0000001,0.02797164,2.797164,1.0279717,1.7714993,-5.1349754,-91.82836,-169.75162,0.1795532,-0.16546644,15.686453,525000
|
| 27 |
+
1.0,1.0,0.02972116,2.972116,1.0297211,3.9209125,-11.591069,-92.44326,-179.12503,0.7461984,-0.34941038,32.133583,530000
|
| 28 |
+
1.0,0.9999396,0.028732024,2.8732023,1.0286716,2.7485232,2.2264824,-90.89141,-179.37616,0.421374,-0.4223844,28.846163,535000
|
| 29 |
+
1.0,0.9999999,0.029354481,2.9354482,1.0293543,1.4808971,-0.39686167,-86.62581,-170.97238,0.3301482,-0.24302964,22.01601,540000
|
| 30 |
+
1.0,1.0,0.02824355,2.8243551,1.0282435,1.196995,-8.212218,-89.84618,-192.50697,0.17205356,-0.21746291,17.68002,545000
|
| 31 |
+
1.0,0.99999994,0.027313815,2.7313814,1.0273137,1.3159078,-5.526501,-88.45916,-177.21669,0.34176654,-0.21142854,18.370007,550000
|
| 32 |
+
1.0,0.99998313,0.026809677,2.6809678,1.0267928,1.505472,0.64103436,-87.57682,-171.60443,0.8050131,-0.8677561,24.70426,555000
|
| 33 |
+
1.0,1.0,0.028479535,2.8479536,1.0284796,1.8479054,-2.3692818,-90.33882,-190.21123,0.6045487,-0.53351456,32.414917,560000
|
| 34 |
+
1.0,1.0,0.027306596,2.7306597,1.0273066,1.6418797,1.5755324,-86.00034,-175.61833,0.48290777,-0.23012751,26.27731,565000
|
| 35 |
+
1.0,1.0,0.028812345,2.8812346,1.0288123,1.4088321,-6.6962147,-86.68374,-188.03596,0.26674983,-0.3705712,22.354813,570000
|
| 36 |
+
1.0,1.0,0.027958095,2.7958097,1.0279582,2.1789005,-7.0649147,-91.747116,-189.65019,0.4352608,-0.25116655,28.023155,575000
|
| 37 |
+
1.0,0.9999589,0.027199455,2.7199454,1.0271584,0.9810616,2.1859703,-88.72465,-184.81218,0.21929246,-0.19292563,13.493492,580000
|
| 38 |
+
1.0,1.0,0.030407228,3.0407228,1.0304072,1.1152725,-1.1895856,-83.35737,-163.9159,0.3662737,-0.20014341,16.979311,585000
|
| 39 |
+
1.0,1.0,0.029095434,2.9095435,1.0290954,1.4334427,-0.33924088,-86.0289,-191.83453,0.3218287,-0.3722298,24.570652,590000
|
| 40 |
+
1.0,1.0,0.029855452,2.9855456,1.0298555,1.1751639,-1.6925819,-85.66372,-187.55261,0.15117049,-0.2987684,15.508531,595000
|
| 41 |
+
1.0,1.0000001,0.028974392,2.897439,1.0289745,1.361495,0.43888986,-86.19103,-190.31033,0.1818742,-0.28831422,18.0083,600000
|
| 42 |
+
1.0,1.0,0.030579604,3.0579605,1.0305796,1.3688914,-5.1868277,-84.06667,-160.24855,0.22067493,-0.15921643,15.408772,605000
|
| 43 |
+
1.0,0.99999994,0.0290608,2.9060802,1.0290607,1.0749149,-0.18576913,-85.88476,-167.7035,0.22567034,-0.19181833,14.963071,610000
|
| 44 |
+
1.0,1.0,0.029777136,2.9777136,1.0297772,1.4772668,-1.2207552,-86.17348,-185.10791,0.3131353,-0.1445865,18.562372,615000
|
| 45 |
+
1.0,1.0,0.027791819,2.779182,1.0277919,1.2263137,-7.468808,-86.70676,-183.23918,0.24187972,-0.124534935,14.215077,620000
|
| 46 |
+
1.0,0.99999994,0.029488675,2.9488678,1.0294886,2.3008575,-2.9173937,-81.540085,-162.2597,0.45000547,-0.45436323,27.43052,625000
|
| 47 |
+
1.0,0.9999999,0.03304253,3.304253,1.0330424,1.1009369,-8.010798,-86.10673,-166.99625,0.23161161,-0.15467167,14.42505,630000
|
| 48 |
+
1.0,1.0,0.028398268,2.8398268,1.0283983,1.2683347,2.4165225,-81.82644,-166.50897,0.4698519,-0.22387849,17.060617,635000
|
| 49 |
+
1.0,0.99999297,0.028513413,2.8513415,1.0285064,1.0603459,0.8634237,-83.07632,-184.48326,0.13762239,-0.17841047,13.7100315,640000
|
| 50 |
+
1.0,1.0000001,0.030850738,3.0850737,1.0308509,1.0063349,-6.119576,-84.837,-173.29623,0.13152419,-0.2876541,14.184723,645000
|
| 51 |
+
1.0,0.9999999,0.027130157,2.7130156,1.02713,1.744371,-3.694085,-77.00824,-179.12402,0.30397892,-0.34729686,24.008179,650000
|
| 52 |
+
1.0,0.99999994,0.02846169,2.846169,1.0284616,1.6476061,-1.03453,-82.62798,-172.2966,0.45145506,-0.4111906,28.578028,655000
|
| 53 |
+
1.0,0.9999999,0.029099101,2.9099102,1.029099,1.0226222,1.0894544,-80.10908,-184.60036,0.17011172,-0.11648369,12.606863,660000
|
| 54 |
+
1.0,0.99999994,0.030114004,3.0114005,1.0301139,1.0247539,-3.7409632,-82.38372,-180.51791,0.34927693,-0.19711797,15.946648,665000
|
| 55 |
+
1.0,1.0,0.029359099,2.93591,1.0293591,1.1407241,-0.8996131,-82.0368,-165.055,0.18203667,-0.36729115,20.570862,670000
|
| 56 |
+
1.0,1.0,0.027800802,2.7800803,1.0278008,0.94336385,-2.3100398,-79.81594,-183.07901,0.1770483,-0.26989076,12.1538105,675000
|
| 57 |
+
1.0,1.0,0.028826227,2.8826227,1.0288262,0.96859473,-3.0086403,-81.17747,-173.3624,0.14399034,-0.23791951,12.935832,680000
|
| 58 |
+
1.0,0.99999994,0.029899344,2.9899344,1.0298992,1.8025011,0.89308864,-81.68165,-159.62326,0.5098676,-0.5711018,34.44747,685000
|
| 59 |
+
1.0,1.0000001,0.02909045,2.909045,1.0290905,1.4307975,-1.3456149,-78.490685,-176.74768,0.5574124,-0.5478476,27.587158,690000
|
| 60 |
+
1.0,0.99991804,0.031072412,3.1072412,1.0309905,1.3462108,1.7484103,-78.277824,-179.27621,0.36681306,-0.20657629,17.481045,695000
|
| 61 |
+
1.0,1.0,0.02866352,2.866352,1.0286635,1.310079,-1.9671917,-82.247,-167.81079,0.6681708,-0.7706908,25.66786,700000
|
| 62 |
+
1.0,1.0,0.03066139,3.0661392,1.0306613,1.8792429,-0.48563617,-81.46601,-179.0039,0.24187243,-0.15345678,16.47634,705000
|
| 63 |
+
1.0,1.0,0.03255529,3.255529,1.0325553,1.0426214,-4.326896,-78.38122,-177.68349,0.16984126,-0.3232741,15.097506,710000
|
| 64 |
+
1.0,1.0,0.028775923,2.8775926,1.0287759,1.0344267,-2.201786,-78.27268,-168.79538,0.21650673,-0.24039692,13.591915,715000
|
| 65 |
+
1.0,1.0,0.030905962,3.0905964,1.030906,1.4879193,-0.04249753,-80.4499,-173.50764,0.17480858,-0.14259417,17.908833,720000
|
| 66 |
+
1.0,1.0,0.030289765,3.0289767,1.0302898,1.153807,-3.2742999,-78.48632,-172.845,0.36190283,-0.20452476,14.627241,725000
|
| 67 |
+
1.0,0.99999994,0.029811835,2.9811838,1.0298117,1.6162747,0.19062641,-79.489685,-167.67587,0.23334767,-0.26864174,18.429594,730000
|
| 68 |
+
1.0,1.0,0.029936913,2.9936912,1.0299369,1.2919143,-2.3219457,-76.75367,-173.92172,0.18950911,-0.37761837,20.501825,735000
|
| 69 |
+
1.0,1.0,0.030583125,3.0583124,1.0305831,1.0020924,-3.8779254,-78.95847,-166.17645,0.17481792,-0.14044605,13.936207,740000
|
| 70 |
+
1.0,1.0000001,0.029932035,2.9932036,1.0299321,1.2503451,-1.8170642,-80.866325,-165.38596,0.27001324,-0.25996187,18.59056,745000
|
| 71 |
+
1.0,1.0,0.026945347,2.6945348,1.0269454,1.0872494,-3.4809084,-75.342735,-183.88287,0.17580277,-0.31675202,15.2077055,750000
|
| 72 |
+
1.0,0.9999999,0.028875742,2.8875744,1.0288756,1.158755,-0.32245803,-81.822685,-179.0785,0.19723153,-0.13587615,13.791277,755000
|
| 73 |
+
1.0,1.0000001,0.029557452,2.9557452,1.0295576,1.2797717,-2.7225082,-75.676956,-183.25209,0.48249784,-0.44401678,21.209183,760000
|
| 74 |
+
1.0,0.9999999,0.030168341,3.0168343,1.0301682,1.039604,-0.29801273,-78.17334,-181.96777,0.1791617,-0.268606,16.297937,765000
|
| 75 |
+
1.0,1.0,0.03026244,3.0262442,1.0302625,1.0960665,-0.9961767,-76.904564,-181.67613,0.1472198,-0.2133097,14.638384,770000
|
| 76 |
+
1.0,1.0,0.029020883,2.9020882,1.0290209,1.9126447,1.1025565,-73.928055,-168.68607,0.8830315,-0.8811148,28.69691,775000
|
| 77 |
+
1.0,0.9999999,0.026768215,2.6768217,1.0267681,2.168081,-2.507389,-78.297935,-177.02034,0.9942874,-0.8256104,33.560005,780000
|
| 78 |
+
1.0,1.0,0.029241005,2.9241004,1.029241,1.3147159,0.18927641,-76.90078,-179.8806,0.3238694,-0.6623882,22.157047,785000
|
| 79 |
+
1.0,0.99999994,0.03273215,3.2732153,1.0327321,3.245547,-6.440209,-78.10644,-167.83926,1.4206494,-1.4985799,67.45865,790000
|
| 80 |
+
1.0,1.0000001,0.0309261,3.0926101,1.0309262,1.7712936,-6.7748995,-78.68036,-149.60652,0.3127793,-0.50636345,32.42936,795000
|
| 81 |
+
1.0,1.0,0.028302658,2.8302658,1.0283027,1.5178775,-4.623312,-74.289856,-162.8892,0.47776693,-0.2178857,19.766258,800000
|
| 82 |
+
1.0,1.0,0.027624436,2.7624438,1.0276245,0.9988994,-3.718313,-77.24389,-180.65868,0.18850729,-0.21744314,13.770182,805000
|
| 83 |
+
1.0,1.0,0.030929865,3.0929866,1.0309299,1.2587565,-1.5539808,-77.31718,-160.09221,0.18924849,-0.44038606,23.902521,810000
|
| 84 |
+
1.0,0.9999999,0.029325422,2.9325423,1.0293252,1.3022418,2.9071474,-74.15098,-151.52704,0.23969454,-0.25326788,16.678091,815000
|
| 85 |
+
1.0,1.0,0.032281272,3.2281272,1.0322813,1.1061958,-2.2815404,-73.260765,-171.6884,0.2074157,-0.19928178,13.576932,820000
|
| 86 |
+
1.0,1.0,0.027961243,2.7961245,1.0279613,1.3516855,-2.8398328,-73.7302,-182.4437,0.2295364,-0.42085585,17.26958,825000
|
| 87 |
+
1.0,1.0,0.030254275,3.0254276,1.0302542,1.6477684,-5.554787,-74.28219,-158.6764,0.2948131,-0.59618485,23.41027,830000
|
| 88 |
+
1.0,1.0,0.03004852,3.0048523,1.0300485,1.4816443,-6.275089,-75.81646,-179.62883,0.4856126,-0.4701814,21.868565,835000
|
| 89 |
+
1.0,1.0000001,0.028501328,2.850133,1.0285014,1.1150454,0.891432,-73.28914,-171.41383,0.27181777,-0.29515952,16.80836,840000
|
| 90 |
+
1.0,1.0,0.029717376,2.9717376,1.0297173,0.9611149,-1.1746378,-77.93211,-160.30507,0.164268,-0.14209498,14.242855,845000
|
| 91 |
+
1.0,1.0,0.029581558,2.958156,1.0295815,2.8112862,-1.0053928,-77.28289,-157.81905,2.0261583,-2.030685,50.976357,850000
|
| 92 |
+
1.0,1.0,0.029129354,2.9129353,1.0291294,1.4264927,-2.0379643,-74.056175,-164.71466,0.35019082,-0.15869084,16.734995,855000
|
| 93 |
+
1.0,1.0,0.029617704,2.9617705,1.0296177,1.2352985,-5.7739,-74.17617,-157.48624,0.29675552,-0.3497808,19.456741,860000
|
| 94 |
+
1.0,0.9999999,0.03141515,3.1415153,1.031415,1.159293,0.46420175,-72.782616,-168.17328,0.19167876,-0.18615498,15.760767,865000
|
| 95 |
+
1.0,1.0,0.031298604,3.1298604,1.0312986,1.1478783,-0.4238211,-72.408554,-155.93524,0.4366696,-0.41830447,14.587732,870000
|
| 96 |
+
1.0,0.99999994,0.028046932,2.8046932,1.0280468,1.7066001,-0.69876814,-73.606834,-169.63846,0.22007403,-0.16337667,16.09037,875000
|
| 97 |
+
1.0,0.9999949,0.030467726,3.0467725,1.0304626,1.3358862,1.2025062,-72.44623,-156.06421,0.51550955,-0.56755215,22.389702,880000
|
| 98 |
+
1.0,0.99999994,0.031030923,3.1030922,1.0310309,1.5794549,-0.2063334,-71.77701,-180.00485,0.5333202,-0.60327566,21.14301,885000
|
| 99 |
+
1.0,1.0,0.028529227,2.852923,1.0285292,4.000989,-4.5180883,-73.07194,-158.98949,0.6402899,-0.93612427,40.81414,890000
|
| 100 |
+
1.0,0.99999994,0.028406568,2.8406568,1.0284065,1.4421934,-0.7852998,-68.89236,-175.58554,0.32959756,-0.4134327,22.533663,895000
|
| 101 |
+
1.0,0.9999999,0.027761918,2.7761917,1.0277618,1.1799005,-0.6992659,-67.682594,-170.13539,0.22685947,-0.26550597,16.37744,900000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:031969951a1a53eab0d7a83e67961663bcc7cdcab064a0ee42e01d6d77372a49
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9280162d513eb505b43d5ecbb9dc007352801f7821825effc4d269e996d690b
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:025655c25699331d525428dd01d06404a41f713a13d51b693f07be2388812d6d
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6534d843f0954f60f924c5b143ffb588eb86bc5aefdcbc21c45d1e9455c56711
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:42fa0c68d091fa39eaa78f1620e0ffbe2b8e3ee118fe78e314bcf84b4f313677
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26771145b35671424c21788949eec8cac9af3b11d7471b739fb186f320182a01
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5383ba085305c0f1682ea97486843289252c86b47b9c6d3a6def5a9c99c54e7
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10a24e27600fa849295d384675b53dbaf174d276869627bc92e703d5ea92a376
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc136429cadc15437ae127245d5a0234dff0e48bb8c51bc732ddf28012ad0e79
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:482d1eafacf52a249554a05204b1f72a61104811411f6076374d0f3130de1a0f
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_135906/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/mnqpkari
|