Tiredsheep commited on
Commit
c967bad
·
verified ·
1 Parent(s): 2831946

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1250000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1300000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1350000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1400000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.04395587688391045,-0.0046724608866270095,-0.04414237831069874,-0.0030387849568712507,33.6158618123947,9.81199999999954,0.94,4827.64,-0.1,-285.74,194.24,0.6276545143127441,950000
3
+ 0.0,0.0,-0.06255814754407822,-0.0025368629037142393,-0.06273168246742349,-0.002566260971497481,35.38073590530668,8.076999999999684,1.0,14084.34,0.0,-221.2,159.54,0.5230940294265747,1000000
4
+ 0.0,0.0,-0.04715658437612465,0.004496944834171452,-0.04715431004691945,0.004669846587075216,34.643521148462895,7.578999999999516,0.98,22220.1,-0.02,-213.98,149.58,0.4945098638534546,1050000
5
+ 0.0,0.0,-0.06629859921254976,0.02010809958354512,-0.06579550296648665,0.013939138004612169,34.90255491550737,7.722999999999497,0.98,30224.68,-0.02,-218.86,152.46,0.4977445363998413,1100000
6
+ 0.0,0.0,-0.048488840469412,0.012901082005943419,-0.047810918034473245,0.009556930251329131,35.72064921667856,6.6839999999996,1.0,37280.44,0.0,-182.04,131.68,0.4346970701217651,1150000
7
+ 0.0,0.0,-0.059238360119033856,0.02337451922957046,-0.057998033379288924,0.016237456420364324,35.74187628477433,5.5949999999996605,1.0,43573.62,0.0,-149.76,109.9,0.35562374114990236,1200000
8
+ 0.0,0.0,-0.07028911763733357,0.04333195667367342,-0.06860053374480364,0.01543295208393365,35.72176234859575,5.754999999999658,1.0,49312.04,0.0,-154.58,113.1,0.37191976070404054,1250000
9
+ 0.0,0.0,-0.05611143637472586,0.047859722252675534,-0.053946605465976065,0.035673214190999315,35.196986059369046,5.071999999999669,1.0,54890.54,0.0,-136.52,99.44,0.32304242610931394,1300000
10
+ 0.0,0.0,-0.04965420830665132,0.06776338743082404,-0.04652062883226989,0.061774033504765145,35.71069556624927,5.299999999999678,1.0,60239.76,0.0,-143.7,104.0,0.3364095640182495,1350000
11
+ 0.0,0.0,-0.07157599356763898,0.060066214015188815,-0.06855477352691795,0.05294852729524083,35.47510979519125,4.995999999999683,1.0,65522.74,0.0,-137.24,97.92,0.3263733196258545,1400000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.04395587688391045,-0.0046724608866270095,-0.04414237831069874,-0.0030387849568712507,33.6158618123947,9.81199999999954,0.94,4827.64,-0.1,-285.74,194.24,0.6276545143127441,950000
3
+ 0.0,0.0,-0.06255814754407822,-0.0025368629037142393,-0.06273168246742349,-0.002566260971497481,35.38073590530668,8.076999999999684,1.0,14084.34,0.0,-221.2,159.54,0.5230940294265747,1000000
4
+ 0.0,0.0,-0.04715658437612465,0.004496944834171452,-0.04715431004691945,0.004669846587075216,34.643521148462895,7.578999999999516,0.98,22220.1,-0.02,-213.98,149.58,0.4945098638534546,1050000
5
+ 0.0,0.0,-0.06629859921254976,0.02010809958354512,-0.06579550296648665,0.013939138004612169,34.90255491550737,7.722999999999497,0.98,30224.68,-0.02,-218.86,152.46,0.4977445363998413,1100000
6
+ 0.0,0.0,-0.048488840469412,0.012901082005943419,-0.047810918034473245,0.009556930251329131,35.72064921667856,6.6839999999996,1.0,37280.44,0.0,-182.04,131.68,0.4346970701217651,1150000
7
+ 0.0,0.0,-0.059238360119033856,0.02337451922957046,-0.057998033379288924,0.016237456420364324,35.74187628477433,5.5949999999996605,1.0,43573.62,0.0,-149.76,109.9,0.35562374114990236,1200000
8
+ 0.0,0.0,-0.07028911763733357,0.04333195667367342,-0.06860053374480364,0.01543295208393365,35.72176234859575,5.754999999999658,1.0,49312.04,0.0,-154.58,113.1,0.37191976070404054,1250000
9
+ 0.0,0.0,-0.05611143637472586,0.047859722252675534,-0.053946605465976065,0.035673214190999315,35.196986059369046,5.071999999999669,1.0,54890.54,0.0,-136.52,99.44,0.32304242610931394,1300000
10
+ 0.0,0.0,-0.04965420830665132,0.06776338743082404,-0.04652062883226989,0.061774033504765145,35.71069556624927,5.299999999999678,1.0,60239.76,0.0,-143.7,104.0,0.3364095640182495,1350000
11
+ 0.0,0.0,-0.07157599356763898,0.060066214015188815,-0.06855477352691795,0.05294852729524083,35.47510979519125,4.995999999999683,1.0,65522.74,0.0,-137.24,97.92,0.3263733196258545,1400000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.35384,0.19249357,0.007770369,6.58582,-53.74494,-165.0678,-203.50235,1.6031954,-1.7419716,79.70168,905000
3
+ 161.30551,0.18625227,0.0060079233,4.4041667,-55.66566,-161.4088,-203.78929,1.532397,-1.0643984,49.036037,910000
4
+ 163.08809,0.19845608,0.006727549,7.543176,-53.052185,-162.90364,-204.173,4.082272,-5.3158216,115.18416,915000
5
+ 158.1781,0.16802564,0.0071092956,5.5443926,-8.327219,-158.76512,-205.0339,0.8558831,-0.8714752,48.884377,920000
6
+ 155.52771,0.1713854,0.008352493,6.053041,-23.815002,-155.70793,-204.70848,1.127246,-1.124135,64.629166,925000
7
+ 152.06133,0.17145331,0.0073566847,7.524129,-41.23899,-152.88145,-204.56575,0.8964363,-1.1451147,61.11857,930000
8
+ 149.83594,0.1803364,0.008790902,7.7498736,-45.063766,-150.20776,-203.82796,3.509069,-3.5147192,89.302605,935000
9
+ 149.5607,0.20280463,0.009612958,6.8334856,-24.417372,-150.94003,-204.91963,3.0950012,-2.8674936,67.84175,940000
10
+ 148.4985,0.18241727,0.008267394,8.1861725,-8.888016,-149.36986,-204.51761,1.8397074,-1.6061592,60.73094,945000
11
+ 147.52367,0.20088136,0.008151255,7.402987,-10.244517,-148.0107,-204.79916,0.9304893,-0.97088933,54.688972,950000
12
+ 143.56883,0.18420404,0.009935757,7.65927,-33.570087,-143.90617,-205.77675,2.1481764,-1.954714,71.31974,955000
13
+ 140.50473,0.18353721,0.009034023,10.003334,-6.899066,-141.50706,-204.45882,2.3218563,-2.1177132,89.6899,960000
14
+ 140.86827,0.19169515,0.00873826,6.1282787,-20.099512,-141.24901,-204.73389,2.097323,-2.3658607,73.331215,965000
15
+ 133.24712,0.2044832,0.0080394605,6.998862,-18.181164,-133.5415,-204.82544,1.1354997,-1.0513916,63.707905,970000
16
+ 138.23293,0.17395627,0.008893515,10.011843,-26.327015,-139.1704,-204.43372,1.0042871,-0.91034365,68.66486,975000
17
+ 139.95505,0.17388406,0.008608251,8.397376,-24.971413,-141.06729,-204.42427,0.88487273,-0.85679305,78.84661,980000
18
+ 138.11952,0.18121415,0.007454627,6.617312,-2.286418,-138.45305,-204.6408,1.2324009,-1.4579124,75.45209,985000
19
+ 136.69553,0.18409255,0.0077873264,4.9231005,-16.449682,-137.45674,-205.57774,0.7699649,-0.7889032,51.980633,990000
20
+ 135.0892,0.18599859,0.0073972903,6.534096,-15.310221,-135.9928,-204.57947,1.4197326,-1.2449795,52.555878,995000
21
+ 133.84328,0.15790679,0.0074588805,6.176026,-24.920626,-134.23738,-205.08252,1.4580928,-1.3260189,61.999012,1000000
22
+ 135.9403,0.16526023,0.008853927,7.5152583,-9.843519,-136.64513,-205.18268,0.9162817,-0.9287502,62.178963,1005000
23
+ 133.00636,0.16373888,0.009327448,5.7370205,-9.679812,-133.20242,-205.10013,1.4809129,-1.3777207,65.49522,1010000
24
+ 131.31737,0.17614953,0.009833027,6.8011446,0.44977948,-132.2384,-205.21361,0.8757323,-0.84109807,58.083996,1015000
25
+ 132.6769,0.19671392,0.009304004,7.7583575,-7.5679865,-132.85564,-205.56125,1.1106526,-1.1302464,62.587097,1020000
26
+ 136.29216,0.19468361,0.007202892,4.316631,-13.412692,-136.23668,-204.78107,1.2378619,-1.8016083,55.080322,1025000
27
+ 132.58589,0.17286482,0.007960161,7.8117676,-3.974147,-133.32843,-204.035,1.1498295,-1.2971356,61.288387,1030000
28
+ 131.92265,0.18066767,0.010194618,5.9516973,1.1160746,-133.08842,-205.24673,1.8830292,-1.9613106,60.232594,1035000
29
+ 125.43835,0.13114768,0.010049034,6.8024507,-5.4824266,-126.37444,-204.46071,1.1276397,-0.98911256,56.011444,1040000
30
+ 129.42825,0.17633379,0.008275352,5.363934,-8.22134,-130.33502,-204.58716,2.6631427,-2.3259883,66.26548,1045000
31
+ 128.22829,0.16920784,0.008020184,5.981501,-4.91882,-128.83025,-204.99014,1.3767065,-1.3102366,60.640915,1050000
32
+ 129.51364,0.15813297,0.008091707,7.3004594,-3.2301173,-130.27403,-204.49486,0.61105406,-1.0386959,57.509415,1055000
33
+ 131.73218,0.16491951,0.009221079,6.045532,-11.940039,-132.37364,-204.56549,1.8071177,-1.4184339,68.185295,1060000
34
+ 127.18691,0.17609477,0.008411485,5.1467166,-0.8599102,-128.2216,-205.45007,1.605079,-1.5572289,75.24091,1065000
35
+ 128.17374,0.18773189,0.008309239,4.971126,4.977595,-128.74515,-204.04645,0.7039795,-1.134066,59.56628,1070000
36
+ 131.42209,0.19230947,0.008908474,4.2319093,-11.561111,-131.44896,-206.06213,1.6499243,-2.467966,59.163795,1075000
37
+ 130.67915,0.18537472,0.008177911,7.8364625,1.306133,-130.6593,-204.52751,4.662506,-4.843952,128.42903,1080000
38
+ 128.72247,0.17985852,0.009645946,3.9643764,-10.882951,-128.81346,-205.39714,1.272903,-1.2669238,55.561558,1085000
39
+ 124.53374,0.15078236,0.009034043,9.1371155,0.5214578,-125.756615,-205.01498,1.0251436,-1.0340463,78.61074,1090000
40
+ 126.62999,0.16598094,0.007968062,4.5141144,-4.7191715,-127.09072,-205.27386,1.0467231,-0.9555151,48.153603,1095000
41
+ 124.449646,0.17655548,0.008169063,5.950261,3.7617226,-125.83645,-205.5127,2.116946,-2.2074964,57.66382,1100000
42
+ 125.245865,0.1755177,0.008023412,5.8275957,-2.5088444,-125.845604,-205.02585,1.3084191,-1.0014406,56.377815,1105000
43
+ 122.32312,0.15201762,0.007978394,5.0393887,-1.2282438,-122.49487,-204.74857,1.6467142,-1.1833669,53.540558,1110000
44
+ 124.10023,0.15129492,0.008503178,5.954429,-6.7570553,-125.145035,-205.17693,2.0245624,-1.9941581,67.38858,1115000
45
+ 123.348724,0.17540583,0.008242016,7.28213,-7.306597,-123.86242,-203.98964,0.9375634,-2.0541139,62.459965,1120000
46
+ 119.06789,0.20035912,0.008388883,4.553475,-2.3925657,-118.47119,-205.14757,1.6689473,-1.4924892,59.441273,1125000
47
+ 124.46796,0.17597538,0.008915433,5.176701,1.105353,-124.5657,-206.11343,1.942518,-1.7522928,83.52775,1130000
48
+ 119.30797,0.18162036,0.006384587,4.7405396,-2.3766642,-119.74257,-204.90999,1.9274054,-1.6507739,52.391068,1135000
49
+ 119.62998,0.19260982,0.0067399973,5.1095786,0.73357147,-120.257645,-204.62932,4.187487,-4.760984,81.22744,1140000
50
+ 124.12055,0.18441787,0.007152339,7.0881586,-4.9621716,-124.972466,-205.49547,0.76552916,-1.0113406,60.234013,1145000
51
+ 112.607574,0.15815255,0.0080004055,4.632175,3.9198837,-113.13069,-204.66347,2.5602794,-2.6488607,60.82058,1150000
52
+ 122.34386,0.1859411,0.008195676,5.835515,0.3258428,-123.48919,-204.79335,0.7488897,-1.3516988,58.098892,1155000
53
+ 118.11235,0.1897581,0.008541355,4.915752,2.4517705,-118.79815,-202.86876,0.96476674,-1.5926819,52.670597,1160000
54
+ 118.88825,0.20507573,0.008145185,5.8590083,1.2881073,-119.49867,-204.32893,1.1029332,-0.99951774,57.96861,1165000
55
+ 120.43708,0.1519637,0.0079764,5.3759522,-4.376928,-121.156425,-203.74635,0.770964,-1.083133,56.967266,1170000
56
+ 115.63388,0.16045557,0.0072580734,4.873628,-4.501936,-115.95361,-204.50009,1.3101119,-1.4046469,61.396797,1175000
57
+ 122.075195,0.18575504,0.007618339,5.97732,-8.417744,-123.41227,-205.15355,0.7100805,-0.7338216,56.85481,1180000
58
+ 116.293106,0.16064498,0.008710623,5.9768195,-1.0301247,-116.90603,-204.35484,0.89136976,-0.8388106,65.25387,1185000
59
+ 112.62344,0.16036052,0.00820703,5.5262837,0.37087974,-113.399,-204.69923,1.1049311,-0.9752369,62.027645,1190000
60
+ 116.838585,0.157792,0.0070597637,9.760907,2.6417568,-117.731155,-205.67369,1.0974985,-1.4022645,89.71819,1195000
61
+ 120.31503,0.14792916,0.0067887553,7.3677964,-2.0286143,-121.15618,-204.1944,0.9663435,-0.9875132,61.003235,1200000
62
+ 119.81793,0.1477694,0.007957104,4.5387535,-3.794629,-121.14949,-204.19508,0.51047766,-0.85113096,53.37684,1205000
63
+ 117.84337,0.16362554,0.0075195506,5.884616,-7.3767104,-118.47774,-205.31549,0.86717564,-0.96378416,62.393364,1210000
64
+ 117.9749,0.18570288,0.0066981474,6.308931,1.1155423,-118.815285,-203.83084,0.7170324,-1.6288724,62.717224,1215000
65
+ 115.78006,0.20372117,0.009187139,4.299127,-0.8975496,-116.85547,-204.79233,2.4127445,-2.321821,69.12787,1220000
66
+ 116.37621,0.17429519,0.007449516,3.9735913,-0.88833654,-116.95849,-205.18504,0.95632565,-1.1096663,63.03396,1225000
67
+ 115.13277,0.18509041,0.008210552,5.223481,-6.108655,-115.76713,-204.54373,0.7875296,-0.61897314,50.976326,1230000
68
+ 115.34971,0.20440719,0.008953433,4.522362,-4.8343496,-115.91853,-205.75249,0.9560551,-0.9342625,53.595833,1235000
69
+ 116.820595,0.19051114,0.0067870268,5.9080973,-5.161472,-116.887085,-203.79782,0.79255486,-0.8301557,52.619175,1240000
70
+ 118.55163,0.17872111,0.0073707043,7.6473145,3.7164812,-120.04746,-204.31609,1.847294,-1.6705362,85.413345,1245000
71
+ 110.07896,0.15848182,0.008088394,5.2652526,-1.2591634,-110.7843,-205.34755,0.92709196,-1.0271378,59.81132,1250000
72
+ 117.54774,0.18604773,0.006550691,5.1019907,-3.1277788,-118.13686,-203.77339,0.90504456,-0.8046166,59.725803,1255000
73
+ 110.658966,0.1677107,0.00709772,6.8620086,-1.4236423,-111.82863,-204.68039,1.6074998,-2.0646043,89.53706,1260000
74
+ 112.24578,0.15926337,0.007884959,6.6828227,-0.71543634,-113.1413,-204.31476,0.9540906,-0.92020506,65.268005,1265000
75
+ 115.533516,0.1497755,0.0074196896,5.2163553,-5.543919,-115.9719,-204.39677,0.95114833,-0.78046143,47.016052,1270000
76
+ 111.81009,0.20559406,0.008322258,5.238183,2.181495,-112.934135,-204.51266,1.5942748,-1.5941174,70.047134,1275000
77
+ 111.74407,0.1836397,0.00790907,5.1881957,0.63402563,-112.91951,-205.06187,0.9460753,-1.0415655,52.484024,1280000
78
+ 113.855194,0.18637943,0.006927648,6.275719,-5.3573847,-114.73181,-202.26292,1.9436496,-2.0857384,74.49002,1285000
79
+ 115.638504,0.1666273,0.007983913,5.0924263,1.0549327,-115.95666,-207.0923,1.539261,-1.9723704,48.714622,1290000
80
+ 115.06765,0.18666074,0.008157566,6.2165146,0.938483,-115.837425,-205.0854,1.109473,-1.1111164,52.30749,1295000
81
+ 109.0475,0.1665621,0.0074106776,5.730331,-0.4202602,-109.60952,-203.82901,2.0804553,-2.0480754,79.138374,1300000
82
+ 113.911,0.15270585,0.005847259,4.333595,3.4692166,-114.53279,-205.07956,0.5352533,-0.6555701,46.48408,1305000
83
+ 114.888,0.17471373,0.0070131994,4.6105123,-5.1173058,-115.47186,-205.50684,2.3075671,-2.5588768,55.30629,1310000
84
+ 108.97417,0.15383805,0.0069264686,5.26074,-2.837904,-109.85982,-202.865,3.600068,-1.3964006,69.05847,1315000
85
+ 112.90842,0.15415582,0.009207127,5.6951356,-3.0009348,-113.490685,-204.55064,1.5475748,-1.4696823,79.99646,1320000
86
+ 110.514366,0.15044664,0.008889281,8.9555,-2.7042425,-111.75899,-204.60526,4.245118,-4.6006784,123.19461,1325000
87
+ 108.01134,0.1727444,0.00673504,4.8928447,-4.786161,-108.74275,-200.3279,1.9893712,-1.97926,59.8917,1330000
88
+ 113.18684,0.18908855,0.007813259,3.8326683,-3.5601606,-113.20701,-205.4978,0.78067183,-0.7605536,47.305923,1335000
89
+ 104.00043,0.18143648,0.007918213,5.4499035,-0.7205053,-104.88936,-205.99068,1.4734535,-1.5429156,60.724037,1340000
90
+ 112.6907,0.1644724,0.008843426,5.284168,-2.9074032,-113.10394,-203.87149,1.1754233,-1.3953984,59.708298,1345000
91
+ 104.54939,0.16575001,0.008032056,5.3594027,2.1418009,-105.01438,-204.98898,2.7207992,-3.1214101,62.879013,1350000
92
+ 108.36536,0.19535765,0.0067700855,5.475462,-2.6027486,-108.981705,-204.86029,0.9055296,-0.67667246,60.074146,1355000
93
+ 104.422775,0.16989961,0.005918505,8.229198,5.272963,-105.12241,-206.86488,2.0649767,-1.8050832,69.663895,1360000
94
+ 106.546,0.1601247,0.0076816953,5.8064103,-1.9945128,-107.08047,-204.27335,1.298056,-1.4829637,63.44338,1365000
95
+ 106.810486,0.18074608,0.0073745423,5.5348725,1.5285338,-107.32703,-204.65146,1.0403116,-0.96361315,61.281685,1370000
96
+ 104.51191,0.15660766,0.0075011533,3.0119116,-1.4115148,-104.96016,-202.63663,0.7530803,-0.8521373,45.467308,1375000
97
+ 104.854935,0.12605783,0.008237808,4.1866245,1.3761406,-105.30175,-204.42854,2.15268,-2.5172741,49.931805,1380000
98
+ 103.64504,0.16453752,0.007288437,4.1709766,0.41837674,-104.38562,-204.4823,1.1535867,-0.93013275,48.08878,1385000
99
+ 106.31976,0.1390172,0.0065704254,13.765357,-0.9348085,-106.85347,-204.86087,0.96755034,-1.4604136,76.18604,1390000
100
+ 100.47064,0.15317082,0.0076385005,4.2788186,-1.1335741,-101.11723,-204.02966,1.1773278,-2.597566,67.595604,1395000
101
+ 100.17121,0.1513519,0.007039368,5.6033225,-1.8426675,-101.23663,-203.34409,1.5856206,-1.576081,67.12921,1400000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 165.35384,0.19249357,0.007770369,6.58582,-53.74494,-165.0678,-203.50235,1.6031954,-1.7419716,79.70168,905000
3
+ 161.30551,0.18625227,0.0060079233,4.4041667,-55.66566,-161.4088,-203.78929,1.532397,-1.0643984,49.036037,910000
4
+ 163.08809,0.19845608,0.006727549,7.543176,-53.052185,-162.90364,-204.173,4.082272,-5.3158216,115.18416,915000
5
+ 158.1781,0.16802564,0.0071092956,5.5443926,-8.327219,-158.76512,-205.0339,0.8558831,-0.8714752,48.884377,920000
6
+ 155.52771,0.1713854,0.008352493,6.053041,-23.815002,-155.70793,-204.70848,1.127246,-1.124135,64.629166,925000
7
+ 152.06133,0.17145331,0.0073566847,7.524129,-41.23899,-152.88145,-204.56575,0.8964363,-1.1451147,61.11857,930000
8
+ 149.83594,0.1803364,0.008790902,7.7498736,-45.063766,-150.20776,-203.82796,3.509069,-3.5147192,89.302605,935000
9
+ 149.5607,0.20280463,0.009612958,6.8334856,-24.417372,-150.94003,-204.91963,3.0950012,-2.8674936,67.84175,940000
10
+ 148.4985,0.18241727,0.008267394,8.1861725,-8.888016,-149.36986,-204.51761,1.8397074,-1.6061592,60.73094,945000
11
+ 147.52367,0.20088136,0.008151255,7.402987,-10.244517,-148.0107,-204.79916,0.9304893,-0.97088933,54.688972,950000
12
+ 143.56883,0.18420404,0.009935757,7.65927,-33.570087,-143.90617,-205.77675,2.1481764,-1.954714,71.31974,955000
13
+ 140.50473,0.18353721,0.009034023,10.003334,-6.899066,-141.50706,-204.45882,2.3218563,-2.1177132,89.6899,960000
14
+ 140.86827,0.19169515,0.00873826,6.1282787,-20.099512,-141.24901,-204.73389,2.097323,-2.3658607,73.331215,965000
15
+ 133.24712,0.2044832,0.0080394605,6.998862,-18.181164,-133.5415,-204.82544,1.1354997,-1.0513916,63.707905,970000
16
+ 138.23293,0.17395627,0.008893515,10.011843,-26.327015,-139.1704,-204.43372,1.0042871,-0.91034365,68.66486,975000
17
+ 139.95505,0.17388406,0.008608251,8.397376,-24.971413,-141.06729,-204.42427,0.88487273,-0.85679305,78.84661,980000
18
+ 138.11952,0.18121415,0.007454627,6.617312,-2.286418,-138.45305,-204.6408,1.2324009,-1.4579124,75.45209,985000
19
+ 136.69553,0.18409255,0.0077873264,4.9231005,-16.449682,-137.45674,-205.57774,0.7699649,-0.7889032,51.980633,990000
20
+ 135.0892,0.18599859,0.0073972903,6.534096,-15.310221,-135.9928,-204.57947,1.4197326,-1.2449795,52.555878,995000
21
+ 133.84328,0.15790679,0.0074588805,6.176026,-24.920626,-134.23738,-205.08252,1.4580928,-1.3260189,61.999012,1000000
22
+ 135.9403,0.16526023,0.008853927,7.5152583,-9.843519,-136.64513,-205.18268,0.9162817,-0.9287502,62.178963,1005000
23
+ 133.00636,0.16373888,0.009327448,5.7370205,-9.679812,-133.20242,-205.10013,1.4809129,-1.3777207,65.49522,1010000
24
+ 131.31737,0.17614953,0.009833027,6.8011446,0.44977948,-132.2384,-205.21361,0.8757323,-0.84109807,58.083996,1015000
25
+ 132.6769,0.19671392,0.009304004,7.7583575,-7.5679865,-132.85564,-205.56125,1.1106526,-1.1302464,62.587097,1020000
26
+ 136.29216,0.19468361,0.007202892,4.316631,-13.412692,-136.23668,-204.78107,1.2378619,-1.8016083,55.080322,1025000
27
+ 132.58589,0.17286482,0.007960161,7.8117676,-3.974147,-133.32843,-204.035,1.1498295,-1.2971356,61.288387,1030000
28
+ 131.92265,0.18066767,0.010194618,5.9516973,1.1160746,-133.08842,-205.24673,1.8830292,-1.9613106,60.232594,1035000
29
+ 125.43835,0.13114768,0.010049034,6.8024507,-5.4824266,-126.37444,-204.46071,1.1276397,-0.98911256,56.011444,1040000
30
+ 129.42825,0.17633379,0.008275352,5.363934,-8.22134,-130.33502,-204.58716,2.6631427,-2.3259883,66.26548,1045000
31
+ 128.22829,0.16920784,0.008020184,5.981501,-4.91882,-128.83025,-204.99014,1.3767065,-1.3102366,60.640915,1050000
32
+ 129.51364,0.15813297,0.008091707,7.3004594,-3.2301173,-130.27403,-204.49486,0.61105406,-1.0386959,57.509415,1055000
33
+ 131.73218,0.16491951,0.009221079,6.045532,-11.940039,-132.37364,-204.56549,1.8071177,-1.4184339,68.185295,1060000
34
+ 127.18691,0.17609477,0.008411485,5.1467166,-0.8599102,-128.2216,-205.45007,1.605079,-1.5572289,75.24091,1065000
35
+ 128.17374,0.18773189,0.008309239,4.971126,4.977595,-128.74515,-204.04645,0.7039795,-1.134066,59.56628,1070000
36
+ 131.42209,0.19230947,0.008908474,4.2319093,-11.561111,-131.44896,-206.06213,1.6499243,-2.467966,59.163795,1075000
37
+ 130.67915,0.18537472,0.008177911,7.8364625,1.306133,-130.6593,-204.52751,4.662506,-4.843952,128.42903,1080000
38
+ 128.72247,0.17985852,0.009645946,3.9643764,-10.882951,-128.81346,-205.39714,1.272903,-1.2669238,55.561558,1085000
39
+ 124.53374,0.15078236,0.009034043,9.1371155,0.5214578,-125.756615,-205.01498,1.0251436,-1.0340463,78.61074,1090000
40
+ 126.62999,0.16598094,0.007968062,4.5141144,-4.7191715,-127.09072,-205.27386,1.0467231,-0.9555151,48.153603,1095000
41
+ 124.449646,0.17655548,0.008169063,5.950261,3.7617226,-125.83645,-205.5127,2.116946,-2.2074964,57.66382,1100000
42
+ 125.245865,0.1755177,0.008023412,5.8275957,-2.5088444,-125.845604,-205.02585,1.3084191,-1.0014406,56.377815,1105000
43
+ 122.32312,0.15201762,0.007978394,5.0393887,-1.2282438,-122.49487,-204.74857,1.6467142,-1.1833669,53.540558,1110000
44
+ 124.10023,0.15129492,0.008503178,5.954429,-6.7570553,-125.145035,-205.17693,2.0245624,-1.9941581,67.38858,1115000
45
+ 123.348724,0.17540583,0.008242016,7.28213,-7.306597,-123.86242,-203.98964,0.9375634,-2.0541139,62.459965,1120000
46
+ 119.06789,0.20035912,0.008388883,4.553475,-2.3925657,-118.47119,-205.14757,1.6689473,-1.4924892,59.441273,1125000
47
+ 124.46796,0.17597538,0.008915433,5.176701,1.105353,-124.5657,-206.11343,1.942518,-1.7522928,83.52775,1130000
48
+ 119.30797,0.18162036,0.006384587,4.7405396,-2.3766642,-119.74257,-204.90999,1.9274054,-1.6507739,52.391068,1135000
49
+ 119.62998,0.19260982,0.0067399973,5.1095786,0.73357147,-120.257645,-204.62932,4.187487,-4.760984,81.22744,1140000
50
+ 124.12055,0.18441787,0.007152339,7.0881586,-4.9621716,-124.972466,-205.49547,0.76552916,-1.0113406,60.234013,1145000
51
+ 112.607574,0.15815255,0.0080004055,4.632175,3.9198837,-113.13069,-204.66347,2.5602794,-2.6488607,60.82058,1150000
52
+ 122.34386,0.1859411,0.008195676,5.835515,0.3258428,-123.48919,-204.79335,0.7488897,-1.3516988,58.098892,1155000
53
+ 118.11235,0.1897581,0.008541355,4.915752,2.4517705,-118.79815,-202.86876,0.96476674,-1.5926819,52.670597,1160000
54
+ 118.88825,0.20507573,0.008145185,5.8590083,1.2881073,-119.49867,-204.32893,1.1029332,-0.99951774,57.96861,1165000
55
+ 120.43708,0.1519637,0.0079764,5.3759522,-4.376928,-121.156425,-203.74635,0.770964,-1.083133,56.967266,1170000
56
+ 115.63388,0.16045557,0.0072580734,4.873628,-4.501936,-115.95361,-204.50009,1.3101119,-1.4046469,61.396797,1175000
57
+ 122.075195,0.18575504,0.007618339,5.97732,-8.417744,-123.41227,-205.15355,0.7100805,-0.7338216,56.85481,1180000
58
+ 116.293106,0.16064498,0.008710623,5.9768195,-1.0301247,-116.90603,-204.35484,0.89136976,-0.8388106,65.25387,1185000
59
+ 112.62344,0.16036052,0.00820703,5.5262837,0.37087974,-113.399,-204.69923,1.1049311,-0.9752369,62.027645,1190000
60
+ 116.838585,0.157792,0.0070597637,9.760907,2.6417568,-117.731155,-205.67369,1.0974985,-1.4022645,89.71819,1195000
61
+ 120.31503,0.14792916,0.0067887553,7.3677964,-2.0286143,-121.15618,-204.1944,0.9663435,-0.9875132,61.003235,1200000
62
+ 119.81793,0.1477694,0.007957104,4.5387535,-3.794629,-121.14949,-204.19508,0.51047766,-0.85113096,53.37684,1205000
63
+ 117.84337,0.16362554,0.0075195506,5.884616,-7.3767104,-118.47774,-205.31549,0.86717564,-0.96378416,62.393364,1210000
64
+ 117.9749,0.18570288,0.0066981474,6.308931,1.1155423,-118.815285,-203.83084,0.7170324,-1.6288724,62.717224,1215000
65
+ 115.78006,0.20372117,0.009187139,4.299127,-0.8975496,-116.85547,-204.79233,2.4127445,-2.321821,69.12787,1220000
66
+ 116.37621,0.17429519,0.007449516,3.9735913,-0.88833654,-116.95849,-205.18504,0.95632565,-1.1096663,63.03396,1225000
67
+ 115.13277,0.18509041,0.008210552,5.223481,-6.108655,-115.76713,-204.54373,0.7875296,-0.61897314,50.976326,1230000
68
+ 115.34971,0.20440719,0.008953433,4.522362,-4.8343496,-115.91853,-205.75249,0.9560551,-0.9342625,53.595833,1235000
69
+ 116.820595,0.19051114,0.0067870268,5.9080973,-5.161472,-116.887085,-203.79782,0.79255486,-0.8301557,52.619175,1240000
70
+ 118.55163,0.17872111,0.0073707043,7.6473145,3.7164812,-120.04746,-204.31609,1.847294,-1.6705362,85.413345,1245000
71
+ 110.07896,0.15848182,0.008088394,5.2652526,-1.2591634,-110.7843,-205.34755,0.92709196,-1.0271378,59.81132,1250000
72
+ 117.54774,0.18604773,0.006550691,5.1019907,-3.1277788,-118.13686,-203.77339,0.90504456,-0.8046166,59.725803,1255000
73
+ 110.658966,0.1677107,0.00709772,6.8620086,-1.4236423,-111.82863,-204.68039,1.6074998,-2.0646043,89.53706,1260000
74
+ 112.24578,0.15926337,0.007884959,6.6828227,-0.71543634,-113.1413,-204.31476,0.9540906,-0.92020506,65.268005,1265000
75
+ 115.533516,0.1497755,0.0074196896,5.2163553,-5.543919,-115.9719,-204.39677,0.95114833,-0.78046143,47.016052,1270000
76
+ 111.81009,0.20559406,0.008322258,5.238183,2.181495,-112.934135,-204.51266,1.5942748,-1.5941174,70.047134,1275000
77
+ 111.74407,0.1836397,0.00790907,5.1881957,0.63402563,-112.91951,-205.06187,0.9460753,-1.0415655,52.484024,1280000
78
+ 113.855194,0.18637943,0.006927648,6.275719,-5.3573847,-114.73181,-202.26292,1.9436496,-2.0857384,74.49002,1285000
79
+ 115.638504,0.1666273,0.007983913,5.0924263,1.0549327,-115.95666,-207.0923,1.539261,-1.9723704,48.714622,1290000
80
+ 115.06765,0.18666074,0.008157566,6.2165146,0.938483,-115.837425,-205.0854,1.109473,-1.1111164,52.30749,1295000
81
+ 109.0475,0.1665621,0.0074106776,5.730331,-0.4202602,-109.60952,-203.82901,2.0804553,-2.0480754,79.138374,1300000
82
+ 113.911,0.15270585,0.005847259,4.333595,3.4692166,-114.53279,-205.07956,0.5352533,-0.6555701,46.48408,1305000
83
+ 114.888,0.17471373,0.0070131994,4.6105123,-5.1173058,-115.47186,-205.50684,2.3075671,-2.5588768,55.30629,1310000
84
+ 108.97417,0.15383805,0.0069264686,5.26074,-2.837904,-109.85982,-202.865,3.600068,-1.3964006,69.05847,1315000
85
+ 112.90842,0.15415582,0.009207127,5.6951356,-3.0009348,-113.490685,-204.55064,1.5475748,-1.4696823,79.99646,1320000
86
+ 110.514366,0.15044664,0.008889281,8.9555,-2.7042425,-111.75899,-204.60526,4.245118,-4.6006784,123.19461,1325000
87
+ 108.01134,0.1727444,0.00673504,4.8928447,-4.786161,-108.74275,-200.3279,1.9893712,-1.97926,59.8917,1330000
88
+ 113.18684,0.18908855,0.007813259,3.8326683,-3.5601606,-113.20701,-205.4978,0.78067183,-0.7605536,47.305923,1335000
89
+ 104.00043,0.18143648,0.007918213,5.4499035,-0.7205053,-104.88936,-205.99068,1.4734535,-1.5429156,60.724037,1340000
90
+ 112.6907,0.1644724,0.008843426,5.284168,-2.9074032,-113.10394,-203.87149,1.1754233,-1.3953984,59.708298,1345000
91
+ 104.54939,0.16575001,0.008032056,5.3594027,2.1418009,-105.01438,-204.98898,2.7207992,-3.1214101,62.879013,1350000
92
+ 108.36536,0.19535765,0.0067700855,5.475462,-2.6027486,-108.981705,-204.86029,0.9055296,-0.67667246,60.074146,1355000
93
+ 104.422775,0.16989961,0.005918505,8.229198,5.272963,-105.12241,-206.86488,2.0649767,-1.8050832,69.663895,1360000
94
+ 106.546,0.1601247,0.0076816953,5.8064103,-1.9945128,-107.08047,-204.27335,1.298056,-1.4829637,63.44338,1365000
95
+ 106.810486,0.18074608,0.0073745423,5.5348725,1.5285338,-107.32703,-204.65146,1.0403116,-0.96361315,61.281685,1370000
96
+ 104.51191,0.15660766,0.0075011533,3.0119116,-1.4115148,-104.96016,-202.63663,0.7530803,-0.8521373,45.467308,1375000
97
+ 104.854935,0.12605783,0.008237808,4.1866245,1.3761406,-105.30175,-204.42854,2.15268,-2.5172741,49.931805,1380000
98
+ 103.64504,0.16453752,0.007288437,4.1709766,0.41837674,-104.38562,-204.4823,1.1535867,-0.93013275,48.08878,1385000
99
+ 106.31976,0.1390172,0.0065704254,13.765357,-0.9348085,-106.85347,-204.86087,0.96755034,-1.4604136,76.18604,1390000
100
+ 100.47064,0.15317082,0.0076385005,4.2788186,-1.1335741,-101.11723,-204.02966,1.1773278,-2.597566,67.595604,1395000
101
+ 100.17121,0.1513519,0.007039368,5.6033225,-1.8426675,-101.23663,-203.34409,1.5856206,-1.576081,67.12921,1400000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edceccf0f37f0253a26fed88ca7a1b82b99cc4edc29dea1c827e266ef8bcf127
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75212f6a0944ec2d0c9852b5a7d834b5d4eb2597fa093051f2a263faab5e20e3
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b019f2b21edce7297bde6b9363aa2f097b83c13814fbfc55c52124cb073d0cba
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa4a39c3be4058ae521135337d5f0847f0ef2b78e50bbf9a30d2cdd7a5120beb
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:220e7a91732ae282b15eefad61c308fc8e6acfa8ca74af2a64393966362e51d8
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8252e1b49bac0ab9810faa26bc738e93dd2e0b3e8a9530b8ec69570b180810f
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce264985ed6d178a710508d52be42439d5696b3f33301a5aed52dab690798042
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6687721ced5b87682c78ddb8b2bd9cac689f9f0cf0004d22557d1a1b9bf7662b
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_1400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5cfb20c2fd36676176a0624d8378bc642ae7306fe1976f027475615c8b75179d
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:456d3203733da39f7962d2ff3ca6fcd252e9c904ecbf0d665e7aeb66db368e4b
3
+ size 217969454
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fql/20260319_193947/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/1uulhonp