Tiredsheep commited on
Commit
a7e1090
·
verified ·
1 Parent(s): 32eaac9

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1250000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1300000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.10352139262235185,0.128379727634799,-0.10784426173180967,-0.05327560924200364,13.839698466689956,23.62099999999718,0.08,12034.56,-1.66,-867.46,470.42,1.3739963531494142,850000
3
+ 0.0,0.0,-0.13838789452413353,0.08797870103114924,-0.13851289059084793,0.014254026983851904,19.96796032847928,17.2999999999982,0.44,32868.2,-0.86,-536.4,344.0,1.011380157470703,900000
4
+ 0.0,0.0,-0.03841693491052887,-0.025421959263906373,-0.03944278995228158,-0.0202870922771738,23.55730846026877,12.414999999998964,0.68,48472.24,-0.42,-343.82,246.3,0.7421352767944336,950000
5
+ 0.0,0.0,-0.032424596160613585,-0.00042195693038945837,-0.03006331956050519,0.053232332006066786,32.09363715766298,5.991999999999514,0.9,58212.68,-0.14,-166.22,117.84,0.36720908641815186,1000000
6
+ 0.0,0.0,-0.04687638198657792,0.019647110765000537,-0.043074649440791604,0.06267947051538775,31.694779353045494,8.934999999999203,0.78,65612.16,-0.32,-270.96,176.7,0.5415661811828614,1050000
7
+ 0.0,0.0,-0.049933097977266326,0.03187741813585734,-0.0472918592291476,0.05396146172616802,33.60619266235892,6.0709999999995325,0.88,73669.08,-0.2,-188.76,119.42,0.37201735496520993,1100000
8
+ 0.0,0.0,-0.06645443846100155,0.047660515972262264,-0.06290678548201366,0.06096403193993084,32.72585040778398,4.636999999999671,0.92,78260.68,-0.08,-119.78,90.74,0.28289925575256347,1150000
9
+ 0.0,0.0,-0.0594221271425904,0.04934284558337315,-0.055676437746766984,0.0813382845427583,35.058891677627344,3.4579999999998834,0.98,82986.42,-0.02,-95.24,67.16,0.22137309074401856,1200000
10
+ 0.0,0.0,-0.0651962160868236,0.07010230716831953,-0.06062025254812616,0.06013440495511496,35.395068147048626,2.9479999999998876,0.98,86211.22,-0.04,-88.18,56.96,0.19020536422729492,1250000
11
+ 0.0,0.0,-0.05095507186235843,0.07858477468116172,-0.04661419455892938,0.08276811154561721,35.31222914897923,2.9279999999999573,1.0,89121.76,0.0,-85.32,56.56,0.19211469650268553,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.10352139262235185,0.128379727634799,-0.10784426173180967,-0.05327560924200364,13.839698466689956,23.62099999999718,0.08,12034.56,-1.66,-867.46,470.42,1.3739963531494142,850000
3
+ 0.0,0.0,-0.13838789452413353,0.08797870103114924,-0.13851289059084793,0.014254026983851904,19.96796032847928,17.2999999999982,0.44,32868.2,-0.86,-536.4,344.0,1.011380157470703,900000
4
+ 0.0,0.0,-0.03841693491052887,-0.025421959263906373,-0.03944278995228158,-0.0202870922771738,23.55730846026877,12.414999999998964,0.68,48472.24,-0.42,-343.82,246.3,0.7421352767944336,950000
5
+ 0.0,0.0,-0.032424596160613585,-0.00042195693038945837,-0.03006331956050519,0.053232332006066786,32.09363715766298,5.991999999999514,0.9,58212.68,-0.14,-166.22,117.84,0.36720908641815186,1000000
6
+ 0.0,0.0,-0.04687638198657792,0.019647110765000537,-0.043074649440791604,0.06267947051538775,31.694779353045494,8.934999999999203,0.78,65612.16,-0.32,-270.96,176.7,0.5415661811828614,1050000
7
+ 0.0,0.0,-0.049933097977266326,0.03187741813585734,-0.0472918592291476,0.05396146172616802,33.60619266235892,6.0709999999995325,0.88,73669.08,-0.2,-188.76,119.42,0.37201735496520993,1100000
8
+ 0.0,0.0,-0.06645443846100155,0.047660515972262264,-0.06290678548201366,0.06096403193993084,32.72585040778398,4.636999999999671,0.92,78260.68,-0.08,-119.78,90.74,0.28289925575256347,1150000
9
+ 0.0,0.0,-0.0594221271425904,0.04934284558337315,-0.055676437746766984,0.0813382845427583,35.058891677627344,3.4579999999998834,0.98,82986.42,-0.02,-95.24,67.16,0.22137309074401856,1200000
10
+ 0.0,0.0,-0.0651962160868236,0.07010230716831953,-0.06062025254812616,0.06013440495511496,35.395068147048626,2.9479999999998876,0.98,86211.22,-0.04,-88.18,56.96,0.19020536422729492,1250000
11
+ 0.0,0.0,-0.05095507186235843,0.07858477468116172,-0.04661419455892938,0.08276811154561721,35.31222914897923,2.9279999999999573,1.0,89121.76,0.0,-85.32,56.56,0.19211469650268553,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 495.99207,1.1101215,0.8150509,-16.05046,-57.195618,-86.371056,1.4003832,-1.5226834,56.826515,805000
3
+ 554.2454,1.2131835,1.0532545,-11.21657,-62.72782,-105.15777,3.30673,-4.057695,97.07875,810000
4
+ 661.34534,1.1061945,3.522588,-13.334948,-72.254684,-135.86647,18.922474,-26.04649,298.47644,815000
5
+ 661.9577,1.1282265,2.9135442,-6.288627,-73.272644,-153.13406,4.485008,-8.682096,164.60582,820000
6
+ 678.25195,0.7011699,2.2532182,-22.950811,-74.69488,-168.4775,10.868331,-6.960555,128.36691,825000
7
+ 648.3005,0.82132035,1.3596662,-14.483994,-71.89868,-161.14105,6.503849,-7.34711,123.127815,830000
8
+ 687.9663,1.1604054,1.7035767,-18.910204,-75.43679,-165.08083,5.3896446,-7.1854024,132.96695,835000
9
+ 712.8274,1.1939896,2.2195156,-22.285522,-78.09523,-165.93262,2.4662147,-2.6519744,113.39424,840000
10
+ 717.92676,1.1240668,1.3888335,-22.755442,-78.35243,-169.17528,2.9819832,-2.8529685,66.267166,845000
11
+ 734.43475,1.0558674,2.8618848,-23.139477,-80.13013,-173.22949,3.727578,-2.8121367,125.75826,850000
12
+ 743.23254,0.7096477,2.4694195,-18.154518,-80.951225,-173.53812,3.7625604,-2.934411,111.253395,855000
13
+ 712.5369,0.7924253,1.5428652,-16.126797,-78.27468,-177.37537,2.6921954,-2.712731,85.5621,860000
14
+ 740.818,0.654428,1.0454358,-18.997822,-80.26351,-164.51334,3.9096043,-2.618484,89.29201,865000
15
+ 723.918,0.85592103,2.0283687,-11.5717745,-78.58379,-178.41426,3.946836,-6.681331,118.66484,870000
16
+ 732.8173,0.6779248,2.871698,-17.095385,-80.23073,-166.80525,5.3967857,-5.8230133,124.586296,875000
17
+ 813.3512,0.86248064,1.8234755,-11.638717,-87.925125,-170.82732,4.9167004,-6.2621894,124.03568,880000
18
+ 791.9729,1.2004921,2.1165094,-26.280643,-85.628136,-172.11635,8.834045,-4.114396,211.41898,885000
19
+ 787.48083,0.84504926,4.2821417,-11.089632,-84.95324,-166.47737,38.0045,-54.762943,462.36713,890000
20
+ 791.90765,0.993324,3.4808426,-12.412878,-85.577225,-175.17444,4.673593,-5.2622733,102.156265,895000
21
+ 797.4648,0.8177344,2.0916939,-17.741398,-85.41981,-176.03726,12.421966,-5.0682673,127.558304,900000
22
+ 790.1657,1.037001,1.7883469,-19.290497,-85.1224,-179.22078,14.193974,-15.27946,289.30106,905000
23
+ 798.2363,0.93483424,2.6098568,-11.733601,-86.0994,-177.39397,3.2225142,-3.0373368,99.12155,910000
24
+ 803.43427,0.78593045,1.8067178,0.7049498,-86.30429,-179.22772,33.769672,-21.629042,236.77316,915000
25
+ 794.20337,1.0699096,5.1488986,-14.854172,-85.5191,-171.79997,4.2205257,-3.9241729,157.67099,920000
26
+ 824.0342,1.1054736,2.760262,-14.924266,-88.45291,-182.77365,3.3793218,-2.6330385,94.3656,925000
27
+ 805.9598,0.85648376,3.4407945,-14.450289,-86.706535,-182.28748,3.8499923,-4.841858,143.21774,930000
28
+ 803.6637,1.0663261,1.6453342,1.6349056,-86.64656,-175.13692,7.0403214,-9.652274,154.98013,935000
29
+ 767.89716,0.9122956,1.9189751,-15.059327,-83.63141,-178.83064,3.0079038,-3.2468936,90.73688,940000
30
+ 831.2569,1.107042,2.5834157,-12.650701,-89.30788,-177.4691,10.435488,-6.0111256,195.06407,945000
31
+ 806.28,1.0457842,2.1262398,-14.83214,-86.44993,-182.16754,9.329617,-6.083772,126.497665,950000
32
+ 847.6068,0.87694013,2.386401,-20.150913,-90.79541,-178.01413,4.574854,-5.7824426,100.97228,955000
33
+ 828.77765,1.0018892,7.3589706,-25.608566,-88.82137,-177.11345,6.687269,-9.359185,144.07068,960000
34
+ 846.9209,0.9605074,4.0373545,-1.6337848,-90.92859,-184.4716,3.7849681,-4.3665643,170.79062,965000
35
+ 836.8085,1.0965109,4.3295207,-14.433735,-89.94496,-175.13228,4.180462,-3.706887,131.65924,970000
36
+ 848.7352,0.89281875,2.4156196,-33.20197,-90.90341,-178.88573,2.8132942,-2.4718018,102.69275,975000
37
+ 833.5195,1.1054094,2.602039,1.8522328,-89.24038,-180.2193,8.369759,-7.34324,234.44145,980000
38
+ 839.5759,1.342891,3.1944056,-16.14565,-90.125694,-179.80475,4.9571037,-3.8437276,124.00153,985000
39
+ 843.1656,1.3001372,10.898775,-12.82538,-90.088844,-176.99353,5.3011894,-7.368275,203.7788,990000
40
+ 838.6386,0.8561298,2.8923287,-3.4495802,-89.8773,-172.94353,14.958263,-5.957302,168.41048,995000
41
+ 802.13245,1.0295317,4.020566,-19.208582,-86.65328,-173.59227,3.7031918,-3.149852,134.7378,1000000
42
+ 801.6256,0.9175568,3.363098,-14.648968,-86.6406,-177.25215,5.5503016,-5.8421016,140.99612,1005000
43
+ 820.4108,1.2167917,3.222747,-12.81268,-88.07385,-176.44405,13.726787,-23.487625,262.04028,1010000
44
+ 797.0431,0.92550874,3.777296,-17.13564,-85.898796,-167.1295,2.8474042,-2.1726182,110.66528,1015000
45
+ 813.19507,1.4076732,4.8627396,-22.733257,-87.27537,-177.61763,3.7006989,-2.587369,129.78127,1020000
46
+ 810.3045,0.9618168,5.2326827,-15.483628,-86.78679,-180.68405,5.3722296,-7.56349,134.2527,1025000
47
+ 817.24506,1.5527664,2.9041452,-4.6853456,-87.78588,-181.26813,120.29186,-141.1069,3238.1262,1030000
48
+ 836.64795,1.0582694,3.7570832,-12.091255,-89.316826,-177.56784,10.424301,-6.0978556,128.89423,1035000
49
+ 823.7908,0.97902614,3.4160004,2.3279848,-88.25373,-183.6692,3.0976908,-2.8189042,115.19182,1040000
50
+ 798.55554,1.1901212,3.5560403,-13.153055,-86.343956,-174.86792,26.39819,-13.345137,291.17355,1045000
51
+ 797.33185,1.043385,5.7424703,-4.4969215,-85.618706,-176.43597,7.5206747,-11.651613,228.62762,1050000
52
+ 841.61676,1.1297226,3.316241,-4.9757595,-90.506615,-179.88034,26.739223,-27.966568,308.8093,1055000
53
+ 790.8652,1.2079511,2.8749306,1.8727717,-85.26554,-182.42188,7.4579463,-3.4529777,111.85513,1060000
54
+ 786.0732,0.98899066,3.5581472,-13.273149,-84.47259,-177.8419,17.253654,-9.502105,258.75992,1065000
55
+ 804.9975,1.2383344,3.554072,-23.369892,-86.60333,-180.77118,5.7122974,-4.263166,142.67517,1070000
56
+ 803.4244,1.2835586,4.2000327,1.044414,-86.48839,-188.46259,19.850164,-19.439198,241.94925,1075000
57
+ 781.9972,1.295928,2.6303928,-1.2125851,-84.253716,-181.12677,4.100351,-4.036431,127.25157,1080000
58
+ 809.4057,0.89361334,4.3800054,-7.754722,-86.72374,-177.46828,5.5093217,-10.610435,189.33392,1085000
59
+ 799.76184,0.923196,7.593226,-3.8593874,-86.04334,-175.94632,11.217593,-19.70889,426.90378,1090000
60
+ 783.0883,1.044889,5.4393992,1.4429818,-84.34159,-180.00175,4.481303,-4.1372466,161.04167,1095000
61
+ 785.6536,1.2632331,2.931921,-4.6527643,-84.06786,-181.40613,3.7222288,-3.9863515,140.59203,1100000
62
+ 778.95276,0.8170933,4.0168962,-5.443469,-84.01243,-179.83575,7.1548367,-7.2420993,199.20123,1105000
63
+ 772.06696,1.1824639,4.1782675,-5.3451843,-83.748436,-170.02606,15.687768,-12.478111,286.57108,1110000
64
+ 782.19684,0.9816873,2.4696534,1.2894354,-84.127014,-175.293,9.307882,-4.444647,126.724014,1115000
65
+ 776.3691,1.2387382,2.2661576,-1.0073384,-83.57532,-176.0021,5.8763285,-8.273937,152.7439,1120000
66
+ 791.2848,0.9452822,6.6361847,-7.880264,-85.628265,-179.78622,4.3938565,-3.9460833,151.9069,1125000
67
+ 771.0732,0.8204881,7.463618,3.6851163,-83.38474,-184.29271,4.9538965,-5.3603787,232.39905,1130000
68
+ 775.9731,1.1108972,3.1357915,-9.183345,-83.92842,-179.84889,3.9168978,-3.923197,123.15297,1135000
69
+ 767.287,0.9203185,3.6907067,3.8557491,-82.62396,-178.16171,3.9175477,-3.0672698,131.5567,1140000
70
+ 781.29425,1.2260283,2.7022583,-5.663058,-84.21873,-176.72456,11.998911,-9.828073,183.50839,1145000
71
+ 772.778,1.029633,2.5452225,-4.680327,-83.520096,-177.67838,4.8151655,-4.602126,121.955986,1150000
72
+ 795.447,1.0160997,5.887579,-7.2001667,-85.41984,-167.80774,3.268656,-4.0980883,154.6984,1155000
73
+ 760.1841,0.86940897,3.214594,-3.0994046,-82.15309,-175.04897,4.694355,-4.1011176,145.34048,1160000
74
+ 748.5935,1.0312291,3.849646,-5.3824544,-81.013794,-174.48058,27.012358,-26.235317,276.64352,1165000
75
+ 758.92413,1.0735043,3.2500694,-2.4357698,-81.67332,-176.9547,4.8392925,-4.7071104,135.73714,1170000
76
+ 751.32074,1.0022668,3.7428882,1.5551171,-81.226616,-175.28296,5.958193,-6.775138,215.84204,1175000
77
+ 759.2299,1.1644071,5.131988,-5.7491684,-81.73871,-173.32045,6.371247,-3.9358885,169.26344,1180000
78
+ 753.952,0.9082321,4.825657,-10.408127,-81.69944,-166.32591,8.466126,-21.011932,179.15985,1185000
79
+ 743.271,1.1377146,2.493597,-2.6539848,-80.67716,-168.40321,3.6956606,-3.8058505,124.111336,1190000
80
+ 758.9781,1.0564542,4.677419,-3.5533717,-82.24623,-171.6071,119.36896,-320.3938,1461.875,1195000
81
+ 746.93524,1.0647848,2.7231743,-6.864749,-80.616394,-158.72786,65.71623,-182.65034,1189.4128,1200000
82
+ 767.75916,1.0816274,3.0933347,-3.2176213,-82.60192,-176.55215,11.832829,-13.138753,353.39545,1205000
83
+ 761.6563,1.1900755,14.290015,-0.8929901,-82.48486,-171.8401,4.0875163,-8.188893,186.13873,1210000
84
+ 760.38684,0.9317373,3.7572136,-2.3315434,-82.06951,-176.71396,7.0284076,-10.711316,248.26288,1215000
85
+ 731.14954,1.2056975,3.1892927,-5.788388,-79.39794,-182.65514,21.004568,-8.993567,165.97076,1220000
86
+ 762.89136,1.0071856,3.9019456,-2.9134629,-82.230545,-170.0335,4.309679,-3.2612095,122.018974,1225000
87
+ 749.91974,1.6261935,4.772939,-2.5183444,-81.08697,-178.21297,32.057995,-21.56175,390.87378,1230000
88
+ 737.7108,0.8967384,2.8276832,-0.6954473,-79.94657,-173.81274,6.0367002,-10.202065,146.07057,1235000
89
+ 765.9822,1.5436214,4.3459506,6.3161325,-83.0012,-178.23705,6.2899704,-4.457318,146.40645,1240000
90
+ 766.708,0.9892355,3.6498032,-3.4955423,-83.10931,-173.3748,12.401974,-6.8468757,177.60971,1245000
91
+ 719.95294,0.85688025,3.5418732,2.427655,-77.58185,-175.99135,5.052911,-4.4846306,132.60837,1250000
92
+ 735.0883,0.97809696,3.3993518,-4.9986143,-79.038124,-165.61761,3.0196621,-8.541936,108.28174,1255000
93
+ 725.3972,1.2126484,3.7404916,-2.5807652,-78.484314,-175.51297,11.559669,-7.322671,174.85265,1260000
94
+ 689.7187,1.0666238,2.9539802,5.585908,-75.19136,-177.10463,56.906372,-117.08369,754.57556,1265000
95
+ 693.73553,1.029602,2.9923368,-2.24476,-75.624,-162.65434,35.04773,-15.409193,307.37903,1270000
96
+ 745.81665,1.0739298,3.25494,4.414821,-80.43658,-176.90872,9.564619,-5.9622297,140.12483,1275000
97
+ 697.16235,1.2295022,3.8861902,1.5326827,-75.72579,-182.4202,3.8387227,-3.8171315,141.27127,1280000
98
+ 695.07336,0.9534003,2.5082905,-0.76858425,-75.414665,-180.28471,12.559613,-23.497595,182.00546,1285000
99
+ 695.5378,1.0541568,3.9947503,0.6256002,-75.0334,-175.19408,6.670271,-4.183338,148.5298,1290000
100
+ 666.5467,0.9674996,3.9375103,-3.807946,-72.53786,-174.53499,101.46597,-127.90569,1858.8547,1295000
101
+ 711.6652,1.5143703,6.334327,-4.126182,-76.59834,-177.60052,6.770572,-5.1564264,179.31479,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 495.99207,1.1101215,0.8150509,-16.05046,-57.195618,-86.371056,1.4003832,-1.5226834,56.826515,805000
3
+ 554.2454,1.2131835,1.0532545,-11.21657,-62.72782,-105.15777,3.30673,-4.057695,97.07875,810000
4
+ 661.34534,1.1061945,3.522588,-13.334948,-72.254684,-135.86647,18.922474,-26.04649,298.47644,815000
5
+ 661.9577,1.1282265,2.9135442,-6.288627,-73.272644,-153.13406,4.485008,-8.682096,164.60582,820000
6
+ 678.25195,0.7011699,2.2532182,-22.950811,-74.69488,-168.4775,10.868331,-6.960555,128.36691,825000
7
+ 648.3005,0.82132035,1.3596662,-14.483994,-71.89868,-161.14105,6.503849,-7.34711,123.127815,830000
8
+ 687.9663,1.1604054,1.7035767,-18.910204,-75.43679,-165.08083,5.3896446,-7.1854024,132.96695,835000
9
+ 712.8274,1.1939896,2.2195156,-22.285522,-78.09523,-165.93262,2.4662147,-2.6519744,113.39424,840000
10
+ 717.92676,1.1240668,1.3888335,-22.755442,-78.35243,-169.17528,2.9819832,-2.8529685,66.267166,845000
11
+ 734.43475,1.0558674,2.8618848,-23.139477,-80.13013,-173.22949,3.727578,-2.8121367,125.75826,850000
12
+ 743.23254,0.7096477,2.4694195,-18.154518,-80.951225,-173.53812,3.7625604,-2.934411,111.253395,855000
13
+ 712.5369,0.7924253,1.5428652,-16.126797,-78.27468,-177.37537,2.6921954,-2.712731,85.5621,860000
14
+ 740.818,0.654428,1.0454358,-18.997822,-80.26351,-164.51334,3.9096043,-2.618484,89.29201,865000
15
+ 723.918,0.85592103,2.0283687,-11.5717745,-78.58379,-178.41426,3.946836,-6.681331,118.66484,870000
16
+ 732.8173,0.6779248,2.871698,-17.095385,-80.23073,-166.80525,5.3967857,-5.8230133,124.586296,875000
17
+ 813.3512,0.86248064,1.8234755,-11.638717,-87.925125,-170.82732,4.9167004,-6.2621894,124.03568,880000
18
+ 791.9729,1.2004921,2.1165094,-26.280643,-85.628136,-172.11635,8.834045,-4.114396,211.41898,885000
19
+ 787.48083,0.84504926,4.2821417,-11.089632,-84.95324,-166.47737,38.0045,-54.762943,462.36713,890000
20
+ 791.90765,0.993324,3.4808426,-12.412878,-85.577225,-175.17444,4.673593,-5.2622733,102.156265,895000
21
+ 797.4648,0.8177344,2.0916939,-17.741398,-85.41981,-176.03726,12.421966,-5.0682673,127.558304,900000
22
+ 790.1657,1.037001,1.7883469,-19.290497,-85.1224,-179.22078,14.193974,-15.27946,289.30106,905000
23
+ 798.2363,0.93483424,2.6098568,-11.733601,-86.0994,-177.39397,3.2225142,-3.0373368,99.12155,910000
24
+ 803.43427,0.78593045,1.8067178,0.7049498,-86.30429,-179.22772,33.769672,-21.629042,236.77316,915000
25
+ 794.20337,1.0699096,5.1488986,-14.854172,-85.5191,-171.79997,4.2205257,-3.9241729,157.67099,920000
26
+ 824.0342,1.1054736,2.760262,-14.924266,-88.45291,-182.77365,3.3793218,-2.6330385,94.3656,925000
27
+ 805.9598,0.85648376,3.4407945,-14.450289,-86.706535,-182.28748,3.8499923,-4.841858,143.21774,930000
28
+ 803.6637,1.0663261,1.6453342,1.6349056,-86.64656,-175.13692,7.0403214,-9.652274,154.98013,935000
29
+ 767.89716,0.9122956,1.9189751,-15.059327,-83.63141,-178.83064,3.0079038,-3.2468936,90.73688,940000
30
+ 831.2569,1.107042,2.5834157,-12.650701,-89.30788,-177.4691,10.435488,-6.0111256,195.06407,945000
31
+ 806.28,1.0457842,2.1262398,-14.83214,-86.44993,-182.16754,9.329617,-6.083772,126.497665,950000
32
+ 847.6068,0.87694013,2.386401,-20.150913,-90.79541,-178.01413,4.574854,-5.7824426,100.97228,955000
33
+ 828.77765,1.0018892,7.3589706,-25.608566,-88.82137,-177.11345,6.687269,-9.359185,144.07068,960000
34
+ 846.9209,0.9605074,4.0373545,-1.6337848,-90.92859,-184.4716,3.7849681,-4.3665643,170.79062,965000
35
+ 836.8085,1.0965109,4.3295207,-14.433735,-89.94496,-175.13228,4.180462,-3.706887,131.65924,970000
36
+ 848.7352,0.89281875,2.4156196,-33.20197,-90.90341,-178.88573,2.8132942,-2.4718018,102.69275,975000
37
+ 833.5195,1.1054094,2.602039,1.8522328,-89.24038,-180.2193,8.369759,-7.34324,234.44145,980000
38
+ 839.5759,1.342891,3.1944056,-16.14565,-90.125694,-179.80475,4.9571037,-3.8437276,124.00153,985000
39
+ 843.1656,1.3001372,10.898775,-12.82538,-90.088844,-176.99353,5.3011894,-7.368275,203.7788,990000
40
+ 838.6386,0.8561298,2.8923287,-3.4495802,-89.8773,-172.94353,14.958263,-5.957302,168.41048,995000
41
+ 802.13245,1.0295317,4.020566,-19.208582,-86.65328,-173.59227,3.7031918,-3.149852,134.7378,1000000
42
+ 801.6256,0.9175568,3.363098,-14.648968,-86.6406,-177.25215,5.5503016,-5.8421016,140.99612,1005000
43
+ 820.4108,1.2167917,3.222747,-12.81268,-88.07385,-176.44405,13.726787,-23.487625,262.04028,1010000
44
+ 797.0431,0.92550874,3.777296,-17.13564,-85.898796,-167.1295,2.8474042,-2.1726182,110.66528,1015000
45
+ 813.19507,1.4076732,4.8627396,-22.733257,-87.27537,-177.61763,3.7006989,-2.587369,129.78127,1020000
46
+ 810.3045,0.9618168,5.2326827,-15.483628,-86.78679,-180.68405,5.3722296,-7.56349,134.2527,1025000
47
+ 817.24506,1.5527664,2.9041452,-4.6853456,-87.78588,-181.26813,120.29186,-141.1069,3238.1262,1030000
48
+ 836.64795,1.0582694,3.7570832,-12.091255,-89.316826,-177.56784,10.424301,-6.0978556,128.89423,1035000
49
+ 823.7908,0.97902614,3.4160004,2.3279848,-88.25373,-183.6692,3.0976908,-2.8189042,115.19182,1040000
50
+ 798.55554,1.1901212,3.5560403,-13.153055,-86.343956,-174.86792,26.39819,-13.345137,291.17355,1045000
51
+ 797.33185,1.043385,5.7424703,-4.4969215,-85.618706,-176.43597,7.5206747,-11.651613,228.62762,1050000
52
+ 841.61676,1.1297226,3.316241,-4.9757595,-90.506615,-179.88034,26.739223,-27.966568,308.8093,1055000
53
+ 790.8652,1.2079511,2.8749306,1.8727717,-85.26554,-182.42188,7.4579463,-3.4529777,111.85513,1060000
54
+ 786.0732,0.98899066,3.5581472,-13.273149,-84.47259,-177.8419,17.253654,-9.502105,258.75992,1065000
55
+ 804.9975,1.2383344,3.554072,-23.369892,-86.60333,-180.77118,5.7122974,-4.263166,142.67517,1070000
56
+ 803.4244,1.2835586,4.2000327,1.044414,-86.48839,-188.46259,19.850164,-19.439198,241.94925,1075000
57
+ 781.9972,1.295928,2.6303928,-1.2125851,-84.253716,-181.12677,4.100351,-4.036431,127.25157,1080000
58
+ 809.4057,0.89361334,4.3800054,-7.754722,-86.72374,-177.46828,5.5093217,-10.610435,189.33392,1085000
59
+ 799.76184,0.923196,7.593226,-3.8593874,-86.04334,-175.94632,11.217593,-19.70889,426.90378,1090000
60
+ 783.0883,1.044889,5.4393992,1.4429818,-84.34159,-180.00175,4.481303,-4.1372466,161.04167,1095000
61
+ 785.6536,1.2632331,2.931921,-4.6527643,-84.06786,-181.40613,3.7222288,-3.9863515,140.59203,1100000
62
+ 778.95276,0.8170933,4.0168962,-5.443469,-84.01243,-179.83575,7.1548367,-7.2420993,199.20123,1105000
63
+ 772.06696,1.1824639,4.1782675,-5.3451843,-83.748436,-170.02606,15.687768,-12.478111,286.57108,1110000
64
+ 782.19684,0.9816873,2.4696534,1.2894354,-84.127014,-175.293,9.307882,-4.444647,126.724014,1115000
65
+ 776.3691,1.2387382,2.2661576,-1.0073384,-83.57532,-176.0021,5.8763285,-8.273937,152.7439,1120000
66
+ 791.2848,0.9452822,6.6361847,-7.880264,-85.628265,-179.78622,4.3938565,-3.9460833,151.9069,1125000
67
+ 771.0732,0.8204881,7.463618,3.6851163,-83.38474,-184.29271,4.9538965,-5.3603787,232.39905,1130000
68
+ 775.9731,1.1108972,3.1357915,-9.183345,-83.92842,-179.84889,3.9168978,-3.923197,123.15297,1135000
69
+ 767.287,0.9203185,3.6907067,3.8557491,-82.62396,-178.16171,3.9175477,-3.0672698,131.5567,1140000
70
+ 781.29425,1.2260283,2.7022583,-5.663058,-84.21873,-176.72456,11.998911,-9.828073,183.50839,1145000
71
+ 772.778,1.029633,2.5452225,-4.680327,-83.520096,-177.67838,4.8151655,-4.602126,121.955986,1150000
72
+ 795.447,1.0160997,5.887579,-7.2001667,-85.41984,-167.80774,3.268656,-4.0980883,154.6984,1155000
73
+ 760.1841,0.86940897,3.214594,-3.0994046,-82.15309,-175.04897,4.694355,-4.1011176,145.34048,1160000
74
+ 748.5935,1.0312291,3.849646,-5.3824544,-81.013794,-174.48058,27.012358,-26.235317,276.64352,1165000
75
+ 758.92413,1.0735043,3.2500694,-2.4357698,-81.67332,-176.9547,4.8392925,-4.7071104,135.73714,1170000
76
+ 751.32074,1.0022668,3.7428882,1.5551171,-81.226616,-175.28296,5.958193,-6.775138,215.84204,1175000
77
+ 759.2299,1.1644071,5.131988,-5.7491684,-81.73871,-173.32045,6.371247,-3.9358885,169.26344,1180000
78
+ 753.952,0.9082321,4.825657,-10.408127,-81.69944,-166.32591,8.466126,-21.011932,179.15985,1185000
79
+ 743.271,1.1377146,2.493597,-2.6539848,-80.67716,-168.40321,3.6956606,-3.8058505,124.111336,1190000
80
+ 758.9781,1.0564542,4.677419,-3.5533717,-82.24623,-171.6071,119.36896,-320.3938,1461.875,1195000
81
+ 746.93524,1.0647848,2.7231743,-6.864749,-80.616394,-158.72786,65.71623,-182.65034,1189.4128,1200000
82
+ 767.75916,1.0816274,3.0933347,-3.2176213,-82.60192,-176.55215,11.832829,-13.138753,353.39545,1205000
83
+ 761.6563,1.1900755,14.290015,-0.8929901,-82.48486,-171.8401,4.0875163,-8.188893,186.13873,1210000
84
+ 760.38684,0.9317373,3.7572136,-2.3315434,-82.06951,-176.71396,7.0284076,-10.711316,248.26288,1215000
85
+ 731.14954,1.2056975,3.1892927,-5.788388,-79.39794,-182.65514,21.004568,-8.993567,165.97076,1220000
86
+ 762.89136,1.0071856,3.9019456,-2.9134629,-82.230545,-170.0335,4.309679,-3.2612095,122.018974,1225000
87
+ 749.91974,1.6261935,4.772939,-2.5183444,-81.08697,-178.21297,32.057995,-21.56175,390.87378,1230000
88
+ 737.7108,0.8967384,2.8276832,-0.6954473,-79.94657,-173.81274,6.0367002,-10.202065,146.07057,1235000
89
+ 765.9822,1.5436214,4.3459506,6.3161325,-83.0012,-178.23705,6.2899704,-4.457318,146.40645,1240000
90
+ 766.708,0.9892355,3.6498032,-3.4955423,-83.10931,-173.3748,12.401974,-6.8468757,177.60971,1245000
91
+ 719.95294,0.85688025,3.5418732,2.427655,-77.58185,-175.99135,5.052911,-4.4846306,132.60837,1250000
92
+ 735.0883,0.97809696,3.3993518,-4.9986143,-79.038124,-165.61761,3.0196621,-8.541936,108.28174,1255000
93
+ 725.3972,1.2126484,3.7404916,-2.5807652,-78.484314,-175.51297,11.559669,-7.322671,174.85265,1260000
94
+ 689.7187,1.0666238,2.9539802,5.585908,-75.19136,-177.10463,56.906372,-117.08369,754.57556,1265000
95
+ 693.73553,1.029602,2.9923368,-2.24476,-75.624,-162.65434,35.04773,-15.409193,307.37903,1270000
96
+ 745.81665,1.0739298,3.25494,4.414821,-80.43658,-176.90872,9.564619,-5.9622297,140.12483,1275000
97
+ 697.16235,1.2295022,3.8861902,1.5326827,-75.72579,-182.4202,3.8387227,-3.8171315,141.27127,1280000
98
+ 695.07336,0.9534003,2.5082905,-0.76858425,-75.414665,-180.28471,12.559613,-23.497595,182.00546,1285000
99
+ 695.5378,1.0541568,3.9947503,0.6256002,-75.0334,-175.19408,6.670271,-4.183338,148.5298,1290000
100
+ 666.5467,0.9674996,3.9375103,-3.807946,-72.53786,-174.53499,101.46597,-127.90569,1858.8547,1295000
101
+ 711.6652,1.5143703,6.334327,-4.126182,-76.59834,-177.60052,6.770572,-5.1564264,179.31479,1300000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3d7b504dd10793ee64d68a2b62b8d559613a3aaca340c81bad9491dfa045148
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8f7c5856e0995f00dc76496f1ca6671b711ed19595418bd8a2aadf4a4297a3b
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db5ec85b9dcb51e939ce988aca2b529a7f0b4364fee3a3a58281b43640010f1b
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09a0fa90836329f482fbdd332baf25ce8b7bb41443683a27646e94b06bf8cd64
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e511587eb715e17d56ba77013ae6509e82ad09200318fed6836f6653bba15ea
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0068658efc55849ee29532a4b6b836bd6dc35e291a46d5efbdffaca57dd822fc
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_1300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8020e886b83dfbc0698383e1db4da7c8fc55e02ba93343ad23de820a8cbb4a78
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0f2e09cd791e749e8bc3c5d57c1efe2919959845333e52892bee163783c9397
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbbe71eb9aee1688b88d2facf7bc072ca42a8a3a44f36077d02d711fe76a9ae0
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b7b85ff7fa7c540f06f6022dd55cda5bcfdfa651ab2e19861e9447c16ea3dac
3
+ size 207971010
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/20260311_185319/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/f0sipdpp