Tiredsheep commited on
Commit
730431e
·
verified ·
1 Parent(s): 93dd06d

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1000000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_750000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_800000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_850000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_900000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_950000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.059672004456001466,-0.005321301096767039,-0.060078756740816724,0.022532321247265417,34.57652686943968,9.179999999999676,0.96,4591.8,-0.04,-250.2,181.6,0.7989863777160644,750000
3
+ 0.0,0.0,-0.042854757305147886,0.00043513539551527983,-0.04243136241475851,-0.001831091747422063,35.31255388782405,6.262999999999671,1.0,12571.72,0.0,-174.28,123.26,0.5245273542404175,800000
4
+ 0.0,0.0,-0.046495703208519625,0.012403196594178479,-0.04553132309566376,0.012978002228288545,35.418025068768245,5.419999999999615,0.98,18497.14,-0.02,-155.82,106.4,0.4659257316589355,850000
5
+ 0.0,0.0,-0.041699877960187814,0.03628828542809035,-0.04060128754648773,0.03269661644720851,35.75350142579296,4.151999999999791,1.0,23287.0,0.0,-118.94,81.04,0.3779515314102173,900000
6
+ 0.0,0.0,-0.045866135713358076,0.034297098386190404,-0.04416375091394265,0.030409189263884695,35.807720123725296,4.062999999999869,1.0,27381.06,0.0,-114.0,79.26,0.3318508338928223,950000
7
+ 0.0,0.0,-0.04434587369095829,0.034480959660084035,-0.04254366862017066,0.03259725015803834,35.81899903081824,3.332999999999855,1.0,31243.82,0.0,-94.54,64.66,0.2802790260314941,1000000
8
+ 0.0,0.0,-0.05111058239111145,0.03948552843611305,-0.048966784814802156,0.03806396281964957,35.75075800652552,3.0689999999998836,1.0,34448.2,0.0,-85.68,59.38,0.256507043838501,1050000
9
+ 0.0,0.0,-0.04741478877742001,0.05160943519616167,-0.04531630496468076,0.04085649210924963,35.76359120706619,3.158999999999874,1.0,37489.68,0.0,-90.22,61.18,0.25731958866119387,1100000
10
+ 0.0,0.0,-0.05256772069486735,0.048550291558614074,-0.05017440136822972,0.043533183106418356,35.83567921512307,2.7999999999999132,1.0,40556.7,0.0,-79.16,54.0,0.2489496326446533,1150000
11
+ 0.0,0.0,-0.04482270721728975,0.046558629048735825,-0.04267874611487351,0.04580989589838766,35.81204965586466,2.9289999999999003,1.0,43366.4,0.0,-83.42,56.58,0.24325576305389404,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.059672004456001466,-0.005321301096767039,-0.060078756740816724,0.022532321247265417,34.57652686943968,9.179999999999676,0.96,4591.8,-0.04,-250.2,181.6,0.7989863777160644,750000
3
+ 0.0,0.0,-0.042854757305147886,0.00043513539551527983,-0.04243136241475851,-0.001831091747422063,35.31255388782405,6.262999999999671,1.0,12571.72,0.0,-174.28,123.26,0.5245273542404175,800000
4
+ 0.0,0.0,-0.046495703208519625,0.012403196594178479,-0.04553132309566376,0.012978002228288545,35.418025068768245,5.419999999999615,0.98,18497.14,-0.02,-155.82,106.4,0.4659257316589355,850000
5
+ 0.0,0.0,-0.041699877960187814,0.03628828542809035,-0.04060128754648773,0.03269661644720851,35.75350142579296,4.151999999999791,1.0,23287.0,0.0,-118.94,81.04,0.3779515314102173,900000
6
+ 0.0,0.0,-0.045866135713358076,0.034297098386190404,-0.04416375091394265,0.030409189263884695,35.807720123725296,4.062999999999869,1.0,27381.06,0.0,-114.0,79.26,0.3318508338928223,950000
7
+ 0.0,0.0,-0.04434587369095829,0.034480959660084035,-0.04254366862017066,0.03259725015803834,35.81899903081824,3.332999999999855,1.0,31243.82,0.0,-94.54,64.66,0.2802790260314941,1000000
8
+ 0.0,0.0,-0.05111058239111145,0.03948552843611305,-0.048966784814802156,0.03806396281964957,35.75075800652552,3.0689999999998836,1.0,34448.2,0.0,-85.68,59.38,0.256507043838501,1050000
9
+ 0.0,0.0,-0.04741478877742001,0.05160943519616167,-0.04531630496468076,0.04085649210924963,35.76359120706619,3.158999999999874,1.0,37489.68,0.0,-90.22,61.18,0.25731958866119387,1100000
10
+ 0.0,0.0,-0.05256772069486735,0.048550291558614074,-0.05017440136822972,0.043533183106418356,35.83567921512307,2.7999999999999132,1.0,40556.7,0.0,-79.16,54.0,0.2489496326446533,1150000
11
+ 0.0,0.0,-0.04482270721728975,0.046558629048735825,-0.04267874611487351,0.04580989589838766,35.81204965586466,2.9289999999999003,1.0,43366.4,0.0,-83.42,56.58,0.24325576305389404,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 143.24338,0.19989698,-0.000650192,-12.54815,0.16944334,142.8747,5.805947,-58.620934,-146.27722,-195.43533,0.43510792,-0.2937581,26.864637,705000
3
+ 140.75133,0.19247857,-0.016914524,-13.80895,0.17844208,140.39734,6.244582,-45.508625,-143.98157,-193.45952,0.5746646,-0.5700803,23.499434,710000
4
+ 139.15038,0.18578112,0.01691627,-11.224378,0.14884861,138.79883,9.093493,-39.36615,-142.10399,-195.59486,0.361628,-0.38040793,28.857105,715000
5
+ 135.89314,0.18123262,-0.005536721,-12.891151,0.18247335,135.53497,16.932331,-38.65701,-139.16434,-199.34853,0.5343741,-0.3791757,37.456978,720000
6
+ 134.19977,0.16840418,-0.011284253,-13.322781,0.18271898,133.85992,9.345061,-49.36395,-137.39969,-195.82143,0.56337845,-0.53394794,32.710373,725000
7
+ 130.38258,0.18323682,0.004467943,-12.186083,0.17344299,130.02142,21.619999,-41.806328,-133.70312,-196.87373,1.3798554,-1.5403186,56.702015,730000
8
+ 128.28625,0.17592318,-0.011293327,-13.250734,0.19933134,127.922295,10.934464,-31.849844,-131.23907,-196.17152,0.48323804,-0.4308199,36.4692,735000
9
+ 128.0825,0.16864602,0.012799918,-11.665903,0.17902309,127.72203,20.642797,-38.782986,-131.93175,-198.19284,0.74908656,-0.7708781,40.002968,740000
10
+ 127.44369,0.16571823,0.020249426,-11.151848,0.16750225,127.09022,11.366492,-32.363686,-130.33653,-198.70703,0.7870549,-0.52342826,39.099045,745000
11
+ 123.487686,0.16362211,0.018215196,-11.334921,0.17721355,123.12863,14.519134,-7.198034,-127.097466,-192.42073,0.5135766,-0.56461054,43.316563,750000
12
+ 122.872246,0.19266,-0.014821706,-13.418064,0.21662824,122.47778,17.242853,-25.688562,-126.715965,-184.5637,1.2538145,-1.4397972,49.318653,755000
13
+ 119.55019,0.2219942,-0.005850949,-12.872129,0.20238702,119.13167,19.038351,-20.691517,-123.73385,-194.57407,0.7815171,-0.8820027,41.136444,760000
14
+ 120.507545,0.1968646,-0.015612692,-13.453938,0.2201949,120.1061,19.05223,-13.17992,-123.839294,-189.07959,0.52738315,-0.5145303,44.7053,765000
15
+ 115.277695,0.19137323,-0.0022495317,-12.638767,0.20488484,114.88368,20.496885,-19.899834,-118.801476,-183.52397,1.1733876,-1.2055821,55.5823,770000
16
+ 116.2462,0.19368513,-0.031678364,-14.3787365,0.24244745,115.84174,13.482691,-5.4247932,-120.462135,-192.3615,0.786741,-0.8745104,34.838943,775000
17
+ 116.66929,0.18398404,-0.010193375,-13.110031,0.21906336,116.276436,18.407728,0.5695484,-120.36316,-187.8383,0.7263323,-0.9720404,75.08022,780000
18
+ 117.10655,0.1973767,0.0026575201,-12.33829,0.20276606,116.70375,17.872862,-8.099065,-120.419876,-189.42554,1.2809018,-0.69807166,74.79434,785000
19
+ 112.697014,0.20080325,-0.035155766,-14.546399,0.2498974,112.28146,20.956364,-6.456405,-116.60231,-184.2158,0.7658976,-0.8621071,45.134907,790000
20
+ 114.80585,0.17635123,-0.009287545,-13.049894,0.22040868,114.41837,22.36116,-9.940298,-118.56719,-186.51523,1.8186404,-1.8271033,47.47959,795000
21
+ 110.43433,0.20909193,0.008118267,-12.021498,0.20395666,110.01317,16.043701,-16.291426,-113.72327,-180.9479,1.557753,-1.5332563,52.94129,800000
22
+ 113.62493,0.20592405,-0.011149182,-13.150124,0.22551577,113.204636,20.968643,-5.8580303,-118.74762,-179.64642,1.309894,-1.2717696,59.330185,805000
23
+ 112.027725,0.18620653,0.0114921685,-11.816631,0.19871958,111.63131,12.98674,-6.4324636,-115.74507,-180.22029,0.5359064,-0.68487465,41.779747,810000
24
+ 109.76496,0.19843492,-0.006021448,-12.850253,0.22091776,109.35163,15.083831,-0.090815336,-113.10213,-181.73434,0.6195259,-0.5628696,42.23914,815000
25
+ 109.5396,0.17959952,0.028310075,-10.882659,0.19049099,109.1412,12.233838,1.2067,-113.30794,-174.36491,1.119206,-1.235274,43.01207,820000
26
+ 111.98229,0.18702218,0.0148449065,-11.649199,0.2032569,111.57717,14.539578,-5.24266,-116.173,-184.0633,0.66925144,-0.6946125,45.8323,825000
27
+ 111.4262,0.18882212,0.003295881,-12.30957,0.21304911,111.021034,19.582144,-13.540382,-115.858864,-183.36145,0.94196796,-0.98712534,45.608276,830000
28
+ 113.11764,0.19298604,-0.0057553267,-12.846699,0.2132599,112.71715,15.318008,2.199626,-116.346085,-185.37892,0.603306,-0.83544433,45.37868,835000
29
+ 107.08641,0.20535856,-0.024540074,-13.940073,0.23755077,106.668045,12.278824,-8.819062,-112.06115,-182.30676,1.2913761,-1.2254298,63.775158,840000
30
+ 108.08579,0.18955791,0.0018401697,-12.392855,0.21284136,107.68155,12.666359,-5.851499,-111.97011,-183.08746,0.60328287,-0.75809944,39.881474,845000
31
+ 109.30752,0.16996798,-0.005263148,-12.810545,0.21711442,108.9257,14.474396,-3.5133302,-113.023705,-193.42642,1.0522512,-1.0368619,45.506256,850000
32
+ 107.46971,0.18413825,0.03207102,-10.66763,0.18671001,107.066795,8.391327,0.8176983,-110.38843,-177.76823,1.1034086,-0.98285323,38.60845,855000
33
+ 110.28901,0.20610814,-0.0036405043,-12.709152,0.22121555,109.865326,15.082148,-12.369663,-113.40051,-187.28484,0.48625976,-0.5535434,50.928696,860000
34
+ 109.66538,0.18569948,-0.01338129,-13.252753,0.23558709,109.25748,12.532963,-1.146238,-113.195145,-189.0224,5.6620684,-5.71383,108.323456,865000
35
+ 108.07965,0.17485034,0.007489231,-12.081216,0.21605167,107.68126,17.508291,0.20536643,-111.75795,-183.69722,3.651266,-3.5517268,116.40412,870000
36
+ 110.06438,0.20146027,0.044238564,-9.962213,0.17366073,109.64502,12.989514,-7.640959,-112.72532,-186.83052,2.7251992,-2.7118075,67.05034,875000
37
+ 110.15913,0.20032978,0.007839506,-12.050196,0.21001926,109.74093,27.527632,1.3190007,-113.687515,-187.72707,10.775192,-10.752937,208.61453,880000
38
+ 106.51428,0.16372564,-0.00808014,-12.966527,0.22457725,106.134056,8.580919,-2.8969274,-109.64837,-179.08182,0.56050956,-0.5416616,36.156937,885000
39
+ 103.55584,0.19391379,-0.032195028,-14.345027,0.25031534,103.14381,17.878164,-5.1129436,-107.48164,-189.63815,0.8338474,-0.8588891,62.207012,890000
40
+ 105.142105,0.17426372,-0.010745027,-13.11314,0.22980237,104.74878,14.626014,-17.111176,-108.65252,-188.42131,0.72546196,-0.65720093,46.77413,895000
41
+ 104.072205,0.20559163,0.00045756757,-12.473717,0.217156,103.649,18.918823,-4.857683,-107.735405,-184.18343,1.4071808,-1.4083467,56.64585,900000
42
+ 107.96043,0.20296264,-0.020983692,-13.686897,0.24197684,107.53647,16.83411,-1.9557312,-111.38772,-178.27951,1.1511309,-0.97685766,63.743675,905000
43
+ 105.105515,0.1972226,-0.032383565,-14.345575,0.25171602,104.688965,15.079738,-4.860751,-109.31001,-173.91458,0.70476276,-0.55690986,48.513893,910000
44
+ 105.665085,0.21972722,0.0014680871,-12.416531,0.21838604,105.22551,12.612208,-6.3610535,-109.19594,-193.54947,0.84566677,-0.769173,48.811058,915000
45
+ 104.68888,0.19894885,0.005782432,-12.167549,0.21163435,104.272514,13.46273,-6.7367997,-108.30969,-178.67041,0.7109406,-0.49433568,54.182453,920000
46
+ 100.71279,0.19259149,0.033379007,-10.593416,0.1854614,100.30136,18.671152,-4.527279,-104.29262,-180.00333,0.8119329,-0.7853733,53.68466,925000
47
+ 104.914474,0.20850275,0.04057095,-10.194553,0.17940243,104.48599,10.5253525,-3.1517742,-108.6289,-187.31413,2.522317,-1.6447421,78.08299,930000
48
+ 101.32387,0.23234876,0.042420927,-10.079323,0.17663412,100.87247,13.030298,-2.2977874,-104.57183,-181.60071,0.5876783,-0.6900239,48.096127,935000
49
+ 100.82217,0.25537607,0.010832245,-11.869657,0.20397615,100.351974,13.658869,1.5755441,-105.70042,-188.81168,0.4026378,-0.861259,46.488285,940000
50
+ 103.79609,0.2001425,-0.008950044,-13.0207405,0.2237894,103.3811,16.466833,0.46831816,-107.490135,-183.81458,0.8950846,-0.8657018,52.34742,945000
51
+ 94.59795,0.23303512,0.005788022,-12.162393,0.20851499,94.15062,13.322395,-0.30389297,-98.777725,-185.67325,2.5620189,-2.5344934,71.36698,950000
52
+ 104.17459,0.20453288,-0.014228743,-13.324652,0.2299068,103.75438,19.363184,-2.787429,-107.83887,-187.02307,1.0793276,-1.074904,67.80327,955000
53
+ 99.17654,0.18779045,-0.008071817,-12.96126,0.22681558,98.770004,13.764876,2.1780794,-103.24876,-180.98038,0.51673424,-0.46852162,44.053505,960000
54
+ 102.68635,0.21244022,0.02002893,-11.341882,0.19615074,102.25773,11.5754385,-2.7444673,-106.57424,-189.57924,0.6665708,-0.6627389,39.82159,965000
55
+ 101.96707,0.20620099,-0.0067791343,-12.892012,0.22294408,101.54471,13.539374,-6.9162927,-105.206116,-172.18164,0.53825045,-0.56321347,38.89672,970000
56
+ 100.468704,0.19342145,0.008043028,-12.035046,0.20818862,100.05905,17.571646,7.8771987,-103.67627,-192.6252,0.722188,-0.75011915,60.05138,975000
57
+ 102.22275,0.20232272,-0.021616245,-13.768598,0.23460975,101.80743,16.051214,-1.0436859,-106.60217,-187.0432,0.61146986,-0.5997852,52.50157,980000
58
+ 98.09878,0.19350743,-0.0032609955,-12.689234,0.21866885,97.689865,18.451849,-1.4083269,-101.47848,-171.81209,0.87464845,-0.69817483,62.83828,985000
59
+ 95.50525,0.21642657,-0.022702297,-13.810203,0.23929377,95.072235,14.172942,1.5561073,-99.172455,-176.60258,0.47797674,-0.6181435,47.040768,990000
60
+ 96.40601,0.20995158,-0.0056037647,-12.827617,0.21941173,95.98225,15.416697,0.70334476,-99.615906,-185.03203,0.67762774,-0.6551002,44.476048,995000
61
+ 102.1322,0.15990433,0.018208677,-11.452137,0.19900335,101.75508,17.616068,-3.8916163,-105.530205,-181.91403,1.0973096,-1.3771132,76.39444,1000000
62
+ 101.379,0.18030137,0.006528652,-12.118965,0.20764638,100.98452,8.814192,-3.5457757,-105.111626,-186.6195,0.44646713,-0.62805176,43.022194,1005000
63
+ 98.12865,0.17040157,-0.034496874,-14.538613,0.24601856,97.74673,13.562335,1.1152229,-102.67242,-181.81822,0.8308118,-0.60992,53.726547,1010000
64
+ 100.19075,0.19877169,-0.0032809621,-12.693709,0.21500035,99.78026,12.372888,0.91791743,-103.5249,-173.07971,1.077771,-0.90506816,57.044266,1015000
65
+ 99.96716,0.21775782,-0.022492155,-13.804496,0.23801753,99.53388,22.297956,3.914031,-104.43328,-175.57663,0.8408448,-1.8859677,73.90494,1020000
66
+ 97.9935,0.21881917,-0.01371278,-13.306172,0.2263345,97.56206,10.478633,1.5624208,-102.110535,-190.0389,0.51770854,-0.65151274,48.041233,1025000
67
+ 93.54993,0.19507097,0.033179857,-10.55598,0.18016577,93.14151,13.452647,7.106862,-96.62587,-164.20612,1.1325071,-1.0218036,48.724976,1030000
68
+ 98.51479,0.22194564,0.016840378,-11.506008,0.19493672,98.08107,11.642682,-3.2102747,-101.59455,-190.60384,0.47254115,-0.659932,46.221462,1035000
69
+ 100.12888,0.154725,-0.020382324,-13.679017,0.23647678,99.75807,14.156305,-2.7081199,-103.0602,-185.62938,0.9976122,-0.9832604,45.73042,1040000
70
+ 102.19601,0.19263396,-0.04581565,-15.16657,0.2605843,101.788605,13.431735,-4.2467947,-106.89434,-188.14247,0.72572154,-0.82316065,50.999615,1045000
71
+ 93.26083,0.2163777,0.005537141,-12.178487,0.20973948,92.82918,23.283028,-7.1024737,-97.09084,-194.79253,1.093219,-1.4707829,89.21389,1050000
72
+ 98.359856,0.18841222,0.04515686,-9.822727,0.16567737,97.9606,14.02805,-4.197053,-101.72678,-178.30872,0.6156518,-0.63397247,40.215946,1055000
73
+ 95.04121,0.18714033,-0.007896469,-12.9604435,0.22226773,94.639694,14.6420965,-1.3463639,-99.06178,-184.26382,0.5196904,-0.53407955,51.862434,1060000
74
+ 98.28111,0.20013268,-0.014354504,-13.34869,0.22577596,97.86955,17.898314,-0.42865515,-102.15301,-189.42982,0.8102983,-0.8149522,54.71112,1065000
75
+ 95.762184,0.20504701,-0.012680881,-13.242498,0.22616418,95.34365,15.601172,-4.371675,-99.71288,-178.45547,0.910553,-0.52336335,51.12021,1070000
76
+ 93.43696,0.20459192,-0.025720341,-14.025553,0.23646641,93.02162,10.622826,1.2622138,-97.16232,-188.80962,0.7393695,-0.6720529,55.345837,1075000
77
+ 95.93614,0.21458502,0.0075806063,-12.051549,0.20371911,95.510254,23.125776,-1.3286319,-98.476776,-188.18388,3.3082821,-3.636525,102.24527,1080000
78
+ 96.57496,0.18715264,-0.0146622425,-13.365331,0.22646338,96.17601,13.625092,0.12639038,-100.37607,-189.68312,0.5691552,-0.65001726,40.623028,1085000
79
+ 96.84541,0.1854386,-0.00073824247,-12.543513,0.21281205,96.4479,14.8043585,0.85526025,-101.23281,-184.64291,0.6376718,-0.7976411,51.414253,1090000
80
+ 94.91413,0.19243327,0.011752033,-11.81019,0.20120582,94.50874,10.378472,-5.751059,-98.57018,-180.75093,0.8820506,-0.9933844,57.515556,1095000
81
+ 93.4106,0.2114522,0.015097091,-11.600264,0.19464616,92.9894,10.552869,-5.3074255,-97.173485,-176.01775,0.6783555,-0.8464374,54.278816,1100000
82
+ 93.89324,0.21755898,-0.006071975,-12.861081,0.2162732,93.465485,19.275465,1.5600411,-97.551186,-182.10197,1.1788987,-1.081755,61.367584,1105000
83
+ 96.965034,0.18791611,0.036112722,-10.353616,0.17419866,96.5668,17.901445,-2.8864717,-99.99039,-176.68948,0.5750501,-0.493349,48.730324,1110000
84
+ 93.456726,0.16489717,0.0074540977,-12.058872,0.20376866,93.08061,10.717723,-1.2171718,-97.11376,-170.2137,3.4300125,-3.4340768,87.32214,1115000
85
+ 94.30181,0.20229489,-0.016430274,-13.4797945,0.22604404,93.88991,14.600532,1.5851539,-98.34783,-180.82681,0.5326016,-0.5023383,46.590076,1120000
86
+ 89.715645,0.21705791,-0.010901286,-13.149556,0.22068465,89.2888,8.803906,-1.491808,-93.73819,-192.05281,0.6533648,-0.5264318,48.94047,1125000
87
+ 89.21835,0.1963191,0.00038872095,-12.476799,0.2090425,88.8126,16.476843,-3.129145,-92.76949,-179.49681,0.60456824,-0.5877307,48.387283,1130000
88
+ 95.4777,0.19496173,-0.00743403,-12.944334,0.21656808,95.0736,13.819107,4.6149607,-98.998985,-186.60115,1.259044,-1.5035669,73.56267,1135000
89
+ 87.37485,0.23146187,-0.0014548195,-12.588297,0.20741047,86.93743,13.733116,-0.13821247,-90.50585,-191.04172,0.41827372,-0.818612,44.491486,1140000
90
+ 96.508705,0.20934656,0.00054604316,-12.467057,0.20664781,96.09216,8.359951,-1.7350986,-100.855415,-183.85497,0.50803417,-0.3245686,34.99338,1145000
91
+ 88.217926,0.19647789,0.0067764823,-12.084265,0.19697344,87.817696,15.729733,3.2972174,-92.22025,-185.25067,0.72052324,-0.67722756,57.288853,1150000
92
+ 94.412445,0.22223283,-0.020654876,-13.743717,0.22824705,93.98261,13.026938,-3.0048401,-97.57395,-186.39317,0.6643415,-0.6456518,45.95528,1155000
93
+ 89.90588,0.21781674,0.015110418,-11.5896845,0.19237833,89.480576,10.043729,-2.7002654,-94.4284,-176.09454,0.37240833,-0.43474856,38.75659,1160000
94
+ 90.97263,0.2386708,0.0029790485,-12.317854,0.20146185,90.529526,11.438765,-2.249203,-94.279076,-179.54677,0.6578934,-0.7195803,41.48974,1165000
95
+ 90.3946,0.16901137,-0.0015426363,-12.593044,0.20878756,90.01834,10.329692,-3.2134495,-94.152504,-170.67253,0.5240084,-0.42568824,36.586483,1170000
96
+ 91.71376,0.17481697,-0.006728522,-12.906614,0.21357447,91.33209,10.903536,-2.3036215,-95.308464,-185.10503,0.30186132,-0.34922674,34.506813,1175000
97
+ 92.17102,0.21712066,-0.015253309,-13.442293,0.21759625,91.75156,14.482721,2.6239147,-95.73756,-173.57048,0.79640794,-1.6571417,71.23872,1180000
98
+ 89.16049,0.20341958,0.022078289,-11.129726,0.17932576,88.75566,9.446093,-2.6180906,-93.15319,-191.3892,2.1442728,-2.21547,61.68827,1185000
99
+ 89.68239,0.18363932,-0.015772048,-13.482857,0.21636142,89.29816,11.463333,14.914861,-93.36916,-183.41405,0.80111736,-0.80603194,47.26907,1190000
100
+ 83.73791,0.18281493,0.0050842585,-12.189062,0.1993078,83.3507,13.024744,-2.4575193,-88.12901,-186.69722,0.8053094,-0.8865109,56.916203,1195000
101
+ 84.54124,0.20237322,0.0063008033,-12.106695,0.19395112,84.13861,6.6703386,-0.6526278,-87.72396,-190.60056,0.27259058,-0.36264923,32.13459,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/edit_alpha_loss,actor/edit_entropy,actor/edit_entropy_loss,actor/edit_q_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 143.24338,0.19989698,-0.000650192,-12.54815,0.16944334,142.8747,5.805947,-58.620934,-146.27722,-195.43533,0.43510792,-0.2937581,26.864637,705000
3
+ 140.75133,0.19247857,-0.016914524,-13.80895,0.17844208,140.39734,6.244582,-45.508625,-143.98157,-193.45952,0.5746646,-0.5700803,23.499434,710000
4
+ 139.15038,0.18578112,0.01691627,-11.224378,0.14884861,138.79883,9.093493,-39.36615,-142.10399,-195.59486,0.361628,-0.38040793,28.857105,715000
5
+ 135.89314,0.18123262,-0.005536721,-12.891151,0.18247335,135.53497,16.932331,-38.65701,-139.16434,-199.34853,0.5343741,-0.3791757,37.456978,720000
6
+ 134.19977,0.16840418,-0.011284253,-13.322781,0.18271898,133.85992,9.345061,-49.36395,-137.39969,-195.82143,0.56337845,-0.53394794,32.710373,725000
7
+ 130.38258,0.18323682,0.004467943,-12.186083,0.17344299,130.02142,21.619999,-41.806328,-133.70312,-196.87373,1.3798554,-1.5403186,56.702015,730000
8
+ 128.28625,0.17592318,-0.011293327,-13.250734,0.19933134,127.922295,10.934464,-31.849844,-131.23907,-196.17152,0.48323804,-0.4308199,36.4692,735000
9
+ 128.0825,0.16864602,0.012799918,-11.665903,0.17902309,127.72203,20.642797,-38.782986,-131.93175,-198.19284,0.74908656,-0.7708781,40.002968,740000
10
+ 127.44369,0.16571823,0.020249426,-11.151848,0.16750225,127.09022,11.366492,-32.363686,-130.33653,-198.70703,0.7870549,-0.52342826,39.099045,745000
11
+ 123.487686,0.16362211,0.018215196,-11.334921,0.17721355,123.12863,14.519134,-7.198034,-127.097466,-192.42073,0.5135766,-0.56461054,43.316563,750000
12
+ 122.872246,0.19266,-0.014821706,-13.418064,0.21662824,122.47778,17.242853,-25.688562,-126.715965,-184.5637,1.2538145,-1.4397972,49.318653,755000
13
+ 119.55019,0.2219942,-0.005850949,-12.872129,0.20238702,119.13167,19.038351,-20.691517,-123.73385,-194.57407,0.7815171,-0.8820027,41.136444,760000
14
+ 120.507545,0.1968646,-0.015612692,-13.453938,0.2201949,120.1061,19.05223,-13.17992,-123.839294,-189.07959,0.52738315,-0.5145303,44.7053,765000
15
+ 115.277695,0.19137323,-0.0022495317,-12.638767,0.20488484,114.88368,20.496885,-19.899834,-118.801476,-183.52397,1.1733876,-1.2055821,55.5823,770000
16
+ 116.2462,0.19368513,-0.031678364,-14.3787365,0.24244745,115.84174,13.482691,-5.4247932,-120.462135,-192.3615,0.786741,-0.8745104,34.838943,775000
17
+ 116.66929,0.18398404,-0.010193375,-13.110031,0.21906336,116.276436,18.407728,0.5695484,-120.36316,-187.8383,0.7263323,-0.9720404,75.08022,780000
18
+ 117.10655,0.1973767,0.0026575201,-12.33829,0.20276606,116.70375,17.872862,-8.099065,-120.419876,-189.42554,1.2809018,-0.69807166,74.79434,785000
19
+ 112.697014,0.20080325,-0.035155766,-14.546399,0.2498974,112.28146,20.956364,-6.456405,-116.60231,-184.2158,0.7658976,-0.8621071,45.134907,790000
20
+ 114.80585,0.17635123,-0.009287545,-13.049894,0.22040868,114.41837,22.36116,-9.940298,-118.56719,-186.51523,1.8186404,-1.8271033,47.47959,795000
21
+ 110.43433,0.20909193,0.008118267,-12.021498,0.20395666,110.01317,16.043701,-16.291426,-113.72327,-180.9479,1.557753,-1.5332563,52.94129,800000
22
+ 113.62493,0.20592405,-0.011149182,-13.150124,0.22551577,113.204636,20.968643,-5.8580303,-118.74762,-179.64642,1.309894,-1.2717696,59.330185,805000
23
+ 112.027725,0.18620653,0.0114921685,-11.816631,0.19871958,111.63131,12.98674,-6.4324636,-115.74507,-180.22029,0.5359064,-0.68487465,41.779747,810000
24
+ 109.76496,0.19843492,-0.006021448,-12.850253,0.22091776,109.35163,15.083831,-0.090815336,-113.10213,-181.73434,0.6195259,-0.5628696,42.23914,815000
25
+ 109.5396,0.17959952,0.028310075,-10.882659,0.19049099,109.1412,12.233838,1.2067,-113.30794,-174.36491,1.119206,-1.235274,43.01207,820000
26
+ 111.98229,0.18702218,0.0148449065,-11.649199,0.2032569,111.57717,14.539578,-5.24266,-116.173,-184.0633,0.66925144,-0.6946125,45.8323,825000
27
+ 111.4262,0.18882212,0.003295881,-12.30957,0.21304911,111.021034,19.582144,-13.540382,-115.858864,-183.36145,0.94196796,-0.98712534,45.608276,830000
28
+ 113.11764,0.19298604,-0.0057553267,-12.846699,0.2132599,112.71715,15.318008,2.199626,-116.346085,-185.37892,0.603306,-0.83544433,45.37868,835000
29
+ 107.08641,0.20535856,-0.024540074,-13.940073,0.23755077,106.668045,12.278824,-8.819062,-112.06115,-182.30676,1.2913761,-1.2254298,63.775158,840000
30
+ 108.08579,0.18955791,0.0018401697,-12.392855,0.21284136,107.68155,12.666359,-5.851499,-111.97011,-183.08746,0.60328287,-0.75809944,39.881474,845000
31
+ 109.30752,0.16996798,-0.005263148,-12.810545,0.21711442,108.9257,14.474396,-3.5133302,-113.023705,-193.42642,1.0522512,-1.0368619,45.506256,850000
32
+ 107.46971,0.18413825,0.03207102,-10.66763,0.18671001,107.066795,8.391327,0.8176983,-110.38843,-177.76823,1.1034086,-0.98285323,38.60845,855000
33
+ 110.28901,0.20610814,-0.0036405043,-12.709152,0.22121555,109.865326,15.082148,-12.369663,-113.40051,-187.28484,0.48625976,-0.5535434,50.928696,860000
34
+ 109.66538,0.18569948,-0.01338129,-13.252753,0.23558709,109.25748,12.532963,-1.146238,-113.195145,-189.0224,5.6620684,-5.71383,108.323456,865000
35
+ 108.07965,0.17485034,0.007489231,-12.081216,0.21605167,107.68126,17.508291,0.20536643,-111.75795,-183.69722,3.651266,-3.5517268,116.40412,870000
36
+ 110.06438,0.20146027,0.044238564,-9.962213,0.17366073,109.64502,12.989514,-7.640959,-112.72532,-186.83052,2.7251992,-2.7118075,67.05034,875000
37
+ 110.15913,0.20032978,0.007839506,-12.050196,0.21001926,109.74093,27.527632,1.3190007,-113.687515,-187.72707,10.775192,-10.752937,208.61453,880000
38
+ 106.51428,0.16372564,-0.00808014,-12.966527,0.22457725,106.134056,8.580919,-2.8969274,-109.64837,-179.08182,0.56050956,-0.5416616,36.156937,885000
39
+ 103.55584,0.19391379,-0.032195028,-14.345027,0.25031534,103.14381,17.878164,-5.1129436,-107.48164,-189.63815,0.8338474,-0.8588891,62.207012,890000
40
+ 105.142105,0.17426372,-0.010745027,-13.11314,0.22980237,104.74878,14.626014,-17.111176,-108.65252,-188.42131,0.72546196,-0.65720093,46.77413,895000
41
+ 104.072205,0.20559163,0.00045756757,-12.473717,0.217156,103.649,18.918823,-4.857683,-107.735405,-184.18343,1.4071808,-1.4083467,56.64585,900000
42
+ 107.96043,0.20296264,-0.020983692,-13.686897,0.24197684,107.53647,16.83411,-1.9557312,-111.38772,-178.27951,1.1511309,-0.97685766,63.743675,905000
43
+ 105.105515,0.1972226,-0.032383565,-14.345575,0.25171602,104.688965,15.079738,-4.860751,-109.31001,-173.91458,0.70476276,-0.55690986,48.513893,910000
44
+ 105.665085,0.21972722,0.0014680871,-12.416531,0.21838604,105.22551,12.612208,-6.3610535,-109.19594,-193.54947,0.84566677,-0.769173,48.811058,915000
45
+ 104.68888,0.19894885,0.005782432,-12.167549,0.21163435,104.272514,13.46273,-6.7367997,-108.30969,-178.67041,0.7109406,-0.49433568,54.182453,920000
46
+ 100.71279,0.19259149,0.033379007,-10.593416,0.1854614,100.30136,18.671152,-4.527279,-104.29262,-180.00333,0.8119329,-0.7853733,53.68466,925000
47
+ 104.914474,0.20850275,0.04057095,-10.194553,0.17940243,104.48599,10.5253525,-3.1517742,-108.6289,-187.31413,2.522317,-1.6447421,78.08299,930000
48
+ 101.32387,0.23234876,0.042420927,-10.079323,0.17663412,100.87247,13.030298,-2.2977874,-104.57183,-181.60071,0.5876783,-0.6900239,48.096127,935000
49
+ 100.82217,0.25537607,0.010832245,-11.869657,0.20397615,100.351974,13.658869,1.5755441,-105.70042,-188.81168,0.4026378,-0.861259,46.488285,940000
50
+ 103.79609,0.2001425,-0.008950044,-13.0207405,0.2237894,103.3811,16.466833,0.46831816,-107.490135,-183.81458,0.8950846,-0.8657018,52.34742,945000
51
+ 94.59795,0.23303512,0.005788022,-12.162393,0.20851499,94.15062,13.322395,-0.30389297,-98.777725,-185.67325,2.5620189,-2.5344934,71.36698,950000
52
+ 104.17459,0.20453288,-0.014228743,-13.324652,0.2299068,103.75438,19.363184,-2.787429,-107.83887,-187.02307,1.0793276,-1.074904,67.80327,955000
53
+ 99.17654,0.18779045,-0.008071817,-12.96126,0.22681558,98.770004,13.764876,2.1780794,-103.24876,-180.98038,0.51673424,-0.46852162,44.053505,960000
54
+ 102.68635,0.21244022,0.02002893,-11.341882,0.19615074,102.25773,11.5754385,-2.7444673,-106.57424,-189.57924,0.6665708,-0.6627389,39.82159,965000
55
+ 101.96707,0.20620099,-0.0067791343,-12.892012,0.22294408,101.54471,13.539374,-6.9162927,-105.206116,-172.18164,0.53825045,-0.56321347,38.89672,970000
56
+ 100.468704,0.19342145,0.008043028,-12.035046,0.20818862,100.05905,17.571646,7.8771987,-103.67627,-192.6252,0.722188,-0.75011915,60.05138,975000
57
+ 102.22275,0.20232272,-0.021616245,-13.768598,0.23460975,101.80743,16.051214,-1.0436859,-106.60217,-187.0432,0.61146986,-0.5997852,52.50157,980000
58
+ 98.09878,0.19350743,-0.0032609955,-12.689234,0.21866885,97.689865,18.451849,-1.4083269,-101.47848,-171.81209,0.87464845,-0.69817483,62.83828,985000
59
+ 95.50525,0.21642657,-0.022702297,-13.810203,0.23929377,95.072235,14.172942,1.5561073,-99.172455,-176.60258,0.47797674,-0.6181435,47.040768,990000
60
+ 96.40601,0.20995158,-0.0056037647,-12.827617,0.21941173,95.98225,15.416697,0.70334476,-99.615906,-185.03203,0.67762774,-0.6551002,44.476048,995000
61
+ 102.1322,0.15990433,0.018208677,-11.452137,0.19900335,101.75508,17.616068,-3.8916163,-105.530205,-181.91403,1.0973096,-1.3771132,76.39444,1000000
62
+ 101.379,0.18030137,0.006528652,-12.118965,0.20764638,100.98452,8.814192,-3.5457757,-105.111626,-186.6195,0.44646713,-0.62805176,43.022194,1005000
63
+ 98.12865,0.17040157,-0.034496874,-14.538613,0.24601856,97.74673,13.562335,1.1152229,-102.67242,-181.81822,0.8308118,-0.60992,53.726547,1010000
64
+ 100.19075,0.19877169,-0.0032809621,-12.693709,0.21500035,99.78026,12.372888,0.91791743,-103.5249,-173.07971,1.077771,-0.90506816,57.044266,1015000
65
+ 99.96716,0.21775782,-0.022492155,-13.804496,0.23801753,99.53388,22.297956,3.914031,-104.43328,-175.57663,0.8408448,-1.8859677,73.90494,1020000
66
+ 97.9935,0.21881917,-0.01371278,-13.306172,0.2263345,97.56206,10.478633,1.5624208,-102.110535,-190.0389,0.51770854,-0.65151274,48.041233,1025000
67
+ 93.54993,0.19507097,0.033179857,-10.55598,0.18016577,93.14151,13.452647,7.106862,-96.62587,-164.20612,1.1325071,-1.0218036,48.724976,1030000
68
+ 98.51479,0.22194564,0.016840378,-11.506008,0.19493672,98.08107,11.642682,-3.2102747,-101.59455,-190.60384,0.47254115,-0.659932,46.221462,1035000
69
+ 100.12888,0.154725,-0.020382324,-13.679017,0.23647678,99.75807,14.156305,-2.7081199,-103.0602,-185.62938,0.9976122,-0.9832604,45.73042,1040000
70
+ 102.19601,0.19263396,-0.04581565,-15.16657,0.2605843,101.788605,13.431735,-4.2467947,-106.89434,-188.14247,0.72572154,-0.82316065,50.999615,1045000
71
+ 93.26083,0.2163777,0.005537141,-12.178487,0.20973948,92.82918,23.283028,-7.1024737,-97.09084,-194.79253,1.093219,-1.4707829,89.21389,1050000
72
+ 98.359856,0.18841222,0.04515686,-9.822727,0.16567737,97.9606,14.02805,-4.197053,-101.72678,-178.30872,0.6156518,-0.63397247,40.215946,1055000
73
+ 95.04121,0.18714033,-0.007896469,-12.9604435,0.22226773,94.639694,14.6420965,-1.3463639,-99.06178,-184.26382,0.5196904,-0.53407955,51.862434,1060000
74
+ 98.28111,0.20013268,-0.014354504,-13.34869,0.22577596,97.86955,17.898314,-0.42865515,-102.15301,-189.42982,0.8102983,-0.8149522,54.71112,1065000
75
+ 95.762184,0.20504701,-0.012680881,-13.242498,0.22616418,95.34365,15.601172,-4.371675,-99.71288,-178.45547,0.910553,-0.52336335,51.12021,1070000
76
+ 93.43696,0.20459192,-0.025720341,-14.025553,0.23646641,93.02162,10.622826,1.2622138,-97.16232,-188.80962,0.7393695,-0.6720529,55.345837,1075000
77
+ 95.93614,0.21458502,0.0075806063,-12.051549,0.20371911,95.510254,23.125776,-1.3286319,-98.476776,-188.18388,3.3082821,-3.636525,102.24527,1080000
78
+ 96.57496,0.18715264,-0.0146622425,-13.365331,0.22646338,96.17601,13.625092,0.12639038,-100.37607,-189.68312,0.5691552,-0.65001726,40.623028,1085000
79
+ 96.84541,0.1854386,-0.00073824247,-12.543513,0.21281205,96.4479,14.8043585,0.85526025,-101.23281,-184.64291,0.6376718,-0.7976411,51.414253,1090000
80
+ 94.91413,0.19243327,0.011752033,-11.81019,0.20120582,94.50874,10.378472,-5.751059,-98.57018,-180.75093,0.8820506,-0.9933844,57.515556,1095000
81
+ 93.4106,0.2114522,0.015097091,-11.600264,0.19464616,92.9894,10.552869,-5.3074255,-97.173485,-176.01775,0.6783555,-0.8464374,54.278816,1100000
82
+ 93.89324,0.21755898,-0.006071975,-12.861081,0.2162732,93.465485,19.275465,1.5600411,-97.551186,-182.10197,1.1788987,-1.081755,61.367584,1105000
83
+ 96.965034,0.18791611,0.036112722,-10.353616,0.17419866,96.5668,17.901445,-2.8864717,-99.99039,-176.68948,0.5750501,-0.493349,48.730324,1110000
84
+ 93.456726,0.16489717,0.0074540977,-12.058872,0.20376866,93.08061,10.717723,-1.2171718,-97.11376,-170.2137,3.4300125,-3.4340768,87.32214,1115000
85
+ 94.30181,0.20229489,-0.016430274,-13.4797945,0.22604404,93.88991,14.600532,1.5851539,-98.34783,-180.82681,0.5326016,-0.5023383,46.590076,1120000
86
+ 89.715645,0.21705791,-0.010901286,-13.149556,0.22068465,89.2888,8.803906,-1.491808,-93.73819,-192.05281,0.6533648,-0.5264318,48.94047,1125000
87
+ 89.21835,0.1963191,0.00038872095,-12.476799,0.2090425,88.8126,16.476843,-3.129145,-92.76949,-179.49681,0.60456824,-0.5877307,48.387283,1130000
88
+ 95.4777,0.19496173,-0.00743403,-12.944334,0.21656808,95.0736,13.819107,4.6149607,-98.998985,-186.60115,1.259044,-1.5035669,73.56267,1135000
89
+ 87.37485,0.23146187,-0.0014548195,-12.588297,0.20741047,86.93743,13.733116,-0.13821247,-90.50585,-191.04172,0.41827372,-0.818612,44.491486,1140000
90
+ 96.508705,0.20934656,0.00054604316,-12.467057,0.20664781,96.09216,8.359951,-1.7350986,-100.855415,-183.85497,0.50803417,-0.3245686,34.99338,1145000
91
+ 88.217926,0.19647789,0.0067764823,-12.084265,0.19697344,87.817696,15.729733,3.2972174,-92.22025,-185.25067,0.72052324,-0.67722756,57.288853,1150000
92
+ 94.412445,0.22223283,-0.020654876,-13.743717,0.22824705,93.98261,13.026938,-3.0048401,-97.57395,-186.39317,0.6643415,-0.6456518,45.95528,1155000
93
+ 89.90588,0.21781674,0.015110418,-11.5896845,0.19237833,89.480576,10.043729,-2.7002654,-94.4284,-176.09454,0.37240833,-0.43474856,38.75659,1160000
94
+ 90.97263,0.2386708,0.0029790485,-12.317854,0.20146185,90.529526,11.438765,-2.249203,-94.279076,-179.54677,0.6578934,-0.7195803,41.48974,1165000
95
+ 90.3946,0.16901137,-0.0015426363,-12.593044,0.20878756,90.01834,10.329692,-3.2134495,-94.152504,-170.67253,0.5240084,-0.42568824,36.586483,1170000
96
+ 91.71376,0.17481697,-0.006728522,-12.906614,0.21357447,91.33209,10.903536,-2.3036215,-95.308464,-185.10503,0.30186132,-0.34922674,34.506813,1175000
97
+ 92.17102,0.21712066,-0.015253309,-13.442293,0.21759625,91.75156,14.482721,2.6239147,-95.73756,-173.57048,0.79640794,-1.6571417,71.23872,1180000
98
+ 89.16049,0.20341958,0.022078289,-11.129726,0.17932576,88.75566,9.446093,-2.6180906,-93.15319,-191.3892,2.1442728,-2.21547,61.68827,1185000
99
+ 89.68239,0.18363932,-0.015772048,-13.482857,0.21636142,89.29816,11.463333,14.914861,-93.36916,-183.41405,0.80111736,-0.80603194,47.26907,1190000
100
+ 83.73791,0.18281493,0.0050842585,-12.189062,0.1993078,83.3507,13.024744,-2.4575193,-88.12901,-186.69722,0.8053094,-0.8865109,56.916203,1195000
101
+ 84.54124,0.20237322,0.0063008033,-12.106695,0.19395112,84.13861,6.6703386,-0.6526278,-87.72396,-190.60056,0.27259058,-0.36264923,32.13459,1200000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebb21a8b723794009912b2b7ce755f9d5da892c770d0d73f063e7a30ff56e06b
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9f3fd850fba39431ad62ad2da123a26039fc6a82a8b2517fa51d42ed2fecda2
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dd920412aeefadbb9f47d2c8c0cddefeac52967e61a93536d30adf9838b9c8a
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce32a9bb315fc254a56a9089b0df06c2e1872fa2bc14f513f44d81b4919f0ef3
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1696fe5b5427e79d5e1b3b197524eb4255f442aa9071a03f83c8200c4da1cce
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73f3cc9939605c8c76df1325281952e857fe37e172c1c541f730295f545f04c9
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f9c63e997d63a86aa236b2327c3fd4a41c74777c8efd4b593ac4acf719d2020
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28229ca05b0bbe7677fa6ac688c71dbab48192ab98691ddf3b43dd5ff09ad999
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0eb8a6eed85aa1e0f90036088f7cc5e2cda6d78345a9f6e195f99bb95c7e2dc4
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:815b9568000a5526cf2f0bed67f232b9686fc44c91c2d8c8c036d8717ac96550
3
+ size 218123833
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/fedit/20260319_024021/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/s1rqjyrt