Tiredsheep commited on
Commit
261a9df
·
verified ·
1 Parent(s): 1b5cda8

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_450000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_500000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_550000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_600000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_650000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_700000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_750000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_800000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_850000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_900000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.02377714327148179,-0.0030835040608588843,-0.02377774537435422,0.021889877096774996,34.50436720586021,9.539999999999665,0.94,4368.46,-0.12,-266.14,188.8,0.6211354207992553,450000
3
+ 0.0,0.0,-0.02659536650337673,-0.005162665740298093,-0.026586085782689655,-0.0037204354803506505,34.90050007180478,6.768999999999564,1.0,13274.06,0.0,-184.16,133.38,0.45239766120910646,500000
4
+ 0.0,0.0,-0.024759027818477084,-0.004310037917494797,-0.02476189332426275,-0.003808717895224875,35.49581052495901,6.4909999999995955,1.0,20050.58,0.0,-181.12,127.82,0.42732916355133055,550000
5
+ 0.0,0.0,-0.02443000061625475,-0.005181079487394602,-0.0245529571260191,-0.004783656051665413,35.411418724173025,5.870999999999596,1.0,26305.82,0.0,-161.76,115.42,0.38958216667175294,600000
6
+ 0.0,0.0,-0.03480618410169093,-0.003355971294305817,-0.034389137245746694,-0.02626080200706025,35.51019612744988,6.088999999999571,0.98,32583.48,-0.02,-166.6,119.78,0.40638222217559816,650000
7
+ 0.0,0.0,-0.02794108827666889,0.0003782997086809447,-0.027601149086877382,0.0057758683019884715,35.50139037791774,5.245999999999676,1.0,38242.14,0.0,-143.06,102.92,0.351343035697937,700000
8
+ 0.0,0.0,-0.042612335597431564,0.002333934623337618,-0.04158536574895959,0.054310359634030914,35.369154324897806,4.925999999999679,1.0,43395.66,0.0,-133.08,96.52,0.323686466217041,750000
9
+ 0.0,0.0,-0.04598527306871166,0.025890167183520177,-0.04435652284821863,0.030707402599506887,35.72090966646393,4.921999999999696,1.0,48446.78,0.0,-134.08,96.44,0.32163807392120364,800000
10
+ 0.0,0.0,-0.0496186124390977,0.019040239561322718,-0.04846833855551509,0.008650228626125907,35.53331210405179,4.739999999999703,1.0,53350.54,0.0,-130.04,92.8,0.31548972606658937,850000
11
+ 0.0,0.0,-0.05889592110198165,0.03234751232470127,-0.05696908739749291,0.014877471742908746,35.56994111872831,4.420999999999735,1.0,58078.06,0.0,-119.52,86.42,0.3050522708892822,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.02377714327148179,-0.0030835040608588843,-0.02377774537435422,0.021889877096774996,34.50436720586021,9.539999999999665,0.94,4368.46,-0.12,-266.14,188.8,0.6211354207992553,450000
3
+ 0.0,0.0,-0.02659536650337673,-0.005162665740298093,-0.026586085782689655,-0.0037204354803506505,34.90050007180478,6.768999999999564,1.0,13274.06,0.0,-184.16,133.38,0.45239766120910646,500000
4
+ 0.0,0.0,-0.024759027818477084,-0.004310037917494797,-0.02476189332426275,-0.003808717895224875,35.49581052495901,6.4909999999995955,1.0,20050.58,0.0,-181.12,127.82,0.42732916355133055,550000
5
+ 0.0,0.0,-0.02443000061625475,-0.005181079487394602,-0.0245529571260191,-0.004783656051665413,35.411418724173025,5.870999999999596,1.0,26305.82,0.0,-161.76,115.42,0.38958216667175294,600000
6
+ 0.0,0.0,-0.03480618410169093,-0.003355971294305817,-0.034389137245746694,-0.02626080200706025,35.51019612744988,6.088999999999571,0.98,32583.48,-0.02,-166.6,119.78,0.40638222217559816,650000
7
+ 0.0,0.0,-0.02794108827666889,0.0003782997086809447,-0.027601149086877382,0.0057758683019884715,35.50139037791774,5.245999999999676,1.0,38242.14,0.0,-143.06,102.92,0.351343035697937,700000
8
+ 0.0,0.0,-0.042612335597431564,0.002333934623337618,-0.04158536574895959,0.054310359634030914,35.369154324897806,4.925999999999679,1.0,43395.66,0.0,-133.08,96.52,0.323686466217041,750000
9
+ 0.0,0.0,-0.04598527306871166,0.025890167183520177,-0.04435652284821863,0.030707402599506887,35.72090966646393,4.921999999999696,1.0,48446.78,0.0,-134.08,96.44,0.32163807392120364,800000
10
+ 0.0,0.0,-0.0496186124390977,0.019040239561322718,-0.04846833855551509,0.008650228626125907,35.53331210405179,4.739999999999703,1.0,53350.54,0.0,-130.04,92.8,0.31548972606658937,850000
11
+ 0.0,0.0,-0.05889592110198165,0.03234751232470127,-0.05696908739749291,0.014877471742908746,35.56994111872831,4.420999999999735,1.0,58078.06,0.0,-119.52,86.42,0.3050522708892822,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 86.76055,49.861343,0.7707269,1.9539603,86.76055,0.19666895,10.385406,-53.113827,-154.51414,-203.27692,10.19539,-9.1399555,385.02078,405000
3
+ 48.539413,19.55403,0.63407737,1.2433679,48.539413,0.1920048,8.542559,-43.776485,-151.97423,-201.05693,7.0402575,-7.0290394,323.6214,410000
4
+ 2004.3916,37.884445,0.8076503,1.8904638,2004.3916,0.20436707,8.311284,-45.20519,-146.6446,-202.72662,47.575886,-50.516747,920.4609,415000
5
+ 193.10661,58.378536,0.8596481,2.1484008,193.10661,0.17471789,10.82828,-25.147114,-145.7794,-204.58176,11.669531,-16.094416,486.02808,420000
6
+ 251.25024,36.26434,0.7655731,1.5405751,251.25024,0.1979292,8.145107,-28.126,-142.41824,-205.6413,46.625366,-36.459736,716.5912,425000
7
+ 167.2634,49.49997,0.8207501,1.7801094,167.2634,0.19358754,13.692172,-5.031059,-141.46605,-204.27429,24.445301,-23.931833,607.86414,430000
8
+ 322.48798,68.505516,0.8921101,2.1750078,322.48798,0.16801569,9.738695,-3.4721322,-141.32384,-203.74269,33.009987,-35.674694,661.16693,435000
9
+ 131.8713,78.030716,0.83360624,1.9946803,131.8713,0.20521924,11.480783,-13.639171,-140.31654,-204.0829,14.023985,-14.000687,469.03534,440000
10
+ 153.56944,43.687527,0.90746987,2.3212888,153.56944,0.18083999,14.553995,-44.577194,-140.98058,-205.3806,27.615467,-24.96814,518.81757,445000
11
+ 262.27997,53.152508,0.82393646,1.9804348,262.27997,0.17297733,11.6861315,-5.831638,-138.01659,-201.86264,80.0005,-87.84236,1080.9366,450000
12
+ 145.64963,34.21648,0.8749255,1.8952103,145.64963,0.19335562,16.078495,-16.628712,-136.67393,-204.1581,17.493553,-23.533833,456.63998,455000
13
+ 191.65433,45.62201,0.7913238,1.7571174,191.65433,0.21365204,14.673685,-8.181197,-133.13762,-203.70212,34.182434,-41.5903,738.6018,460000
14
+ 183.56538,60.963543,0.90161955,2.3571253,183.56538,0.16566738,12.603721,-21.388607,-134.91492,-204.65512,29.759548,-35.906067,607.17664,465000
15
+ 95.85333,44.90395,0.86582726,1.8071203,95.85333,0.19787367,10.809168,-30.677471,-130.87431,-204.68475,12.345491,-13.247326,409.80798,470000
16
+ 124.46897,72.116844,0.8378605,2.0972788,124.46897,0.18534864,11.361556,-4.922303,-133.46776,-206.1163,28.215479,-23.999641,512.9966,475000
17
+ 220.37343,52.287247,0.8305226,1.7476124,220.37343,0.19430783,8.615044,-8.373473,-132.4973,-203.30751,56.18585,-59.548523,986.3743,480000
18
+ 166.44421,49.319817,0.7845539,1.7455887,166.44421,0.15435845,10.494006,-7.5985575,-131.03763,-204.17188,9.891394,-12.056726,459.18707,485000
19
+ 170.4057,57.12674,0.7864415,1.6727812,170.4057,0.17337225,10.395865,-12.12813,-131.19551,-204.27066,38.169777,-44.52569,638.95483,490000
20
+ 376.91724,59.710796,0.82769376,2.007429,376.91724,0.16940233,7.6939683,-12.047846,-130.9403,-204.10411,43.023495,-55.12059,800.7657,495000
21
+ 252.10968,41.04834,0.8416476,1.8681723,252.10968,0.17287064,17.669851,-14.048727,-125.58013,-203.14201,11.117022,-11.196056,489.71884,500000
22
+ 167.95314,57.593372,1.0041864,2.3973758,167.95314,0.19690216,16.935734,-3.910102,-131.06047,-204.23686,21.324236,-26.239773,547.6936,505000
23
+ 148.11151,30.559856,0.7769653,1.5532324,148.11151,0.21604237,9.273035,-7.024894,-126.65684,-201.46051,24.74365,-17.693644,454.0313,510000
24
+ 118.17131,49.870564,0.80726683,1.844088,118.17131,0.16739662,10.562599,1.3522202,-125.19375,-199.65826,15.727909,-13.741228,454.8081,515000
25
+ 90.891426,50.959164,0.80113477,1.9999256,90.891426,0.16837241,11.821422,-4.2139416,-126.58099,-201.88377,12.378007,-16.504837,453.60956,520000
26
+ 105.64703,52.17998,0.8396826,1.9652401,105.64703,0.18844861,12.123694,-7.132643,-131.00829,-201.36742,15.913022,-14.301994,505.20294,525000
27
+ 2824.5752,97.15428,0.93127424,2.6820102,2824.5752,0.17798367,6.9892335,-10.505265,-129.2521,-200.17354,64.79989,-62.840317,1141.9713,530000
28
+ 148.57877,84.13823,0.84770125,2.128266,148.57877,0.21422404,9.153096,3.5068667,-126.36841,-203.8383,29.736588,-22.527374,712.939,535000
29
+ 86.157196,32.91439,0.77671176,1.5137819,86.157196,0.15359977,13.352674,-7.597601,-121.04508,-195.09772,12.89443,-15.036761,461.3312,540000
30
+ 325.28128,24.25648,0.79467016,1.5356939,325.28128,0.188502,9.114272,-4.2086234,-125.936455,-200.29196,19.64609,-19.542809,599.65405,545000
31
+ 98.81268,45.281364,0.9166644,2.2224672,98.81268,0.15397128,8.221522,-10.317914,-126.81907,-202.9265,23.282362,-21.25297,488.44702,550000
32
+ 74.271126,82.07189,0.7588385,2.14183,74.271126,0.19408485,5.326196,-3.4962926,-122.816826,-198.06873,21.510199,-22.886654,441.48483,555000
33
+ 206.77046,65.97543,0.8321261,1.9983091,206.77046,0.16807464,13.430371,-0.78099996,-124.67468,-204.83952,50.892185,-63.840252,821.8871,560000
34
+ 53.472572,29.778868,0.76892257,1.3199195,53.472572,0.18676871,8.916557,1.562844,-122.06521,-198.2188,16.895971,-14.970745,430.0307,565000
35
+ 141.30952,36.45471,0.8453834,1.6479328,141.30952,0.16558246,7.2023787,-4.2103944,-123.01116,-202.76141,25.277813,-24.416021,517.7953,570000
36
+ 236.82422,34.09146,0.7810327,1.7124931,236.82422,0.19607496,11.654233,-12.373093,-124.03584,-203.61874,22.996206,-23.239647,579.3907,575000
37
+ 71.19495,54.485897,0.784582,1.6616151,71.19495,0.16492005,5.8231883,2.5909474,-125.45894,-201.69586,13.660369,-17.416079,453.10638,580000
38
+ 135.43332,31.706285,0.8276289,1.7856169,135.43332,0.18574303,10.4809065,-5.4789605,-119.11604,-200.8079,36.15436,-31.452065,555.0348,585000
39
+ 11107.981,43.24849,0.8608014,1.7966231,11107.981,0.17431693,8.99974,-7.6762514,-119.92187,-199.13554,209.87726,-304.13098,4322.2627,590000
40
+ 65.15948,29.16358,0.7870973,1.508655,65.15948,0.16912042,9.501841,-4.308037,-119.44463,-199.11212,12.439478,-11.864088,356.12714,595000
41
+ 225.41008,57.93618,0.83851457,2.286039,225.41008,0.16601261,11.087802,-4.866708,-117.846825,-201.19824,36.81086,-44.482548,705.2883,600000
42
+ 53.65919,35.397846,0.75204784,1.417531,53.65919,0.1617565,9.187911,6.6932297,-119.53625,-200.27304,9.460438,-10.919937,346.2781,605000
43
+ 78.89143,54.695686,0.80115426,1.7950382,78.89143,0.16985641,8.291246,2.5299482,-118.13621,-191.29579,7.8952394,-9.7974205,369.45282,610000
44
+ 162.51306,50.971607,0.90130657,2.1431584,162.51306,0.16641557,9.404892,2.6019385,-121.40039,-201.90442,21.52706,-24.545925,637.68463,615000
45
+ 121.73536,45.375927,0.90850425,2.1753542,121.73536,0.16466206,7.6159472,1.9994882,-116.72394,-194.34999,37.747433,-39.22865,741.2898,620000
46
+ 1572.2479,75.08517,0.88554734,2.7784607,1572.2479,0.17115118,11.109553,0.35834354,-111.790855,-197.93999,39.084076,-38.995834,1021.56775,625000
47
+ 149.74261,53.635105,0.77755827,1.5737491,149.74261,0.16422462,10.437612,-4.941439,-119.67759,-196.3246,15.207573,-15.494997,550.8223,630000
48
+ 115.214424,53.373398,0.8185452,1.91571,115.214424,0.15744674,12.060712,-2.136906,-115.46655,-195.4451,14.476638,-17.81947,579.963,635000
49
+ 109.214424,60.17381,0.8106496,1.7204959,109.214424,0.16897012,13.861101,1.3281,-116.87959,-204.5616,23.783184,-31.577477,576.8968,640000
50
+ 87.35207,36.72392,0.84988666,1.7274338,87.35207,0.16441911,15.559819,-3.9314632,-118.7022,-199.03973,11.80836,-11.010994,418.52057,645000
51
+ 60.336807,33.736324,0.77881926,1.6178837,60.336807,0.17404112,8.651348,-1.8561277,-108.20396,-203.48102,14.184042,-14.00252,410.03357,650000
52
+ 219.70517,48.073303,0.88226295,2.2026227,219.70517,0.21190715,17.498272,-4.3203945,-120.00103,-200.24722,82.567856,-80.48458,909.6892,655000
53
+ 214.61548,53.365513,0.8842369,1.9991301,214.61548,0.20165762,7.5032783,2.637326,-114.63409,-202.52791,29.083536,-30.462141,685.2683,660000
54
+ 77.478424,50.097645,0.80954576,1.7930717,77.478424,0.1751527,12.629466,-4.7822065,-116.21222,-202.4437,11.356047,-10.999591,388.64478,665000
55
+ 98.787224,102.497795,0.92810535,2.7608192,98.787224,0.16610013,13.662272,-5.8530416,-117.78751,-189.79305,47.783813,-50.135857,695.56714,670000
56
+ 111.98629,53.211597,0.87802345,2.0271297,111.98629,0.18979448,7.9366226,-5.677345,-112.83327,-199.41003,12.9851265,-14.167629,415.1293,675000
57
+ 102.288284,44.745937,0.88853896,1.8634785,102.288284,0.17549348,8.231489,-4.953134,-119.046486,-205.13297,17.862284,-19.256863,504.40558,680000
58
+ 128.80757,73.25266,0.95456696,2.567134,128.80757,0.15692025,8.6904545,-3.0060446,-110.05403,-197.1196,13.252465,-22.745546,544.0449,685000
59
+ 117.82396,53.860695,0.8930046,2.0138917,117.82396,0.1537868,11.130305,-1.7845068,-110.05615,-196.57077,40.787548,-37.48084,693.18884,690000
60
+ 105.67265,64.25056,0.7991775,1.9248774,105.67265,0.19052058,12.5813055,0.9990264,-109.53979,-197.85089,30.758734,-31.351265,532.2217,695000
61
+ 73.62953,34.760235,0.82267356,1.7164525,73.62953,0.18141797,9.9320755,-2.0488794,-113.9943,-200.4835,11.280344,-11.289507,434.24002,700000
62
+ 444.0855,34.514256,0.7945845,1.5268414,444.0855,0.16277626,14.190712,3.4057307,-114.49003,-199.43954,35.93206,-34.636364,671.70166,705000
63
+ 155.22147,74.261086,0.89583814,2.3942745,155.22147,0.15872064,14.741773,-7.705519,-112.026245,-202.2133,37.340076,-31.448704,689.2561,710000
64
+ 117.42753,39.231644,0.87228435,1.8751873,117.42753,0.15410128,6.9006805,1.4601039,-113.49617,-195.97632,16.850758,-14.409643,528.2014,715000
65
+ 211.26733,57.51436,0.83794844,1.7964967,211.26733,0.17044975,10.484345,-1.4841467,-114.1947,-202.90932,51.143646,-50.328903,845.9622,720000
66
+ 85.59852,41.39444,0.82458556,1.8794248,85.59852,0.14426851,8.257953,-4.6157484,-110.212,-204.89268,18.17035,-17.893116,539.30115,725000
67
+ 1485.729,40.20817,0.89509964,1.8838731,1485.729,0.16656947,14.3474,0.4780103,-106.90098,-189.0825,90.98428,-84.88474,1534.3496,730000
68
+ 99.83242,53.378242,0.8487402,1.9278957,99.83242,0.16948247,7.79297,-13.728922,-110.24352,-202.52406,21.647297,-20.317188,441.95398,735000
69
+ 99.119194,53.944637,0.78580093,1.7170434,99.119194,0.1416137,12.41339,-0.43244407,-112.47522,-201.63286,22.87611,-23.349527,488.61804,740000
70
+ 275.3968,37.95932,0.9248816,1.9667214,275.3968,0.14355257,10.418777,2.5734255,-115.27844,-196.67198,30.189121,-32.865826,766.7648,745000
71
+ 96.776306,57.63674,0.9066711,2.4694338,96.776306,0.12972793,7.000381,4.001671,-105.165825,-203.95721,33.125443,-40.68482,561.25977,750000
72
+ 147.29152,60.56502,0.8677707,2.15635,147.29152,0.15750909,6.691724,-0.73619205,-111.91869,-203.05545,22.74366,-32.29527,549.895,755000
73
+ 92.904816,34.749973,0.9011559,1.851046,92.904816,0.18954413,8.4139,-2.8444052,-105.158325,-202.7722,31.93391,-28.178223,524.7628,760000
74
+ 78.95353,28.67589,0.8307759,1.502874,78.95353,0.16407743,13.128372,-0.55677605,-110.998535,-203.80725,22.828667,-21.19104,420.0838,765000
75
+ 68.26767,61.82445,0.78049904,1.6376331,68.26767,0.16288455,12.600085,-3.271187,-109.95829,-201.58946,19.885237,-18.122328,529.54535,770000
76
+ 116.234314,65.231674,0.8858239,2.2032328,116.234314,0.14618103,7.3779054,3.7518888,-108.357315,-193.30634,22.849852,-26.34189,564.54047,775000
77
+ 111.56714,61.21972,0.85787445,2.285712,111.56714,0.15923944,5.4256897,-0.7641851,-105.81585,-201.63141,32.201027,-30.683802,638.9723,780000
78
+ 68.94369,36.880203,0.75768495,1.4432372,68.94369,0.17281981,11.3914,0.44302523,-107.02665,-204.0154,15.815756,-15.601738,467.15002,785000
79
+ 97.629456,40.757603,0.8352906,1.800172,97.629456,0.1712864,10.103554,5.6479883,-110.206474,-203.61633,35.11548,-32.41894,561.9246,790000
80
+ 192.9202,159.40433,1.0045291,3.392467,192.9202,0.16091299,10.724608,-2.4582977,-108.288895,-186.4092,66.60034,-61.321022,1030.6265,795000
81
+ 68.384544,30.03999,0.8074574,1.5505537,68.384544,0.15102692,11.174011,-0.6601643,-104.300735,-201.7715,18.700703,-18.958744,476.71872,800000
82
+ 89.29743,37.008118,0.8102723,1.592759,89.29743,0.17262001,7.2873836,2.1533349,-106.88063,-202.33817,30.042044,-24.543226,638.7739,805000
83
+ 1094.1271,74.70503,0.84853834,2.359577,1094.1271,0.1765312,6.900866,1.492358,-109.940384,-197.52808,77.64395,-93.50113,1163.0153,810000
84
+ 89.09611,63.993736,0.85438263,2.134264,89.09611,0.17704964,6.009826,0.19066283,-105.27051,-194.68106,32.047028,-37.26977,520.3405,815000
85
+ 114.73842,54.030552,0.7869628,1.6803685,114.73842,0.16132866,10.160247,0.26987964,-107.96963,-199.6928,18.405111,-21.853361,472.1546,820000
86
+ 132.14291,63.23186,0.92450637,2.251877,132.14291,0.15696986,11.503676,-2.015034,-105.15574,-201.76349,53.167953,-74.20234,723.7092,825000
87
+ 151.47333,70.337746,0.91880506,2.3777988,151.47333,0.16246901,17.1891,-0.19840404,-101.00689,-187.01707,44.254974,-49.985264,658.8837,830000
88
+ 91.03414,95.36042,0.84299123,2.1802638,91.03414,0.16507986,8.553807,-4.105972,-107.19324,-196.59267,14.57362,-15.73753,416.10272,835000
89
+ 91.773705,52.24922,0.8513324,1.918158,91.773705,0.16238584,6.408912,-1.281793,-100.49275,-202.28986,43.152706,-42.90877,841.08936,840000
90
+ 183.94156,71.940544,0.8225818,1.8261507,183.94156,0.14935112,9.79703,-5.6597953,-107.58474,-199.25052,40.100716,-36.082863,706.4858,845000
91
+ 262.8415,51.751534,0.9674818,2.2986205,262.8415,0.16149297,8.430525,-1.9528822,-102.1751,-193.4369,56.013172,-58.15065,1016.97723,850000
92
+ 79.465744,51.969406,0.86491555,1.7832155,79.465744,0.16518033,4.718362,1.7035462,-102.82647,-187.25613,15.611069,-16.11784,442.11792,855000
93
+ 72.28282,36.11667,0.8596591,1.7259125,72.28282,0.15558843,12.240811,-0.22230653,-103.29187,-189.11089,26.20269,-14.263849,536.4213,860000
94
+ 74.21773,31.582613,0.81827384,1.5982858,74.21773,0.14877744,8.29953,-8.29796,-103.80991,-200.83502,14.710085,-16.316425,472.72015,865000
95
+ 129.20549,54.238045,0.76372343,1.6602442,129.20549,0.14603506,9.519709,0.5411986,-103.47544,-198.55577,42.909855,-38.181892,745.5835,870000
96
+ 172.40979,96.06824,0.9197341,2.5109484,172.40979,0.1276635,9.76579,1.5378928,-104.94861,-202.20413,41.657845,-51.197777,703.6059,875000
97
+ 146.2342,51.0099,0.9642503,2.1406536,146.2342,0.16175365,8.873911,1.8397624,-104.49678,-193.4828,57.103577,-50.630272,750.29297,880000
98
+ 134.33023,80.35818,0.950881,2.3958628,134.33023,0.1343015,9.747345,-1.606576,-101.39943,-195.86034,20.560127,-21.113775,555.06134,885000
99
+ 83.67289,62.037334,0.83476377,2.0009582,83.67289,0.15629144,7.0584793,-3.4934356,-99.08268,-195.20522,11.277386,-13.491167,361.20862,890000
100
+ 91.766205,41.192978,0.8217626,1.6899042,91.766205,0.12320092,7.849726,5.2755256,-95.58921,-201.87364,42.74396,-37.305283,710.4884,895000
101
+ 158.59805,58.72584,0.96264285,2.143373,158.59805,0.15878642,6.490504,-2.6413412,-97.490105,-202.4374,13.267875,-12.019755,508.95087,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/adj_loss,actor/adj_max,actor/adj_mean,actor/adj_std,actor/fast_loss,actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 86.76055,49.861343,0.7707269,1.9539603,86.76055,0.19666895,10.385406,-53.113827,-154.51414,-203.27692,10.19539,-9.1399555,385.02078,405000
3
+ 48.539413,19.55403,0.63407737,1.2433679,48.539413,0.1920048,8.542559,-43.776485,-151.97423,-201.05693,7.0402575,-7.0290394,323.6214,410000
4
+ 2004.3916,37.884445,0.8076503,1.8904638,2004.3916,0.20436707,8.311284,-45.20519,-146.6446,-202.72662,47.575886,-50.516747,920.4609,415000
5
+ 193.10661,58.378536,0.8596481,2.1484008,193.10661,0.17471789,10.82828,-25.147114,-145.7794,-204.58176,11.669531,-16.094416,486.02808,420000
6
+ 251.25024,36.26434,0.7655731,1.5405751,251.25024,0.1979292,8.145107,-28.126,-142.41824,-205.6413,46.625366,-36.459736,716.5912,425000
7
+ 167.2634,49.49997,0.8207501,1.7801094,167.2634,0.19358754,13.692172,-5.031059,-141.46605,-204.27429,24.445301,-23.931833,607.86414,430000
8
+ 322.48798,68.505516,0.8921101,2.1750078,322.48798,0.16801569,9.738695,-3.4721322,-141.32384,-203.74269,33.009987,-35.674694,661.16693,435000
9
+ 131.8713,78.030716,0.83360624,1.9946803,131.8713,0.20521924,11.480783,-13.639171,-140.31654,-204.0829,14.023985,-14.000687,469.03534,440000
10
+ 153.56944,43.687527,0.90746987,2.3212888,153.56944,0.18083999,14.553995,-44.577194,-140.98058,-205.3806,27.615467,-24.96814,518.81757,445000
11
+ 262.27997,53.152508,0.82393646,1.9804348,262.27997,0.17297733,11.6861315,-5.831638,-138.01659,-201.86264,80.0005,-87.84236,1080.9366,450000
12
+ 145.64963,34.21648,0.8749255,1.8952103,145.64963,0.19335562,16.078495,-16.628712,-136.67393,-204.1581,17.493553,-23.533833,456.63998,455000
13
+ 191.65433,45.62201,0.7913238,1.7571174,191.65433,0.21365204,14.673685,-8.181197,-133.13762,-203.70212,34.182434,-41.5903,738.6018,460000
14
+ 183.56538,60.963543,0.90161955,2.3571253,183.56538,0.16566738,12.603721,-21.388607,-134.91492,-204.65512,29.759548,-35.906067,607.17664,465000
15
+ 95.85333,44.90395,0.86582726,1.8071203,95.85333,0.19787367,10.809168,-30.677471,-130.87431,-204.68475,12.345491,-13.247326,409.80798,470000
16
+ 124.46897,72.116844,0.8378605,2.0972788,124.46897,0.18534864,11.361556,-4.922303,-133.46776,-206.1163,28.215479,-23.999641,512.9966,475000
17
+ 220.37343,52.287247,0.8305226,1.7476124,220.37343,0.19430783,8.615044,-8.373473,-132.4973,-203.30751,56.18585,-59.548523,986.3743,480000
18
+ 166.44421,49.319817,0.7845539,1.7455887,166.44421,0.15435845,10.494006,-7.5985575,-131.03763,-204.17188,9.891394,-12.056726,459.18707,485000
19
+ 170.4057,57.12674,0.7864415,1.6727812,170.4057,0.17337225,10.395865,-12.12813,-131.19551,-204.27066,38.169777,-44.52569,638.95483,490000
20
+ 376.91724,59.710796,0.82769376,2.007429,376.91724,0.16940233,7.6939683,-12.047846,-130.9403,-204.10411,43.023495,-55.12059,800.7657,495000
21
+ 252.10968,41.04834,0.8416476,1.8681723,252.10968,0.17287064,17.669851,-14.048727,-125.58013,-203.14201,11.117022,-11.196056,489.71884,500000
22
+ 167.95314,57.593372,1.0041864,2.3973758,167.95314,0.19690216,16.935734,-3.910102,-131.06047,-204.23686,21.324236,-26.239773,547.6936,505000
23
+ 148.11151,30.559856,0.7769653,1.5532324,148.11151,0.21604237,9.273035,-7.024894,-126.65684,-201.46051,24.74365,-17.693644,454.0313,510000
24
+ 118.17131,49.870564,0.80726683,1.844088,118.17131,0.16739662,10.562599,1.3522202,-125.19375,-199.65826,15.727909,-13.741228,454.8081,515000
25
+ 90.891426,50.959164,0.80113477,1.9999256,90.891426,0.16837241,11.821422,-4.2139416,-126.58099,-201.88377,12.378007,-16.504837,453.60956,520000
26
+ 105.64703,52.17998,0.8396826,1.9652401,105.64703,0.18844861,12.123694,-7.132643,-131.00829,-201.36742,15.913022,-14.301994,505.20294,525000
27
+ 2824.5752,97.15428,0.93127424,2.6820102,2824.5752,0.17798367,6.9892335,-10.505265,-129.2521,-200.17354,64.79989,-62.840317,1141.9713,530000
28
+ 148.57877,84.13823,0.84770125,2.128266,148.57877,0.21422404,9.153096,3.5068667,-126.36841,-203.8383,29.736588,-22.527374,712.939,535000
29
+ 86.157196,32.91439,0.77671176,1.5137819,86.157196,0.15359977,13.352674,-7.597601,-121.04508,-195.09772,12.89443,-15.036761,461.3312,540000
30
+ 325.28128,24.25648,0.79467016,1.5356939,325.28128,0.188502,9.114272,-4.2086234,-125.936455,-200.29196,19.64609,-19.542809,599.65405,545000
31
+ 98.81268,45.281364,0.9166644,2.2224672,98.81268,0.15397128,8.221522,-10.317914,-126.81907,-202.9265,23.282362,-21.25297,488.44702,550000
32
+ 74.271126,82.07189,0.7588385,2.14183,74.271126,0.19408485,5.326196,-3.4962926,-122.816826,-198.06873,21.510199,-22.886654,441.48483,555000
33
+ 206.77046,65.97543,0.8321261,1.9983091,206.77046,0.16807464,13.430371,-0.78099996,-124.67468,-204.83952,50.892185,-63.840252,821.8871,560000
34
+ 53.472572,29.778868,0.76892257,1.3199195,53.472572,0.18676871,8.916557,1.562844,-122.06521,-198.2188,16.895971,-14.970745,430.0307,565000
35
+ 141.30952,36.45471,0.8453834,1.6479328,141.30952,0.16558246,7.2023787,-4.2103944,-123.01116,-202.76141,25.277813,-24.416021,517.7953,570000
36
+ 236.82422,34.09146,0.7810327,1.7124931,236.82422,0.19607496,11.654233,-12.373093,-124.03584,-203.61874,22.996206,-23.239647,579.3907,575000
37
+ 71.19495,54.485897,0.784582,1.6616151,71.19495,0.16492005,5.8231883,2.5909474,-125.45894,-201.69586,13.660369,-17.416079,453.10638,580000
38
+ 135.43332,31.706285,0.8276289,1.7856169,135.43332,0.18574303,10.4809065,-5.4789605,-119.11604,-200.8079,36.15436,-31.452065,555.0348,585000
39
+ 11107.981,43.24849,0.8608014,1.7966231,11107.981,0.17431693,8.99974,-7.6762514,-119.92187,-199.13554,209.87726,-304.13098,4322.2627,590000
40
+ 65.15948,29.16358,0.7870973,1.508655,65.15948,0.16912042,9.501841,-4.308037,-119.44463,-199.11212,12.439478,-11.864088,356.12714,595000
41
+ 225.41008,57.93618,0.83851457,2.286039,225.41008,0.16601261,11.087802,-4.866708,-117.846825,-201.19824,36.81086,-44.482548,705.2883,600000
42
+ 53.65919,35.397846,0.75204784,1.417531,53.65919,0.1617565,9.187911,6.6932297,-119.53625,-200.27304,9.460438,-10.919937,346.2781,605000
43
+ 78.89143,54.695686,0.80115426,1.7950382,78.89143,0.16985641,8.291246,2.5299482,-118.13621,-191.29579,7.8952394,-9.7974205,369.45282,610000
44
+ 162.51306,50.971607,0.90130657,2.1431584,162.51306,0.16641557,9.404892,2.6019385,-121.40039,-201.90442,21.52706,-24.545925,637.68463,615000
45
+ 121.73536,45.375927,0.90850425,2.1753542,121.73536,0.16466206,7.6159472,1.9994882,-116.72394,-194.34999,37.747433,-39.22865,741.2898,620000
46
+ 1572.2479,75.08517,0.88554734,2.7784607,1572.2479,0.17115118,11.109553,0.35834354,-111.790855,-197.93999,39.084076,-38.995834,1021.56775,625000
47
+ 149.74261,53.635105,0.77755827,1.5737491,149.74261,0.16422462,10.437612,-4.941439,-119.67759,-196.3246,15.207573,-15.494997,550.8223,630000
48
+ 115.214424,53.373398,0.8185452,1.91571,115.214424,0.15744674,12.060712,-2.136906,-115.46655,-195.4451,14.476638,-17.81947,579.963,635000
49
+ 109.214424,60.17381,0.8106496,1.7204959,109.214424,0.16897012,13.861101,1.3281,-116.87959,-204.5616,23.783184,-31.577477,576.8968,640000
50
+ 87.35207,36.72392,0.84988666,1.7274338,87.35207,0.16441911,15.559819,-3.9314632,-118.7022,-199.03973,11.80836,-11.010994,418.52057,645000
51
+ 60.336807,33.736324,0.77881926,1.6178837,60.336807,0.17404112,8.651348,-1.8561277,-108.20396,-203.48102,14.184042,-14.00252,410.03357,650000
52
+ 219.70517,48.073303,0.88226295,2.2026227,219.70517,0.21190715,17.498272,-4.3203945,-120.00103,-200.24722,82.567856,-80.48458,909.6892,655000
53
+ 214.61548,53.365513,0.8842369,1.9991301,214.61548,0.20165762,7.5032783,2.637326,-114.63409,-202.52791,29.083536,-30.462141,685.2683,660000
54
+ 77.478424,50.097645,0.80954576,1.7930717,77.478424,0.1751527,12.629466,-4.7822065,-116.21222,-202.4437,11.356047,-10.999591,388.64478,665000
55
+ 98.787224,102.497795,0.92810535,2.7608192,98.787224,0.16610013,13.662272,-5.8530416,-117.78751,-189.79305,47.783813,-50.135857,695.56714,670000
56
+ 111.98629,53.211597,0.87802345,2.0271297,111.98629,0.18979448,7.9366226,-5.677345,-112.83327,-199.41003,12.9851265,-14.167629,415.1293,675000
57
+ 102.288284,44.745937,0.88853896,1.8634785,102.288284,0.17549348,8.231489,-4.953134,-119.046486,-205.13297,17.862284,-19.256863,504.40558,680000
58
+ 128.80757,73.25266,0.95456696,2.567134,128.80757,0.15692025,8.6904545,-3.0060446,-110.05403,-197.1196,13.252465,-22.745546,544.0449,685000
59
+ 117.82396,53.860695,0.8930046,2.0138917,117.82396,0.1537868,11.130305,-1.7845068,-110.05615,-196.57077,40.787548,-37.48084,693.18884,690000
60
+ 105.67265,64.25056,0.7991775,1.9248774,105.67265,0.19052058,12.5813055,0.9990264,-109.53979,-197.85089,30.758734,-31.351265,532.2217,695000
61
+ 73.62953,34.760235,0.82267356,1.7164525,73.62953,0.18141797,9.9320755,-2.0488794,-113.9943,-200.4835,11.280344,-11.289507,434.24002,700000
62
+ 444.0855,34.514256,0.7945845,1.5268414,444.0855,0.16277626,14.190712,3.4057307,-114.49003,-199.43954,35.93206,-34.636364,671.70166,705000
63
+ 155.22147,74.261086,0.89583814,2.3942745,155.22147,0.15872064,14.741773,-7.705519,-112.026245,-202.2133,37.340076,-31.448704,689.2561,710000
64
+ 117.42753,39.231644,0.87228435,1.8751873,117.42753,0.15410128,6.9006805,1.4601039,-113.49617,-195.97632,16.850758,-14.409643,528.2014,715000
65
+ 211.26733,57.51436,0.83794844,1.7964967,211.26733,0.17044975,10.484345,-1.4841467,-114.1947,-202.90932,51.143646,-50.328903,845.9622,720000
66
+ 85.59852,41.39444,0.82458556,1.8794248,85.59852,0.14426851,8.257953,-4.6157484,-110.212,-204.89268,18.17035,-17.893116,539.30115,725000
67
+ 1485.729,40.20817,0.89509964,1.8838731,1485.729,0.16656947,14.3474,0.4780103,-106.90098,-189.0825,90.98428,-84.88474,1534.3496,730000
68
+ 99.83242,53.378242,0.8487402,1.9278957,99.83242,0.16948247,7.79297,-13.728922,-110.24352,-202.52406,21.647297,-20.317188,441.95398,735000
69
+ 99.119194,53.944637,0.78580093,1.7170434,99.119194,0.1416137,12.41339,-0.43244407,-112.47522,-201.63286,22.87611,-23.349527,488.61804,740000
70
+ 275.3968,37.95932,0.9248816,1.9667214,275.3968,0.14355257,10.418777,2.5734255,-115.27844,-196.67198,30.189121,-32.865826,766.7648,745000
71
+ 96.776306,57.63674,0.9066711,2.4694338,96.776306,0.12972793,7.000381,4.001671,-105.165825,-203.95721,33.125443,-40.68482,561.25977,750000
72
+ 147.29152,60.56502,0.8677707,2.15635,147.29152,0.15750909,6.691724,-0.73619205,-111.91869,-203.05545,22.74366,-32.29527,549.895,755000
73
+ 92.904816,34.749973,0.9011559,1.851046,92.904816,0.18954413,8.4139,-2.8444052,-105.158325,-202.7722,31.93391,-28.178223,524.7628,760000
74
+ 78.95353,28.67589,0.8307759,1.502874,78.95353,0.16407743,13.128372,-0.55677605,-110.998535,-203.80725,22.828667,-21.19104,420.0838,765000
75
+ 68.26767,61.82445,0.78049904,1.6376331,68.26767,0.16288455,12.600085,-3.271187,-109.95829,-201.58946,19.885237,-18.122328,529.54535,770000
76
+ 116.234314,65.231674,0.8858239,2.2032328,116.234314,0.14618103,7.3779054,3.7518888,-108.357315,-193.30634,22.849852,-26.34189,564.54047,775000
77
+ 111.56714,61.21972,0.85787445,2.285712,111.56714,0.15923944,5.4256897,-0.7641851,-105.81585,-201.63141,32.201027,-30.683802,638.9723,780000
78
+ 68.94369,36.880203,0.75768495,1.4432372,68.94369,0.17281981,11.3914,0.44302523,-107.02665,-204.0154,15.815756,-15.601738,467.15002,785000
79
+ 97.629456,40.757603,0.8352906,1.800172,97.629456,0.1712864,10.103554,5.6479883,-110.206474,-203.61633,35.11548,-32.41894,561.9246,790000
80
+ 192.9202,159.40433,1.0045291,3.392467,192.9202,0.16091299,10.724608,-2.4582977,-108.288895,-186.4092,66.60034,-61.321022,1030.6265,795000
81
+ 68.384544,30.03999,0.8074574,1.5505537,68.384544,0.15102692,11.174011,-0.6601643,-104.300735,-201.7715,18.700703,-18.958744,476.71872,800000
82
+ 89.29743,37.008118,0.8102723,1.592759,89.29743,0.17262001,7.2873836,2.1533349,-106.88063,-202.33817,30.042044,-24.543226,638.7739,805000
83
+ 1094.1271,74.70503,0.84853834,2.359577,1094.1271,0.1765312,6.900866,1.492358,-109.940384,-197.52808,77.64395,-93.50113,1163.0153,810000
84
+ 89.09611,63.993736,0.85438263,2.134264,89.09611,0.17704964,6.009826,0.19066283,-105.27051,-194.68106,32.047028,-37.26977,520.3405,815000
85
+ 114.73842,54.030552,0.7869628,1.6803685,114.73842,0.16132866,10.160247,0.26987964,-107.96963,-199.6928,18.405111,-21.853361,472.1546,820000
86
+ 132.14291,63.23186,0.92450637,2.251877,132.14291,0.15696986,11.503676,-2.015034,-105.15574,-201.76349,53.167953,-74.20234,723.7092,825000
87
+ 151.47333,70.337746,0.91880506,2.3777988,151.47333,0.16246901,17.1891,-0.19840404,-101.00689,-187.01707,44.254974,-49.985264,658.8837,830000
88
+ 91.03414,95.36042,0.84299123,2.1802638,91.03414,0.16507986,8.553807,-4.105972,-107.19324,-196.59267,14.57362,-15.73753,416.10272,835000
89
+ 91.773705,52.24922,0.8513324,1.918158,91.773705,0.16238584,6.408912,-1.281793,-100.49275,-202.28986,43.152706,-42.90877,841.08936,840000
90
+ 183.94156,71.940544,0.8225818,1.8261507,183.94156,0.14935112,9.79703,-5.6597953,-107.58474,-199.25052,40.100716,-36.082863,706.4858,845000
91
+ 262.8415,51.751534,0.9674818,2.2986205,262.8415,0.16149297,8.430525,-1.9528822,-102.1751,-193.4369,56.013172,-58.15065,1016.97723,850000
92
+ 79.465744,51.969406,0.86491555,1.7832155,79.465744,0.16518033,4.718362,1.7035462,-102.82647,-187.25613,15.611069,-16.11784,442.11792,855000
93
+ 72.28282,36.11667,0.8596591,1.7259125,72.28282,0.15558843,12.240811,-0.22230653,-103.29187,-189.11089,26.20269,-14.263849,536.4213,860000
94
+ 74.21773,31.582613,0.81827384,1.5982858,74.21773,0.14877744,8.29953,-8.29796,-103.80991,-200.83502,14.710085,-16.316425,472.72015,865000
95
+ 129.20549,54.238045,0.76372343,1.6602442,129.20549,0.14603506,9.519709,0.5411986,-103.47544,-198.55577,42.909855,-38.181892,745.5835,870000
96
+ 172.40979,96.06824,0.9197341,2.5109484,172.40979,0.1276635,9.76579,1.5378928,-104.94861,-202.20413,41.657845,-51.197777,703.6059,875000
97
+ 146.2342,51.0099,0.9642503,2.1406536,146.2342,0.16175365,8.873911,1.8397624,-104.49678,-193.4828,57.103577,-50.630272,750.29297,880000
98
+ 134.33023,80.35818,0.950881,2.3958628,134.33023,0.1343015,9.747345,-1.606576,-101.39943,-195.86034,20.560127,-21.113775,555.06134,885000
99
+ 83.67289,62.037334,0.83476377,2.0009582,83.67289,0.15629144,7.0584793,-3.4934356,-99.08268,-195.20522,11.277386,-13.491167,361.20862,890000
100
+ 91.766205,41.192978,0.8217626,1.6899042,91.766205,0.12320092,7.849726,5.2755256,-95.58921,-201.87364,42.74396,-37.305283,710.4884,895000
101
+ 158.59805,58.72584,0.96264285,2.143373,158.59805,0.15878642,6.490504,-2.6413412,-97.490105,-202.4374,13.267875,-12.019755,508.95087,900000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54bdb026738322ab50eccb84ac0c7a0fd50666687ebf1a1b55b6c0c0e5e8a764
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549bea0380ffff114db53f35125f922ad6d7b317dab35d2eed7b51a2f7310a6e
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5bff9209a565bd13873edbb2d616f8549cfc39a9021a08657dc6b076a97e3ec
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a4e0098353eb6dc4dad68367a42db6e949df9c73750082ed412c2cf8e078e88
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:565b8e15bd76e2a566cd7e00f58e6f5a101bc1939fbd8aff7a02b00e71cb4134
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d896e2ec95f28f628bbeea568f8af91c89c3a45d568dce70316781ef270374c
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f75ff25ffc1cd7bb67b7c57640a0f928539bfb9732fe013a3ea161ba58cbec0
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:186e606d3b75e57f6ebd5cf9e29425f17d860c4191e9835ef27a95caf8139f2c
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9868cf38c265b11444316da2cfacc3be5165a25441ae17e99ec468afffe036f9
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b278a08f7a6f880f9e4ed42c8cd49612d3b0a4ce49576b60c1abb02b0769e8c
3
+ size 237984512
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/qam/20260319_080410/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/ed0tbmxm