Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1050000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1100000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0380179015797789,-0.00034942582813032326,-0.037502913899701604,0.0013935657645997928,24.489975697758204,10.00599999999905,0.76,5413.4,-0.28,-264.56,198.12,0.6001528549194336,650000
|
| 3 |
+
0.0,0.0,-0.04268233709771587,0.010527678019802037,-0.04209875798608167,-0.008928001203662212,29.0150279364035,9.191999999999279,0.78,14454.7,-0.28,-259.1,181.84,0.5735257768630981,700000
|
| 4 |
+
0.0,0.0,-0.04116180386027787,0.03627008925560146,-0.038882874330046065,0.030177844787185142,33.31086594858332,5.32099999999975,0.94,22065.04,-0.08,-146.02,104.42,0.33108964920043943,750000
|
| 5 |
+
0.0,0.0,-0.0792806951601339,0.047354595808763375,-0.07664137220006685,0.043021360085334324,33.747141803533815,4.652999999999777,0.94,27085.26,-0.08,-131.68,91.06,0.2994532108306885,800000
|
| 6 |
+
0.0,0.0,-0.059201509044742896,0.05044207060360424,-0.05639898319938114,0.04689336488522902,34.82636057388165,4.132999999999737,0.94,31482.88,-0.08,-119.6,80.66,0.26908241271972655,850000
|
| 7 |
+
0.0,0.0,-0.06074725754530125,0.05041782906927206,-0.05819743436799442,0.03607675465334038,33.87545859778418,3.39899999999984,0.98,35337.78,-0.02,-93.78,65.98,0.22236245155334472,900000
|
| 8 |
+
0.0,0.0,-0.0660211772872667,0.04924943851314269,-0.06355397334461593,0.03830256163854864,34.132775266739095,3.143999999999865,0.98,38241.24,-0.02,-84.46,60.88,0.22342996120452882,950000
|
| 9 |
+
0.0,0.0,-0.06614612979489382,0.05058609818540884,-0.06368615504449532,0.029640243935819228,33.59772555701199,4.231999999999796,0.94,42079.84,-0.08,-113.06,82.64,0.2723376131057739,1000000
|
| 10 |
+
0.0,0.0,-0.06485192787910284,0.04799759480846279,-0.062065081429655056,0.053987237747640755,34.457481198056016,2.9669999999998846,0.98,45676.04,-0.02,-89.86,57.34,0.19874478816986085,1050000
|
| 11 |
+
0.0,0.0,-0.07557052008065,0.0696740246224775,-0.0719038401043174,0.07736549782891781,33.848647564794376,2.520999999999944,1.0,48466.7,0.0,-71.32,48.42,0.16940658569335937,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.0380179015797789,-0.00034942582813032326,-0.037502913899701604,0.0013935657645997928,24.489975697758204,10.00599999999905,0.76,5413.4,-0.28,-264.56,198.12,0.6001528549194336,650000
|
| 3 |
+
0.0,0.0,-0.04268233709771587,0.010527678019802037,-0.04209875798608167,-0.008928001203662212,29.0150279364035,9.191999999999279,0.78,14454.7,-0.28,-259.1,181.84,0.5735257768630981,700000
|
| 4 |
+
0.0,0.0,-0.04116180386027787,0.03627008925560146,-0.038882874330046065,0.030177844787185142,33.31086594858332,5.32099999999975,0.94,22065.04,-0.08,-146.02,104.42,0.33108964920043943,750000
|
| 5 |
+
0.0,0.0,-0.0792806951601339,0.047354595808763375,-0.07664137220006685,0.043021360085334324,33.747141803533815,4.652999999999777,0.94,27085.26,-0.08,-131.68,91.06,0.2994532108306885,800000
|
| 6 |
+
0.0,0.0,-0.059201509044742896,0.05044207060360424,-0.05639898319938114,0.04689336488522902,34.82636057388165,4.132999999999737,0.94,31482.88,-0.08,-119.6,80.66,0.26908241271972655,850000
|
| 7 |
+
0.0,0.0,-0.06074725754530125,0.05041782906927206,-0.05819743436799442,0.03607675465334038,33.87545859778418,3.39899999999984,0.98,35337.78,-0.02,-93.78,65.98,0.22236245155334472,900000
|
| 8 |
+
0.0,0.0,-0.0660211772872667,0.04924943851314269,-0.06355397334461593,0.03830256163854864,34.132775266739095,3.143999999999865,0.98,38241.24,-0.02,-84.46,60.88,0.22342996120452882,950000
|
| 9 |
+
0.0,0.0,-0.06614612979489382,0.05058609818540884,-0.06368615504449532,0.029640243935819228,33.59772555701199,4.231999999999796,0.94,42079.84,-0.08,-113.06,82.64,0.2723376131057739,1000000
|
| 10 |
+
0.0,0.0,-0.06485192787910284,0.04799759480846279,-0.062065081429655056,0.053987237747640755,34.457481198056016,2.9669999999998846,0.98,45676.04,-0.02,-89.86,57.34,0.19874478816986085,1050000
|
| 11 |
+
0.0,0.0,-0.07557052008065,0.0696740246224775,-0.0719038401043174,0.07736549782891781,33.848647564794376,2.520999999999944,1.0,48466.7,0.0,-71.32,48.42,0.16940658569335937,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.024815034,2.4815035,1.0248151,0.3666931,-24.198751,-102.884926,-181.20018,0.19193716,-0.11091934,8.51194,605000
|
| 3 |
+
1.0,0.99999994,0.024872595,2.4872594,1.0248725,0.68319535,-19.728884,-102.68652,-174.64014,0.24901415,-0.22656584,11.091871,610000
|
| 4 |
+
1.0,0.99999994,0.02203678,2.2036781,1.0220367,0.8408438,-27.068047,-106.19684,-178.91734,0.18771432,-0.24076296,10.36423,615000
|
| 5 |
+
1.0,1.0,0.0208416,2.0841599,1.0208416,0.78311414,-20.8429,-107.599686,-191.68127,0.08344711,-0.12342457,8.493226,620000
|
| 6 |
+
1.0,1.0,0.02146972,2.146972,1.0214697,0.8043398,-38.866932,-108.75793,-189.0563,0.2235443,-0.13419862,10.498583,625000
|
| 7 |
+
1.0,1.0000001,0.021569917,2.1569917,1.0215701,0.83385605,-26.861532,-107.46399,-190.09727,0.1582477,-0.21159212,12.572064,630000
|
| 8 |
+
1.0,1.0,0.02338985,2.3389852,1.0233898,1.016264,-23.10069,-106.79955,-190.65068,0.55849355,-0.6607512,20.200058,635000
|
| 9 |
+
1.0,1.0,0.02347282,2.347282,1.0234728,1.3089417,-15.030339,-105.025475,-177.88438,0.89134127,-0.9374014,20.773636,640000
|
| 10 |
+
1.0,1.0,0.02202149,2.202149,1.0220215,1.0443696,-2.1652534,-105.6617,-202.48274,0.26967785,-0.13954163,13.495289,645000
|
| 11 |
+
1.0,1.0,0.025514234,2.5514235,1.0255142,2.0007029,-22.345577,-105.3116,-177.83101,0.49798405,-0.52658194,28.483624,650000
|
| 12 |
+
1.0,0.99999994,0.025430828,2.543083,1.0254308,1.289069,-25.627003,-104.16801,-190.30298,0.2734816,-0.26137617,16.549225,655000
|
| 13 |
+
1.0,1.0,0.025059368,2.5059366,1.0250593,1.237017,-10.044821,-99.13094,-185.25066,0.16622026,-0.238983,13.488863,660000
|
| 14 |
+
1.0,0.99999994,0.02396392,2.396392,1.0239638,1.1224693,-9.493827,-98.65179,-195.79085,0.19118328,-0.19028684,12.278523,665000
|
| 15 |
+
1.0,0.99999994,0.026226591,2.6226592,1.0262265,1.2415612,-7.5872555,-94.62333,-203.84235,0.16700162,-0.19428472,13.815616,670000
|
| 16 |
+
1.0,1.0,0.027785927,2.7785928,1.0277859,1.2928694,-11.749939,-97.796684,-185.42088,0.29437864,-0.23840144,18.380318,675000
|
| 17 |
+
1.0,0.99999994,0.028133925,2.8133926,1.0281339,1.2490613,-12.333711,-97.913605,-186.01971,0.24529383,-0.21620011,15.772633,680000
|
| 18 |
+
1.0,0.99999994,0.026637925,2.6637926,1.0266379,1.284335,-5.4739394,-94.723236,-189.5096,0.1552522,-0.22890593,17.811432,685000
|
| 19 |
+
1.0,1.0,0.027797244,2.7797246,1.0277972,1.8961948,-11.311711,-95.13237,-193.09128,0.37339672,-0.36991754,22.394474,690000
|
| 20 |
+
1.0,1.0,0.0290201,2.90201,1.0290201,1.2066398,-4.1415315,-94.6806,-199.86206,0.38267502,-0.20759256,19.022984,695000
|
| 21 |
+
1.0,1.0,0.025870197,2.58702,1.0258702,1.4049101,-0.597336,-89.364494,-170.3079,0.34688452,-0.42954943,22.302704,700000
|
| 22 |
+
1.0,1.0,0.028702859,2.870286,1.0287029,0.8554718,-21.083527,-95.6017,-179.14592,0.12138721,-0.21362394,11.400747,705000
|
| 23 |
+
1.0,1.0,0.027738169,2.773817,1.0277382,1.7025633,-11.445053,-92.478874,-180.1325,0.26024923,-0.19330414,18.128498,710000
|
| 24 |
+
1.0,0.9999515,0.026800107,2.6800108,1.0267516,1.4594078,1.4997178,-89.46349,-171.0341,1.2200351,-0.97659326,41.037106,715000
|
| 25 |
+
1.0,1.0000001,0.02772373,2.772373,1.0277238,1.6300217,-1.2981927,-88.589775,-160.89142,0.34486604,-0.68273026,24.284918,720000
|
| 26 |
+
1.0,1.0,0.028543115,2.8543115,1.0285431,1.075097,-13.743146,-92.93043,-181.75014,0.5752878,-0.55788195,17.979618,725000
|
| 27 |
+
1.0,1.0,0.027695708,2.7695708,1.0276957,1.3717239,-4.669609,-89.76309,-178.93031,0.33333752,-0.32401228,21.266794,730000
|
| 28 |
+
1.0,0.9999321,0.027869256,2.7869258,1.0278014,0.8543068,2.2758615,-88.905495,-170.26028,0.084789716,-0.1479711,9.450944,735000
|
| 29 |
+
1.0,1.0,0.029665526,2.9665527,1.0296655,2.408781,-7.0499196,-85.098915,-179.44843,0.54007787,-0.3435824,31.778362,740000
|
| 30 |
+
1.0,0.9999999,0.03092987,3.092987,1.0309298,1.8018528,-5.8581967,-89.693184,-198.16058,0.3735438,-0.32709354,26.693243,745000
|
| 31 |
+
1.0,1.0000001,0.0274479,2.74479,1.027448,1.1101294,-4.780729,-89.27441,-187.33295,0.17227732,-0.18912518,14.403259,750000
|
| 32 |
+
1.0,1.0,0.027567178,2.756718,1.0275671,0.97082615,1.5211284,-85.77029,-175.45271,0.18404084,-0.18975538,13.6040325,755000
|
| 33 |
+
1.0,0.9999866,0.028530037,2.853004,1.0285167,1.3774571,-4.649334,-89.181526,-194.8292,0.24975877,-0.24696442,18.680586,760000
|
| 34 |
+
1.0,1.0,0.029020157,2.902016,1.0290202,2.34171,-2.6184754,-88.470726,-172.51056,0.35466298,-0.53605914,29.614685,765000
|
| 35 |
+
1.0,1.0,0.029962573,2.9962575,1.0299625,1.1217546,-2.5699265,-83.64429,-184.14706,0.40592235,-0.17907876,15.705631,770000
|
| 36 |
+
1.0,1.0,0.028588535,2.8588536,1.0285885,1.4029318,-3.7928474,-89.63704,-194.04607,0.4912306,-0.41175148,21.64424,775000
|
| 37 |
+
1.0,0.99998796,0.028244566,2.8244565,1.0282326,1.0526441,3.3391223,-87.377396,-192.05365,0.20857796,-0.28159177,15.165477,780000
|
| 38 |
+
1.0,1.0,0.028367361,2.8367362,1.0283674,1.275322,0.3695038,-85.344475,-161.4191,0.1548892,-0.32059366,16.406881,785000
|
| 39 |
+
1.0,0.99999994,0.026297692,2.6297693,1.0262977,1.2674353,-6.5713215,-84.211464,-199.8247,0.27791992,-0.24333303,16.590584,790000
|
| 40 |
+
1.0,1.0,0.028843787,2.884379,1.0288438,1.744681,-2.2924156,-85.65918,-201.58391,1.156159,-1.0087198,37.487507,795000
|
| 41 |
+
1.0,0.9999999,0.03015241,3.0152414,1.0301523,1.5797462,2.9944963,-83.35614,-198.12369,0.36500883,-0.369054,20.69853,800000
|
| 42 |
+
1.0,1.0,0.029135026,2.9135027,1.029135,0.93589383,-5.7925487,-80.96902,-172.02705,0.3285348,-0.14963108,17.429224,805000
|
| 43 |
+
1.0,0.99999994,0.029536318,2.9536319,1.0295362,1.146423,-3.263936,-82.45394,-162.41779,0.33632,-0.31252956,16.880117,810000
|
| 44 |
+
1.0,1.0,0.03174019,3.1740189,1.0317402,2.3784883,1.434686,-83.948784,-165.7096,0.28298655,-0.22330444,22.354568,815000
|
| 45 |
+
1.0,1.0000001,0.029892066,2.9892068,1.0298922,1.678744,-2.1017718,-82.83461,-190.99829,0.11997774,-0.22886154,14.92853,820000
|
| 46 |
+
1.0,0.99999994,0.028205942,2.8205943,1.0282059,1.4769353,-2.5888424,-80.78572,-171.09837,0.4074059,-0.4009019,17.801382,825000
|
| 47 |
+
1.0,1.0,0.03125038,3.1250384,1.0312504,1.2141228,1.0687292,-82.23925,-159.53119,0.39669502,-0.39710626,15.653326,830000
|
| 48 |
+
1.0,0.9999999,0.027710889,2.7710886,1.0277108,2.6160824,-0.023082525,-80.552284,-165.16473,0.7412218,-0.27758107,34.688004,835000
|
| 49 |
+
1.0,0.9999999,0.029112386,2.9112387,1.0291122,0.9875744,1.927965,-79.79832,-192.95631,0.32844037,-0.114079244,13.376781,840000
|
| 50 |
+
1.0,1.0,0.03093367,3.093367,1.0309336,0.88982075,-0.843024,-82.73107,-170.51042,0.10912285,-0.1234206,10.806158,845000
|
| 51 |
+
1.0,1.0,0.027890356,2.7890356,1.0278903,1.660792,-4.364303,-75.46258,-188.57376,0.37819412,-0.40284482,23.890484,850000
|
| 52 |
+
1.0,1.0,0.029946357,2.994636,1.0299463,0.999986,-4.896181,-81.95036,-160.58205,0.1851584,-0.23036225,11.567949,855000
|
| 53 |
+
1.0,1.0,0.030525722,3.0525723,1.0305257,0.9974746,1.9100163,-79.87445,-164.50127,0.18420653,-0.25841975,14.637952,860000
|
| 54 |
+
1.0,1.0,0.029138573,2.9138575,1.0291386,2.4730167,0.22859217,-78.39559,-196.05235,0.952238,-0.9062966,45.682804,865000
|
| 55 |
+
1.0,1.0,0.030512689,3.051269,1.0305127,6.504473,-3.7329664,-81.2477,-161.78123,1.0812693,-0.8129737,67.11237,870000
|
| 56 |
+
1.0,1.0,0.029420162,2.9420161,1.0294201,1.2710308,-0.3803721,-78.227135,-198.60483,0.38114265,-0.42623514,24.486631,875000
|
| 57 |
+
1.0,0.9999003,0.030607376,3.0607378,1.0305077,0.9299766,-4.9270887,-78.18602,-167.58418,0.21976577,-0.28166535,12.981388,880000
|
| 58 |
+
1.0,1.0000001,0.029157545,2.9157546,1.0291576,1.4415811,1.924162,-76.013084,-165.07925,0.33494204,-0.31407282,19.635735,885000
|
| 59 |
+
1.0,1.0,0.030164275,3.0164278,1.0301642,3.228233,-1.6272675,-73.776855,-188.24402,0.56838024,-0.37059212,33.446564,890000
|
| 60 |
+
1.0,0.9999959,0.03009193,3.0091932,1.0300878,1.2442479,0.8585273,-75.08681,-163.28494,0.13663846,-0.35652632,17.464672,895000
|
| 61 |
+
1.0,1.0,0.029899975,2.9899979,1.0299,1.6651955,2.0981905,-76.0613,-161.67807,0.21541177,-0.3051875,21.620518,900000
|
| 62 |
+
1.0,1.0,0.03382951,3.3829513,1.0338295,1.61562,-0.71288854,-79.449135,-159.70755,0.42533553,-0.25124165,21.231493,905000
|
| 63 |
+
1.0,0.9999999,0.030801602,3.0801604,1.0308015,1.6140877,1.3606559,-74.69624,-168.69664,0.26083022,-0.25052127,20.440239,910000
|
| 64 |
+
1.0,0.99999994,0.029417798,2.9417796,1.0294178,0.8571071,0.3831859,-76.13492,-163.93777,0.20155005,-0.32797122,16.45071,915000
|
| 65 |
+
1.0,1.0,0.032023437,3.202344,1.0320234,1.3342617,-0.9439661,-75.18939,-151.32826,0.27451205,-0.2604828,18.238605,920000
|
| 66 |
+
1.0,1.0,0.033920743,3.392074,1.0339208,1.1794865,1.2676927,-75.44327,-171.4388,0.25025827,-0.23041706,16.728386,925000
|
| 67 |
+
1.0,1.0,0.030582936,3.0582938,1.0305829,2.4430752,-1.178472,-72.129555,-149.88414,0.3620799,-0.27957276,27.107368,930000
|
| 68 |
+
1.0,1.0,0.03083017,3.0830169,1.0308301,0.97503215,2.2528684,-75.41378,-179.7236,0.12304565,-0.21949956,12.076079,935000
|
| 69 |
+
1.0,1.0,0.03212049,3.2120488,1.0321205,0.88710254,0.72403604,-75.03179,-160.28148,0.19441615,-0.30782348,14.386883,940000
|
| 70 |
+
1.0,0.99999994,0.031449616,3.1449614,1.0314496,0.88351995,-0.07827644,-78.60188,-170.30186,0.30504578,-0.30423683,13.459339,945000
|
| 71 |
+
1.0,1.0000001,0.02924212,2.9242122,1.0292423,0.9203669,-0.77450526,-70.96956,-167.81752,0.1484165,-0.15512161,11.270857,950000
|
| 72 |
+
1.0,1.0,0.029689245,2.9689245,1.0296892,0.92100394,0.82146215,-76.792366,-159.91739,0.21005374,-0.14991367,13.730187,955000
|
| 73 |
+
1.0,1.0000001,0.030781507,3.0781507,1.0307816,1.3673706,-2.2457135,-71.88796,-170.44258,0.60151833,-0.60674965,25.20316,960000
|
| 74 |
+
1.0,1.0,0.030990513,3.0990515,1.0309905,1.5097321,-3.1074853,-73.78062,-161.8589,0.19264293,-0.19292884,15.608269,965000
|
| 75 |
+
1.0,1.0,0.030669479,3.0669482,1.0306695,1.0138245,-2.2876992,-71.081535,-159.77557,0.20310338,-0.22473824,13.705998,970000
|
| 76 |
+
1.0,0.99998796,0.03055593,3.055593,1.0305439,0.7910748,0.8451664,-70.39855,-170.21861,0.10616802,-0.21456546,11.890287,975000
|
| 77 |
+
1.0,1.0,0.028994082,2.899408,1.0289941,1.1881804,1.2889166,-71.78707,-155.99887,0.32204187,-0.17553496,14.464261,980000
|
| 78 |
+
1.0,1.0000001,0.030396145,3.0396147,1.0303962,1.0076854,0.8080372,-72.32439,-149.55403,0.20197594,-0.16508889,13.431903,985000
|
| 79 |
+
1.0,1.0,0.032394156,3.2394161,1.0323942,2.851364,-0.07765512,-74.85708,-158.39764,0.6163468,-0.49920332,35.897453,990000
|
| 80 |
+
1.0,0.99977285,0.030849434,3.0849435,1.0306222,1.449524,3.2696266,-72.480934,-149.20557,0.25384355,-0.22568831,18.087715,995000
|
| 81 |
+
1.0,1.0,0.030446537,3.044654,1.0304465,0.8001977,1.295736,-70.74902,-147.38843,0.13037589,-0.35703558,15.321369,1000000
|
| 82 |
+
1.0,1.0,0.029521894,2.9521894,1.029522,0.9073537,1.804283,-72.56652,-163.79276,0.27560493,-0.2750259,12.134148,1005000
|
| 83 |
+
1.0,0.99999994,0.030624975,3.0624974,1.0306249,1.2351993,-0.48483264,-73.13953,-142.39386,0.23881198,-0.27471095,17.204222,1010000
|
| 84 |
+
1.0,0.99999994,0.030485503,3.0485506,1.0304854,1.2219172,0.54306984,-72.00967,-151.51376,0.34237874,-0.24080196,16.613783,1015000
|
| 85 |
+
1.0,1.0,0.033992708,3.3992708,1.0339928,0.91650957,-0.7382773,-70.70718,-155.51399,0.15402462,-0.22110869,12.677833,1020000
|
| 86 |
+
1.0,1.0000001,0.029457474,2.9457474,1.0294576,1.1741233,-0.6850228,-69.70017,-159.70868,0.28886265,-0.13351043,13.302741,1025000
|
| 87 |
+
1.0,1.0,0.030109141,3.0109143,1.0301092,1.200968,-1.3691163,-68.5387,-151.12064,0.48537624,-0.5537471,27.22465,1030000
|
| 88 |
+
1.0,1.0,0.033670798,3.36708,1.0336708,0.9480209,-4.6147437,-69.79474,-171.34915,0.21607992,-0.17612582,13.041958,1035000
|
| 89 |
+
1.0,0.99999994,0.032592915,3.2592916,1.0325929,1.0285814,-2.0690825,-66.73834,-167.80032,0.2234381,-0.30573237,12.220416,1040000
|
| 90 |
+
1.0,1.0,0.0328943,3.2894297,1.0328943,1.5639404,-3.2496843,-72.99569,-136.8094,0.5372599,-0.5453766,30.224796,1045000
|
| 91 |
+
1.0,1.0,0.029591905,2.9591904,1.0295919,0.8755743,0.32315773,-68.3559,-157.0354,0.18134974,-0.1362086,11.693008,1050000
|
| 92 |
+
1.0,0.99999994,0.032282963,3.2282963,1.032283,1.0488411,0.6583621,-69.38667,-154.31189,0.15439567,-0.34856516,17.165802,1055000
|
| 93 |
+
1.0,1.0,0.032610036,3.261004,1.03261,1.399474,0.97662055,-67.33406,-138.71103,0.26802126,-0.4593436,21.819283,1060000
|
| 94 |
+
1.0,0.99999994,0.034048844,3.4048843,1.0340488,1.2439209,2.0829003,-67.11425,-135.1039,0.26112658,-0.37013003,18.052431,1065000
|
| 95 |
+
1.0,0.99999994,0.032085203,3.2085204,1.0320852,1.1371292,-2.0745292,-66.66137,-134.39859,0.2754921,-0.28958052,16.18332,1070000
|
| 96 |
+
1.0,1.0,0.0306753,3.0675302,1.0306753,1.3967011,-0.7854585,-69.66265,-157.90437,0.4143233,-0.39612597,17.085484,1075000
|
| 97 |
+
1.0,0.99998343,0.03275539,3.2755394,1.0327388,1.1819179,0.6322001,-66.52468,-141.4191,0.32188106,-0.28310126,17.762177,1080000
|
| 98 |
+
1.0,1.0,0.0319407,3.1940699,1.0319407,1.0487398,-1.8347744,-66.68598,-168.0207,0.17817639,-0.25144598,15.056358,1085000
|
| 99 |
+
1.0,1.0,0.030981576,3.0981576,1.0309815,0.8174259,-0.817459,-67.32993,-152.78893,0.1349187,-0.16325076,10.259439,1090000
|
| 100 |
+
1.0,0.9999999,0.029535025,2.9535027,1.0295349,1.4653295,-1.781519,-63.062275,-160.16127,0.4262811,-0.52346617,21.053352,1095000
|
| 101 |
+
1.0,1.0000001,0.03196525,3.1965253,1.0319654,1.3003924,-5.0377836,-65.45146,-156.04889,0.15104401,-0.23891333,14.160297,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.024815034,2.4815035,1.0248151,0.3666931,-24.198751,-102.884926,-181.20018,0.19193716,-0.11091934,8.51194,605000
|
| 3 |
+
1.0,0.99999994,0.024872595,2.4872594,1.0248725,0.68319535,-19.728884,-102.68652,-174.64014,0.24901415,-0.22656584,11.091871,610000
|
| 4 |
+
1.0,0.99999994,0.02203678,2.2036781,1.0220367,0.8408438,-27.068047,-106.19684,-178.91734,0.18771432,-0.24076296,10.36423,615000
|
| 5 |
+
1.0,1.0,0.0208416,2.0841599,1.0208416,0.78311414,-20.8429,-107.599686,-191.68127,0.08344711,-0.12342457,8.493226,620000
|
| 6 |
+
1.0,1.0,0.02146972,2.146972,1.0214697,0.8043398,-38.866932,-108.75793,-189.0563,0.2235443,-0.13419862,10.498583,625000
|
| 7 |
+
1.0,1.0000001,0.021569917,2.1569917,1.0215701,0.83385605,-26.861532,-107.46399,-190.09727,0.1582477,-0.21159212,12.572064,630000
|
| 8 |
+
1.0,1.0,0.02338985,2.3389852,1.0233898,1.016264,-23.10069,-106.79955,-190.65068,0.55849355,-0.6607512,20.200058,635000
|
| 9 |
+
1.0,1.0,0.02347282,2.347282,1.0234728,1.3089417,-15.030339,-105.025475,-177.88438,0.89134127,-0.9374014,20.773636,640000
|
| 10 |
+
1.0,1.0,0.02202149,2.202149,1.0220215,1.0443696,-2.1652534,-105.6617,-202.48274,0.26967785,-0.13954163,13.495289,645000
|
| 11 |
+
1.0,1.0,0.025514234,2.5514235,1.0255142,2.0007029,-22.345577,-105.3116,-177.83101,0.49798405,-0.52658194,28.483624,650000
|
| 12 |
+
1.0,0.99999994,0.025430828,2.543083,1.0254308,1.289069,-25.627003,-104.16801,-190.30298,0.2734816,-0.26137617,16.549225,655000
|
| 13 |
+
1.0,1.0,0.025059368,2.5059366,1.0250593,1.237017,-10.044821,-99.13094,-185.25066,0.16622026,-0.238983,13.488863,660000
|
| 14 |
+
1.0,0.99999994,0.02396392,2.396392,1.0239638,1.1224693,-9.493827,-98.65179,-195.79085,0.19118328,-0.19028684,12.278523,665000
|
| 15 |
+
1.0,0.99999994,0.026226591,2.6226592,1.0262265,1.2415612,-7.5872555,-94.62333,-203.84235,0.16700162,-0.19428472,13.815616,670000
|
| 16 |
+
1.0,1.0,0.027785927,2.7785928,1.0277859,1.2928694,-11.749939,-97.796684,-185.42088,0.29437864,-0.23840144,18.380318,675000
|
| 17 |
+
1.0,0.99999994,0.028133925,2.8133926,1.0281339,1.2490613,-12.333711,-97.913605,-186.01971,0.24529383,-0.21620011,15.772633,680000
|
| 18 |
+
1.0,0.99999994,0.026637925,2.6637926,1.0266379,1.284335,-5.4739394,-94.723236,-189.5096,0.1552522,-0.22890593,17.811432,685000
|
| 19 |
+
1.0,1.0,0.027797244,2.7797246,1.0277972,1.8961948,-11.311711,-95.13237,-193.09128,0.37339672,-0.36991754,22.394474,690000
|
| 20 |
+
1.0,1.0,0.0290201,2.90201,1.0290201,1.2066398,-4.1415315,-94.6806,-199.86206,0.38267502,-0.20759256,19.022984,695000
|
| 21 |
+
1.0,1.0,0.025870197,2.58702,1.0258702,1.4049101,-0.597336,-89.364494,-170.3079,0.34688452,-0.42954943,22.302704,700000
|
| 22 |
+
1.0,1.0,0.028702859,2.870286,1.0287029,0.8554718,-21.083527,-95.6017,-179.14592,0.12138721,-0.21362394,11.400747,705000
|
| 23 |
+
1.0,1.0,0.027738169,2.773817,1.0277382,1.7025633,-11.445053,-92.478874,-180.1325,0.26024923,-0.19330414,18.128498,710000
|
| 24 |
+
1.0,0.9999515,0.026800107,2.6800108,1.0267516,1.4594078,1.4997178,-89.46349,-171.0341,1.2200351,-0.97659326,41.037106,715000
|
| 25 |
+
1.0,1.0000001,0.02772373,2.772373,1.0277238,1.6300217,-1.2981927,-88.589775,-160.89142,0.34486604,-0.68273026,24.284918,720000
|
| 26 |
+
1.0,1.0,0.028543115,2.8543115,1.0285431,1.075097,-13.743146,-92.93043,-181.75014,0.5752878,-0.55788195,17.979618,725000
|
| 27 |
+
1.0,1.0,0.027695708,2.7695708,1.0276957,1.3717239,-4.669609,-89.76309,-178.93031,0.33333752,-0.32401228,21.266794,730000
|
| 28 |
+
1.0,0.9999321,0.027869256,2.7869258,1.0278014,0.8543068,2.2758615,-88.905495,-170.26028,0.084789716,-0.1479711,9.450944,735000
|
| 29 |
+
1.0,1.0,0.029665526,2.9665527,1.0296655,2.408781,-7.0499196,-85.098915,-179.44843,0.54007787,-0.3435824,31.778362,740000
|
| 30 |
+
1.0,0.9999999,0.03092987,3.092987,1.0309298,1.8018528,-5.8581967,-89.693184,-198.16058,0.3735438,-0.32709354,26.693243,745000
|
| 31 |
+
1.0,1.0000001,0.0274479,2.74479,1.027448,1.1101294,-4.780729,-89.27441,-187.33295,0.17227732,-0.18912518,14.403259,750000
|
| 32 |
+
1.0,1.0,0.027567178,2.756718,1.0275671,0.97082615,1.5211284,-85.77029,-175.45271,0.18404084,-0.18975538,13.6040325,755000
|
| 33 |
+
1.0,0.9999866,0.028530037,2.853004,1.0285167,1.3774571,-4.649334,-89.181526,-194.8292,0.24975877,-0.24696442,18.680586,760000
|
| 34 |
+
1.0,1.0,0.029020157,2.902016,1.0290202,2.34171,-2.6184754,-88.470726,-172.51056,0.35466298,-0.53605914,29.614685,765000
|
| 35 |
+
1.0,1.0,0.029962573,2.9962575,1.0299625,1.1217546,-2.5699265,-83.64429,-184.14706,0.40592235,-0.17907876,15.705631,770000
|
| 36 |
+
1.0,1.0,0.028588535,2.8588536,1.0285885,1.4029318,-3.7928474,-89.63704,-194.04607,0.4912306,-0.41175148,21.64424,775000
|
| 37 |
+
1.0,0.99998796,0.028244566,2.8244565,1.0282326,1.0526441,3.3391223,-87.377396,-192.05365,0.20857796,-0.28159177,15.165477,780000
|
| 38 |
+
1.0,1.0,0.028367361,2.8367362,1.0283674,1.275322,0.3695038,-85.344475,-161.4191,0.1548892,-0.32059366,16.406881,785000
|
| 39 |
+
1.0,0.99999994,0.026297692,2.6297693,1.0262977,1.2674353,-6.5713215,-84.211464,-199.8247,0.27791992,-0.24333303,16.590584,790000
|
| 40 |
+
1.0,1.0,0.028843787,2.884379,1.0288438,1.744681,-2.2924156,-85.65918,-201.58391,1.156159,-1.0087198,37.487507,795000
|
| 41 |
+
1.0,0.9999999,0.03015241,3.0152414,1.0301523,1.5797462,2.9944963,-83.35614,-198.12369,0.36500883,-0.369054,20.69853,800000
|
| 42 |
+
1.0,1.0,0.029135026,2.9135027,1.029135,0.93589383,-5.7925487,-80.96902,-172.02705,0.3285348,-0.14963108,17.429224,805000
|
| 43 |
+
1.0,0.99999994,0.029536318,2.9536319,1.0295362,1.146423,-3.263936,-82.45394,-162.41779,0.33632,-0.31252956,16.880117,810000
|
| 44 |
+
1.0,1.0,0.03174019,3.1740189,1.0317402,2.3784883,1.434686,-83.948784,-165.7096,0.28298655,-0.22330444,22.354568,815000
|
| 45 |
+
1.0,1.0000001,0.029892066,2.9892068,1.0298922,1.678744,-2.1017718,-82.83461,-190.99829,0.11997774,-0.22886154,14.92853,820000
|
| 46 |
+
1.0,0.99999994,0.028205942,2.8205943,1.0282059,1.4769353,-2.5888424,-80.78572,-171.09837,0.4074059,-0.4009019,17.801382,825000
|
| 47 |
+
1.0,1.0,0.03125038,3.1250384,1.0312504,1.2141228,1.0687292,-82.23925,-159.53119,0.39669502,-0.39710626,15.653326,830000
|
| 48 |
+
1.0,0.9999999,0.027710889,2.7710886,1.0277108,2.6160824,-0.023082525,-80.552284,-165.16473,0.7412218,-0.27758107,34.688004,835000
|
| 49 |
+
1.0,0.9999999,0.029112386,2.9112387,1.0291122,0.9875744,1.927965,-79.79832,-192.95631,0.32844037,-0.114079244,13.376781,840000
|
| 50 |
+
1.0,1.0,0.03093367,3.093367,1.0309336,0.88982075,-0.843024,-82.73107,-170.51042,0.10912285,-0.1234206,10.806158,845000
|
| 51 |
+
1.0,1.0,0.027890356,2.7890356,1.0278903,1.660792,-4.364303,-75.46258,-188.57376,0.37819412,-0.40284482,23.890484,850000
|
| 52 |
+
1.0,1.0,0.029946357,2.994636,1.0299463,0.999986,-4.896181,-81.95036,-160.58205,0.1851584,-0.23036225,11.567949,855000
|
| 53 |
+
1.0,1.0,0.030525722,3.0525723,1.0305257,0.9974746,1.9100163,-79.87445,-164.50127,0.18420653,-0.25841975,14.637952,860000
|
| 54 |
+
1.0,1.0,0.029138573,2.9138575,1.0291386,2.4730167,0.22859217,-78.39559,-196.05235,0.952238,-0.9062966,45.682804,865000
|
| 55 |
+
1.0,1.0,0.030512689,3.051269,1.0305127,6.504473,-3.7329664,-81.2477,-161.78123,1.0812693,-0.8129737,67.11237,870000
|
| 56 |
+
1.0,1.0,0.029420162,2.9420161,1.0294201,1.2710308,-0.3803721,-78.227135,-198.60483,0.38114265,-0.42623514,24.486631,875000
|
| 57 |
+
1.0,0.9999003,0.030607376,3.0607378,1.0305077,0.9299766,-4.9270887,-78.18602,-167.58418,0.21976577,-0.28166535,12.981388,880000
|
| 58 |
+
1.0,1.0000001,0.029157545,2.9157546,1.0291576,1.4415811,1.924162,-76.013084,-165.07925,0.33494204,-0.31407282,19.635735,885000
|
| 59 |
+
1.0,1.0,0.030164275,3.0164278,1.0301642,3.228233,-1.6272675,-73.776855,-188.24402,0.56838024,-0.37059212,33.446564,890000
|
| 60 |
+
1.0,0.9999959,0.03009193,3.0091932,1.0300878,1.2442479,0.8585273,-75.08681,-163.28494,0.13663846,-0.35652632,17.464672,895000
|
| 61 |
+
1.0,1.0,0.029899975,2.9899979,1.0299,1.6651955,2.0981905,-76.0613,-161.67807,0.21541177,-0.3051875,21.620518,900000
|
| 62 |
+
1.0,1.0,0.03382951,3.3829513,1.0338295,1.61562,-0.71288854,-79.449135,-159.70755,0.42533553,-0.25124165,21.231493,905000
|
| 63 |
+
1.0,0.9999999,0.030801602,3.0801604,1.0308015,1.6140877,1.3606559,-74.69624,-168.69664,0.26083022,-0.25052127,20.440239,910000
|
| 64 |
+
1.0,0.99999994,0.029417798,2.9417796,1.0294178,0.8571071,0.3831859,-76.13492,-163.93777,0.20155005,-0.32797122,16.45071,915000
|
| 65 |
+
1.0,1.0,0.032023437,3.202344,1.0320234,1.3342617,-0.9439661,-75.18939,-151.32826,0.27451205,-0.2604828,18.238605,920000
|
| 66 |
+
1.0,1.0,0.033920743,3.392074,1.0339208,1.1794865,1.2676927,-75.44327,-171.4388,0.25025827,-0.23041706,16.728386,925000
|
| 67 |
+
1.0,1.0,0.030582936,3.0582938,1.0305829,2.4430752,-1.178472,-72.129555,-149.88414,0.3620799,-0.27957276,27.107368,930000
|
| 68 |
+
1.0,1.0,0.03083017,3.0830169,1.0308301,0.97503215,2.2528684,-75.41378,-179.7236,0.12304565,-0.21949956,12.076079,935000
|
| 69 |
+
1.0,1.0,0.03212049,3.2120488,1.0321205,0.88710254,0.72403604,-75.03179,-160.28148,0.19441615,-0.30782348,14.386883,940000
|
| 70 |
+
1.0,0.99999994,0.031449616,3.1449614,1.0314496,0.88351995,-0.07827644,-78.60188,-170.30186,0.30504578,-0.30423683,13.459339,945000
|
| 71 |
+
1.0,1.0000001,0.02924212,2.9242122,1.0292423,0.9203669,-0.77450526,-70.96956,-167.81752,0.1484165,-0.15512161,11.270857,950000
|
| 72 |
+
1.0,1.0,0.029689245,2.9689245,1.0296892,0.92100394,0.82146215,-76.792366,-159.91739,0.21005374,-0.14991367,13.730187,955000
|
| 73 |
+
1.0,1.0000001,0.030781507,3.0781507,1.0307816,1.3673706,-2.2457135,-71.88796,-170.44258,0.60151833,-0.60674965,25.20316,960000
|
| 74 |
+
1.0,1.0,0.030990513,3.0990515,1.0309905,1.5097321,-3.1074853,-73.78062,-161.8589,0.19264293,-0.19292884,15.608269,965000
|
| 75 |
+
1.0,1.0,0.030669479,3.0669482,1.0306695,1.0138245,-2.2876992,-71.081535,-159.77557,0.20310338,-0.22473824,13.705998,970000
|
| 76 |
+
1.0,0.99998796,0.03055593,3.055593,1.0305439,0.7910748,0.8451664,-70.39855,-170.21861,0.10616802,-0.21456546,11.890287,975000
|
| 77 |
+
1.0,1.0,0.028994082,2.899408,1.0289941,1.1881804,1.2889166,-71.78707,-155.99887,0.32204187,-0.17553496,14.464261,980000
|
| 78 |
+
1.0,1.0000001,0.030396145,3.0396147,1.0303962,1.0076854,0.8080372,-72.32439,-149.55403,0.20197594,-0.16508889,13.431903,985000
|
| 79 |
+
1.0,1.0,0.032394156,3.2394161,1.0323942,2.851364,-0.07765512,-74.85708,-158.39764,0.6163468,-0.49920332,35.897453,990000
|
| 80 |
+
1.0,0.99977285,0.030849434,3.0849435,1.0306222,1.449524,3.2696266,-72.480934,-149.20557,0.25384355,-0.22568831,18.087715,995000
|
| 81 |
+
1.0,1.0,0.030446537,3.044654,1.0304465,0.8001977,1.295736,-70.74902,-147.38843,0.13037589,-0.35703558,15.321369,1000000
|
| 82 |
+
1.0,1.0,0.029521894,2.9521894,1.029522,0.9073537,1.804283,-72.56652,-163.79276,0.27560493,-0.2750259,12.134148,1005000
|
| 83 |
+
1.0,0.99999994,0.030624975,3.0624974,1.0306249,1.2351993,-0.48483264,-73.13953,-142.39386,0.23881198,-0.27471095,17.204222,1010000
|
| 84 |
+
1.0,0.99999994,0.030485503,3.0485506,1.0304854,1.2219172,0.54306984,-72.00967,-151.51376,0.34237874,-0.24080196,16.613783,1015000
|
| 85 |
+
1.0,1.0,0.033992708,3.3992708,1.0339928,0.91650957,-0.7382773,-70.70718,-155.51399,0.15402462,-0.22110869,12.677833,1020000
|
| 86 |
+
1.0,1.0000001,0.029457474,2.9457474,1.0294576,1.1741233,-0.6850228,-69.70017,-159.70868,0.28886265,-0.13351043,13.302741,1025000
|
| 87 |
+
1.0,1.0,0.030109141,3.0109143,1.0301092,1.200968,-1.3691163,-68.5387,-151.12064,0.48537624,-0.5537471,27.22465,1030000
|
| 88 |
+
1.0,1.0,0.033670798,3.36708,1.0336708,0.9480209,-4.6147437,-69.79474,-171.34915,0.21607992,-0.17612582,13.041958,1035000
|
| 89 |
+
1.0,0.99999994,0.032592915,3.2592916,1.0325929,1.0285814,-2.0690825,-66.73834,-167.80032,0.2234381,-0.30573237,12.220416,1040000
|
| 90 |
+
1.0,1.0,0.0328943,3.2894297,1.0328943,1.5639404,-3.2496843,-72.99569,-136.8094,0.5372599,-0.5453766,30.224796,1045000
|
| 91 |
+
1.0,1.0,0.029591905,2.9591904,1.0295919,0.8755743,0.32315773,-68.3559,-157.0354,0.18134974,-0.1362086,11.693008,1050000
|
| 92 |
+
1.0,0.99999994,0.032282963,3.2282963,1.032283,1.0488411,0.6583621,-69.38667,-154.31189,0.15439567,-0.34856516,17.165802,1055000
|
| 93 |
+
1.0,1.0,0.032610036,3.261004,1.03261,1.399474,0.97662055,-67.33406,-138.71103,0.26802126,-0.4593436,21.819283,1060000
|
| 94 |
+
1.0,0.99999994,0.034048844,3.4048843,1.0340488,1.2439209,2.0829003,-67.11425,-135.1039,0.26112658,-0.37013003,18.052431,1065000
|
| 95 |
+
1.0,0.99999994,0.032085203,3.2085204,1.0320852,1.1371292,-2.0745292,-66.66137,-134.39859,0.2754921,-0.28958052,16.18332,1070000
|
| 96 |
+
1.0,1.0,0.0306753,3.0675302,1.0306753,1.3967011,-0.7854585,-69.66265,-157.90437,0.4143233,-0.39612597,17.085484,1075000
|
| 97 |
+
1.0,0.99998343,0.03275539,3.2755394,1.0327388,1.1819179,0.6322001,-66.52468,-141.4191,0.32188106,-0.28310126,17.762177,1080000
|
| 98 |
+
1.0,1.0,0.0319407,3.1940699,1.0319407,1.0487398,-1.8347744,-66.68598,-168.0207,0.17817639,-0.25144598,15.056358,1085000
|
| 99 |
+
1.0,1.0,0.030981576,3.0981576,1.0309815,0.8174259,-0.817459,-67.32993,-152.78893,0.1349187,-0.16325076,10.259439,1090000
|
| 100 |
+
1.0,0.9999999,0.029535025,2.9535027,1.0295349,1.4653295,-1.781519,-63.062275,-160.16127,0.4262811,-0.52346617,21.053352,1095000
|
| 101 |
+
1.0,1.0000001,0.03196525,3.1965253,1.0319654,1.3003924,-5.0377836,-65.45146,-156.04889,0.15104401,-0.23891333,14.160297,1100000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ba823c34132a75f37c789f5469d288334533c6842ea26f6115bc3c8adee8391
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1050000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c04b675343bbbab983a97bf9af787f58bab01d8f61d61c7706bf3253a8e4ae9a
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_1100000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:164b8b9ac1721a56e829ddeb9972a521b128341240d08c6bca554cca9bfc6746
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:19ff0d8f2618a6d9b0fe0e7c8dc3ea4567f47abc394e08a2f5a5d0a7223b4fa6
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a64fbd7c975f87434672189358e680c927af70fb7ea388bfeb92c385b9618f7e
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8cccdcc1e76cdccf86c31d53698bc06cf0254718a4d3fdd4bf54d70c3faeed55
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7eee09af71e7fec79cf2e162d0ab20aae441208a82d8d32493199f55826e117e
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f07a9467219afc7ec654efd8bb59523beff8a088b13ffd21eda701ad1c28a46
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db9416388c3a8b80e4de46820e170f791ffa1109c9218ea85c53d97140d8f267
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:684a0aeba37bd70b0ac9798d6b02374939c5462e590f4856ed75af79bfe7a369
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_161705/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/11aj934o
|