Upload folder using huggingface_hub
Browse files- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/env.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/env_sv.csv +0 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/eval.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/online_agent.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_1000000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_750000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_800000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_850000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_900000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_950000.pkl +3 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/progress.tk +1 -0
- O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/token.tk +1 -0
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.027455182984970107,-0.016243476162429545,-0.02655822377977938,0.004606737676975518,27.880579936757943,11.923999999999014,0.72,6018.5,-0.34,-320.92,236.48,0.7212435579299927,550000
|
| 3 |
+
0.0,0.0,-0.04820476472961069,0.015163067781845495,-0.0471887235932262,-0.0036181416708732845,31.79327044021031,8.123999999999285,0.8,16288.22,-0.26,-234.9,160.48,0.5065046072006225,600000
|
| 4 |
+
0.0,0.0,-0.05266321517879578,0.03743369862221797,-0.050734723769969056,0.020061306807899425,33.52103240517475,5.578999999999564,0.9,22846.84,-0.16,-166.94,109.58,0.35276634216308594,650000
|
| 5 |
+
0.0,0.0,-0.06374074364712366,0.03579966317827975,-0.06134582087285001,0.0476647374867622,35.04908660168684,4.408999999999707,0.94,28018.6,-0.08,-122.24,86.18,0.2755628681182861,700000
|
| 6 |
+
0.0,0.0,-0.07120693246885947,0.06064182892097534,-0.06806423283852063,0.04458135832850559,34.50470492612419,4.152999999999735,0.94,33466.78,-0.1,-125.68,81.06,0.2579488706588745,750000
|
| 7 |
+
0.0,0.0,-0.06916772122931852,0.04896479284041979,-0.0667231795782509,0.04744183941903372,34.621356002130476,4.015999999999811,0.96,37706.98,-0.06,-118.56,78.32,0.25413339138031005,800000
|
| 8 |
+
0.0,0.0,-0.06318659032122738,0.06310402599320777,-0.06045968442607231,0.049428480407572584,35.44367030951644,3.783999999999787,0.96,41263.2,-0.06,-104.32,73.68,0.24591673374176026,850000
|
| 9 |
+
0.0,0.0,-0.06344932820089662,0.0593729858043898,-0.060145874801365275,0.05844700357082891,35.29355002538855,2.6089999999999343,1.0,44686.4,0.0,-74.1,50.18,0.16667794227600097,900000
|
| 10 |
+
0.0,0.0,-0.06345432247943285,0.054674498806359495,-0.060074136532753356,0.06519491198786527,35.77051941144731,2.8369999999999704,1.0,47412.64,0.0,-81.3,54.74,0.18300590991973878,950000
|
| 11 |
+
0.0,0.0,-0.06884639855905171,0.049966818111081376,-0.06576707292553005,0.058148765454996684,35.33225139427971,3.654999999999827,0.96,50846.2,-0.04,-95.16,71.1,0.23551222324371338,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,-0.027455182984970107,-0.016243476162429545,-0.02655822377977938,0.004606737676975518,27.880579936757943,11.923999999999014,0.72,6018.5,-0.34,-320.92,236.48,0.7212435579299927,550000
|
| 3 |
+
0.0,0.0,-0.04820476472961069,0.015163067781845495,-0.0471887235932262,-0.0036181416708732845,31.79327044021031,8.123999999999285,0.8,16288.22,-0.26,-234.9,160.48,0.5065046072006225,600000
|
| 4 |
+
0.0,0.0,-0.05266321517879578,0.03743369862221797,-0.050734723769969056,0.020061306807899425,33.52103240517475,5.578999999999564,0.9,22846.84,-0.16,-166.94,109.58,0.35276634216308594,650000
|
| 5 |
+
0.0,0.0,-0.06374074364712366,0.03579966317827975,-0.06134582087285001,0.0476647374867622,35.04908660168684,4.408999999999707,0.94,28018.6,-0.08,-122.24,86.18,0.2755628681182861,700000
|
| 6 |
+
0.0,0.0,-0.07120693246885947,0.06064182892097534,-0.06806423283852063,0.04458135832850559,34.50470492612419,4.152999999999735,0.94,33466.78,-0.1,-125.68,81.06,0.2579488706588745,750000
|
| 7 |
+
0.0,0.0,-0.06916772122931852,0.04896479284041979,-0.0667231795782509,0.04744183941903372,34.621356002130476,4.015999999999811,0.96,37706.98,-0.06,-118.56,78.32,0.25413339138031005,800000
|
| 8 |
+
0.0,0.0,-0.06318659032122738,0.06310402599320777,-0.06045968442607231,0.049428480407572584,35.44367030951644,3.783999999999787,0.96,41263.2,-0.06,-104.32,73.68,0.24591673374176026,850000
|
| 9 |
+
0.0,0.0,-0.06344932820089662,0.0593729858043898,-0.060145874801365275,0.05844700357082891,35.29355002538855,2.6089999999999343,1.0,44686.4,0.0,-74.1,50.18,0.16667794227600097,900000
|
| 10 |
+
0.0,0.0,-0.06345432247943285,0.054674498806359495,-0.060074136532753356,0.06519491198786527,35.77051941144731,2.8369999999999704,1.0,47412.64,0.0,-81.3,54.74,0.18300590991973878,950000
|
| 11 |
+
0.0,0.0,-0.06884639855905171,0.049966818111081376,-0.06576707292553005,0.058148765454996684,35.33225139427971,3.654999999999827,0.96,50846.2,-0.04,-95.16,71.1,0.23551222324371338,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.025410943,2.5410943,1.0254109,0.6865036,-24.974669,-102.93029,-179.41916,0.12654576,-0.10546045,9.12171,505000
|
| 3 |
+
1.0,1.0,0.025060683,2.5060682,1.0250607,0.782943,-21.23974,-102.35262,-175.97856,0.11903742,-0.2107001,11.693334,510000
|
| 4 |
+
1.0,0.99999994,0.022867696,2.2867696,1.0228677,0.71515316,-26.577238,-103.82975,-178.77844,0.18020111,-0.15395957,13.160402,515000
|
| 5 |
+
1.0,1.0000001,0.022416048,2.2416048,1.0224161,0.9619643,-18.120338,-105.88897,-191.63484,0.10565561,-0.15439466,9.745169,520000
|
| 6 |
+
1.0,1.0,0.023058593,2.3058596,1.0230587,0.80849755,-33.990444,-106.04723,-188.48236,0.0919208,-0.17733589,10.229068,525000
|
| 7 |
+
1.0,1.0,0.022428637,2.242864,1.0224286,0.88605195,-34.510475,-104.84872,-190.34796,0.26262304,-0.2718877,12.804092,530000
|
| 8 |
+
1.0,1.0,0.022158973,2.215897,1.022159,0.8800613,-20.19318,-106.854065,-180.049,0.4487577,-0.60797226,18.583145,535000
|
| 9 |
+
1.0,1.0,0.02297491,2.297491,1.022975,1.5489773,-35.40843,-107.56136,-182.75642,0.83169043,-0.8705027,22.940176,540000
|
| 10 |
+
1.0,0.9999999,0.02196005,2.196005,1.0219599,1.2221813,-21.527563,-107.030334,-202.29256,0.19230473,-0.15571816,13.269623,545000
|
| 11 |
+
1.0,1.0,0.02354283,2.354283,1.0235429,1.5922931,-30.393694,-106.23435,-182.82527,0.3647646,-0.36432904,25.948217,550000
|
| 12 |
+
1.0,1.0,0.02536783,2.536783,1.0253679,2.0470092,-7.461494,-102.798416,-185.60269,0.35730273,-0.35765824,26.464296,555000
|
| 13 |
+
1.0,1.0,0.025287835,2.5287833,1.0252879,1.656799,-15.664715,-99.067535,-192.53185,0.3486125,-0.40872923,23.5306,560000
|
| 14 |
+
1.0,1.0,0.025409633,2.5409632,1.0254096,1.2570553,-3.1835854,-98.165215,-183.9281,0.20331134,-0.15948656,15.099241,565000
|
| 15 |
+
1.0,1.0,0.026977146,2.6977146,1.0269772,1.5246799,-5.377539,-93.98988,-203.5072,0.53823256,-0.32634777,19.555496,570000
|
| 16 |
+
1.0,1.0,0.027086522,2.7086523,1.0270865,1.4368721,-11.199528,-96.73852,-182.21834,0.24647173,-0.18685284,17.039223,575000
|
| 17 |
+
1.0,1.0,0.026504228,2.6504228,1.0265043,1.5081205,-8.48454,-98.8531,-191.9634,2.3308961,-1.850974,34.224102,580000
|
| 18 |
+
1.0,1.0,0.02576692,2.5766923,1.025767,1.8606566,-3.8789434,-98.45335,-190.37073,0.67826074,-0.6375243,28.902344,585000
|
| 19 |
+
1.0,1.0,0.026975406,2.6975408,1.0269754,1.959246,-5.51579,-95.957054,-182.71729,0.29508334,-0.49208122,21.159958,590000
|
| 20 |
+
1.0,1.0,0.026802046,2.6802046,1.0268021,1.4234171,0.15374969,-99.05247,-190.38115,0.29551995,-0.31371152,18.348816,595000
|
| 21 |
+
1.0,1.0,0.025772886,2.5772886,1.0257729,1.4451106,-7.3733506,-94.00695,-181.8485,0.3867184,-0.21249662,18.776222,600000
|
| 22 |
+
1.0,1.0,0.025315017,2.5315015,1.025315,1.5138313,-2.2273512,-96.4674,-185.30692,0.47865117,-0.48974037,25.880524,605000
|
| 23 |
+
1.0,1.0,0.0266723,2.6672301,1.0266722,2.1488817,-5.6067986,-96.552956,-183.28654,0.26760864,-0.2435858,24.558426,610000
|
| 24 |
+
1.0,0.9999829,0.025494866,2.5494866,1.0254778,1.0669516,0.91773045,-92.092155,-187.76794,0.21168384,-0.17381403,13.467963,615000
|
| 25 |
+
1.0,1.0,0.025314126,2.5314126,1.0253141,1.2720234,-2.675796,-92.4444,-183.03299,0.33386025,-0.3393581,19.480377,620000
|
| 26 |
+
1.0,1.0,0.027017578,2.701758,1.0270176,1.4993012,-6.6765513,-95.94484,-183.22258,0.2522036,-0.28925097,18.498175,625000
|
| 27 |
+
1.0,1.0,0.027048767,2.704877,1.0270488,1.5519892,-8.114893,-93.80342,-180.27388,0.2771563,-0.2918598,18.34594,630000
|
| 28 |
+
1.0,0.99987274,0.026558477,2.6558478,1.0264312,1.1272588,1.9102526,-91.50371,-178.6441,0.24042335,-0.2702937,14.406121,635000
|
| 29 |
+
1.0,1.0,0.028039351,2.8039353,1.0280393,1.7223685,-9.093226,-86.850395,-172.73402,0.7245283,-0.6399443,26.972328,640000
|
| 30 |
+
1.0,0.99999994,0.02888504,2.8885043,1.028885,2.878331,-8.063931,-90.840324,-196.6282,0.51324904,-0.6023001,33.034588,645000
|
| 31 |
+
1.0,1.0000001,0.027982622,2.7982624,1.0279827,1.1062393,-5.241204,-88.42275,-185.41507,0.18195322,-0.23971614,13.476558,650000
|
| 32 |
+
1.0,1.0,0.025657937,2.5657938,1.0256579,7.537431,-8.530247,-89.03199,-178.08403,1.7140052,-1.5738974,71.02468,655000
|
| 33 |
+
1.0,1.0000001,0.027786827,2.7786827,1.027787,1.5730733,-1.5423744,-90.65618,-186.25743,0.7338078,-0.7197376,21.952858,660000
|
| 34 |
+
1.0,1.0,0.027109401,2.7109401,1.0271094,1.2187889,-1.1917478,-89.2444,-177.62567,0.16974652,-0.18100452,14.306935,665000
|
| 35 |
+
1.0,1.0,0.03190776,3.1907763,1.0319078,2.7649481,-13.716895,-86.36326,-172.87323,0.5341985,-0.6053363,34.39742,670000
|
| 36 |
+
1.0,1.0,0.02943724,2.9437242,1.0294372,1.4414328,-3.073575,-89.84759,-189.76178,0.21206269,-0.13885272,14.759348,675000
|
| 37 |
+
1.0,1.0,0.028243726,2.8243728,1.0282438,2.535841,0.4118026,-89.66458,-196.55864,0.6208907,-0.88009065,35.95955,680000
|
| 38 |
+
1.0,0.99999994,0.028554594,2.8554595,1.0285546,1.8549168,-8.67231,-84.80662,-167.81204,0.28377447,-0.2502568,21.625198,685000
|
| 39 |
+
1.0,1.0,0.027132098,2.7132096,1.0271322,2.4195278,-1.9693551,-83.33007,-194.82904,0.703107,-0.90457225,32.69143,690000
|
| 40 |
+
1.0,0.99999994,0.030175608,3.017561,1.0301756,1.4010524,-4.020889,-83.97118,-194.78273,0.7693731,-0.7325906,21.567785,695000
|
| 41 |
+
1.0,1.0,0.028594166,2.859417,1.0285941,1.4510701,-4.5949674,-84.95441,-193.40576,0.41576916,-0.5511275,23.894108,700000
|
| 42 |
+
1.0,0.99999994,0.029518355,2.9518356,1.0295182,1.4867847,-4.1052775,-83.21893,-156.86475,0.23773536,-0.24819325,17.742817,705000
|
| 43 |
+
1.0,1.0,0.028720919,2.872092,1.028721,1.3276224,1.2356395,-83.917274,-165.66574,0.3606796,-0.5344254,22.902302,710000
|
| 44 |
+
1.0,0.99999994,0.029612493,2.9612494,1.0296124,1.3033727,-0.37460423,-85.26497,-171.70792,0.24477744,-0.28364277,17.124096,715000
|
| 45 |
+
1.0,1.0,0.02795872,2.7958722,1.0279588,1.2548304,-5.811518,-83.31936,-179.61902,0.22430286,-0.27280387,15.189444,720000
|
| 46 |
+
1.0,1.0,0.028944084,2.8944085,1.0289441,1.8260239,-6.10352,-82.67244,-156.14793,0.31743553,-0.29297668,22.943546,725000
|
| 47 |
+
1.0,0.99999994,0.030226102,3.0226102,1.030226,1.8917888,-3.0537846,-86.14532,-174.218,0.31276563,-0.30630544,26.6586,730000
|
| 48 |
+
1.0,1.0,0.029247759,2.924776,1.0292478,1.5075599,1.1659265,-86.93462,-176.46257,0.31568512,-0.44524336,22.60336,735000
|
| 49 |
+
1.0,0.9998121,0.029418273,2.9418273,1.0292304,1.3514868,3.301708,-85.77549,-194.05617,0.3139456,-0.3451441,19.779512,740000
|
| 50 |
+
1.0,1.0,0.029713437,2.9713438,1.0297134,1.2611574,-2.635559,-84.300125,-182.99535,0.39628285,-0.31582594,18.523548,745000
|
| 51 |
+
1.0,0.99999994,0.02751282,2.7512822,1.0275128,1.2267185,0.14573511,-79.48733,-192.9651,0.21637286,-0.22638719,15.386296,750000
|
| 52 |
+
1.0,1.0,0.028825622,2.8825624,1.0288256,2.1232147,-6.150314,-86.681595,-170.16281,0.8915199,-0.9380819,43.803474,755000
|
| 53 |
+
1.0,1.0,0.029262304,2.9262304,1.0292623,1.4965184,1.7977626,-82.80813,-173.2857,0.20536266,-0.2498822,18.22322,760000
|
| 54 |
+
1.0,1.0,0.028649982,2.8649983,1.0286499,1.5094092,-4.7082872,-81.4304,-182.23016,0.2892022,-0.18249023,20.20559,765000
|
| 55 |
+
1.0,0.9999999,0.026993526,2.6993525,1.0269934,1.2577406,-0.35468614,-82.48976,-161.12798,0.17738114,-0.20674208,16.092731,770000
|
| 56 |
+
1.0,1.0,0.028099157,2.809916,1.0280992,6.419037,-8.969891,-85.33965,-186.48456,1.0860205,-1.0640181,77.68452,775000
|
| 57 |
+
1.0,1.0,0.028319696,2.8319697,1.0283197,1.5179636,2.53469,-82.93361,-165.26172,0.19580814,-0.20031427,18.921488,780000
|
| 58 |
+
1.0,1.0,0.02886528,2.8865283,1.0288653,1.0883429,-1.8060315,-82.2486,-172.96414,0.43229896,-0.22924843,15.116756,785000
|
| 59 |
+
1.0,0.99999994,0.028379623,2.8379622,1.0283796,2.2870119,-1.7035887,-81.09949,-192.65506,0.4683863,-0.287018,25.77564,790000
|
| 60 |
+
1.0,0.9999958,0.029317245,2.9317248,1.0293131,1.7061099,2.1004124,-80.7593,-173.84407,0.22851695,-0.20628393,19.494522,795000
|
| 61 |
+
1.0,1.0,0.028401732,2.8401732,1.0284017,1.3343986,-3.9526892,-84.31293,-177.33226,0.37323084,-0.3827526,18.30392,800000
|
| 62 |
+
1.0,1.0,0.030219626,3.0219626,1.0302197,2.0977638,-5.8785744,-84.39987,-166.58086,0.8341387,-0.6651324,36.37857,805000
|
| 63 |
+
1.0,1.0000001,0.030042592,3.004259,1.0300428,1.0520374,3.8584266,-81.118614,-183.71269,0.10442688,-0.16104795,12.439722,810000
|
| 64 |
+
1.0,0.9999999,0.028126182,2.8126183,1.0281261,1.24166,-0.94159955,-82.13251,-166.59154,0.4749075,-0.5092092,16.773575,815000
|
| 65 |
+
1.0,1.0,0.029176682,2.9176683,1.0291767,1.543215,-2.3737683,-81.8475,-177.4524,0.29355282,-0.3481551,22.53749,820000
|
| 66 |
+
1.0,0.9999999,0.029865805,2.9865804,1.0298657,1.6252774,1.4570118,-80.51342,-173.79721,0.74526644,-0.27937415,22.777,825000
|
| 67 |
+
1.0,1.0,0.029597122,2.9597125,1.0295972,1.7556679,-2.286252,-79.58232,-162.34122,0.45968282,-0.31354663,23.754913,830000
|
| 68 |
+
1.0,1.0,0.02896733,2.896733,1.0289674,1.8895886,0.38186955,-78.493385,-192.15854,0.2997719,-0.30900258,23.367275,835000
|
| 69 |
+
1.0,1.0,0.0308696,3.0869598,1.0308696,1.4942139,0.1608458,-79.11062,-164.07074,0.2096849,-0.19404967,17.13427,840000
|
| 70 |
+
1.0,1.0,0.02735312,2.735312,1.0273532,1.3932456,-0.2903636,-82.79846,-181.54291,1.6530524,-1.5789057,40.98786,845000
|
| 71 |
+
1.0,1.0,0.027944218,2.794422,1.0279442,1.550975,1.3182546,-77.56123,-180.35826,0.45856073,-0.8199188,25.036987,850000
|
| 72 |
+
1.0,0.99999994,0.02796571,2.796571,1.0279657,1.4880016,0.29854482,-80.68373,-159.48862,0.34835768,-0.20721327,21.336185,855000
|
| 73 |
+
1.0,1.0,0.029235937,2.9235938,1.029236,1.9323953,-1.0218707,-77.69029,-182.01926,0.41750938,-1.3531325,28.433817,860000
|
| 74 |
+
1.0,1.0,0.027836239,2.783624,1.0278362,1.365343,-0.67144346,-79.012344,-167.63707,0.16706753,-0.48343503,18.832344,865000
|
| 75 |
+
1.0,1.0,0.028775904,2.8775904,1.0287759,9.034078,-0.71063036,-78.23907,-179.53859,4.3901296,-4.6447697,93.88536,870000
|
| 76 |
+
1.0,1.0,0.027554054,2.7554054,1.027554,1.3572859,0.57545125,-78.30064,-188.02393,0.18430167,-0.20863762,18.130116,875000
|
| 77 |
+
1.0,0.9999999,0.028011702,2.8011703,1.0280116,2.4466848,-3.098978,-77.63776,-167.76212,0.579199,-0.60090464,30.958942,880000
|
| 78 |
+
1.0,1.0000001,0.027840976,2.7840977,1.0278411,1.3382999,-3.9815316,-77.92391,-167.61919,0.18921937,-0.2882311,18.323992,885000
|
| 79 |
+
1.0,1.0,0.030590605,3.0590606,1.0305907,1.4504688,0.42903644,-80.802795,-173.10107,0.25774246,-0.24602164,16.73123,890000
|
| 80 |
+
1.0,1.0,0.03074963,3.074963,1.0307497,1.5019183,1.301219,-80.658775,-167.75356,0.20403384,-0.22687142,19.147058,895000
|
| 81 |
+
1.0,1.0000001,0.028131772,2.8131773,1.0281318,1.4104862,-0.9105861,-74.981606,-146.83203,0.39182857,-0.38005584,25.282368,900000
|
| 82 |
+
1.0,1.0,0.029539408,2.9539409,1.0295395,1.2440677,0.11218046,-76.71696,-175.00394,0.18053626,-0.34083503,16.08099,905000
|
| 83 |
+
1.0,1.0,0.030927394,3.0927396,1.0309274,1.4707477,-2.752386,-77.31771,-154.08267,1.2603273,-1.2217491,30.029121,910000
|
| 84 |
+
1.0,0.99999994,0.027832251,2.783225,1.0278322,1.6333259,-0.68634176,-75.63672,-147.8456,0.32320133,-0.23522042,19.498522,915000
|
| 85 |
+
1.0,0.99999994,0.031383,3.1383004,1.0313829,1.2917235,-0.32668298,-75.70513,-155.98402,0.16825162,-0.22967301,17.004498,920000
|
| 86 |
+
1.0,1.0000001,0.029208746,2.9208746,1.0292089,2.0999205,0.118010744,-77.31284,-192.49301,0.41868868,-0.2002792,23.024845,925000
|
| 87 |
+
1.0,1.0,0.03021834,3.021834,1.0302184,1.4082173,4.3368607,-74.09452,-157.00473,0.25990027,-0.5130353,22.147058,930000
|
| 88 |
+
1.0,1.0000001,0.030324666,3.0324664,1.0303248,1.3120235,-4.062712,-77.09051,-186.57077,0.35051495,-0.3217945,18.651766,935000
|
| 89 |
+
1.0,1.0,0.031158257,3.1158257,1.0311582,1.1614254,-0.22409798,-71.79646,-176.35176,0.15762524,-0.30571327,16.429932,940000
|
| 90 |
+
1.0,1.0,0.031283878,3.1283877,1.0312839,1.0423069,-3.849921,-77.490234,-143.36201,0.57466376,-0.5925511,15.984029,945000
|
| 91 |
+
1.0,1.0,0.02795937,2.795937,1.0279593,0.9363171,-2.9288266,-73.757774,-165.93112,0.21723905,-0.23706955,14.024564,950000
|
| 92 |
+
1.0,1.0,0.031464864,3.1464865,1.0314648,1.3048204,-1.6777456,-74.71749,-155.34308,0.22621632,-0.21026841,14.62136,955000
|
| 93 |
+
1.0,1.0,0.02959936,2.959936,1.0295993,1.2129326,0.5961497,-72.73693,-151.47598,0.159593,-0.24496,15.932545,960000
|
| 94 |
+
1.0,1.0,0.029690074,2.9690075,1.02969,1.1740359,-1.1010258,-73.72134,-144.22054,0.1407535,-0.27483875,14.891957,965000
|
| 95 |
+
1.0,1.0,0.032308772,3.2308774,1.0323088,1.5507258,-2.15166,-73.04394,-143.32477,0.40238875,-0.30739444,22.210897,970000
|
| 96 |
+
1.0,1.0,0.029195502,2.9195504,1.0291955,1.305962,4.7949643,-73.69378,-171.29778,0.38938087,-0.21890551,16.836071,975000
|
| 97 |
+
1.0,1.0000001,0.030809822,3.0809824,1.03081,1.7242422,1.1164567,-73.571625,-150.37857,0.8975912,-0.8414911,33.335632,980000
|
| 98 |
+
1.0,1.0,0.031096717,3.1096718,1.0310967,1.2215202,1.430079,-71.48467,-181.58261,0.51951766,-0.4130411,16.450691,985000
|
| 99 |
+
1.0,1.0,0.03090405,3.090405,1.030904,2.7367492,-0.5595513,-74.31366,-157.20044,0.56621003,-0.64196944,34.19162,990000
|
| 100 |
+
1.0,1.0,0.030094117,3.0094118,1.0300941,2.5589688,1.3449925,-67.347244,-165.45395,0.32833928,-0.30099905,20.168728,995000
|
| 101 |
+
1.0,1.0,0.03145179,3.1451793,1.0314518,1.3668126,1.1351964,-71.38733,-157.54648,0.42768312,-0.36670828,19.791334,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/action_std,actor/actor_loss,actor/bc_loss,actor/mse,actor/total_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
|
| 2 |
+
1.0,1.0,0.025410943,2.5410943,1.0254109,0.6865036,-24.974669,-102.93029,-179.41916,0.12654576,-0.10546045,9.12171,505000
|
| 3 |
+
1.0,1.0,0.025060683,2.5060682,1.0250607,0.782943,-21.23974,-102.35262,-175.97856,0.11903742,-0.2107001,11.693334,510000
|
| 4 |
+
1.0,0.99999994,0.022867696,2.2867696,1.0228677,0.71515316,-26.577238,-103.82975,-178.77844,0.18020111,-0.15395957,13.160402,515000
|
| 5 |
+
1.0,1.0000001,0.022416048,2.2416048,1.0224161,0.9619643,-18.120338,-105.88897,-191.63484,0.10565561,-0.15439466,9.745169,520000
|
| 6 |
+
1.0,1.0,0.023058593,2.3058596,1.0230587,0.80849755,-33.990444,-106.04723,-188.48236,0.0919208,-0.17733589,10.229068,525000
|
| 7 |
+
1.0,1.0,0.022428637,2.242864,1.0224286,0.88605195,-34.510475,-104.84872,-190.34796,0.26262304,-0.2718877,12.804092,530000
|
| 8 |
+
1.0,1.0,0.022158973,2.215897,1.022159,0.8800613,-20.19318,-106.854065,-180.049,0.4487577,-0.60797226,18.583145,535000
|
| 9 |
+
1.0,1.0,0.02297491,2.297491,1.022975,1.5489773,-35.40843,-107.56136,-182.75642,0.83169043,-0.8705027,22.940176,540000
|
| 10 |
+
1.0,0.9999999,0.02196005,2.196005,1.0219599,1.2221813,-21.527563,-107.030334,-202.29256,0.19230473,-0.15571816,13.269623,545000
|
| 11 |
+
1.0,1.0,0.02354283,2.354283,1.0235429,1.5922931,-30.393694,-106.23435,-182.82527,0.3647646,-0.36432904,25.948217,550000
|
| 12 |
+
1.0,1.0,0.02536783,2.536783,1.0253679,2.0470092,-7.461494,-102.798416,-185.60269,0.35730273,-0.35765824,26.464296,555000
|
| 13 |
+
1.0,1.0,0.025287835,2.5287833,1.0252879,1.656799,-15.664715,-99.067535,-192.53185,0.3486125,-0.40872923,23.5306,560000
|
| 14 |
+
1.0,1.0,0.025409633,2.5409632,1.0254096,1.2570553,-3.1835854,-98.165215,-183.9281,0.20331134,-0.15948656,15.099241,565000
|
| 15 |
+
1.0,1.0,0.026977146,2.6977146,1.0269772,1.5246799,-5.377539,-93.98988,-203.5072,0.53823256,-0.32634777,19.555496,570000
|
| 16 |
+
1.0,1.0,0.027086522,2.7086523,1.0270865,1.4368721,-11.199528,-96.73852,-182.21834,0.24647173,-0.18685284,17.039223,575000
|
| 17 |
+
1.0,1.0,0.026504228,2.6504228,1.0265043,1.5081205,-8.48454,-98.8531,-191.9634,2.3308961,-1.850974,34.224102,580000
|
| 18 |
+
1.0,1.0,0.02576692,2.5766923,1.025767,1.8606566,-3.8789434,-98.45335,-190.37073,0.67826074,-0.6375243,28.902344,585000
|
| 19 |
+
1.0,1.0,0.026975406,2.6975408,1.0269754,1.959246,-5.51579,-95.957054,-182.71729,0.29508334,-0.49208122,21.159958,590000
|
| 20 |
+
1.0,1.0,0.026802046,2.6802046,1.0268021,1.4234171,0.15374969,-99.05247,-190.38115,0.29551995,-0.31371152,18.348816,595000
|
| 21 |
+
1.0,1.0,0.025772886,2.5772886,1.0257729,1.4451106,-7.3733506,-94.00695,-181.8485,0.3867184,-0.21249662,18.776222,600000
|
| 22 |
+
1.0,1.0,0.025315017,2.5315015,1.025315,1.5138313,-2.2273512,-96.4674,-185.30692,0.47865117,-0.48974037,25.880524,605000
|
| 23 |
+
1.0,1.0,0.0266723,2.6672301,1.0266722,2.1488817,-5.6067986,-96.552956,-183.28654,0.26760864,-0.2435858,24.558426,610000
|
| 24 |
+
1.0,0.9999829,0.025494866,2.5494866,1.0254778,1.0669516,0.91773045,-92.092155,-187.76794,0.21168384,-0.17381403,13.467963,615000
|
| 25 |
+
1.0,1.0,0.025314126,2.5314126,1.0253141,1.2720234,-2.675796,-92.4444,-183.03299,0.33386025,-0.3393581,19.480377,620000
|
| 26 |
+
1.0,1.0,0.027017578,2.701758,1.0270176,1.4993012,-6.6765513,-95.94484,-183.22258,0.2522036,-0.28925097,18.498175,625000
|
| 27 |
+
1.0,1.0,0.027048767,2.704877,1.0270488,1.5519892,-8.114893,-93.80342,-180.27388,0.2771563,-0.2918598,18.34594,630000
|
| 28 |
+
1.0,0.99987274,0.026558477,2.6558478,1.0264312,1.1272588,1.9102526,-91.50371,-178.6441,0.24042335,-0.2702937,14.406121,635000
|
| 29 |
+
1.0,1.0,0.028039351,2.8039353,1.0280393,1.7223685,-9.093226,-86.850395,-172.73402,0.7245283,-0.6399443,26.972328,640000
|
| 30 |
+
1.0,0.99999994,0.02888504,2.8885043,1.028885,2.878331,-8.063931,-90.840324,-196.6282,0.51324904,-0.6023001,33.034588,645000
|
| 31 |
+
1.0,1.0000001,0.027982622,2.7982624,1.0279827,1.1062393,-5.241204,-88.42275,-185.41507,0.18195322,-0.23971614,13.476558,650000
|
| 32 |
+
1.0,1.0,0.025657937,2.5657938,1.0256579,7.537431,-8.530247,-89.03199,-178.08403,1.7140052,-1.5738974,71.02468,655000
|
| 33 |
+
1.0,1.0000001,0.027786827,2.7786827,1.027787,1.5730733,-1.5423744,-90.65618,-186.25743,0.7338078,-0.7197376,21.952858,660000
|
| 34 |
+
1.0,1.0,0.027109401,2.7109401,1.0271094,1.2187889,-1.1917478,-89.2444,-177.62567,0.16974652,-0.18100452,14.306935,665000
|
| 35 |
+
1.0,1.0,0.03190776,3.1907763,1.0319078,2.7649481,-13.716895,-86.36326,-172.87323,0.5341985,-0.6053363,34.39742,670000
|
| 36 |
+
1.0,1.0,0.02943724,2.9437242,1.0294372,1.4414328,-3.073575,-89.84759,-189.76178,0.21206269,-0.13885272,14.759348,675000
|
| 37 |
+
1.0,1.0,0.028243726,2.8243728,1.0282438,2.535841,0.4118026,-89.66458,-196.55864,0.6208907,-0.88009065,35.95955,680000
|
| 38 |
+
1.0,0.99999994,0.028554594,2.8554595,1.0285546,1.8549168,-8.67231,-84.80662,-167.81204,0.28377447,-0.2502568,21.625198,685000
|
| 39 |
+
1.0,1.0,0.027132098,2.7132096,1.0271322,2.4195278,-1.9693551,-83.33007,-194.82904,0.703107,-0.90457225,32.69143,690000
|
| 40 |
+
1.0,0.99999994,0.030175608,3.017561,1.0301756,1.4010524,-4.020889,-83.97118,-194.78273,0.7693731,-0.7325906,21.567785,695000
|
| 41 |
+
1.0,1.0,0.028594166,2.859417,1.0285941,1.4510701,-4.5949674,-84.95441,-193.40576,0.41576916,-0.5511275,23.894108,700000
|
| 42 |
+
1.0,0.99999994,0.029518355,2.9518356,1.0295182,1.4867847,-4.1052775,-83.21893,-156.86475,0.23773536,-0.24819325,17.742817,705000
|
| 43 |
+
1.0,1.0,0.028720919,2.872092,1.028721,1.3276224,1.2356395,-83.917274,-165.66574,0.3606796,-0.5344254,22.902302,710000
|
| 44 |
+
1.0,0.99999994,0.029612493,2.9612494,1.0296124,1.3033727,-0.37460423,-85.26497,-171.70792,0.24477744,-0.28364277,17.124096,715000
|
| 45 |
+
1.0,1.0,0.02795872,2.7958722,1.0279588,1.2548304,-5.811518,-83.31936,-179.61902,0.22430286,-0.27280387,15.189444,720000
|
| 46 |
+
1.0,1.0,0.028944084,2.8944085,1.0289441,1.8260239,-6.10352,-82.67244,-156.14793,0.31743553,-0.29297668,22.943546,725000
|
| 47 |
+
1.0,0.99999994,0.030226102,3.0226102,1.030226,1.8917888,-3.0537846,-86.14532,-174.218,0.31276563,-0.30630544,26.6586,730000
|
| 48 |
+
1.0,1.0,0.029247759,2.924776,1.0292478,1.5075599,1.1659265,-86.93462,-176.46257,0.31568512,-0.44524336,22.60336,735000
|
| 49 |
+
1.0,0.9998121,0.029418273,2.9418273,1.0292304,1.3514868,3.301708,-85.77549,-194.05617,0.3139456,-0.3451441,19.779512,740000
|
| 50 |
+
1.0,1.0,0.029713437,2.9713438,1.0297134,1.2611574,-2.635559,-84.300125,-182.99535,0.39628285,-0.31582594,18.523548,745000
|
| 51 |
+
1.0,0.99999994,0.02751282,2.7512822,1.0275128,1.2267185,0.14573511,-79.48733,-192.9651,0.21637286,-0.22638719,15.386296,750000
|
| 52 |
+
1.0,1.0,0.028825622,2.8825624,1.0288256,2.1232147,-6.150314,-86.681595,-170.16281,0.8915199,-0.9380819,43.803474,755000
|
| 53 |
+
1.0,1.0,0.029262304,2.9262304,1.0292623,1.4965184,1.7977626,-82.80813,-173.2857,0.20536266,-0.2498822,18.22322,760000
|
| 54 |
+
1.0,1.0,0.028649982,2.8649983,1.0286499,1.5094092,-4.7082872,-81.4304,-182.23016,0.2892022,-0.18249023,20.20559,765000
|
| 55 |
+
1.0,0.9999999,0.026993526,2.6993525,1.0269934,1.2577406,-0.35468614,-82.48976,-161.12798,0.17738114,-0.20674208,16.092731,770000
|
| 56 |
+
1.0,1.0,0.028099157,2.809916,1.0280992,6.419037,-8.969891,-85.33965,-186.48456,1.0860205,-1.0640181,77.68452,775000
|
| 57 |
+
1.0,1.0,0.028319696,2.8319697,1.0283197,1.5179636,2.53469,-82.93361,-165.26172,0.19580814,-0.20031427,18.921488,780000
|
| 58 |
+
1.0,1.0,0.02886528,2.8865283,1.0288653,1.0883429,-1.8060315,-82.2486,-172.96414,0.43229896,-0.22924843,15.116756,785000
|
| 59 |
+
1.0,0.99999994,0.028379623,2.8379622,1.0283796,2.2870119,-1.7035887,-81.09949,-192.65506,0.4683863,-0.287018,25.77564,790000
|
| 60 |
+
1.0,0.9999958,0.029317245,2.9317248,1.0293131,1.7061099,2.1004124,-80.7593,-173.84407,0.22851695,-0.20628393,19.494522,795000
|
| 61 |
+
1.0,1.0,0.028401732,2.8401732,1.0284017,1.3343986,-3.9526892,-84.31293,-177.33226,0.37323084,-0.3827526,18.30392,800000
|
| 62 |
+
1.0,1.0,0.030219626,3.0219626,1.0302197,2.0977638,-5.8785744,-84.39987,-166.58086,0.8341387,-0.6651324,36.37857,805000
|
| 63 |
+
1.0,1.0000001,0.030042592,3.004259,1.0300428,1.0520374,3.8584266,-81.118614,-183.71269,0.10442688,-0.16104795,12.439722,810000
|
| 64 |
+
1.0,0.9999999,0.028126182,2.8126183,1.0281261,1.24166,-0.94159955,-82.13251,-166.59154,0.4749075,-0.5092092,16.773575,815000
|
| 65 |
+
1.0,1.0,0.029176682,2.9176683,1.0291767,1.543215,-2.3737683,-81.8475,-177.4524,0.29355282,-0.3481551,22.53749,820000
|
| 66 |
+
1.0,0.9999999,0.029865805,2.9865804,1.0298657,1.6252774,1.4570118,-80.51342,-173.79721,0.74526644,-0.27937415,22.777,825000
|
| 67 |
+
1.0,1.0,0.029597122,2.9597125,1.0295972,1.7556679,-2.286252,-79.58232,-162.34122,0.45968282,-0.31354663,23.754913,830000
|
| 68 |
+
1.0,1.0,0.02896733,2.896733,1.0289674,1.8895886,0.38186955,-78.493385,-192.15854,0.2997719,-0.30900258,23.367275,835000
|
| 69 |
+
1.0,1.0,0.0308696,3.0869598,1.0308696,1.4942139,0.1608458,-79.11062,-164.07074,0.2096849,-0.19404967,17.13427,840000
|
| 70 |
+
1.0,1.0,0.02735312,2.735312,1.0273532,1.3932456,-0.2903636,-82.79846,-181.54291,1.6530524,-1.5789057,40.98786,845000
|
| 71 |
+
1.0,1.0,0.027944218,2.794422,1.0279442,1.550975,1.3182546,-77.56123,-180.35826,0.45856073,-0.8199188,25.036987,850000
|
| 72 |
+
1.0,0.99999994,0.02796571,2.796571,1.0279657,1.4880016,0.29854482,-80.68373,-159.48862,0.34835768,-0.20721327,21.336185,855000
|
| 73 |
+
1.0,1.0,0.029235937,2.9235938,1.029236,1.9323953,-1.0218707,-77.69029,-182.01926,0.41750938,-1.3531325,28.433817,860000
|
| 74 |
+
1.0,1.0,0.027836239,2.783624,1.0278362,1.365343,-0.67144346,-79.012344,-167.63707,0.16706753,-0.48343503,18.832344,865000
|
| 75 |
+
1.0,1.0,0.028775904,2.8775904,1.0287759,9.034078,-0.71063036,-78.23907,-179.53859,4.3901296,-4.6447697,93.88536,870000
|
| 76 |
+
1.0,1.0,0.027554054,2.7554054,1.027554,1.3572859,0.57545125,-78.30064,-188.02393,0.18430167,-0.20863762,18.130116,875000
|
| 77 |
+
1.0,0.9999999,0.028011702,2.8011703,1.0280116,2.4466848,-3.098978,-77.63776,-167.76212,0.579199,-0.60090464,30.958942,880000
|
| 78 |
+
1.0,1.0000001,0.027840976,2.7840977,1.0278411,1.3382999,-3.9815316,-77.92391,-167.61919,0.18921937,-0.2882311,18.323992,885000
|
| 79 |
+
1.0,1.0,0.030590605,3.0590606,1.0305907,1.4504688,0.42903644,-80.802795,-173.10107,0.25774246,-0.24602164,16.73123,890000
|
| 80 |
+
1.0,1.0,0.03074963,3.074963,1.0307497,1.5019183,1.301219,-80.658775,-167.75356,0.20403384,-0.22687142,19.147058,895000
|
| 81 |
+
1.0,1.0000001,0.028131772,2.8131773,1.0281318,1.4104862,-0.9105861,-74.981606,-146.83203,0.39182857,-0.38005584,25.282368,900000
|
| 82 |
+
1.0,1.0,0.029539408,2.9539409,1.0295395,1.2440677,0.11218046,-76.71696,-175.00394,0.18053626,-0.34083503,16.08099,905000
|
| 83 |
+
1.0,1.0,0.030927394,3.0927396,1.0309274,1.4707477,-2.752386,-77.31771,-154.08267,1.2603273,-1.2217491,30.029121,910000
|
| 84 |
+
1.0,0.99999994,0.027832251,2.783225,1.0278322,1.6333259,-0.68634176,-75.63672,-147.8456,0.32320133,-0.23522042,19.498522,915000
|
| 85 |
+
1.0,0.99999994,0.031383,3.1383004,1.0313829,1.2917235,-0.32668298,-75.70513,-155.98402,0.16825162,-0.22967301,17.004498,920000
|
| 86 |
+
1.0,1.0000001,0.029208746,2.9208746,1.0292089,2.0999205,0.118010744,-77.31284,-192.49301,0.41868868,-0.2002792,23.024845,925000
|
| 87 |
+
1.0,1.0,0.03021834,3.021834,1.0302184,1.4082173,4.3368607,-74.09452,-157.00473,0.25990027,-0.5130353,22.147058,930000
|
| 88 |
+
1.0,1.0000001,0.030324666,3.0324664,1.0303248,1.3120235,-4.062712,-77.09051,-186.57077,0.35051495,-0.3217945,18.651766,935000
|
| 89 |
+
1.0,1.0,0.031158257,3.1158257,1.0311582,1.1614254,-0.22409798,-71.79646,-176.35176,0.15762524,-0.30571327,16.429932,940000
|
| 90 |
+
1.0,1.0,0.031283878,3.1283877,1.0312839,1.0423069,-3.849921,-77.490234,-143.36201,0.57466376,-0.5925511,15.984029,945000
|
| 91 |
+
1.0,1.0,0.02795937,2.795937,1.0279593,0.9363171,-2.9288266,-73.757774,-165.93112,0.21723905,-0.23706955,14.024564,950000
|
| 92 |
+
1.0,1.0,0.031464864,3.1464865,1.0314648,1.3048204,-1.6777456,-74.71749,-155.34308,0.22621632,-0.21026841,14.62136,955000
|
| 93 |
+
1.0,1.0,0.02959936,2.959936,1.0295993,1.2129326,0.5961497,-72.73693,-151.47598,0.159593,-0.24496,15.932545,960000
|
| 94 |
+
1.0,1.0,0.029690074,2.9690075,1.02969,1.1740359,-1.1010258,-73.72134,-144.22054,0.1407535,-0.27483875,14.891957,965000
|
| 95 |
+
1.0,1.0,0.032308772,3.2308774,1.0323088,1.5507258,-2.15166,-73.04394,-143.32477,0.40238875,-0.30739444,22.210897,970000
|
| 96 |
+
1.0,1.0,0.029195502,2.9195504,1.0291955,1.305962,4.7949643,-73.69378,-171.29778,0.38938087,-0.21890551,16.836071,975000
|
| 97 |
+
1.0,1.0000001,0.030809822,3.0809824,1.03081,1.7242422,1.1164567,-73.571625,-150.37857,0.8975912,-0.8414911,33.335632,980000
|
| 98 |
+
1.0,1.0,0.031096717,3.1096718,1.0310967,1.2215202,1.430079,-71.48467,-181.58261,0.51951766,-0.4130411,16.450691,985000
|
| 99 |
+
1.0,1.0,0.03090405,3.090405,1.030904,2.7367492,-0.5595513,-74.31366,-157.20044,0.56621003,-0.64196944,34.19162,990000
|
| 100 |
+
1.0,1.0,0.030094117,3.0094118,1.0300941,2.5589688,1.3449925,-67.347244,-165.45395,0.32833928,-0.30099905,20.168728,995000
|
| 101 |
+
1.0,1.0,0.03145179,3.1451793,1.0314518,1.3668126,1.1351964,-71.38733,-157.54648,0.42768312,-0.36670828,19.791334,1000000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_1000000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:34f475892ddfa5f61b764f7ce9068313e75ab1e13390446f9abde13bb57c6ca5
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d27db992db54100d636548730a1a0b3e0e8ded770fba045fafba9cd456c799a8
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aca3149de1e37e16a8d5e3184efedefad8c70b3e2be0487dcc6a95c2c678ce5f
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:665d6aed4658ec71f66812bbb5693f4a458feb4a6fc14e57c3acf14ce88c8354
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8423c6130460ad747087e425cad1930d042719e94271868c119fcd2f1195e3e4
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_750000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75e846298a27f5e4aa22a4d8a4d41270baab108d5624f1dfdd395dffe57cf9d9
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_800000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8c3b3511d6ebb682317d4eca01602ad90b667b51aa77d7e08a6cd6c9614b56b
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_850000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a6f20b5a3cd74ff8c531ad0890c4342a1937f6d240f2d94756189be9dae46c5
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_900000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:17c5bb18c93d947c1c5aaa7b619916f9013cd62aafe8bc282ddb03f30491dce7
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/params_950000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dafd33fc29a9d619257e8d786318386fb037fd0ab789a899bcd2f465d5c35ed9
|
| 3 |
+
size 217655954
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/cube-double-play-singletask-task2-v0/rebrac/20260311_150935/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/eekwskuj
|