Upload folder using huggingface_hub
Browse files- .gitattributes +10 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/env.csv +0 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/env_sv.csv +0 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/eval.csv +11 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/eval_sv.csv +11 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/online_agent.csv +101 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/online_agent_sv.csv +101 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_250000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_300000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_350000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_400000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_450000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_500000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_550000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_600000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_650000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/params_700000.pkl +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/progress.tk +1 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/token.tk +1 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_250000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_300000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_350000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_400000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_450000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_500000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_550000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_600000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_650000.png +3 -0
- O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_700000.png +3 -0
.gitattributes
CHANGED
|
@@ -630,3 +630,13 @@ O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_450000.png filter=lfs diff=
|
|
| 630 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_500000.png filter=lfs diff=lfs merge=lfs -text
|
| 631 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
|
| 632 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_600000.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 630 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_500000.png filter=lfs diff=lfs merge=lfs -text
|
| 631 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
|
| 632 |
O2O-w-diff-ckpts/ifql/20260316_131424/visited_states_600000.png filter=lfs diff=lfs merge=lfs -text
|
| 633 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_250000.png filter=lfs diff=lfs merge=lfs -text
|
| 634 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_300000.png filter=lfs diff=lfs merge=lfs -text
|
| 635 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_350000.png filter=lfs diff=lfs merge=lfs -text
|
| 636 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_400000.png filter=lfs diff=lfs merge=lfs -text
|
| 637 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_450000.png filter=lfs diff=lfs merge=lfs -text
|
| 638 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_500000.png filter=lfs diff=lfs merge=lfs -text
|
| 639 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
|
| 640 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_600000.png filter=lfs diff=lfs merge=lfs -text
|
| 641 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_650000.png filter=lfs diff=lfs merge=lfs -text
|
| 642 |
+
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_700000.png filter=lfs diff=lfs merge=lfs -text
|
O2O-w-diff-ckpts/ifql/20260316_182227/env.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/ifql/20260316_182227/env_sv.csv
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
O2O-w-diff-ckpts/ifql/20260316_182227/eval.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,6.51424767603725,0.9100825324008239,0.04045872428369031,0.9129895451275379,0.04512074617838393,0.0,25500.0,-1.0,-1000.0,1000.0,1.8291082000732422,250000
|
| 3 |
+
0.0,0.0,15.67396506209857,2.1578120367600975,-0.043636517545263424,2.156660234021784,0.014543634120793824,0.0,77500.0,-1.0,-1000.0,1000.0,1.8158960294723512,300000
|
| 4 |
+
0.0,0.0,18.891472867585318,2.582006869383151,0.04342744170334991,2.585358420579039,0.02650152422861129,0.0,129500.0,-1.0,-1000.0,1000.0,1.8441482448577882,350000
|
| 5 |
+
0.0,0.0,20.895261473090045,2.8277794801435094,-0.0227559947051088,2.820924074710993,-0.11345823209519804,0.0,181500.0,-1.0,-1000.0,1000.0,1.819699821472168,400000
|
| 6 |
+
0.0,0.0,24.598291834908913,3.3094243868883266,-0.04475211499095904,3.305484194754799,-0.00993176341498391,0.0,233500.0,-1.0,-1000.0,1000.0,1.8244494009017944,450000
|
| 7 |
+
0.0,0.0,27.330782576888865,3.677012472985521,-0.006798123982638852,3.6789961419882116,0.04900321370583133,0.02,285452.96,-0.98,-998.86,998.88,1.8165232181549071,500000
|
| 8 |
+
0.0,0.0,29.26271985983331,3.9702510759026404,0.049703529858560094,3.9746835175179984,0.03794926367514683,0.0,337444.0,-1.0,-1000.0,1000.0,1.8270413589477539,550000
|
| 9 |
+
0.0,0.0,29.14351072490581,3.9847162006150345,0.04695028450368142,3.984327153907498,-0.03865418926901417,0.0,389444.0,-1.0,-1000.0,1000.0,1.821832628250122,600000
|
| 10 |
+
0.0,0.0,26.64425635460772,3.6154850853269798,-0.010348842511728084,3.618104467540578,0.05374188263387629,0.02,441410.34,-0.98,-998.96,998.98,1.8267197179794312,650000
|
| 11 |
+
0.0,0.0,30.619719582836296,4.159841613071046,0.03526678153816263,4.162219461295356,-0.0023022243635685033,0.0,493393.0,-1.0,-1000.0,1000.0,1.8226502227783203,700000
|
O2O-w-diff-ckpts/ifql/20260316_182227/eval_sv.csv
ADDED
|
@@ -0,0 +1,11 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
|
| 2 |
+
0.0,0.0,6.51424767603725,0.9100825324008239,0.04045872428369031,0.9129895451275379,0.04512074617838393,0.0,25500.0,-1.0,-1000.0,1000.0,1.8291082000732422,250000
|
| 3 |
+
0.0,0.0,15.67396506209857,2.1578120367600975,-0.043636517545263424,2.156660234021784,0.014543634120793824,0.0,77500.0,-1.0,-1000.0,1000.0,1.8158960294723512,300000
|
| 4 |
+
0.0,0.0,18.891472867585318,2.582006869383151,0.04342744170334991,2.585358420579039,0.02650152422861129,0.0,129500.0,-1.0,-1000.0,1000.0,1.8441482448577882,350000
|
| 5 |
+
0.0,0.0,20.895261473090045,2.8277794801435094,-0.0227559947051088,2.820924074710993,-0.11345823209519804,0.0,181500.0,-1.0,-1000.0,1000.0,1.819699821472168,400000
|
| 6 |
+
0.0,0.0,24.598291834908913,3.3094243868883266,-0.04475211499095904,3.305484194754799,-0.00993176341498391,0.0,233500.0,-1.0,-1000.0,1000.0,1.8244494009017944,450000
|
| 7 |
+
0.0,0.0,27.330782576888865,3.677012472985521,-0.006798123982638852,3.6789961419882116,0.04900321370583133,0.02,285452.96,-0.98,-998.86,998.88,1.8165232181549071,500000
|
| 8 |
+
0.0,0.0,29.26271985983331,3.9702510759026404,0.049703529858560094,3.9746835175179984,0.03794926367514683,0.0,337444.0,-1.0,-1000.0,1000.0,1.8270413589477539,550000
|
| 9 |
+
0.0,0.0,29.14351072490581,3.9847162006150345,0.04695028450368142,3.984327153907498,-0.03865418926901417,0.0,389444.0,-1.0,-1000.0,1000.0,1.821832628250122,600000
|
| 10 |
+
0.0,0.0,26.64425635460772,3.6154850853269798,-0.010348842511728084,3.618104467540578,0.05374188263387629,0.02,441410.34,-0.98,-998.96,998.98,1.8267197179794312,650000
|
| 11 |
+
0.0,0.0,30.619719582836296,4.159841613071046,0.03526678153816263,4.162219461295356,-0.0023022243635685033,0.0,493393.0,-1.0,-1000.0,1000.0,1.8226502227783203,700000
|
O2O-w-diff-ckpts/ifql/20260316_182227/online_agent.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,value/v_max,value/v_mean,value/v_min,value/value_loss,step
|
| 2 |
+
0.38895607,1.1459874,-8.023321,-154.16956,-285.7999,6.9051113,-5.7756853,86.15816,-6.027101,-153.93439,-286.19492,0.3381335,205000
|
| 3 |
+
0.36215258,1.4650327,-5.1131225,-151.47333,-191.80055,27.35391,-18.26819,182.8132,-1.8781186,-151.08327,-191.75737,0.54415095,210000
|
| 4 |
+
0.33249968,1.4592159,-22.344532,-156.4974,-274.36185,12.778899,-14.72248,115.60741,-20.704744,-156.32758,-274.74,0.23940316,215000
|
| 5 |
+
0.29745036,0.7721874,-16.394876,-156.21716,-231.54044,2.5777168,-4.015804,50.538147,-16.597677,-156.0427,-231.73213,0.30951485,220000
|
| 6 |
+
0.34066513,9.347129,0.0,-152.4719,-198.32065,34.30968,-41.245148,318.87253,-1.6165652,-152.42628,-198.3146,2.0894406,225000
|
| 7 |
+
0.3352921,1.0191942,0.0,-154.00574,-259.2318,3.6025524,-3.9891133,56.691288,-0.41851416,-153.818,-259.5941,0.22199002,230000
|
| 8 |
+
0.3894788,3.1622465,0.0,-153.44302,-216.03697,11.966342,-7.410068,139.7605,-2.1268525,-153.02217,-216.22205,0.7228104,235000
|
| 9 |
+
0.4020131,1.8590252,-0.97867864,-155.03091,-247.9232,9.626582,-7.603983,131.82523,-0.67672324,-154.63333,-248.20241,0.30800617,240000
|
| 10 |
+
0.34633887,3.6556194,-12.318881,-157.16595,-201.31711,38.705143,-26.337435,440.37723,-10.015143,-156.8692,-201.29709,3.6712856,245000
|
| 11 |
+
0.34088132,1.9215899,0.0,-155.91951,-238.0665,11.313725,-10.192516,125.95436,-0.6221231,-155.68518,-238.25192,0.41761965,250000
|
| 12 |
+
0.29637113,1.3830566,0.0,-154.72021,-209.41435,10.801954,-8.9390135,104.36485,-1.3456665,-154.51451,-209.46257,0.4007556,255000
|
| 13 |
+
0.33660156,2.195641,-31.182655,-157.98352,-228.10663,5.2380724,-3.9788046,84.18315,-30.638634,-157.82372,-228.27707,0.2778053,260000
|
| 14 |
+
0.34530523,1.567449,-27.80474,-159.6785,-206.74095,11.3519535,-15.081514,119.6877,-28.333115,-159.4159,-206.77808,0.39377737,265000
|
| 15 |
+
0.32150707,1.4123309,-12.283138,-159.51833,-199.82657,4.4248314,-6.09235,76.31562,-11.678349,-159.41756,-199.82484,0.24027306,270000
|
| 16 |
+
0.34712544,1.756699,0.0,-161.76465,-216.36948,56.528004,-63.03217,337.55145,-1.7867435,-161.60954,-216.52136,0.3661632,275000
|
| 17 |
+
0.32878333,1.0143584,-11.0198765,-157.32642,-206.30817,2.4421978,-2.3000662,50.786232,-11.479675,-157.20152,-206.3456,0.20833436,280000
|
| 18 |
+
0.30892116,3.4381764,-15.311848,-160.48894,-208.1654,4.5370684,-6.5582676,87.501755,-12.760204,-160.20673,-208.31268,0.41478372,285000
|
| 19 |
+
0.31111306,2.1020439,-14.430047,-157.25104,-205.50548,3.338995,-2.4156923,64.01194,-13.820369,-157.00842,-205.56886,0.35928196,290000
|
| 20 |
+
0.31951267,1.3935426,0.0,-155.28784,-207.25316,52.993294,-86.175125,480.73132,0.2337363,-155.1397,-207.29337,1.0627406,295000
|
| 21 |
+
0.36682346,1.3334281,-0.8696497,-158.38965,-204.91348,7.2202644,-8.783162,103.86866,-0.11175713,-158.03897,-204.93405,1.9945834,300000
|
| 22 |
+
0.28132486,1.4075319,-32.716873,-160.57619,-208.70454,7.032765,-9.227086,95.109116,-5.1515675,-160.32712,-208.7497,0.94384605,305000
|
| 23 |
+
0.28736496,2.1811128,-16.85251,-157.09885,-214.18866,28.59894,-16.320822,174.67766,-16.843748,-156.73636,-214.25465,0.8440038,310000
|
| 24 |
+
0.3269183,0.89288515,-5.521922,-164.34515,-209.6293,4.3263936,-1.9947473,42.941593,-8.973211,-164.25587,-209.67003,0.3278848,315000
|
| 25 |
+
0.3049274,0.8984165,-19.894953,-162.2039,-209.3276,3.4906392,-6.584749,57.89332,-21.19858,-162.04651,-209.34676,0.20530927,320000
|
| 26 |
+
0.3139879,1.1498607,-31.157488,-162.465,-207.81296,4.914736,-3.4530313,55.34141,-29.43744,-162.0824,-207.87419,0.4626484,325000
|
| 27 |
+
0.33991152,1.8374968,-13.520956,-161.37997,-223.85962,8.165795,-4.673163,82.14899,-11.942598,-161.33292,-223.94907,0.2554024,330000
|
| 28 |
+
0.32328776,0.5299954,-54.725677,-164.10078,-221.50966,2.432256,-1.8227676,38.498016,-55.188675,-164.02133,-221.61613,0.17324558,335000
|
| 29 |
+
0.27960515,3.149083,-44.430805,-164.26456,-195.25613,25.204416,-27.131033,328.94815,-45.102264,-164.01932,-194.96193,1.1670754,340000
|
| 30 |
+
0.34235728,2.9082284,-17.445591,-158.80972,-194.84793,4.443536,-4.220748,92.90235,-17.632383,-158.47888,-194.81995,0.2855368,345000
|
| 31 |
+
0.3542427,1.1398394,-22.204966,-164.1947,-210.45117,4.657018,-3.9662857,63.709785,-21.143444,-163.89432,-210.51944,0.24233939,350000
|
| 32 |
+
0.33068347,1.602668,-41.16954,-163.26572,-210.52132,6.3647256,-5.9017887,87.13621,-43.089485,-163.14706,-210.57414,0.15984413,355000
|
| 33 |
+
0.34408593,1.1893405,0.0,-161.13791,-259.33234,23.950937,-16.94721,152.44756,-2.039895,-160.79202,-259.4825,0.565673,360000
|
| 34 |
+
0.2971474,0.85874176,-31.694319,-163.82977,-262.84592,4.2994127,-4.278463,52.889168,-30.505825,-163.62332,-263.02362,0.21694891,365000
|
| 35 |
+
0.33193517,1.4576254,0.0,-162.58199,-267.6384,5.606421,-7.889426,85.06308,-1.7238935,-162.23354,-268.00766,0.32752073,370000
|
| 36 |
+
0.31724787,0.48442093,-17.645044,-162.95515,-206.4429,1.8124224,-4.8335605,36.711445,-17.796114,-162.80045,-206.46526,0.15575269,375000
|
| 37 |
+
0.35783023,0.85393155,-1.3888738,-157.42584,-196.27078,4.468623,-3.8017097,53.17748,-0.5375773,-157.28378,-196.33447,0.30301356,380000
|
| 38 |
+
0.3250208,1.1961311,-2.7587757,-168.04585,-296.81308,7.4914465,-7.9910717,96.49004,-1.5394409,-167.7751,-297.30142,0.25317836,385000
|
| 39 |
+
0.31779426,1.326642,-38.76303,-161.832,-254.54294,2.7115948,-2.8889415,50.192963,-37.74073,-161.80032,-254.12128,0.2169945,390000
|
| 40 |
+
0.3368278,1.9531378,0.0,-166.17987,-296.62292,11.2186985,-8.563757,149.46371,-0.68581486,-165.98233,-297.12573,0.3964759,395000
|
| 41 |
+
0.27688313,1.6085911,0.0,-163.33781,-316.69302,12.677133,-17.299305,134.92946,-1.957585,-163.17957,-317.29678,0.7034955,400000
|
| 42 |
+
0.3392071,2.0947864,-20.975494,-160.3159,-320.65546,13.002868,-9.862699,139.57529,-21.222694,-159.96794,-321.27563,0.73103,405000
|
| 43 |
+
0.31921342,1.5830249,-56.89881,-166.06804,-324.99362,12.741311,-18.889694,106.455956,-57.091404,-165.88998,-325.6126,0.7822569,410000
|
| 44 |
+
0.34916443,0.6443264,0.0,-166.82887,-328.03473,3.46265,-8.610422,56.986538,-1.3001894,-166.66017,-328.66873,0.23444399,415000
|
| 45 |
+
0.2742551,1.4154208,0.0,-164.5264,-195.05745,2.9955578,-4.584632,64.84445,-0.79503703,-164.30109,-194.83537,0.22610542,420000
|
| 46 |
+
0.30260652,11.519561,0.0,-162.93819,-204.51207,45.04081,-63.977177,677.8869,-3.0755403,-162.92915,-204.53726,1.0000472,425000
|
| 47 |
+
0.31381828,0.8722275,-27.249044,-165.61469,-332.82892,3.977785,-5.7812734,57.225952,-28.185555,-165.48116,-333.4888,0.21208745,430000
|
| 48 |
+
0.29664358,1.2883025,0.0,-166.509,-196.9382,22.328526,-21.439503,195.45477,-1.251343,-166.29152,-196.89722,0.5212945,435000
|
| 49 |
+
0.36794603,0.9283401,-49.883568,-167.9715,-324.6735,1.8218297,-3.2032888,32.12303,-46.605434,-167.75494,-325.30173,0.103006065,440000
|
| 50 |
+
0.31414664,0.62466013,-21.697168,-167.63898,-316.74188,2.658507,-3.6459646,38.396954,-21.240658,-167.47787,-317.32806,0.24739404,445000
|
| 51 |
+
0.31709355,2.6343892,-1.344412,-167.39488,-304.27902,8.16689,-23.61968,180.52046,-1.5650662,-167.18518,-304.80258,0.38253522,450000
|
| 52 |
+
0.29631633,1.6307936,-8.008329,-163.48132,-293.33066,4.900776,-6.06609,103.38715,-8.207723,-163.17993,-293.7938,0.36651504,455000
|
| 53 |
+
0.33467656,0.838174,0.0,-164.72476,-207.83809,29.256275,-17.112556,118.3013,-4.1014075,-164.53868,-207.8844,0.43167114,460000
|
| 54 |
+
0.3354962,2.2102783,-45.92118,-166.49905,-260.17664,8.429345,-9.106382,148.28467,-47.04769,-166.19815,-260.48288,0.45539448,465000
|
| 55 |
+
0.33365455,3.9369721,-33.60886,-166.81857,-201.07404,35.097122,-21.186289,163.0788,-24.056795,-166.68616,-201.07922,0.92746955,470000
|
| 56 |
+
0.3075456,2.6993976,-27.12052,-165.1843,-192.74408,55.228996,-29.351711,245.40945,-27.675026,-165.10712,-192.67128,0.20747319,475000
|
| 57 |
+
0.33489138,1.0662405,0.0,-165.79712,-225.34248,20.653532,-11.030676,100.93453,-0.39020994,-165.67117,-225.48457,0.17177568,480000
|
| 58 |
+
0.3035646,0.90801966,0.0,-165.00026,-217.73576,5.33033,-11.507295,68.63527,-2.4053178,-164.99167,-217.8222,0.31648037,485000
|
| 59 |
+
0.31576514,1.3779168,-65.260315,-169.01096,-209.59125,7.732828,-3.7773502,61.745796,-52.588364,-168.73344,-209.62344,0.113849655,490000
|
| 60 |
+
0.32793683,1.248122,0.0,-162.80319,-196.2775,17.551708,-10.005285,120.970535,-0.31515867,-162.64919,-195.69092,0.29435045,495000
|
| 61 |
+
0.33151644,1.0471356,-40.79141,-165.66174,-193.8259,12.866778,-15.063683,115.074936,-39.939087,-165.35336,-193.80556,0.7738043,500000
|
| 62 |
+
0.37147984,0.72172266,-42.54347,-168.72055,-192.70735,4.3883686,-9.2205715,63.867558,-43.300007,-168.43813,-192.72173,0.41922802,505000
|
| 63 |
+
0.37915933,1.5850228,-31.870083,-167.89365,-199.2474,16.797968,-7.6672926,102.197174,-32.19967,-167.73117,-199.2447,0.6831566,510000
|
| 64 |
+
0.32890296,1.5233608,0.0,-164.69806,-197.59203,26.174818,-25.746653,182.83327,-0.35970336,-164.54353,-197.5815,1.1941671,515000
|
| 65 |
+
0.31823406,2.3713872,0.0,-167.68686,-195.18323,49.21918,-40.258934,312.1187,-0.7960643,-167.52628,-195.21164,0.8261391,520000
|
| 66 |
+
0.29580554,0.7107603,0.0,-162.37268,-192.656,4.649644,-4.2159653,50.660294,-0.30978104,-162.2027,-192.64612,0.41186374,525000
|
| 67 |
+
0.34832484,0.64572495,-23.32416,-168.57043,-199.80988,3.859827,-3.4247546,46.277412,-23.337622,-168.39316,-199.77548,0.13144381,530000
|
| 68 |
+
0.3577447,0.697692,-40.05087,-167.02026,-196.32822,11.803898,-24.34915,125.192665,-40.252697,-166.81628,-196.29364,0.5943298,535000
|
| 69 |
+
0.29141188,1.3090307,-40.67306,-168.16304,-198.7884,18.334515,-21.223045,204.83475,-36.520737,-167.93692,-198.78621,1.0797882,540000
|
| 70 |
+
0.29723245,1.1128327,-28.492414,-166.50067,-196.06703,17.8489,-9.154214,83.13708,-28.265974,-166.4075,-196.044,0.11226815,545000
|
| 71 |
+
0.30156514,2.681776,0.0,-168.30428,-193.12506,15.571805,-13.323311,131.09087,0.17259726,-168.18144,-193.01129,0.45844054,550000
|
| 72 |
+
0.30897838,1.178192,0.0,-165.57057,-198.24547,28.271055,-19.062948,185.70546,-14.060973,-165.3876,-198.23524,0.9979206,555000
|
| 73 |
+
0.3162534,0.69694257,-21.844488,-171.37712,-193.4012,14.974806,-11.245555,75.36484,-22.18447,-171.25621,-193.39804,0.19295853,560000
|
| 74 |
+
0.33968997,0.7113215,0.0,-165.77255,-197.89648,7.004684,-2.2743316,46.029205,-0.5630647,-165.71501,-197.88681,0.22963773,565000
|
| 75 |
+
0.33673137,1.680258,0.0,-165.90195,-193.71498,7.4061418,-6.697023,106.39426,0.1733625,-165.7558,-193.7961,0.3502025,570000
|
| 76 |
+
0.311005,1.2769196,0.0,-167.97845,-193.19672,7.148731,-36.50681,133.99702,-2.8555057,-167.80649,-193.23582,0.46303502,575000
|
| 77 |
+
0.33223206,1.1673977,-20.061491,-165.82664,-201.05345,10.995876,-24.528624,118.478485,-3.2541842,-165.58612,-200.83994,0.8786078,580000
|
| 78 |
+
0.33257073,1.1369628,-13.738224,-164.28595,-193.88477,13.067301,-20.391504,113.58153,-12.177857,-164.15591,-193.83705,0.36243463,585000
|
| 79 |
+
0.32379478,2.3715608,0.0,-166.56343,-193.4658,14.997203,-12.515535,151.2957,-2.008237,-166.41112,-193.50688,0.30846536,590000
|
| 80 |
+
0.3053699,0.915586,-41.145164,-168.84724,-195.71164,9.670061,-2.708492,49.85286,-42.67387,-168.72302,-195.686,0.21927473,595000
|
| 81 |
+
0.31559962,0.8232129,0.0,-165.41684,-199.05682,10.704342,-11.7628355,95.36957,-2.7533376,-165.31293,-199.0625,0.4139821,600000
|
| 82 |
+
0.3137985,0.7270572,-2.8363066,-164.97598,-193.28616,2.5251644,-2.9365318,44.863556,-1.3407148,-164.76529,-193.22342,0.18168834,605000
|
| 83 |
+
0.3237008,0.96550035,-1.9611297,-167.44775,-204.61269,1.4508791,-1.2769916,30.497156,-0.73715216,-167.2378,-204.58197,0.11152761,610000
|
| 84 |
+
0.31229478,0.6406558,0.0,-168.38916,-193.1059,2.929795,-3.8814273,42.638084,-4.795566,-168.24586,-193.08887,0.20169741,615000
|
| 85 |
+
0.31122285,1.1240519,-63.179115,-167.97742,-192.9965,13.046176,-16.924713,71.24699,-61.19943,-167.8249,-192.94096,0.27457398,620000
|
| 86 |
+
0.28103897,1.2511885,-33.28489,-170.72006,-197.32668,7.61517,-5.689301,88.49733,-31.66739,-170.51366,-197.43138,0.32145423,625000
|
| 87 |
+
0.30640197,1.4723725,-24.261312,-169.55853,-203.96405,27.43543,-13.8335085,192.89427,-23.234894,-169.3597,-204.43097,0.3516716,630000
|
| 88 |
+
0.32929707,0.94865173,-42.764,-166.54575,-196.54904,3.2174742,-6.584887,53.14821,-41.686,-166.27032,-196.5294,0.44601178,635000
|
| 89 |
+
0.32530272,1.1241245,0.0,-168.6678,-204.76862,3.5176039,-3.1502583,38.476986,-0.5306785,-168.54587,-204.40709,0.110924006,640000
|
| 90 |
+
0.29812062,0.94458735,-15.676316,-166.35861,-197.01399,1.5570918,-4.1428113,40.311073,-18.145372,-166.25858,-197.59152,0.16234007,645000
|
| 91 |
+
0.3238843,1.1866889,0.0,-164.16629,-192.86014,8.556775,-3.6695302,51.584408,-1.3930733,-163.93639,-192.82365,0.1805183,650000
|
| 92 |
+
0.35843647,1.580457,0.0,-165.77618,-193.88995,30.560314,-40.582394,227.16661,-0.91016483,-165.69044,-193.8531,0.4290958,655000
|
| 93 |
+
0.3330047,0.9401051,-28.950167,-165.41246,-193.07246,10.120232,-8.942247,97.16916,-28.335173,-165.29257,-193.0362,0.28795868,660000
|
| 94 |
+
0.31550395,0.94973105,-43.76305,-166.23364,-193.497,2.1192453,-3.6861331,34.61426,-42.548832,-166.13368,-193.46303,0.21160078,665000
|
| 95 |
+
0.29294917,1.0058484,-17.105078,-167.08054,-199.64384,20.412062,-11.867359,153.87466,-17.32495,-166.98352,-199.65472,0.34358668,670000
|
| 96 |
+
0.32741487,1.5839185,-57.567215,-166.07144,-199.8275,16.335695,-23.112768,119.19072,-57.206467,-165.96265,-199.82352,0.39384335,675000
|
| 97 |
+
0.32899672,1.0323937,-1.6722463,-166.56206,-193.19281,2.8421085,-2.5704403,46.448418,-0.5282449,-166.34024,-193.16087,0.17767788,680000
|
| 98 |
+
0.302135,0.52715695,-38.98869,-170.28062,-194.18504,1.4831221,-2.7831054,24.04651,-36.952362,-170.16586,-194.1523,0.12589532,685000
|
| 99 |
+
0.3291425,1.1621746,-32.81954,-167.59277,-194.19301,11.590228,-8.08379,108.028015,-33.272026,-167.30682,-194.16447,0.329782,690000
|
| 100 |
+
0.3392719,0.85148984,-6.586831,-169.70679,-198.56432,11.076331,-15.265045,86.175674,-4.6702414,-169.69536,-198.50227,0.252811,695000
|
| 101 |
+
0.34683892,0.9906418,-31.186403,-169.56796,-195.82014,3.071503,-3.4121077,47.16716,-29.951797,-169.38358,-195.70915,0.16536215,700000
|
O2O-w-diff-ckpts/ifql/20260316_182227/online_agent_sv.csv
ADDED
|
@@ -0,0 +1,101 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,value/v_max,value/v_mean,value/v_min,value/value_loss,step
|
| 2 |
+
0.38895607,1.1459874,-8.023321,-154.16956,-285.7999,6.9051113,-5.7756853,86.15816,-6.027101,-153.93439,-286.19492,0.3381335,205000
|
| 3 |
+
0.36215258,1.4650327,-5.1131225,-151.47333,-191.80055,27.35391,-18.26819,182.8132,-1.8781186,-151.08327,-191.75737,0.54415095,210000
|
| 4 |
+
0.33249968,1.4592159,-22.344532,-156.4974,-274.36185,12.778899,-14.72248,115.60741,-20.704744,-156.32758,-274.74,0.23940316,215000
|
| 5 |
+
0.29745036,0.7721874,-16.394876,-156.21716,-231.54044,2.5777168,-4.015804,50.538147,-16.597677,-156.0427,-231.73213,0.30951485,220000
|
| 6 |
+
0.34066513,9.347129,0.0,-152.4719,-198.32065,34.30968,-41.245148,318.87253,-1.6165652,-152.42628,-198.3146,2.0894406,225000
|
| 7 |
+
0.3352921,1.0191942,0.0,-154.00574,-259.2318,3.6025524,-3.9891133,56.691288,-0.41851416,-153.818,-259.5941,0.22199002,230000
|
| 8 |
+
0.3894788,3.1622465,0.0,-153.44302,-216.03697,11.966342,-7.410068,139.7605,-2.1268525,-153.02217,-216.22205,0.7228104,235000
|
| 9 |
+
0.4020131,1.8590252,-0.97867864,-155.03091,-247.9232,9.626582,-7.603983,131.82523,-0.67672324,-154.63333,-248.20241,0.30800617,240000
|
| 10 |
+
0.34633887,3.6556194,-12.318881,-157.16595,-201.31711,38.705143,-26.337435,440.37723,-10.015143,-156.8692,-201.29709,3.6712856,245000
|
| 11 |
+
0.34088132,1.9215899,0.0,-155.91951,-238.0665,11.313725,-10.192516,125.95436,-0.6221231,-155.68518,-238.25192,0.41761965,250000
|
| 12 |
+
0.29637113,1.3830566,0.0,-154.72021,-209.41435,10.801954,-8.9390135,104.36485,-1.3456665,-154.51451,-209.46257,0.4007556,255000
|
| 13 |
+
0.33660156,2.195641,-31.182655,-157.98352,-228.10663,5.2380724,-3.9788046,84.18315,-30.638634,-157.82372,-228.27707,0.2778053,260000
|
| 14 |
+
0.34530523,1.567449,-27.80474,-159.6785,-206.74095,11.3519535,-15.081514,119.6877,-28.333115,-159.4159,-206.77808,0.39377737,265000
|
| 15 |
+
0.32150707,1.4123309,-12.283138,-159.51833,-199.82657,4.4248314,-6.09235,76.31562,-11.678349,-159.41756,-199.82484,0.24027306,270000
|
| 16 |
+
0.34712544,1.756699,0.0,-161.76465,-216.36948,56.528004,-63.03217,337.55145,-1.7867435,-161.60954,-216.52136,0.3661632,275000
|
| 17 |
+
0.32878333,1.0143584,-11.0198765,-157.32642,-206.30817,2.4421978,-2.3000662,50.786232,-11.479675,-157.20152,-206.3456,0.20833436,280000
|
| 18 |
+
0.30892116,3.4381764,-15.311848,-160.48894,-208.1654,4.5370684,-6.5582676,87.501755,-12.760204,-160.20673,-208.31268,0.41478372,285000
|
| 19 |
+
0.31111306,2.1020439,-14.430047,-157.25104,-205.50548,3.338995,-2.4156923,64.01194,-13.820369,-157.00842,-205.56886,0.35928196,290000
|
| 20 |
+
0.31951267,1.3935426,0.0,-155.28784,-207.25316,52.993294,-86.175125,480.73132,0.2337363,-155.1397,-207.29337,1.0627406,295000
|
| 21 |
+
0.36682346,1.3334281,-0.8696497,-158.38965,-204.91348,7.2202644,-8.783162,103.86866,-0.11175713,-158.03897,-204.93405,1.9945834,300000
|
| 22 |
+
0.28132486,1.4075319,-32.716873,-160.57619,-208.70454,7.032765,-9.227086,95.109116,-5.1515675,-160.32712,-208.7497,0.94384605,305000
|
| 23 |
+
0.28736496,2.1811128,-16.85251,-157.09885,-214.18866,28.59894,-16.320822,174.67766,-16.843748,-156.73636,-214.25465,0.8440038,310000
|
| 24 |
+
0.3269183,0.89288515,-5.521922,-164.34515,-209.6293,4.3263936,-1.9947473,42.941593,-8.973211,-164.25587,-209.67003,0.3278848,315000
|
| 25 |
+
0.3049274,0.8984165,-19.894953,-162.2039,-209.3276,3.4906392,-6.584749,57.89332,-21.19858,-162.04651,-209.34676,0.20530927,320000
|
| 26 |
+
0.3139879,1.1498607,-31.157488,-162.465,-207.81296,4.914736,-3.4530313,55.34141,-29.43744,-162.0824,-207.87419,0.4626484,325000
|
| 27 |
+
0.33991152,1.8374968,-13.520956,-161.37997,-223.85962,8.165795,-4.673163,82.14899,-11.942598,-161.33292,-223.94907,0.2554024,330000
|
| 28 |
+
0.32328776,0.5299954,-54.725677,-164.10078,-221.50966,2.432256,-1.8227676,38.498016,-55.188675,-164.02133,-221.61613,0.17324558,335000
|
| 29 |
+
0.27960515,3.149083,-44.430805,-164.26456,-195.25613,25.204416,-27.131033,328.94815,-45.102264,-164.01932,-194.96193,1.1670754,340000
|
| 30 |
+
0.34235728,2.9082284,-17.445591,-158.80972,-194.84793,4.443536,-4.220748,92.90235,-17.632383,-158.47888,-194.81995,0.2855368,345000
|
| 31 |
+
0.3542427,1.1398394,-22.204966,-164.1947,-210.45117,4.657018,-3.9662857,63.709785,-21.143444,-163.89432,-210.51944,0.24233939,350000
|
| 32 |
+
0.33068347,1.602668,-41.16954,-163.26572,-210.52132,6.3647256,-5.9017887,87.13621,-43.089485,-163.14706,-210.57414,0.15984413,355000
|
| 33 |
+
0.34408593,1.1893405,0.0,-161.13791,-259.33234,23.950937,-16.94721,152.44756,-2.039895,-160.79202,-259.4825,0.565673,360000
|
| 34 |
+
0.2971474,0.85874176,-31.694319,-163.82977,-262.84592,4.2994127,-4.278463,52.889168,-30.505825,-163.62332,-263.02362,0.21694891,365000
|
| 35 |
+
0.33193517,1.4576254,0.0,-162.58199,-267.6384,5.606421,-7.889426,85.06308,-1.7238935,-162.23354,-268.00766,0.32752073,370000
|
| 36 |
+
0.31724787,0.48442093,-17.645044,-162.95515,-206.4429,1.8124224,-4.8335605,36.711445,-17.796114,-162.80045,-206.46526,0.15575269,375000
|
| 37 |
+
0.35783023,0.85393155,-1.3888738,-157.42584,-196.27078,4.468623,-3.8017097,53.17748,-0.5375773,-157.28378,-196.33447,0.30301356,380000
|
| 38 |
+
0.3250208,1.1961311,-2.7587757,-168.04585,-296.81308,7.4914465,-7.9910717,96.49004,-1.5394409,-167.7751,-297.30142,0.25317836,385000
|
| 39 |
+
0.31779426,1.326642,-38.76303,-161.832,-254.54294,2.7115948,-2.8889415,50.192963,-37.74073,-161.80032,-254.12128,0.2169945,390000
|
| 40 |
+
0.3368278,1.9531378,0.0,-166.17987,-296.62292,11.2186985,-8.563757,149.46371,-0.68581486,-165.98233,-297.12573,0.3964759,395000
|
| 41 |
+
0.27688313,1.6085911,0.0,-163.33781,-316.69302,12.677133,-17.299305,134.92946,-1.957585,-163.17957,-317.29678,0.7034955,400000
|
| 42 |
+
0.3392071,2.0947864,-20.975494,-160.3159,-320.65546,13.002868,-9.862699,139.57529,-21.222694,-159.96794,-321.27563,0.73103,405000
|
| 43 |
+
0.31921342,1.5830249,-56.89881,-166.06804,-324.99362,12.741311,-18.889694,106.455956,-57.091404,-165.88998,-325.6126,0.7822569,410000
|
| 44 |
+
0.34916443,0.6443264,0.0,-166.82887,-328.03473,3.46265,-8.610422,56.986538,-1.3001894,-166.66017,-328.66873,0.23444399,415000
|
| 45 |
+
0.2742551,1.4154208,0.0,-164.5264,-195.05745,2.9955578,-4.584632,64.84445,-0.79503703,-164.30109,-194.83537,0.22610542,420000
|
| 46 |
+
0.30260652,11.519561,0.0,-162.93819,-204.51207,45.04081,-63.977177,677.8869,-3.0755403,-162.92915,-204.53726,1.0000472,425000
|
| 47 |
+
0.31381828,0.8722275,-27.249044,-165.61469,-332.82892,3.977785,-5.7812734,57.225952,-28.185555,-165.48116,-333.4888,0.21208745,430000
|
| 48 |
+
0.29664358,1.2883025,0.0,-166.509,-196.9382,22.328526,-21.439503,195.45477,-1.251343,-166.29152,-196.89722,0.5212945,435000
|
| 49 |
+
0.36794603,0.9283401,-49.883568,-167.9715,-324.6735,1.8218297,-3.2032888,32.12303,-46.605434,-167.75494,-325.30173,0.103006065,440000
|
| 50 |
+
0.31414664,0.62466013,-21.697168,-167.63898,-316.74188,2.658507,-3.6459646,38.396954,-21.240658,-167.47787,-317.32806,0.24739404,445000
|
| 51 |
+
0.31709355,2.6343892,-1.344412,-167.39488,-304.27902,8.16689,-23.61968,180.52046,-1.5650662,-167.18518,-304.80258,0.38253522,450000
|
| 52 |
+
0.29631633,1.6307936,-8.008329,-163.48132,-293.33066,4.900776,-6.06609,103.38715,-8.207723,-163.17993,-293.7938,0.36651504,455000
|
| 53 |
+
0.33467656,0.838174,0.0,-164.72476,-207.83809,29.256275,-17.112556,118.3013,-4.1014075,-164.53868,-207.8844,0.43167114,460000
|
| 54 |
+
0.3354962,2.2102783,-45.92118,-166.49905,-260.17664,8.429345,-9.106382,148.28467,-47.04769,-166.19815,-260.48288,0.45539448,465000
|
| 55 |
+
0.33365455,3.9369721,-33.60886,-166.81857,-201.07404,35.097122,-21.186289,163.0788,-24.056795,-166.68616,-201.07922,0.92746955,470000
|
| 56 |
+
0.3075456,2.6993976,-27.12052,-165.1843,-192.74408,55.228996,-29.351711,245.40945,-27.675026,-165.10712,-192.67128,0.20747319,475000
|
| 57 |
+
0.33489138,1.0662405,0.0,-165.79712,-225.34248,20.653532,-11.030676,100.93453,-0.39020994,-165.67117,-225.48457,0.17177568,480000
|
| 58 |
+
0.3035646,0.90801966,0.0,-165.00026,-217.73576,5.33033,-11.507295,68.63527,-2.4053178,-164.99167,-217.8222,0.31648037,485000
|
| 59 |
+
0.31576514,1.3779168,-65.260315,-169.01096,-209.59125,7.732828,-3.7773502,61.745796,-52.588364,-168.73344,-209.62344,0.113849655,490000
|
| 60 |
+
0.32793683,1.248122,0.0,-162.80319,-196.2775,17.551708,-10.005285,120.970535,-0.31515867,-162.64919,-195.69092,0.29435045,495000
|
| 61 |
+
0.33151644,1.0471356,-40.79141,-165.66174,-193.8259,12.866778,-15.063683,115.074936,-39.939087,-165.35336,-193.80556,0.7738043,500000
|
| 62 |
+
0.37147984,0.72172266,-42.54347,-168.72055,-192.70735,4.3883686,-9.2205715,63.867558,-43.300007,-168.43813,-192.72173,0.41922802,505000
|
| 63 |
+
0.37915933,1.5850228,-31.870083,-167.89365,-199.2474,16.797968,-7.6672926,102.197174,-32.19967,-167.73117,-199.2447,0.6831566,510000
|
| 64 |
+
0.32890296,1.5233608,0.0,-164.69806,-197.59203,26.174818,-25.746653,182.83327,-0.35970336,-164.54353,-197.5815,1.1941671,515000
|
| 65 |
+
0.31823406,2.3713872,0.0,-167.68686,-195.18323,49.21918,-40.258934,312.1187,-0.7960643,-167.52628,-195.21164,0.8261391,520000
|
| 66 |
+
0.29580554,0.7107603,0.0,-162.37268,-192.656,4.649644,-4.2159653,50.660294,-0.30978104,-162.2027,-192.64612,0.41186374,525000
|
| 67 |
+
0.34832484,0.64572495,-23.32416,-168.57043,-199.80988,3.859827,-3.4247546,46.277412,-23.337622,-168.39316,-199.77548,0.13144381,530000
|
| 68 |
+
0.3577447,0.697692,-40.05087,-167.02026,-196.32822,11.803898,-24.34915,125.192665,-40.252697,-166.81628,-196.29364,0.5943298,535000
|
| 69 |
+
0.29141188,1.3090307,-40.67306,-168.16304,-198.7884,18.334515,-21.223045,204.83475,-36.520737,-167.93692,-198.78621,1.0797882,540000
|
| 70 |
+
0.29723245,1.1128327,-28.492414,-166.50067,-196.06703,17.8489,-9.154214,83.13708,-28.265974,-166.4075,-196.044,0.11226815,545000
|
| 71 |
+
0.30156514,2.681776,0.0,-168.30428,-193.12506,15.571805,-13.323311,131.09087,0.17259726,-168.18144,-193.01129,0.45844054,550000
|
| 72 |
+
0.30897838,1.178192,0.0,-165.57057,-198.24547,28.271055,-19.062948,185.70546,-14.060973,-165.3876,-198.23524,0.9979206,555000
|
| 73 |
+
0.3162534,0.69694257,-21.844488,-171.37712,-193.4012,14.974806,-11.245555,75.36484,-22.18447,-171.25621,-193.39804,0.19295853,560000
|
| 74 |
+
0.33968997,0.7113215,0.0,-165.77255,-197.89648,7.004684,-2.2743316,46.029205,-0.5630647,-165.71501,-197.88681,0.22963773,565000
|
| 75 |
+
0.33673137,1.680258,0.0,-165.90195,-193.71498,7.4061418,-6.697023,106.39426,0.1733625,-165.7558,-193.7961,0.3502025,570000
|
| 76 |
+
0.311005,1.2769196,0.0,-167.97845,-193.19672,7.148731,-36.50681,133.99702,-2.8555057,-167.80649,-193.23582,0.46303502,575000
|
| 77 |
+
0.33223206,1.1673977,-20.061491,-165.82664,-201.05345,10.995876,-24.528624,118.478485,-3.2541842,-165.58612,-200.83994,0.8786078,580000
|
| 78 |
+
0.33257073,1.1369628,-13.738224,-164.28595,-193.88477,13.067301,-20.391504,113.58153,-12.177857,-164.15591,-193.83705,0.36243463,585000
|
| 79 |
+
0.32379478,2.3715608,0.0,-166.56343,-193.4658,14.997203,-12.515535,151.2957,-2.008237,-166.41112,-193.50688,0.30846536,590000
|
| 80 |
+
0.3053699,0.915586,-41.145164,-168.84724,-195.71164,9.670061,-2.708492,49.85286,-42.67387,-168.72302,-195.686,0.21927473,595000
|
| 81 |
+
0.31559962,0.8232129,0.0,-165.41684,-199.05682,10.704342,-11.7628355,95.36957,-2.7533376,-165.31293,-199.0625,0.4139821,600000
|
| 82 |
+
0.3137985,0.7270572,-2.8363066,-164.97598,-193.28616,2.5251644,-2.9365318,44.863556,-1.3407148,-164.76529,-193.22342,0.18168834,605000
|
| 83 |
+
0.3237008,0.96550035,-1.9611297,-167.44775,-204.61269,1.4508791,-1.2769916,30.497156,-0.73715216,-167.2378,-204.58197,0.11152761,610000
|
| 84 |
+
0.31229478,0.6406558,0.0,-168.38916,-193.1059,2.929795,-3.8814273,42.638084,-4.795566,-168.24586,-193.08887,0.20169741,615000
|
| 85 |
+
0.31122285,1.1240519,-63.179115,-167.97742,-192.9965,13.046176,-16.924713,71.24699,-61.19943,-167.8249,-192.94096,0.27457398,620000
|
| 86 |
+
0.28103897,1.2511885,-33.28489,-170.72006,-197.32668,7.61517,-5.689301,88.49733,-31.66739,-170.51366,-197.43138,0.32145423,625000
|
| 87 |
+
0.30640197,1.4723725,-24.261312,-169.55853,-203.96405,27.43543,-13.8335085,192.89427,-23.234894,-169.3597,-204.43097,0.3516716,630000
|
| 88 |
+
0.32929707,0.94865173,-42.764,-166.54575,-196.54904,3.2174742,-6.584887,53.14821,-41.686,-166.27032,-196.5294,0.44601178,635000
|
| 89 |
+
0.32530272,1.1241245,0.0,-168.6678,-204.76862,3.5176039,-3.1502583,38.476986,-0.5306785,-168.54587,-204.40709,0.110924006,640000
|
| 90 |
+
0.29812062,0.94458735,-15.676316,-166.35861,-197.01399,1.5570918,-4.1428113,40.311073,-18.145372,-166.25858,-197.59152,0.16234007,645000
|
| 91 |
+
0.3238843,1.1866889,0.0,-164.16629,-192.86014,8.556775,-3.6695302,51.584408,-1.3930733,-163.93639,-192.82365,0.1805183,650000
|
| 92 |
+
0.35843647,1.580457,0.0,-165.77618,-193.88995,30.560314,-40.582394,227.16661,-0.91016483,-165.69044,-193.8531,0.4290958,655000
|
| 93 |
+
0.3330047,0.9401051,-28.950167,-165.41246,-193.07246,10.120232,-8.942247,97.16916,-28.335173,-165.29257,-193.0362,0.28795868,660000
|
| 94 |
+
0.31550395,0.94973105,-43.76305,-166.23364,-193.497,2.1192453,-3.6861331,34.61426,-42.548832,-166.13368,-193.46303,0.21160078,665000
|
| 95 |
+
0.29294917,1.0058484,-17.105078,-167.08054,-199.64384,20.412062,-11.867359,153.87466,-17.32495,-166.98352,-199.65472,0.34358668,670000
|
| 96 |
+
0.32741487,1.5839185,-57.567215,-166.07144,-199.8275,16.335695,-23.112768,119.19072,-57.206467,-165.96265,-199.82352,0.39384335,675000
|
| 97 |
+
0.32899672,1.0323937,-1.6722463,-166.56206,-193.19281,2.8421085,-2.5704403,46.448418,-0.5282449,-166.34024,-193.16087,0.17767788,680000
|
| 98 |
+
0.302135,0.52715695,-38.98869,-170.28062,-194.18504,1.4831221,-2.7831054,24.04651,-36.952362,-170.16586,-194.1523,0.12589532,685000
|
| 99 |
+
0.3291425,1.1621746,-32.81954,-167.59277,-194.19301,11.590228,-8.08379,108.028015,-33.272026,-167.30682,-194.16447,0.329782,690000
|
| 100 |
+
0.3392719,0.85148984,-6.586831,-169.70679,-198.56432,11.076331,-15.265045,86.175674,-4.6702414,-169.69536,-198.50227,0.252811,695000
|
| 101 |
+
0.34683892,0.9906418,-31.186403,-169.56796,-195.82014,3.071503,-3.4121077,47.16716,-29.951797,-169.38358,-195.70915,0.16536215,700000
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_250000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3db253472732afbef9166fb741c1ed439561bdfc3a9f2d01ed2a190fd4f9bbf8
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_300000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eec895ff6ecf6efc151c2021ba508c9e1bd61fb6c17e40ca59424f99cd39c466
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_350000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e5cd97df598f7259e941fb63d0b0bfa59fecb1894b7e662b9f0885ba67805cb
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_400000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76cd05fc1deddd8c7a451a35a30ac7025330cdd94e9b8c77beab37dff632cdc5
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_450000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0a1551501658d53a20adbb8e29e269a06e8aa52471532c93c64eee6193bc26b
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_500000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d477588aec1f1701a38d72f24cb03c6f641f275149bd0ff318f3e29a191fbe4
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_550000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fe2aea587b77da6440e9bd393ea4260ceefd17a567eb7481107f8292273e4206
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_600000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d81da383864e11cabe656b1f9caa8a103d95cafb70a2a92f6e038a215286a520
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_650000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38b4fb8e48a34725c54bf6a5ac97d2efde6ce3b9631bf1d90af3e8ae2c9a0487
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/params_700000.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bad6e891f5a45b34956180be08a904c740979b2cea3ffaee862de42073510bbe
|
| 3 |
+
size 214338967
|
O2O-w-diff-ckpts/ifql/20260316_182227/progress.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
online,500000
|
O2O-w-diff-ckpts/ifql/20260316_182227/token.tk
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/y1zwzdjh
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_250000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_300000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_350000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_400000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_450000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_500000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_550000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_600000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_650000.png
ADDED
|
Git LFS Details
|
O2O-w-diff-ckpts/ifql/20260316_182227/visited_states_700000.png
ADDED
|
Git LFS Details
|