Tiredsheep commited on
Commit
7c61833
·
verified ·
1 Parent(s): d951c35

Upload folder using huggingface_hub

Browse files
Files changed (29) hide show
  1. .gitattributes +1 -0
  2. O2O-w-diff-ckpts/fawac/20260312_185155/env.csv +0 -0
  3. O2O-w-diff-ckpts/fawac/20260312_185155/env_sv.csv +0 -0
  4. O2O-w-diff-ckpts/fawac/20260312_185155/eval.csv +11 -0
  5. O2O-w-diff-ckpts/fawac/20260312_185155/eval_sv.csv +11 -0
  6. O2O-w-diff-ckpts/fawac/20260312_185155/online_agent.csv +101 -0
  7. O2O-w-diff-ckpts/fawac/20260312_185155/online_agent_sv.csv +101 -0
  8. O2O-w-diff-ckpts/fawac/20260312_185155/params_1000000.pkl +3 -0
  9. O2O-w-diff-ckpts/fawac/20260312_185155/params_550000.pkl +3 -0
  10. O2O-w-diff-ckpts/fawac/20260312_185155/params_600000.pkl +3 -0
  11. O2O-w-diff-ckpts/fawac/20260312_185155/params_650000.pkl +3 -0
  12. O2O-w-diff-ckpts/fawac/20260312_185155/params_700000.pkl +3 -0
  13. O2O-w-diff-ckpts/fawac/20260312_185155/params_750000.pkl +3 -0
  14. O2O-w-diff-ckpts/fawac/20260312_185155/params_800000.pkl +3 -0
  15. O2O-w-diff-ckpts/fawac/20260312_185155/params_850000.pkl +3 -0
  16. O2O-w-diff-ckpts/fawac/20260312_185155/params_900000.pkl +3 -0
  17. O2O-w-diff-ckpts/fawac/20260312_185155/params_950000.pkl +3 -0
  18. O2O-w-diff-ckpts/fawac/20260312_185155/progress.tk +1 -0
  19. O2O-w-diff-ckpts/fawac/20260312_185155/token.tk +1 -0
  20. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_1000000.png +0 -0
  21. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_550000.png +3 -0
  22. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_600000.png +0 -0
  23. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_650000.png +0 -0
  24. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_700000.png +0 -0
  25. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_750000.png +0 -0
  26. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_800000.png +0 -0
  27. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_850000.png +0 -0
  28. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_900000.png +0 -0
  29. O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_950000.png +0 -0
.gitattributes CHANGED
@@ -673,3 +673,4 @@ O2O-w-diff-ckpts/ifql/20260318_061136/visited_states_950000.png filter=lfs diff=
673
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1050000.png filter=lfs diff=lfs merge=lfs -text
674
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1450000.png filter=lfs diff=lfs merge=lfs -text
675
  O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_450000.png filter=lfs diff=lfs merge=lfs -text
 
 
673
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1050000.png filter=lfs diff=lfs merge=lfs -text
674
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1450000.png filter=lfs diff=lfs merge=lfs -text
675
  O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_450000.png filter=lfs diff=lfs merge=lfs -text
676
+ O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
O2O-w-diff-ckpts/fawac/20260312_185155/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_185155/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_185155/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.36216982450930785,0.12732165591699393,-0.047623372487005114,0.12607408164343736,-0.015010624143063525,0.0,25500.0,-1.0,-1000.0,1000.0,1.4391490077972413,550000
3
+ 0.0,0.0,0.6108238356622213,0.1453323123073722,-0.012463043140382225,0.142361391685736,0.013742637459695319,0.0,77500.0,-1.0,-1000.0,1000.0,1.450574550628662,600000
4
+ 0.0,0.0,0.31964080983416887,0.13969937293982185,-0.01248199148821474,0.13404586806154048,-0.06394957257876478,0.0,129500.0,-1.0,-1000.0,1000.0,1.442838387489319,650000
5
+ 0.0,0.0,0.09904387851607366,0.09708878767180994,0.04926490048852717,0.10095838704445553,0.03746707713110681,0.0,181500.0,-1.0,-1000.0,1000.0,1.4497653341293335,700000
6
+ 0.0,0.0,0.27267659136035866,0.13656151254853927,-0.012171958844611514,0.1349570667372138,0.0014705320565028554,0.0,233500.0,-1.0,-1000.0,1000.0,1.4371297407150267,750000
7
+ 0.0,0.0,0.19542935953027574,0.1186006840388546,0.007932439533471704,0.12192071223198711,0.06720339219065288,0.0,285500.0,-1.0,-1000.0,1000.0,1.428543210029602,800000
8
+ 0.0,0.0,0.28827444272609193,0.13277291461927976,0.05703652260908807,0.1331365361274492,-0.04384787066557095,0.0,337500.0,-1.0,-1000.0,1000.0,1.435564522743225,850000
9
+ 0.0,0.0,0.3281218188695677,0.1336135811723288,0.010138575163433349,0.13524391477479286,0.0028124011706425174,0.0,389500.0,-1.0,-1000.0,1000.0,1.4402158451080322,900000
10
+ 0.0,0.0,0.30038773061924773,0.11904720810826476,-0.01971492621355325,0.11744687775604298,-0.05317037026819348,0.0,441500.0,-1.0,-1000.0,1000.0,1.4512209463119508,950000
11
+ 0.0,0.0,0.3140470446030536,0.13700513715254886,-0.0006736590508636223,0.13568887135392482,0.01240116035784453,0.0,493500.0,-1.0,-1000.0,1000.0,1.4360474824905396,1000000
O2O-w-diff-ckpts/fawac/20260312_185155/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.36216982450930785,0.12732165591699393,-0.047623372487005114,0.12607408164343736,-0.015010624143063525,0.0,25500.0,-1.0,-1000.0,1000.0,1.4391490077972413,550000
3
+ 0.0,0.0,0.6108238356622213,0.1453323123073722,-0.012463043140382225,0.142361391685736,0.013742637459695319,0.0,77500.0,-1.0,-1000.0,1000.0,1.450574550628662,600000
4
+ 0.0,0.0,0.31964080983416887,0.13969937293982185,-0.01248199148821474,0.13404586806154048,-0.06394957257876478,0.0,129500.0,-1.0,-1000.0,1000.0,1.442838387489319,650000
5
+ 0.0,0.0,0.09904387851607366,0.09708878767180994,0.04926490048852717,0.10095838704445553,0.03746707713110681,0.0,181500.0,-1.0,-1000.0,1000.0,1.4497653341293335,700000
6
+ 0.0,0.0,0.27267659136035866,0.13656151254853927,-0.012171958844611514,0.1349570667372138,0.0014705320565028554,0.0,233500.0,-1.0,-1000.0,1000.0,1.4371297407150267,750000
7
+ 0.0,0.0,0.19542935953027574,0.1186006840388546,0.007932439533471704,0.12192071223198711,0.06720339219065288,0.0,285500.0,-1.0,-1000.0,1000.0,1.428543210029602,800000
8
+ 0.0,0.0,0.28827444272609193,0.13277291461927976,0.05703652260908807,0.1331365361274492,-0.04384787066557095,0.0,337500.0,-1.0,-1000.0,1000.0,1.435564522743225,850000
9
+ 0.0,0.0,0.3281218188695677,0.1336135811723288,0.010138575163433349,0.13524391477479286,0.0028124011706425174,0.0,389500.0,-1.0,-1000.0,1000.0,1.4402158451080322,900000
10
+ 0.0,0.0,0.30038773061924773,0.11904720810826476,-0.01971492621355325,0.11744687775604298,-0.05317037026819348,0.0,441500.0,-1.0,-1000.0,1000.0,1.4512209463119508,950000
11
+ 0.0,0.0,0.3140470446030536,0.13700513715254886,-0.0006736590508636223,0.13568887135392482,0.01240116035784453,0.0,493500.0,-1.0,-1000.0,1000.0,1.4360474824905396,1000000
O2O-w-diff-ckpts/fawac/20260312_185155/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 2.4244354,34.066395,-31.689217,-289.0415,-2093.174,20.747715,148.96803,-152.13306,2248.8672,505000
3
+ 3.154436,20.562046,3.7311661,-274.53854,-1925.8263,19.952526,138.51772,-65.64188,1711.7905,510000
4
+ 2.7377396,32.255142,-128.0372,-304.7328,-1799.3597,18.444693,234.19861,-246.42365,2824.6611,515000
5
+ 1.9113106,16.421225,-63.2349,-275.99356,-1639.946,11.222372,31.152702,-55.128437,968.43005,520000
6
+ 2.878191,20.263184,12.137194,-279.31616,-1603.329,46.577377,124.14535,-174.6888,2058.6182,525000
7
+ 2.0687253,27.224707,13.612643,-277.2856,-1396.9054,14.931119,184.29105,-152.39413,1560.9376,530000
8
+ 0.2773057,20.45525,15.805802,-260.15054,-660.4697,13.428065,41.286648,-42.279877,900.2613,535000
9
+ 1.4644815,20.613699,1.7737442,-260.7398,-1151.2748,9.25947,121.099014,-69.649635,1392.6447,540000
10
+ 1.4918554,10.253269,-102.75024,-266.10123,-1238.9578,10.900582,55.91637,-105.317604,827.983,545000
11
+ 2.5921984,104.18728,8.1618,-272.56946,-1053.2018,25.188164,331.2194,-347.89667,5204.404,550000
12
+ 0.8836267,35.5028,5.855666,-256.85892,-869.48755,30.06099,578.70355,-282.50986,4347.4204,555000
13
+ 0.82641464,6.8583026,-152.65044,-258.58292,-797.2144,10.176107,20.421158,-22.492805,460.5686,560000
14
+ 1.2126181,11.061674,15.371127,-256.89597,-653.0203,5.983558,70.101135,-42.848553,691.3043,565000
15
+ 2.8132753,22.302526,0.79405737,-254.90709,-652.09,14.040903,134.9049,-197.31987,1937.1003,570000
16
+ 1.0108776,33.369835,4.528782,-247.19551,-622.60657,9.542892,185.57864,-532.22565,3131.336,575000
17
+ 1.0342985,12.08472,-108.91883,-258.1373,-587.05096,35.194923,1155.1924,-641.74084,5551.2544,580000
18
+ 0.55120665,19.232313,-12.7023,-247.70976,-732.1279,7.689164,69.839165,-79.44663,1340.148,585000
19
+ 0.8878676,5.710751,79.51471,-246.3164,-468.8076,8.381824,60.375385,-72.84898,769.55133,590000
20
+ 1.150594,19.227757,94.85184,-242.93994,-406.36105,11.036214,313.9354,-887.843,6160.297,595000
21
+ 1.4154942,17.58228,38.009426,-243.49669,-382.99484,13.749748,147.43398,-137.48938,2120.2156,600000
22
+ 0.50155646,9.56272,-163.0257,-244.27432,-504.2677,22.01618,466.54602,-422.8931,4060.2231,605000
23
+ 1.0360343,9.209447,140.77,-239.7762,-381.5104,3.7445984,108.55809,-120.61259,1200.9456,610000
24
+ 1.3505833,11.358887,-62.52652,-246.85806,-1818.0457,11.024816,108.240974,-109.47001,1595.985,615000
25
+ 0.7747059,16.771873,-144.90244,-239.07109,-425.33633,3.447776,44.529873,-54.93949,759.79114,620000
26
+ 0.56680095,6.692421,180.84732,-237.78172,-467.94598,4.254449,13.455548,-25.124525,303.09277,625000
27
+ 0.8889389,2.765624,-134.58658,-235.77022,-460.50598,2.541764,7.846018,-8.321752,210.39026,630000
28
+ 0.45851547,2.3192124,184.72665,-233.24683,-340.61337,2.2097027,5.632436,-6.5189757,189.38112,635000
29
+ 1.3441608,15.276731,88.201126,-235.51538,-697.2078,2.5528805,230.0874,-290.5662,1912.5118,640000
30
+ 0.6254833,18.730938,180.7315,-229.7314,-442.18945,18.22501,252.32344,-283.9194,3013.9202,645000
31
+ 1.0761464,4.4240494,-12.031812,-233.44298,-412.33478,5.1185365,68.67597,-33.651306,485.19305,650000
32
+ 2.2045226,13.179873,171.54303,-235.02254,-567.95087,20.616232,206.08238,-274.73373,2289.3455,655000
33
+ 1.3604627,4.8948946,102.60794,-230.69518,-686.3281,5.5898376,80.530334,-30.171669,637.8364,660000
34
+ 1.0149509,3.056439,143.58861,-230.24425,-417.684,2.9206154,53.136364,-25.707249,451.18765,665000
35
+ 0.65839326,8.965962,6.7115493,-228.66035,-491.01553,5.2930913,79.03328,-75.73584,900.21655,670000
36
+ 0.6506411,44.325977,100.511185,-232.26555,-325.77072,6.3962116,191.88531,-103.46229,1076.4845,675000
37
+ 1.3791585,3.366574,119.78238,-229.89737,-468.21246,5.4854813,61.073116,-49.519493,598.28015,680000
38
+ 0.64692044,7.31274,97.47393,-229.9984,-442.22867,4.71875,51.621056,-31.727406,650.6891,685000
39
+ 1.1588438,10.266008,90.0483,-233.6798,-552.0056,6.0076814,124.68285,-116.59725,1363.3934,690000
40
+ 0.9360469,38.327023,72.81278,-226.78087,-356.36945,36.285667,723.3588,-1428.8917,8783.837,695000
41
+ 1.7954273,26.244139,27.811983,-230.99065,-656.1353,115.85872,7380.62,-3379.3677,32247.02,700000
42
+ 0.5052245,6.8472414,21.713127,-229.89294,-356.26956,4.8303003,28.139534,-23.56566,380.4233,705000
43
+ 0.8089874,1.6457018,-50.876263,-230.53267,-338.21838,1.9559716,6.9100027,-7.166821,156.54349,710000
44
+ 0.86306787,2.6814592,24.893322,-227.95293,-328.2368,2.6660957,44.834995,-23.802372,414.7096,715000
45
+ 0.836172,7.986829,0.7848544,-230.65031,-370.19888,4.526846,25.03372,-29.490154,535.3468,720000
46
+ 1.4389071,224.76323,18.844582,-230.89275,-733.4146,50.439472,379.50876,-269.54425,5855.299,725000
47
+ 1.6175463,7.913018,27.741642,-227.79459,-416.55963,7.750296,20.75352,-61.597385,556.7548,730000
48
+ 0.57947254,4.819057,8.4596405,-230.33305,-383.7503,27.145523,215.92786,-256.46115,2401.4346,735000
49
+ 0.68032885,3.1979606,32.975163,-233.49998,-454.50183,2.6909087,9.48593,-8.826355,263.66364,740000
50
+ 0.7836034,2.9480379,71.94968,-228.98946,-591.5606,3.0968144,16.565153,-21.566917,325.3697,745000
51
+ 0.64202803,77.61834,69.660065,-229.1847,-1493.0808,11.73619,176.82416,-96.69407,2410.633,750000
52
+ 1.1285186,13.221393,90.96754,-227.86865,-367.36835,8.670804,125.04965,-109.53611,1485.7352,755000
53
+ 1.3149235,2.7366085,2.3050678,-229.20909,-411.22226,2.0989695,13.573759,-31.25827,281.56226,760000
54
+ 0.45100084,21.797071,48.26931,-229.84517,-455.1903,18.163553,381.6307,-576.65625,3771.95,765000
55
+ 2.186359,3.972429,119.37052,-232.2884,-446.86407,11.569829,106.20259,-305.2968,1590.0333,770000
56
+ 0.9518004,2.3574028,138.15819,-230.09073,-504.21228,3.2234864,27.13816,-19.017075,381.97943,775000
57
+ 0.99165356,4.31193,126.806114,-229.03784,-385.07703,3.285827,18.957705,-20.380465,442.0017,780000
58
+ 0.68127686,7.883002,68.12752,-233.00053,-490.42123,4.647304,38.535095,-38.413322,633.28754,785000
59
+ 1.1116129,13.396228,200.852,-227.77324,-360.0627,7.4497695,43.88418,-44.492023,803.40875,790000
60
+ 1.3994932,19.614038,-5.0094695,-232.44014,-605.3646,25.45548,463.12646,-1104.4259,5897.712,795000
61
+ 0.8078401,6.1093087,262.78983,-235.44102,-1280.4304,4.4568887,20.69635,-16.250006,427.9293,800000
62
+ 0.72056514,5.328851,303.5859,-229.51013,-360.19095,3.497542,141.90974,-137.44156,1155.908,805000
63
+ 1.1902735,5.6185355,255.0818,-231.27184,-369.7986,5.2974763,31.63908,-23.430975,586.18066,810000
64
+ 1.4911637,7.3306727,418.8975,-229.52461,-413.12842,9.412299,106.22178,-80.17231,852.753,815000
65
+ 2.5965168,6.7842484,493.05118,-224.05382,-421.79483,10.6320095,82.94916,-67.510315,1324.2341,820000
66
+ 0.73411226,3.6079614,15.727756,-233.02696,-366.45676,6.297531,42.56216,-38.18004,607.20215,825000
67
+ 1.0660064,18.425219,688.70795,-229.85747,-441.42328,4.7147555,25.335623,-13.203459,607.52875,830000
68
+ 1.3862181,10.726526,764.7122,-229.12552,-776.9505,6.7104645,43.177994,-64.6414,1073.7869,835000
69
+ 0.87858784,4.6021814,865.05914,-225.30876,-577.84875,3.552171,22.460945,-23.127716,662.21655,840000
70
+ 0.6094191,6.4886546,286.08264,-231.3815,-370.82938,4.3450236,25.736755,-38.778313,599.41693,845000
71
+ 1.2559593,7.5640616,1076.6924,-227.5321,-443.77225,4.6102166,18.452019,-27.018509,861.88586,850000
72
+ 1.6086825,9.876964,7.4432893,-235.12901,-510.0606,11.913025,148.06369,-139.88493,1775.5105,855000
73
+ 1.4085124,35.071148,1498.3933,-206.94011,-450.6327,11.883016,137.7066,-560.2036,4543.922,860000
74
+ 1.9153533,25.53437,10.243878,-234.9578,-468.44235,15.212699,154.88177,-145.48207,1797.7317,865000
75
+ 0.72443825,8.052882,1684.8462,-230.73592,-479.11163,17.756815,2595.4412,-662.3124,11060.883,870000
76
+ 0.7823623,4.032703,977.91046,-229.66985,-460.3168,5.9263663,297.8329,-76.11848,1299.3182,875000
77
+ 1.0137551,5.4874697,919.6879,-232.54056,-425.18692,4.2002425,33.525562,-85.89885,772.3205,880000
78
+ 0.90664715,4.9174767,890.2819,-230.23643,-361.64844,4.0584826,43.10404,-12.929328,503.55676,885000
79
+ 1.1833644,12.052974,1763.9335,-214.18945,-370.2673,12.085031,102.040054,-268.39047,2428.8804,890000
80
+ 0.525958,4.572967,846.60736,-232.225,-337.95856,6.900969,12.669615,-54.16819,525.4686,895000
81
+ 0.48168787,7.326979,1849.3124,-225.86397,-454.66168,6.1314645,207.73549,-73.35199,1292.9838,900000
82
+ 0.92399395,10.662639,844.05273,-227.28392,-508.83737,5.8785963,80.105995,-74.01657,1012.3553,905000
83
+ 0.5723296,5.7675233,756.4527,-233.6031,-521.12775,5.3656344,26.67427,-22.662392,624.24896,910000
84
+ 0.8559362,6.2608194,731.80853,-234.87173,-512.5987,24.907103,267.6072,-293.01065,2386.046,915000
85
+ 0.5374327,5.189039,669.16724,-236.19507,-507.19498,4.6406746,18.707203,-15.9143095,368.93945,920000
86
+ 0.43339324,53.730427,632.8456,-234.20308,-1004.29834,57.429592,246.18661,-234.2071,3379.856,925000
87
+ 1.0217394,6.286325,96.079414,-235.79903,-685.1878,8.611224,228.5368,-211.61218,1732.1273,930000
88
+ 0.69466734,3.5787454,-12.149616,-233.95267,-661.63025,2.6260493,9.429834,-11.177242,220.12074,935000
89
+ 0.8094872,10.508997,9.311622,-234.87744,-465.66452,13.596173,105.181175,-159.46071,1178.5627,940000
90
+ 0.5014178,5.9925613,-29.080421,-236.06804,-548.91235,2.592869,8.743116,-14.9385195,310.00754,945000
91
+ 2.586247,11.856093,1559.2633,-221.16606,-441.44714,9.527763,107.62231,-448.33902,2251.5474,950000
92
+ 0.50648636,9.950772,1516.9225,-223.4692,-626.95984,99.89193,1340.5638,-756.67487,8461.43,955000
93
+ 0.62864506,4.6232486,38.080376,-233.24515,-488.67212,6.6844573,93.935356,-131.8441,963.8365,960000
94
+ 0.83935213,16.637936,519.626,-235.35489,-549.41504,20.2468,179.00655,-104.62547,1735.0574,965000
95
+ 0.84316075,5.468171,503.36105,-227.59949,-323.02704,3.7569993,100.40577,-243.04933,1161.21,970000
96
+ 0.5578735,10.578678,285.6624,-233.04308,-1106.2333,37.282875,205.96141,-279.20505,2089.3105,975000
97
+ 1.7573028,7.9197397,953.65,-226.31018,-433.12094,9.420655,45.680523,-78.82538,988.3764,980000
98
+ 0.77651536,5.4922895,185.01593,-233.9583,-626.95404,3.955719,87.76429,-27.795074,546.1645,985000
99
+ 0.934042,3.3675117,731.9833,-225.85208,-315.71994,3.446772,54.298237,-60.722942,748.7698,990000
100
+ 0.4659821,4.945886,629.1102,-228.90247,-479.24594,5.397013,42.473125,-39.95248,790.9956,995000
101
+ 0.48426354,18.828943,106.44166,-231.96231,-1055.2605,7.988038,24.616076,-21.495876,681.7528,1000000
O2O-w-diff-ckpts/fawac/20260312_185155/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 2.4244354,34.066395,-31.689217,-289.0415,-2093.174,20.747715,148.96803,-152.13306,2248.8672,505000
3
+ 3.154436,20.562046,3.7311661,-274.53854,-1925.8263,19.952526,138.51772,-65.64188,1711.7905,510000
4
+ 2.7377396,32.255142,-128.0372,-304.7328,-1799.3597,18.444693,234.19861,-246.42365,2824.6611,515000
5
+ 1.9113106,16.421225,-63.2349,-275.99356,-1639.946,11.222372,31.152702,-55.128437,968.43005,520000
6
+ 2.878191,20.263184,12.137194,-279.31616,-1603.329,46.577377,124.14535,-174.6888,2058.6182,525000
7
+ 2.0687253,27.224707,13.612643,-277.2856,-1396.9054,14.931119,184.29105,-152.39413,1560.9376,530000
8
+ 0.2773057,20.45525,15.805802,-260.15054,-660.4697,13.428065,41.286648,-42.279877,900.2613,535000
9
+ 1.4644815,20.613699,1.7737442,-260.7398,-1151.2748,9.25947,121.099014,-69.649635,1392.6447,540000
10
+ 1.4918554,10.253269,-102.75024,-266.10123,-1238.9578,10.900582,55.91637,-105.317604,827.983,545000
11
+ 2.5921984,104.18728,8.1618,-272.56946,-1053.2018,25.188164,331.2194,-347.89667,5204.404,550000
12
+ 0.8836267,35.5028,5.855666,-256.85892,-869.48755,30.06099,578.70355,-282.50986,4347.4204,555000
13
+ 0.82641464,6.8583026,-152.65044,-258.58292,-797.2144,10.176107,20.421158,-22.492805,460.5686,560000
14
+ 1.2126181,11.061674,15.371127,-256.89597,-653.0203,5.983558,70.101135,-42.848553,691.3043,565000
15
+ 2.8132753,22.302526,0.79405737,-254.90709,-652.09,14.040903,134.9049,-197.31987,1937.1003,570000
16
+ 1.0108776,33.369835,4.528782,-247.19551,-622.60657,9.542892,185.57864,-532.22565,3131.336,575000
17
+ 1.0342985,12.08472,-108.91883,-258.1373,-587.05096,35.194923,1155.1924,-641.74084,5551.2544,580000
18
+ 0.55120665,19.232313,-12.7023,-247.70976,-732.1279,7.689164,69.839165,-79.44663,1340.148,585000
19
+ 0.8878676,5.710751,79.51471,-246.3164,-468.8076,8.381824,60.375385,-72.84898,769.55133,590000
20
+ 1.150594,19.227757,94.85184,-242.93994,-406.36105,11.036214,313.9354,-887.843,6160.297,595000
21
+ 1.4154942,17.58228,38.009426,-243.49669,-382.99484,13.749748,147.43398,-137.48938,2120.2156,600000
22
+ 0.50155646,9.56272,-163.0257,-244.27432,-504.2677,22.01618,466.54602,-422.8931,4060.2231,605000
23
+ 1.0360343,9.209447,140.77,-239.7762,-381.5104,3.7445984,108.55809,-120.61259,1200.9456,610000
24
+ 1.3505833,11.358887,-62.52652,-246.85806,-1818.0457,11.024816,108.240974,-109.47001,1595.985,615000
25
+ 0.7747059,16.771873,-144.90244,-239.07109,-425.33633,3.447776,44.529873,-54.93949,759.79114,620000
26
+ 0.56680095,6.692421,180.84732,-237.78172,-467.94598,4.254449,13.455548,-25.124525,303.09277,625000
27
+ 0.8889389,2.765624,-134.58658,-235.77022,-460.50598,2.541764,7.846018,-8.321752,210.39026,630000
28
+ 0.45851547,2.3192124,184.72665,-233.24683,-340.61337,2.2097027,5.632436,-6.5189757,189.38112,635000
29
+ 1.3441608,15.276731,88.201126,-235.51538,-697.2078,2.5528805,230.0874,-290.5662,1912.5118,640000
30
+ 0.6254833,18.730938,180.7315,-229.7314,-442.18945,18.22501,252.32344,-283.9194,3013.9202,645000
31
+ 1.0761464,4.4240494,-12.031812,-233.44298,-412.33478,5.1185365,68.67597,-33.651306,485.19305,650000
32
+ 2.2045226,13.179873,171.54303,-235.02254,-567.95087,20.616232,206.08238,-274.73373,2289.3455,655000
33
+ 1.3604627,4.8948946,102.60794,-230.69518,-686.3281,5.5898376,80.530334,-30.171669,637.8364,660000
34
+ 1.0149509,3.056439,143.58861,-230.24425,-417.684,2.9206154,53.136364,-25.707249,451.18765,665000
35
+ 0.65839326,8.965962,6.7115493,-228.66035,-491.01553,5.2930913,79.03328,-75.73584,900.21655,670000
36
+ 0.6506411,44.325977,100.511185,-232.26555,-325.77072,6.3962116,191.88531,-103.46229,1076.4845,675000
37
+ 1.3791585,3.366574,119.78238,-229.89737,-468.21246,5.4854813,61.073116,-49.519493,598.28015,680000
38
+ 0.64692044,7.31274,97.47393,-229.9984,-442.22867,4.71875,51.621056,-31.727406,650.6891,685000
39
+ 1.1588438,10.266008,90.0483,-233.6798,-552.0056,6.0076814,124.68285,-116.59725,1363.3934,690000
40
+ 0.9360469,38.327023,72.81278,-226.78087,-356.36945,36.285667,723.3588,-1428.8917,8783.837,695000
41
+ 1.7954273,26.244139,27.811983,-230.99065,-656.1353,115.85872,7380.62,-3379.3677,32247.02,700000
42
+ 0.5052245,6.8472414,21.713127,-229.89294,-356.26956,4.8303003,28.139534,-23.56566,380.4233,705000
43
+ 0.8089874,1.6457018,-50.876263,-230.53267,-338.21838,1.9559716,6.9100027,-7.166821,156.54349,710000
44
+ 0.86306787,2.6814592,24.893322,-227.95293,-328.2368,2.6660957,44.834995,-23.802372,414.7096,715000
45
+ 0.836172,7.986829,0.7848544,-230.65031,-370.19888,4.526846,25.03372,-29.490154,535.3468,720000
46
+ 1.4389071,224.76323,18.844582,-230.89275,-733.4146,50.439472,379.50876,-269.54425,5855.299,725000
47
+ 1.6175463,7.913018,27.741642,-227.79459,-416.55963,7.750296,20.75352,-61.597385,556.7548,730000
48
+ 0.57947254,4.819057,8.4596405,-230.33305,-383.7503,27.145523,215.92786,-256.46115,2401.4346,735000
49
+ 0.68032885,3.1979606,32.975163,-233.49998,-454.50183,2.6909087,9.48593,-8.826355,263.66364,740000
50
+ 0.7836034,2.9480379,71.94968,-228.98946,-591.5606,3.0968144,16.565153,-21.566917,325.3697,745000
51
+ 0.64202803,77.61834,69.660065,-229.1847,-1493.0808,11.73619,176.82416,-96.69407,2410.633,750000
52
+ 1.1285186,13.221393,90.96754,-227.86865,-367.36835,8.670804,125.04965,-109.53611,1485.7352,755000
53
+ 1.3149235,2.7366085,2.3050678,-229.20909,-411.22226,2.0989695,13.573759,-31.25827,281.56226,760000
54
+ 0.45100084,21.797071,48.26931,-229.84517,-455.1903,18.163553,381.6307,-576.65625,3771.95,765000
55
+ 2.186359,3.972429,119.37052,-232.2884,-446.86407,11.569829,106.20259,-305.2968,1590.0333,770000
56
+ 0.9518004,2.3574028,138.15819,-230.09073,-504.21228,3.2234864,27.13816,-19.017075,381.97943,775000
57
+ 0.99165356,4.31193,126.806114,-229.03784,-385.07703,3.285827,18.957705,-20.380465,442.0017,780000
58
+ 0.68127686,7.883002,68.12752,-233.00053,-490.42123,4.647304,38.535095,-38.413322,633.28754,785000
59
+ 1.1116129,13.396228,200.852,-227.77324,-360.0627,7.4497695,43.88418,-44.492023,803.40875,790000
60
+ 1.3994932,19.614038,-5.0094695,-232.44014,-605.3646,25.45548,463.12646,-1104.4259,5897.712,795000
61
+ 0.8078401,6.1093087,262.78983,-235.44102,-1280.4304,4.4568887,20.69635,-16.250006,427.9293,800000
62
+ 0.72056514,5.328851,303.5859,-229.51013,-360.19095,3.497542,141.90974,-137.44156,1155.908,805000
63
+ 1.1902735,5.6185355,255.0818,-231.27184,-369.7986,5.2974763,31.63908,-23.430975,586.18066,810000
64
+ 1.4911637,7.3306727,418.8975,-229.52461,-413.12842,9.412299,106.22178,-80.17231,852.753,815000
65
+ 2.5965168,6.7842484,493.05118,-224.05382,-421.79483,10.6320095,82.94916,-67.510315,1324.2341,820000
66
+ 0.73411226,3.6079614,15.727756,-233.02696,-366.45676,6.297531,42.56216,-38.18004,607.20215,825000
67
+ 1.0660064,18.425219,688.70795,-229.85747,-441.42328,4.7147555,25.335623,-13.203459,607.52875,830000
68
+ 1.3862181,10.726526,764.7122,-229.12552,-776.9505,6.7104645,43.177994,-64.6414,1073.7869,835000
69
+ 0.87858784,4.6021814,865.05914,-225.30876,-577.84875,3.552171,22.460945,-23.127716,662.21655,840000
70
+ 0.6094191,6.4886546,286.08264,-231.3815,-370.82938,4.3450236,25.736755,-38.778313,599.41693,845000
71
+ 1.2559593,7.5640616,1076.6924,-227.5321,-443.77225,4.6102166,18.452019,-27.018509,861.88586,850000
72
+ 1.6086825,9.876964,7.4432893,-235.12901,-510.0606,11.913025,148.06369,-139.88493,1775.5105,855000
73
+ 1.4085124,35.071148,1498.3933,-206.94011,-450.6327,11.883016,137.7066,-560.2036,4543.922,860000
74
+ 1.9153533,25.53437,10.243878,-234.9578,-468.44235,15.212699,154.88177,-145.48207,1797.7317,865000
75
+ 0.72443825,8.052882,1684.8462,-230.73592,-479.11163,17.756815,2595.4412,-662.3124,11060.883,870000
76
+ 0.7823623,4.032703,977.91046,-229.66985,-460.3168,5.9263663,297.8329,-76.11848,1299.3182,875000
77
+ 1.0137551,5.4874697,919.6879,-232.54056,-425.18692,4.2002425,33.525562,-85.89885,772.3205,880000
78
+ 0.90664715,4.9174767,890.2819,-230.23643,-361.64844,4.0584826,43.10404,-12.929328,503.55676,885000
79
+ 1.1833644,12.052974,1763.9335,-214.18945,-370.2673,12.085031,102.040054,-268.39047,2428.8804,890000
80
+ 0.525958,4.572967,846.60736,-232.225,-337.95856,6.900969,12.669615,-54.16819,525.4686,895000
81
+ 0.48168787,7.326979,1849.3124,-225.86397,-454.66168,6.1314645,207.73549,-73.35199,1292.9838,900000
82
+ 0.92399395,10.662639,844.05273,-227.28392,-508.83737,5.8785963,80.105995,-74.01657,1012.3553,905000
83
+ 0.5723296,5.7675233,756.4527,-233.6031,-521.12775,5.3656344,26.67427,-22.662392,624.24896,910000
84
+ 0.8559362,6.2608194,731.80853,-234.87173,-512.5987,24.907103,267.6072,-293.01065,2386.046,915000
85
+ 0.5374327,5.189039,669.16724,-236.19507,-507.19498,4.6406746,18.707203,-15.9143095,368.93945,920000
86
+ 0.43339324,53.730427,632.8456,-234.20308,-1004.29834,57.429592,246.18661,-234.2071,3379.856,925000
87
+ 1.0217394,6.286325,96.079414,-235.79903,-685.1878,8.611224,228.5368,-211.61218,1732.1273,930000
88
+ 0.69466734,3.5787454,-12.149616,-233.95267,-661.63025,2.6260493,9.429834,-11.177242,220.12074,935000
89
+ 0.8094872,10.508997,9.311622,-234.87744,-465.66452,13.596173,105.181175,-159.46071,1178.5627,940000
90
+ 0.5014178,5.9925613,-29.080421,-236.06804,-548.91235,2.592869,8.743116,-14.9385195,310.00754,945000
91
+ 2.586247,11.856093,1559.2633,-221.16606,-441.44714,9.527763,107.62231,-448.33902,2251.5474,950000
92
+ 0.50648636,9.950772,1516.9225,-223.4692,-626.95984,99.89193,1340.5638,-756.67487,8461.43,955000
93
+ 0.62864506,4.6232486,38.080376,-233.24515,-488.67212,6.6844573,93.935356,-131.8441,963.8365,960000
94
+ 0.83935213,16.637936,519.626,-235.35489,-549.41504,20.2468,179.00655,-104.62547,1735.0574,965000
95
+ 0.84316075,5.468171,503.36105,-227.59949,-323.02704,3.7569993,100.40577,-243.04933,1161.21,970000
96
+ 0.5578735,10.578678,285.6624,-233.04308,-1106.2333,37.282875,205.96141,-279.20505,2089.3105,975000
97
+ 1.7573028,7.9197397,953.65,-226.31018,-433.12094,9.420655,45.680523,-78.82538,988.3764,980000
98
+ 0.77651536,5.4922895,185.01593,-233.9583,-626.95404,3.955719,87.76429,-27.795074,546.1645,985000
99
+ 0.934042,3.3675117,731.9833,-225.85208,-315.71994,3.446772,54.298237,-60.722942,748.7698,990000
100
+ 0.4659821,4.945886,629.1102,-228.90247,-479.24594,5.397013,42.473125,-39.95248,790.9956,995000
101
+ 0.48426354,18.828943,106.44166,-231.96231,-1055.2605,7.988038,24.616076,-21.495876,681.7528,1000000
O2O-w-diff-ckpts/fawac/20260312_185155/params_1000000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b84c4c4cd89dc096f5fdf55cbf7c6939559d5df5aef5befd7e86d2c52c9222
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35768223b347300a7141db8ea7078b10973b601bbd46ccb0a36c27b28e0ffcca
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0dd34b06de8a009a32f2fcf06e3de5c571d9aec45a28d26872d390b37ca6f23d
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18bee568670015381800ba576a1ba7a62f56084b565fbd9b4c995de20671f4c9
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:127d770eec132b4c024e52e8e1777a25845567dfefccb654f1c9fa55eb126471
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1db64d98537e4a1c5aaff86db41c2bb6d8bcf3590188deec4217df8016c447a
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d37f2a8c11e189287ef291fe661dc05f1a9ec676c9289d58c22f152f011a8a26
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69ba63f399e9ff46b360e7f49d9650c0ce4cb1fc8d9a4756f8e6599dd68d3e1b
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15a085a86877b4e2929f0fffbe687c506e7439c1bd5837dfde1d1ded7df7c968
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/params_950000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bfda9a417e98deedde956fcfd4321f5e23f875382f6380d4cf3164958df1389b
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_185155/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/fawac/20260312_185155/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/dcbnhsau
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_1000000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_550000.png ADDED

Git LFS Details

  • SHA256: f87baf1f5c2005df1ef0f1cfd31e07a1a8f0bd550cdc301d80a2e639210d77ca
  • Pointer size: 131 Bytes
  • Size of remote file: 223 kB
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_600000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_650000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_700000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_750000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_800000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_850000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_900000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_185155/visited_states_950000.png ADDED