Tiredsheep commited on
Commit
d951c35
·
verified ·
1 Parent(s): 5e326ee

Upload folder using huggingface_hub

Browse files
Files changed (29) hide show
  1. .gitattributes +1 -0
  2. O2O-w-diff-ckpts/fawac/20260312_174717/env.csv +0 -0
  3. O2O-w-diff-ckpts/fawac/20260312_174717/env_sv.csv +0 -0
  4. O2O-w-diff-ckpts/fawac/20260312_174717/eval.csv +11 -0
  5. O2O-w-diff-ckpts/fawac/20260312_174717/eval_sv.csv +11 -0
  6. O2O-w-diff-ckpts/fawac/20260312_174717/online_agent.csv +101 -0
  7. O2O-w-diff-ckpts/fawac/20260312_174717/online_agent_sv.csv +101 -0
  8. O2O-w-diff-ckpts/fawac/20260312_174717/params_450000.pkl +3 -0
  9. O2O-w-diff-ckpts/fawac/20260312_174717/params_500000.pkl +3 -0
  10. O2O-w-diff-ckpts/fawac/20260312_174717/params_550000.pkl +3 -0
  11. O2O-w-diff-ckpts/fawac/20260312_174717/params_600000.pkl +3 -0
  12. O2O-w-diff-ckpts/fawac/20260312_174717/params_650000.pkl +3 -0
  13. O2O-w-diff-ckpts/fawac/20260312_174717/params_700000.pkl +3 -0
  14. O2O-w-diff-ckpts/fawac/20260312_174717/params_750000.pkl +3 -0
  15. O2O-w-diff-ckpts/fawac/20260312_174717/params_800000.pkl +3 -0
  16. O2O-w-diff-ckpts/fawac/20260312_174717/params_850000.pkl +3 -0
  17. O2O-w-diff-ckpts/fawac/20260312_174717/params_900000.pkl +3 -0
  18. O2O-w-diff-ckpts/fawac/20260312_174717/progress.tk +1 -0
  19. O2O-w-diff-ckpts/fawac/20260312_174717/token.tk +1 -0
  20. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_450000.png +3 -0
  21. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_500000.png +0 -0
  22. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_550000.png +0 -0
  23. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_600000.png +0 -0
  24. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_650000.png +0 -0
  25. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_700000.png +0 -0
  26. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_750000.png +0 -0
  27. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_800000.png +0 -0
  28. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_850000.png +0 -0
  29. O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_900000.png +0 -0
.gitattributes CHANGED
@@ -672,3 +672,4 @@ O2O-w-diff-ckpts/ifql/20260318_061136/visited_states_1400000.png filter=lfs diff
672
  O2O-w-diff-ckpts/ifql/20260318_061136/visited_states_950000.png filter=lfs diff=lfs merge=lfs -text
673
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1050000.png filter=lfs diff=lfs merge=lfs -text
674
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1450000.png filter=lfs diff=lfs merge=lfs -text
 
 
672
  O2O-w-diff-ckpts/ifql/20260318_061136/visited_states_950000.png filter=lfs diff=lfs merge=lfs -text
673
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1050000.png filter=lfs diff=lfs merge=lfs -text
674
  O2O-w-diff-ckpts/ifql/20260318_111956/visited_states_1450000.png filter=lfs diff=lfs merge=lfs -text
675
+ O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_450000.png filter=lfs diff=lfs merge=lfs -text
O2O-w-diff-ckpts/fawac/20260312_174717/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_174717/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_174717/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.24801742147601563,0.09501245444158858,-0.010979530059841057,0.0977403361677636,0.03822815557159994,0.0,25500.0,-1.0,-1000.0,1000.0,1.3963294410705567,450000
3
+ 0.0,0.0,0.3029224021492154,0.1331543130808059,0.02966840953681909,0.13380492818810802,-0.006002054116355205,0.0,77500.0,-1.0,-1000.0,1000.0,1.3933022117614746,500000
4
+ 0.0,0.0,0.25943261770937404,0.13166527239472503,-0.006905957955890071,0.1284782713664867,-0.0479726409274728,0.0,129500.0,-1.0,-1000.0,1000.0,1.405892152786255,550000
5
+ 0.0,0.0,0.1864657065019923,0.11573948519301351,-0.011197527042046716,0.11415190585776736,0.009565246848864372,0.0,181500.0,-1.0,-1000.0,1000.0,1.4796000385284425,600000
6
+ 0.0,0.0,0.3418656911597497,0.1439851393486535,0.01187935910515455,0.14517064875780242,0.014911628301641663,0.0,233500.0,-1.0,-1000.0,1000.0,1.4595744800567627,650000
7
+ 0.0,0.0,0.006073572080551966,0.07660986308491506,0.002471767835575042,0.07702675492652636,0.0042452324040285405,0.0,285500.0,-1.0,-1000.0,1000.0,1.5490845012664796,700000
8
+ 0.0,0.0,0.3120050866920359,0.1300784207649073,-0.0651020424341609,0.12967535809775776,-0.01270296368091233,0.0,337500.0,-1.0,-1000.0,1000.0,1.3687645721435546,750000
9
+ 0.0,0.0,0.1727112415462143,0.11119253575282526,0.03355450288848489,0.11050834596513069,-0.01356851665711498,0.0,389500.0,-1.0,-1000.0,1000.0,1.429611358642578,800000
10
+ 0.0,0.0,0.2348015017107825,0.13096748491424054,0.03459426288773039,0.13156404360995305,-0.0216888583579918,0.0,441500.0,-1.0,-1000.0,1000.0,1.4623742055892945,850000
11
+ 0.0,0.0,0.17103846111725798,0.12232612905209898,-0.013234699410578987,0.12280830589655554,0.01326221806263311,0.0,493500.0,-1.0,-1000.0,1000.0,1.4546094274520873,900000
O2O-w-diff-ckpts/fawac/20260312_174717/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.24801742147601563,0.09501245444158858,-0.010979530059841057,0.0977403361677636,0.03822815557159994,0.0,25500.0,-1.0,-1000.0,1000.0,1.3963294410705567,450000
3
+ 0.0,0.0,0.3029224021492154,0.1331543130808059,0.02966840953681909,0.13380492818810802,-0.006002054116355205,0.0,77500.0,-1.0,-1000.0,1000.0,1.3933022117614746,500000
4
+ 0.0,0.0,0.25943261770937404,0.13166527239472503,-0.006905957955890071,0.1284782713664867,-0.0479726409274728,0.0,129500.0,-1.0,-1000.0,1000.0,1.405892152786255,550000
5
+ 0.0,0.0,0.1864657065019923,0.11573948519301351,-0.011197527042046716,0.11415190585776736,0.009565246848864372,0.0,181500.0,-1.0,-1000.0,1000.0,1.4796000385284425,600000
6
+ 0.0,0.0,0.3418656911597497,0.1439851393486535,0.01187935910515455,0.14517064875780242,0.014911628301641663,0.0,233500.0,-1.0,-1000.0,1000.0,1.4595744800567627,650000
7
+ 0.0,0.0,0.006073572080551966,0.07660986308491506,0.002471767835575042,0.07702675492652636,0.0042452324040285405,0.0,285500.0,-1.0,-1000.0,1000.0,1.5490845012664796,700000
8
+ 0.0,0.0,0.3120050866920359,0.1300784207649073,-0.0651020424341609,0.12967535809775776,-0.01270296368091233,0.0,337500.0,-1.0,-1000.0,1000.0,1.3687645721435546,750000
9
+ 0.0,0.0,0.1727112415462143,0.11119253575282526,0.03355450288848489,0.11050834596513069,-0.01356851665711498,0.0,389500.0,-1.0,-1000.0,1000.0,1.429611358642578,800000
10
+ 0.0,0.0,0.2348015017107825,0.13096748491424054,0.03459426288773039,0.13156404360995305,-0.0216888583579918,0.0,441500.0,-1.0,-1000.0,1000.0,1.4623742055892945,850000
11
+ 0.0,0.0,0.17103846111725798,0.12232612905209898,-0.013234699410578987,0.12280830589655554,0.01326221806263311,0.0,493500.0,-1.0,-1000.0,1000.0,1.4546094274520873,900000
O2O-w-diff-ckpts/fawac/20260312_174717/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 4.4662676,70.66207,-7.661806,-320.06268,-4945.9316,50.497265,421.3995,-447.27518,4827.7744,405000
3
+ 1.9251473,23.748615,1.681031,-294.81592,-5002.0244,27.988605,116.99065,-140.46909,2013.1014,410000
4
+ 2.6703537,41.540302,-135.20332,-380.5646,-5016.6294,32.797974,93.10898,-83.322075,2105.0269,415000
5
+ 2.3608665,33.98456,-142.05649,-316.92245,-5004.1523,28.293385,95.16309,-250.87956,2059.163,420000
6
+ 2.360067,77.6676,-2.475463,-324.4499,-5008.3945,158.74632,2761.1558,-4251.7515,25111.3,425000
7
+ 2.0706396,42.13426,9.441224,-338.39737,-4983.5195,36.169674,407.6437,-229.33011,2750.4937,430000
8
+ 1.4852369,83.31918,39.285675,-277.1876,-661.23096,22.093939,91.46239,-138.40251,2137.6843,435000
9
+ 2.434082,22.246557,1.4617324,-326.0509,-5024.9873,20.364231,67.176094,-110.25852,1433.1628,440000
10
+ 2.036507,28.666494,41.802696,-317.84534,-5022.6914,43.412872,514.25183,-410.70752,3879.9897,445000
11
+ 1.9188668,156.47021,2.1899948,-380.85538,-4980.919,68.53112,605.55176,-393.00766,9515.861,450000
12
+ 2.5730925,54.31077,0.7276381,-307.33453,-4887.247,87.96156,1000.76825,-1754.9308,13776.016,455000
13
+ 1.583828,42.173817,-119.02087,-323.22403,-4822.7407,26.292383,305.3202,-170.81592,2988.4722,460000
14
+ 2.2649367,45.080456,-93.788284,-298.95837,-879.1661,48.421074,462.54837,-272.82925,3439.6426,465000
15
+ 1.4618866,30.642197,-16.860039,-312.3545,-4562.2407,52.17538,276.93457,-705.3908,5387.389,470000
16
+ 2.876676,58.196327,13.298346,-316.30566,-4485.0996,46.54013,184.87578,-296.85693,3574.1106,475000
17
+ 1.9046676,37.34897,-117.19675,-349.14728,-4310.9336,54.963623,761.4507,-416.93805,4788.853,480000
18
+ 2.7546246,26.75739,-36.684387,-300.4809,-3408.2803,21.699492,167.46945,-178.73552,2719.3162,485000
19
+ 4.2801714,74.261826,-10.498431,-350.12723,-4007.9814,76.13753,405.93958,-444.89435,7091.83,490000
20
+ 5.2836757,46.102886,26.153572,-321.2647,-3849.3572,31.777578,431.7699,-311.134,3500.1604,495000
21
+ 2.65165,42.77255,-6.896263,-336.96387,-3635.5256,31.32884,489.23544,-299.81378,5067.16,500000
22
+ 2.0243697,24.882923,-200.34311,-319.6841,-3395.5896,83.85656,1460.0222,-1559.0061,10965.089,505000
23
+ 3.6971917,45.941643,-50.936005,-352.2982,-3202.5098,32.935078,635.2303,-1292.7697,8049.1763,510000
24
+ 3.7464664,47.60129,-27.713577,-314.2509,-3045.9236,55.16955,1266.6954,-1208.5592,8036.6655,515000
25
+ 2.0620341,41.222725,-168.20958,-296.4643,-2814.1194,20.518538,1034.5524,-689.94385,4626.8604,520000
26
+ 1.3082144,40.485123,-72.27203,-296.08658,-2634.067,23.194166,72.72102,-68.757576,1309.4968,525000
27
+ 1.7712398,10.308053,-122.85537,-295.33517,-2388.544,16.040121,584.1681,-328.4729,2510.8428,530000
28
+ 3.3131285,15.5299225,-63.638878,-292.86453,-2203.6877,8.861171,35.28946,-74.874054,981.3823,535000
29
+ 1.717349,7.8464046,-110.320946,-282.6497,-2016.1901,12.600331,41.92994,-57.50298,873.4033,540000
30
+ 3.1177168,22.246098,-48.362465,-308.87692,-2032.301,29.657232,260.52966,-175.28436,3176.4548,545000
31
+ 2.061579,14.918902,-163.43948,-280.8233,-1692.0394,15.59625,44.77542,-126.66382,1358.7324,550000
32
+ 1.477859,20.779766,-37.21306,-276.60635,-1563.559,22.379255,225.23096,-172.92258,2269.5198,555000
33
+ 2.2948785,10.645155,0.6945473,-271.94107,-1432.4725,6.860032,56.61361,-40.008743,700.13586,560000
34
+ 2.3014197,14.626869,-27.307095,-270.42844,-1310.515,12.132082,121.98134,-157.81744,1600.3982,565000
35
+ 2.3331711,17.479862,5.674675,-289.94028,-1223.2719,22.386005,347.24744,-237.56963,3004.6746,570000
36
+ 1.1114837,79.373405,-80.60028,-264.11594,-1091.2456,7.354017,146.46983,-55.6022,1032.0801,575000
37
+ 1.855611,8.109914,3.4185257,-258.7295,-1012.1166,9.175351,54.814106,-63.687706,1069.6364,580000
38
+ 0.9304005,10.399654,9.255396,-258.71613,-944.8369,5.6499147,59.72145,-30.683914,700.5602,585000
39
+ 1.7854236,6.661368,-31.479002,-258.3043,-936.6001,6.1531925,26.076162,-36.090866,619.0369,590000
40
+ 2.3753872,73.68874,29.266247,-253.59605,-794.43005,60.382824,907.3978,-1060.7778,7303.154,595000
41
+ 1.2719606,78.815,28.140682,-255.91463,-734.84607,48.603176,212.67545,-167.7103,2896.619,600000
42
+ 0.8842579,11.933133,-123.29658,-244.34166,-444.43784,11.971677,228.34885,-93.172844,1385.8367,605000
43
+ 0.6789751,8.091731,-126.28157,-250.16658,-616.1711,3.8766408,36.048794,-27.41568,390.18262,610000
44
+ 2.8148963,4.602666,17.029408,-247.3319,-564.63477,5.5308714,26.25508,-68.75469,642.5071,615000
45
+ 1.7003508,3.7583272,-0.0015941858,-240.69107,-521.9331,5.8494983,22.65949,-27.894436,480.36664,620000
46
+ 0.80279684,29.381088,107.7082,-243.86803,-717.711,15.443746,127.679596,-185.04683,2001.9042,625000
47
+ 1.0289263,6.037807,83.46259,-247.58243,-505.29376,4.440723,31.500559,-17.488207,400.1015,630000
48
+ 1.1686795,9.882148,128.56435,-237.3719,-436.70084,5.689525,91.49606,-68.1981,1286.8853,635000
49
+ 1.1527958,2.9552526,-194.89253,-242.39969,-659.7418,2.8399525,44.3979,-63.020924,316.70178,640000
50
+ 0.8517413,2.5789306,152.01219,-235.09033,-418.7422,2.3063905,26.580343,-14.224776,400.09814,645000
51
+ 0.7667899,5.298355,166.5329,-232.75053,-563.55164,7.2333617,74.48452,-76.40666,855.9071,650000
52
+ 2.4940095,16.84259,28.59451,-232.98564,-416.03015,8.854617,70.84202,-146.41342,1765.7888,655000
53
+ 0.41739637,4.2639217,7.4708385,-231.33853,-401.25143,8.193844,158.77562,-708.4156,2859.494,660000
54
+ 0.69776046,243.31895,87.8072,-234.41386,-327.54404,148.71397,1047.6675,-2679.6577,14889.493,665000
55
+ 0.7924217,2.936808,-143.68271,-234.0127,-377.64722,5.3032,38.526608,-57.98727,480.87805,670000
56
+ 0.68378484,2.053703,-156.41959,-230.5917,-663.5892,4.307565,187.10811,-65.7998,1071.6753,675000
57
+ 0.5925187,4.1055818,-7.75692,-229.5251,-494.37067,1.4179091,26.29938,-16.196106,266.05414,680000
58
+ 1.0080602,1.9553102,4.1149807,-233.26431,-691.086,2.1022692,16.378853,-26.63039,306.97333,685000
59
+ 1.3041475,4.1548524,151.29282,-226.02734,-324.36115,3.528402,87.87003,-47.879677,732.409,690000
60
+ 0.42329532,11.3934355,4.876248,-228.16808,-406.97406,17.031834,131.83891,-245.55708,2360.5884,695000
61
+ 0.6044845,2.84272,-90.901184,-227.21475,-664.6494,1.7353302,8.133621,-7.32504,222.70888,700000
62
+ 0.48717946,3.7711637,164.64355,-223.96245,-314.09534,1.2926091,26.423943,-16.445751,263.47296,705000
63
+ 0.4917208,1.569171,-127.985825,-226.20691,-361.0392,1.3362173,8.194722,-6.5942144,215.51707,710000
64
+ 0.9268609,4.419582,140.96904,-221.79727,-331.74063,4.873951,446.40866,-127.34708,1647.0844,715000
65
+ 1.4413913,4.8457794,20.44192,-223.22842,-322.06107,5.9278965,390.86234,-139.88219,2001.9523,720000
66
+ 0.87832594,1.7396338,109.19546,-221.79784,-318.61237,2.1540546,27.354836,-91.46683,466.0308,725000
67
+ 0.39666235,2.0213277,20.189232,-222.0349,-317.2845,1.3962171,18.961857,-6.3692074,216.38672,730000
68
+ 0.45646483,1.286457,81.87161,-222.15833,-426.95325,1.7975613,9.504781,-13.372507,213.67891,735000
69
+ 0.46040124,6.595671,-83.32864,-222.31519,-553.44916,2.0290852,96.184525,-93.06744,1037.3159,740000
70
+ 0.9292548,0.9994095,-85.417404,-221.80493,-297.62634,1.1807479,10.385268,-4.8498564,166.86996,745000
71
+ 0.4798066,2.3256104,30.747559,-218.84917,-319.57486,3.1551616,104.33824,-30.288761,589.90625,750000
72
+ 1.1410515,7.5363235,14.411462,-221.4688,-448.32468,4.980819,198.95753,-131.63199,1469.9354,755000
73
+ 0.70471436,3.8344667,-32.178303,-219.43599,-523.5603,4.197593,71.52052,-80.55274,809.45764,760000
74
+ 1.2963651,7.465114,12.538819,-221.85733,-427.31503,16.158056,301.52838,-301.31873,2430.5933,765000
75
+ 0.7566171,1.8194674,3.1555414,-221.75456,-467.68256,1.8717088,36.198578,-39.551617,391.1515,770000
76
+ 0.5522855,1.7646055,11.52543,-219.6888,-481.79276,1.1829304,8.736204,-14.069153,201.23976,775000
77
+ 0.45889878,14.676816,29.382341,-220.5355,-300.2527,4.2204432,131.37158,-141.8387,1664.568,780000
78
+ 0.66314495,3.163153,61.5119,-218.90479,-268.37207,2.3329966,101.02064,-17.99605,578.5614,785000
79
+ 0.88493997,2.055275,74.597786,-214.96333,-279.22617,2.456411,44.92651,-42.110233,543.6818,790000
80
+ 0.42377412,1.0927333,95.766136,-221.14722,-451.48557,1.6472536,12.622605,-23.150429,173.51955,795000
81
+ 0.5505823,4.348186,123.19546,-220.11406,-453.80255,2.6497378,59.946617,-28.692097,516.98914,800000
82
+ 0.8159154,2.6715038,153.60184,-218.23657,-527.11487,5.6886744,75.97491,-27.023266,655.20245,805000
83
+ 0.5270793,1.4577888,187.04753,-218.86784,-289.55682,1.2105764,19.39738,-9.437429,244.17633,810000
84
+ 0.6307365,4.2838664,213.97665,-219.97054,-321.6666,2.495225,23.89012,-24.635923,410.29178,815000
85
+ 0.4286133,2.1614892,238.8037,-219.87144,-516.6416,2.9773674,47.175987,-43.35445,486.6414,820000
86
+ 0.57002354,4.635358,276.7615,-217.37796,-426.51367,2.7358265,11.300769,-30.418213,349.78778,825000
87
+ 0.76265717,5.0959654,320.37473,-220.96378,-548.5687,8.637939,162.69864,-142.94072,1382.7644,830000
88
+ 0.54201484,3.788327,-146.43921,-222.1256,-550.74316,1.319394,7.664749,-10.27225,238.49838,835000
89
+ 0.81399125,72.81124,32.564827,-219.76152,-383.3534,69.19149,206.83556,-138.86075,2577.5322,840000
90
+ 0.47830427,1.9536752,463.64435,-218.20625,-313.0447,2.0115626,12.854819,-21.265059,269.51956,845000
91
+ 0.34188503,10.398839,522.94543,-211.65494,-345.98013,2.7106123,32.845795,-65.21416,750.21094,850000
92
+ 0.8965757,14.968289,590.1251,-212.37369,-567.58997,45.946472,1321.6267,-799.0439,7785.012,855000
93
+ 0.6214229,9.172577,646.41296,-216.93419,-329.57303,10.782523,19.59313,-24.793573,334.99625,860000
94
+ 0.53327006,7.6812973,-79.2179,-220.36421,-262.4437,11.295256,50.717564,-78.23236,1046.1855,865000
95
+ 0.7065997,1.959351,-117.360725,-220.46753,-292.95877,6.2291155,159.39935,-370.9934,2084.4595,870000
96
+ 0.82645583,19.506918,1061.1471,-211.53398,-411.45392,24.898335,56.88674,-92.829315,1587.9727,875000
97
+ 0.7350342,4.6899476,1183.5968,-191.86333,-330.00482,4.093171,48.66261,-108.76965,1257.1962,880000
98
+ 0.34763676,1.5509987,921.3322,-209.78809,-532.2286,1.1218677,38.319984,-32.479927,325.6854,885000
99
+ 0.44202155,3.693075,934.1501,-215.94205,-270.77213,31.76242,2260.9736,-1868.9363,14213.222,890000
100
+ 0.74969053,4.9884195,1735.8158,-210.04443,-433.23105,2.3736317,130.79951,-87.09507,778.43427,895000
101
+ 0.40706742,3.0118256,1927.4456,-204.00586,-534.20087,2.1530473,26.885925,-26.389694,814.10925,900000
O2O-w-diff-ckpts/fawac/20260312_174717/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 4.4662676,70.66207,-7.661806,-320.06268,-4945.9316,50.497265,421.3995,-447.27518,4827.7744,405000
3
+ 1.9251473,23.748615,1.681031,-294.81592,-5002.0244,27.988605,116.99065,-140.46909,2013.1014,410000
4
+ 2.6703537,41.540302,-135.20332,-380.5646,-5016.6294,32.797974,93.10898,-83.322075,2105.0269,415000
5
+ 2.3608665,33.98456,-142.05649,-316.92245,-5004.1523,28.293385,95.16309,-250.87956,2059.163,420000
6
+ 2.360067,77.6676,-2.475463,-324.4499,-5008.3945,158.74632,2761.1558,-4251.7515,25111.3,425000
7
+ 2.0706396,42.13426,9.441224,-338.39737,-4983.5195,36.169674,407.6437,-229.33011,2750.4937,430000
8
+ 1.4852369,83.31918,39.285675,-277.1876,-661.23096,22.093939,91.46239,-138.40251,2137.6843,435000
9
+ 2.434082,22.246557,1.4617324,-326.0509,-5024.9873,20.364231,67.176094,-110.25852,1433.1628,440000
10
+ 2.036507,28.666494,41.802696,-317.84534,-5022.6914,43.412872,514.25183,-410.70752,3879.9897,445000
11
+ 1.9188668,156.47021,2.1899948,-380.85538,-4980.919,68.53112,605.55176,-393.00766,9515.861,450000
12
+ 2.5730925,54.31077,0.7276381,-307.33453,-4887.247,87.96156,1000.76825,-1754.9308,13776.016,455000
13
+ 1.583828,42.173817,-119.02087,-323.22403,-4822.7407,26.292383,305.3202,-170.81592,2988.4722,460000
14
+ 2.2649367,45.080456,-93.788284,-298.95837,-879.1661,48.421074,462.54837,-272.82925,3439.6426,465000
15
+ 1.4618866,30.642197,-16.860039,-312.3545,-4562.2407,52.17538,276.93457,-705.3908,5387.389,470000
16
+ 2.876676,58.196327,13.298346,-316.30566,-4485.0996,46.54013,184.87578,-296.85693,3574.1106,475000
17
+ 1.9046676,37.34897,-117.19675,-349.14728,-4310.9336,54.963623,761.4507,-416.93805,4788.853,480000
18
+ 2.7546246,26.75739,-36.684387,-300.4809,-3408.2803,21.699492,167.46945,-178.73552,2719.3162,485000
19
+ 4.2801714,74.261826,-10.498431,-350.12723,-4007.9814,76.13753,405.93958,-444.89435,7091.83,490000
20
+ 5.2836757,46.102886,26.153572,-321.2647,-3849.3572,31.777578,431.7699,-311.134,3500.1604,495000
21
+ 2.65165,42.77255,-6.896263,-336.96387,-3635.5256,31.32884,489.23544,-299.81378,5067.16,500000
22
+ 2.0243697,24.882923,-200.34311,-319.6841,-3395.5896,83.85656,1460.0222,-1559.0061,10965.089,505000
23
+ 3.6971917,45.941643,-50.936005,-352.2982,-3202.5098,32.935078,635.2303,-1292.7697,8049.1763,510000
24
+ 3.7464664,47.60129,-27.713577,-314.2509,-3045.9236,55.16955,1266.6954,-1208.5592,8036.6655,515000
25
+ 2.0620341,41.222725,-168.20958,-296.4643,-2814.1194,20.518538,1034.5524,-689.94385,4626.8604,520000
26
+ 1.3082144,40.485123,-72.27203,-296.08658,-2634.067,23.194166,72.72102,-68.757576,1309.4968,525000
27
+ 1.7712398,10.308053,-122.85537,-295.33517,-2388.544,16.040121,584.1681,-328.4729,2510.8428,530000
28
+ 3.3131285,15.5299225,-63.638878,-292.86453,-2203.6877,8.861171,35.28946,-74.874054,981.3823,535000
29
+ 1.717349,7.8464046,-110.320946,-282.6497,-2016.1901,12.600331,41.92994,-57.50298,873.4033,540000
30
+ 3.1177168,22.246098,-48.362465,-308.87692,-2032.301,29.657232,260.52966,-175.28436,3176.4548,545000
31
+ 2.061579,14.918902,-163.43948,-280.8233,-1692.0394,15.59625,44.77542,-126.66382,1358.7324,550000
32
+ 1.477859,20.779766,-37.21306,-276.60635,-1563.559,22.379255,225.23096,-172.92258,2269.5198,555000
33
+ 2.2948785,10.645155,0.6945473,-271.94107,-1432.4725,6.860032,56.61361,-40.008743,700.13586,560000
34
+ 2.3014197,14.626869,-27.307095,-270.42844,-1310.515,12.132082,121.98134,-157.81744,1600.3982,565000
35
+ 2.3331711,17.479862,5.674675,-289.94028,-1223.2719,22.386005,347.24744,-237.56963,3004.6746,570000
36
+ 1.1114837,79.373405,-80.60028,-264.11594,-1091.2456,7.354017,146.46983,-55.6022,1032.0801,575000
37
+ 1.855611,8.109914,3.4185257,-258.7295,-1012.1166,9.175351,54.814106,-63.687706,1069.6364,580000
38
+ 0.9304005,10.399654,9.255396,-258.71613,-944.8369,5.6499147,59.72145,-30.683914,700.5602,585000
39
+ 1.7854236,6.661368,-31.479002,-258.3043,-936.6001,6.1531925,26.076162,-36.090866,619.0369,590000
40
+ 2.3753872,73.68874,29.266247,-253.59605,-794.43005,60.382824,907.3978,-1060.7778,7303.154,595000
41
+ 1.2719606,78.815,28.140682,-255.91463,-734.84607,48.603176,212.67545,-167.7103,2896.619,600000
42
+ 0.8842579,11.933133,-123.29658,-244.34166,-444.43784,11.971677,228.34885,-93.172844,1385.8367,605000
43
+ 0.6789751,8.091731,-126.28157,-250.16658,-616.1711,3.8766408,36.048794,-27.41568,390.18262,610000
44
+ 2.8148963,4.602666,17.029408,-247.3319,-564.63477,5.5308714,26.25508,-68.75469,642.5071,615000
45
+ 1.7003508,3.7583272,-0.0015941858,-240.69107,-521.9331,5.8494983,22.65949,-27.894436,480.36664,620000
46
+ 0.80279684,29.381088,107.7082,-243.86803,-717.711,15.443746,127.679596,-185.04683,2001.9042,625000
47
+ 1.0289263,6.037807,83.46259,-247.58243,-505.29376,4.440723,31.500559,-17.488207,400.1015,630000
48
+ 1.1686795,9.882148,128.56435,-237.3719,-436.70084,5.689525,91.49606,-68.1981,1286.8853,635000
49
+ 1.1527958,2.9552526,-194.89253,-242.39969,-659.7418,2.8399525,44.3979,-63.020924,316.70178,640000
50
+ 0.8517413,2.5789306,152.01219,-235.09033,-418.7422,2.3063905,26.580343,-14.224776,400.09814,645000
51
+ 0.7667899,5.298355,166.5329,-232.75053,-563.55164,7.2333617,74.48452,-76.40666,855.9071,650000
52
+ 2.4940095,16.84259,28.59451,-232.98564,-416.03015,8.854617,70.84202,-146.41342,1765.7888,655000
53
+ 0.41739637,4.2639217,7.4708385,-231.33853,-401.25143,8.193844,158.77562,-708.4156,2859.494,660000
54
+ 0.69776046,243.31895,87.8072,-234.41386,-327.54404,148.71397,1047.6675,-2679.6577,14889.493,665000
55
+ 0.7924217,2.936808,-143.68271,-234.0127,-377.64722,5.3032,38.526608,-57.98727,480.87805,670000
56
+ 0.68378484,2.053703,-156.41959,-230.5917,-663.5892,4.307565,187.10811,-65.7998,1071.6753,675000
57
+ 0.5925187,4.1055818,-7.75692,-229.5251,-494.37067,1.4179091,26.29938,-16.196106,266.05414,680000
58
+ 1.0080602,1.9553102,4.1149807,-233.26431,-691.086,2.1022692,16.378853,-26.63039,306.97333,685000
59
+ 1.3041475,4.1548524,151.29282,-226.02734,-324.36115,3.528402,87.87003,-47.879677,732.409,690000
60
+ 0.42329532,11.3934355,4.876248,-228.16808,-406.97406,17.031834,131.83891,-245.55708,2360.5884,695000
61
+ 0.6044845,2.84272,-90.901184,-227.21475,-664.6494,1.7353302,8.133621,-7.32504,222.70888,700000
62
+ 0.48717946,3.7711637,164.64355,-223.96245,-314.09534,1.2926091,26.423943,-16.445751,263.47296,705000
63
+ 0.4917208,1.569171,-127.985825,-226.20691,-361.0392,1.3362173,8.194722,-6.5942144,215.51707,710000
64
+ 0.9268609,4.419582,140.96904,-221.79727,-331.74063,4.873951,446.40866,-127.34708,1647.0844,715000
65
+ 1.4413913,4.8457794,20.44192,-223.22842,-322.06107,5.9278965,390.86234,-139.88219,2001.9523,720000
66
+ 0.87832594,1.7396338,109.19546,-221.79784,-318.61237,2.1540546,27.354836,-91.46683,466.0308,725000
67
+ 0.39666235,2.0213277,20.189232,-222.0349,-317.2845,1.3962171,18.961857,-6.3692074,216.38672,730000
68
+ 0.45646483,1.286457,81.87161,-222.15833,-426.95325,1.7975613,9.504781,-13.372507,213.67891,735000
69
+ 0.46040124,6.595671,-83.32864,-222.31519,-553.44916,2.0290852,96.184525,-93.06744,1037.3159,740000
70
+ 0.9292548,0.9994095,-85.417404,-221.80493,-297.62634,1.1807479,10.385268,-4.8498564,166.86996,745000
71
+ 0.4798066,2.3256104,30.747559,-218.84917,-319.57486,3.1551616,104.33824,-30.288761,589.90625,750000
72
+ 1.1410515,7.5363235,14.411462,-221.4688,-448.32468,4.980819,198.95753,-131.63199,1469.9354,755000
73
+ 0.70471436,3.8344667,-32.178303,-219.43599,-523.5603,4.197593,71.52052,-80.55274,809.45764,760000
74
+ 1.2963651,7.465114,12.538819,-221.85733,-427.31503,16.158056,301.52838,-301.31873,2430.5933,765000
75
+ 0.7566171,1.8194674,3.1555414,-221.75456,-467.68256,1.8717088,36.198578,-39.551617,391.1515,770000
76
+ 0.5522855,1.7646055,11.52543,-219.6888,-481.79276,1.1829304,8.736204,-14.069153,201.23976,775000
77
+ 0.45889878,14.676816,29.382341,-220.5355,-300.2527,4.2204432,131.37158,-141.8387,1664.568,780000
78
+ 0.66314495,3.163153,61.5119,-218.90479,-268.37207,2.3329966,101.02064,-17.99605,578.5614,785000
79
+ 0.88493997,2.055275,74.597786,-214.96333,-279.22617,2.456411,44.92651,-42.110233,543.6818,790000
80
+ 0.42377412,1.0927333,95.766136,-221.14722,-451.48557,1.6472536,12.622605,-23.150429,173.51955,795000
81
+ 0.5505823,4.348186,123.19546,-220.11406,-453.80255,2.6497378,59.946617,-28.692097,516.98914,800000
82
+ 0.8159154,2.6715038,153.60184,-218.23657,-527.11487,5.6886744,75.97491,-27.023266,655.20245,805000
83
+ 0.5270793,1.4577888,187.04753,-218.86784,-289.55682,1.2105764,19.39738,-9.437429,244.17633,810000
84
+ 0.6307365,4.2838664,213.97665,-219.97054,-321.6666,2.495225,23.89012,-24.635923,410.29178,815000
85
+ 0.4286133,2.1614892,238.8037,-219.87144,-516.6416,2.9773674,47.175987,-43.35445,486.6414,820000
86
+ 0.57002354,4.635358,276.7615,-217.37796,-426.51367,2.7358265,11.300769,-30.418213,349.78778,825000
87
+ 0.76265717,5.0959654,320.37473,-220.96378,-548.5687,8.637939,162.69864,-142.94072,1382.7644,830000
88
+ 0.54201484,3.788327,-146.43921,-222.1256,-550.74316,1.319394,7.664749,-10.27225,238.49838,835000
89
+ 0.81399125,72.81124,32.564827,-219.76152,-383.3534,69.19149,206.83556,-138.86075,2577.5322,840000
90
+ 0.47830427,1.9536752,463.64435,-218.20625,-313.0447,2.0115626,12.854819,-21.265059,269.51956,845000
91
+ 0.34188503,10.398839,522.94543,-211.65494,-345.98013,2.7106123,32.845795,-65.21416,750.21094,850000
92
+ 0.8965757,14.968289,590.1251,-212.37369,-567.58997,45.946472,1321.6267,-799.0439,7785.012,855000
93
+ 0.6214229,9.172577,646.41296,-216.93419,-329.57303,10.782523,19.59313,-24.793573,334.99625,860000
94
+ 0.53327006,7.6812973,-79.2179,-220.36421,-262.4437,11.295256,50.717564,-78.23236,1046.1855,865000
95
+ 0.7065997,1.959351,-117.360725,-220.46753,-292.95877,6.2291155,159.39935,-370.9934,2084.4595,870000
96
+ 0.82645583,19.506918,1061.1471,-211.53398,-411.45392,24.898335,56.88674,-92.829315,1587.9727,875000
97
+ 0.7350342,4.6899476,1183.5968,-191.86333,-330.00482,4.093171,48.66261,-108.76965,1257.1962,880000
98
+ 0.34763676,1.5509987,921.3322,-209.78809,-532.2286,1.1218677,38.319984,-32.479927,325.6854,885000
99
+ 0.44202155,3.693075,934.1501,-215.94205,-270.77213,31.76242,2260.9736,-1868.9363,14213.222,890000
100
+ 0.74969053,4.9884195,1735.8158,-210.04443,-433.23105,2.3736317,130.79951,-87.09507,778.43427,895000
101
+ 0.40706742,3.0118256,1927.4456,-204.00586,-534.20087,2.1530473,26.885925,-26.389694,814.10925,900000
O2O-w-diff-ckpts/fawac/20260312_174717/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b8e601c3e2be76530f1cdc01762fe8d21823ce690a62c5ab6b19ce7c7896cd3
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5576a42ee79b1f1410164025f38c43161a04c00c3ac7e5bd335458ba31486ee3
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:469cdc7f343d0d4278c09b229e92446a9560d2879141cc5b4d8ca6e0fa340835
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8bf66a38441f384cfff67012d8cfb4eb10a161bcc1cb8b3e6f17df4eb30812e
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb3599fdae65cc4216534c629876ccbe7a0a46577e484d00172907b6b6518520
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd4d3d73ccde9e18d688e9bfd0e2841a193b66c22f1af90747c1ae40adbeba0e
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02847894965c815ae5cb083fb6941c8a27f62685994e898e805b418c182163a4
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2b439a66acb843587a0d1ee43e10822dc90e67bf73f93ebd7f63592a4d36db4
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_850000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0717b4341ba5bc908693156a017ab12641fe19e60034d4124361cca2dbd4ec45
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/params_900000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2fc4b5316fa070465d3ca10787d87126eb51ca9ffa91182b779791797bf7327
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_174717/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/fawac/20260312_174717/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/tbn5gnrf
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_450000.png ADDED

Git LFS Details

  • SHA256: 6fa4013229042d1aff762f36f27d10afcb57c91d524dfcc8638881226b68f939
  • Pointer size: 131 Bytes
  • Size of remote file: 223 kB
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_500000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_550000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_600000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_650000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_700000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_750000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_800000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_850000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_174717/visited_states_900000.png ADDED