Tiredsheep commited on
Commit
4c04aa5
·
verified ·
1 Parent(s): 1980c9f

Upload folder using huggingface_hub

Browse files
Files changed (29) hide show
  1. .gitattributes +10 -0
  2. O2O-w-diff-ckpts/cgql/20260318_085240/env.csv +0 -0
  3. O2O-w-diff-ckpts/cgql/20260318_085240/env_sv.csv +0 -0
  4. O2O-w-diff-ckpts/cgql/20260318_085240/eval.csv +11 -0
  5. O2O-w-diff-ckpts/cgql/20260318_085240/eval_sv.csv +11 -0
  6. O2O-w-diff-ckpts/cgql/20260318_085240/online_agent.csv +101 -0
  7. O2O-w-diff-ckpts/cgql/20260318_085240/online_agent_sv.csv +101 -0
  8. O2O-w-diff-ckpts/cgql/20260318_085240/params_1050000.pkl +3 -0
  9. O2O-w-diff-ckpts/cgql/20260318_085240/params_1100000.pkl +3 -0
  10. O2O-w-diff-ckpts/cgql/20260318_085240/params_1150000.pkl +3 -0
  11. O2O-w-diff-ckpts/cgql/20260318_085240/params_1200000.pkl +3 -0
  12. O2O-w-diff-ckpts/cgql/20260318_085240/params_1250000.pkl +3 -0
  13. O2O-w-diff-ckpts/cgql/20260318_085240/params_1300000.pkl +3 -0
  14. O2O-w-diff-ckpts/cgql/20260318_085240/params_1350000.pkl +3 -0
  15. O2O-w-diff-ckpts/cgql/20260318_085240/params_1400000.pkl +3 -0
  16. O2O-w-diff-ckpts/cgql/20260318_085240/params_1450000.pkl +3 -0
  17. O2O-w-diff-ckpts/cgql/20260318_085240/params_1500000.pkl +3 -0
  18. O2O-w-diff-ckpts/cgql/20260318_085240/progress.tk +1 -0
  19. O2O-w-diff-ckpts/cgql/20260318_085240/token.tk +1 -0
  20. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1050000.png +3 -0
  21. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1100000.png +3 -0
  22. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1150000.png +3 -0
  23. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1200000.png +3 -0
  24. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1250000.png +3 -0
  25. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1300000.png +3 -0
  26. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1350000.png +3 -0
  27. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1400000.png +3 -0
  28. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1450000.png +3 -0
  29. O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1500000.png +3 -0
.gitattributes CHANGED
@@ -583,3 +583,13 @@ O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_800000.png filter=lfs diff=
583
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_850000.png filter=lfs diff=lfs merge=lfs -text
584
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_900000.png filter=lfs diff=lfs merge=lfs -text
585
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_950000.png filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
583
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_850000.png filter=lfs diff=lfs merge=lfs -text
584
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_900000.png filter=lfs diff=lfs merge=lfs -text
585
  O2O-w-diff-ckpts/dsrl/20260317_155656/visited_states_950000.png filter=lfs diff=lfs merge=lfs -text
586
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1050000.png filter=lfs diff=lfs merge=lfs -text
587
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1100000.png filter=lfs diff=lfs merge=lfs -text
588
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1150000.png filter=lfs diff=lfs merge=lfs -text
589
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1200000.png filter=lfs diff=lfs merge=lfs -text
590
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1250000.png filter=lfs diff=lfs merge=lfs -text
591
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1300000.png filter=lfs diff=lfs merge=lfs -text
592
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1350000.png filter=lfs diff=lfs merge=lfs -text
593
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1400000.png filter=lfs diff=lfs merge=lfs -text
594
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1450000.png filter=lfs diff=lfs merge=lfs -text
595
+ O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1500000.png filter=lfs diff=lfs merge=lfs -text
O2O-w-diff-ckpts/cgql/20260318_085240/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cgql/20260318_085240/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cgql/20260318_085240/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,38.38247454883598,5.171139095097944,0.15976387477258874,5.183597331543548,0.10325478506434722,0.58,24057.52,-0.42,-938.7,939.28,3.5520128488540648,1050000
3
+ 0.0,0.0,40.692213272261434,5.508577032713585,0.10992244723542377,5.515768979324023,0.06611384558057717,0.88,70288.04,-0.12,-841.4,842.28,3.1640005016326906,1100000
4
+ 0.0,0.0,43.52899975367977,5.906993033056206,0.11028972750728233,5.916032293204412,0.04388338765405391,0.98,112902.9,-0.02,-812.3,813.28,3.0516812658309935,1150000
5
+ 0.0,0.0,41.8931935547074,5.690273559902828,0.12273554749234178,5.6960513089568305,0.01883011223328981,0.92,155421.7,-0.08,-813.64,814.56,3.120081076622009,1200000
6
+ 0.0,0.0,39.17500528493351,5.333382847406074,0.11169004245523502,5.34408239471848,0.13699482601927898,0.86,197717.12,-0.14,-803.14,804.0,3.0215666484832764,1250000
7
+ 0.0,0.0,37.649126868850665,5.122581318151405,0.0825834211175545,5.127111602570162,0.03100550254260232,0.78,240035.1,-0.22,-824.78,825.56,3.1110984086990356,1300000
8
+ 0.0,0.0,40.88798959123815,5.567981928949924,0.16741566055344126,5.5773569662621645,0.06770433437156881,0.9,281789.3,-0.1,-779.76,780.66,2.9400390863418577,1350000
9
+ 0.0,0.0,41.88675059002228,5.702727119481999,0.11123914821194361,5.712009182318023,0.07020653220134179,0.94,321935.9,-0.06,-759.4,760.34,2.8330482816696168,1400000
10
+ 0.0,0.0,41.30021325164909,5.615055521347297,0.16953987357656636,5.62617954285235,0.10423677404961162,0.92,361179.76,-0.08,-762.32,763.24,2.8554001331329344,1450000
11
+ 0.0,0.0,43.14065925765695,5.864655880647949,0.18728403052974565,5.881732594382712,0.14329193547862812,0.98,400919.8,-0.02,-753.86,754.84,2.8403921270370485,1500000
O2O-w-diff-ckpts/cgql/20260318_085240/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,38.38247454883598,5.171139095097944,0.15976387477258874,5.183597331543548,0.10325478506434722,0.58,24057.52,-0.42,-938.7,939.28,3.5520128488540648,1050000
3
+ 0.0,0.0,40.692213272261434,5.508577032713585,0.10992244723542377,5.515768979324023,0.06611384558057717,0.88,70288.04,-0.12,-841.4,842.28,3.1640005016326906,1100000
4
+ 0.0,0.0,43.52899975367977,5.906993033056206,0.11028972750728233,5.916032293204412,0.04388338765405391,0.98,112902.9,-0.02,-812.3,813.28,3.0516812658309935,1150000
5
+ 0.0,0.0,41.8931935547074,5.690273559902828,0.12273554749234178,5.6960513089568305,0.01883011223328981,0.92,155421.7,-0.08,-813.64,814.56,3.120081076622009,1200000
6
+ 0.0,0.0,39.17500528493351,5.333382847406074,0.11169004245523502,5.34408239471848,0.13699482601927898,0.86,197717.12,-0.14,-803.14,804.0,3.0215666484832764,1250000
7
+ 0.0,0.0,37.649126868850665,5.122581318151405,0.0825834211175545,5.127111602570162,0.03100550254260232,0.78,240035.1,-0.22,-824.78,825.56,3.1110984086990356,1300000
8
+ 0.0,0.0,40.88798959123815,5.567981928949924,0.16741566055344126,5.5773569662621645,0.06770433437156881,0.9,281789.3,-0.1,-779.76,780.66,2.9400390863418577,1350000
9
+ 0.0,0.0,41.88675059002228,5.702727119481999,0.11123914821194361,5.712009182318023,0.07020653220134179,0.94,321935.9,-0.06,-759.4,760.34,2.8330482816696168,1400000
10
+ 0.0,0.0,41.30021325164909,5.615055521347297,0.16953987357656636,5.62617954285235,0.10423677404961162,0.92,361179.76,-0.08,-762.32,763.24,2.8554001331329344,1450000
11
+ 0.0,0.0,43.14065925765695,5.864655880647949,0.18728403052974565,5.881732594382712,0.14329193547862812,0.98,400919.8,-0.02,-753.86,754.84,2.8403921270370485,1500000
O2O-w-diff-ckpts/cgql/20260318_085240/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 0.2757188,0.24932995,-6.8187165,-165.42313,-207.07358,1.8819021,-1.3926582,20.145782,1005000
3
+ 0.2760018,0.21493101,-9.2512245,-162.49748,-207.23335,0.9292645,-0.70847756,14.132397,1010000
4
+ 0.33784002,0.19599095,-7.9655237,-168.53392,-210.53554,1.5933404,-1.3339407,20.430855,1015000
5
+ 0.28946513,0.1973801,-16.520441,-167.69127,-210.79283,2.2282674,-1.0988592,18.936653,1020000
6
+ 0.32244524,0.29068375,0.6815015,-164.14494,-208.78056,1.2239302,-2.056798,20.88412,1025000
7
+ 0.2985832,0.23440278,0.22156614,-165.44121,-207.56883,1.8933871,-1.2535281,23.142057,1030000
8
+ 0.34479713,0.26367125,0.7046306,-165.69205,-210.05121,0.9502883,-0.8874404,12.817882,1035000
9
+ 0.2659489,0.21686211,-5.302234,-166.06555,-208.91759,0.7011474,-0.5798365,11.238279,1040000
10
+ 0.29671824,0.18447462,-7.164996,-168.96754,-210.15215,0.98086727,-1.1010232,13.318889,1045000
11
+ 0.3264516,0.19373505,-0.18919751,-167.38072,-209.75993,0.9883155,-1.0529616,13.934447,1050000
12
+ 0.30630913,0.29738888,0.5781903,-165.90025,-208.47466,3.6445055,-2.0637152,32.69731,1055000
13
+ 0.3179896,0.41146556,-35.50542,-169.26372,-210.55418,5.4979143,-3.1708727,51.025135,1060000
14
+ 0.31734282,0.19671059,-14.70156,-171.97401,-208.34811,1.1138767,-0.98405445,11.745972,1065000
15
+ 0.33754677,0.31145015,-15.22413,-170.71786,-207.20561,1.2412467,-0.66516656,16.314077,1070000
16
+ 0.34544784,0.21571355,-0.625108,-173.57611,-208.8821,1.4509645,-1.4436914,14.250902,1075000
17
+ 0.3122379,0.25971636,-10.2958765,-171.55644,-208.79274,2.2034543,-1.3349702,20.375252,1080000
18
+ 0.3107438,0.23192611,-2.3382616,-172.31285,-209.26189,1.238916,-1.4038097,18.350445,1085000
19
+ 0.31990325,0.24880557,-21.489634,-170.76738,-205.59915,1.9215748,-1.1911794,24.59683,1090000
20
+ 0.32549107,0.33916765,1.0627165,-167.86266,-210.63419,2.0496094,-5.991201,28.726086,1095000
21
+ 0.34198725,0.28441092,-4.451391,-169.08882,-208.01923,1.5877584,-4.6173515,27.94935,1100000
22
+ 0.34661198,0.231984,-18.072277,-174.30815,-209.09564,1.5940168,-0.7613491,15.167725,1105000
23
+ 0.28375602,0.38956836,-9.08734,-168.40854,-206.44206,6.6517606,-3.1021032,46.97253,1110000
24
+ 0.27820566,0.22815077,-12.068341,-177.59526,-211.2477,2.1324356,-4.032596,22.616138,1115000
25
+ 0.3000974,0.25438926,-16.421686,-175.10979,-208.38048,2.3837645,-2.3341627,21.153574,1120000
26
+ 0.3384323,0.20761871,-29.929466,-173.89174,-208.95714,1.3426074,-2.9419026,25.11412,1125000
27
+ 0.32486337,0.27664217,-2.9415262,-173.67775,-210.5966,5.1061707,-2.0217373,42.054184,1130000
28
+ 0.32326627,0.31508225,-21.449486,-174.26347,-208.0543,1.1577034,-2.794912,30.116,1135000
29
+ 0.28463912,0.22224343,-2.6781504,-177.30148,-208.75496,1.9896535,-2.0948584,20.863121,1140000
30
+ 0.32209194,0.3628674,-0.9853225,-172.27908,-209.69112,1.289222,-1.011419,19.656982,1145000
31
+ 0.29820883,0.2910201,-5.9008236,-173.62675,-205.8894,1.0923891,-3.0454667,21.47339,1150000
32
+ 0.34587193,0.25058126,-22.564342,-176.77672,-211.67288,1.8917799,-1.2384688,22.005611,1155000
33
+ 0.3306436,0.28733265,-0.008759052,-171.40054,-209.95845,2.2319405,-1.2105981,19.242952,1160000
34
+ 0.3038727,0.27019557,-0.44718117,-172.83907,-210.72928,1.9149158,-3.1697342,29.167042,1165000
35
+ 0.3184435,0.42158747,-5.088914,-175.12268,-205.81375,2.250281,-5.807274,51.67089,1170000
36
+ 0.27705854,0.3140284,-3.9108706,-173.54205,-205.98456,1.5262377,-6.0506916,29.757318,1175000
37
+ 0.33508718,0.46609163,-10.996679,-168.70897,-210.62883,7.058089,-5.2374387,47.21183,1180000
38
+ 0.32788384,0.31979927,-4.354794,-175.12955,-211.72884,4.447243,-3.224459,37.386776,1185000
39
+ 0.2901316,0.37663147,-23.872646,-172.01094,-208.28085,1.9917805,-2.9520433,24.353111,1190000
40
+ 0.3266046,0.2421191,0.59748113,-173.62062,-208.35193,2.2680314,-2.0244613,21.934841,1195000
41
+ 0.30432594,0.43180153,-0.3792128,-173.94724,-210.77887,9.63074,-4.379065,41.307846,1200000
42
+ 0.30495727,0.23759785,0.2949415,-174.15775,-210.47527,2.611272,-1.1877639,25.21822,1205000
43
+ 0.31813878,0.22998965,-22.229528,-174.9042,-211.25743,1.2839835,-2.3713105,20.132933,1210000
44
+ 0.35736448,0.25256297,0.5424722,-177.13216,-207.68945,3.4127574,-1.824238,24.766125,1215000
45
+ 0.33365768,0.30726433,1.2008957,-176.03351,-208.53789,1.8199736,-0.8126318,18.278666,1220000
46
+ 0.34726083,0.27114415,0.38107455,-173.43645,-208.1267,1.827003,-2.998451,28.532932,1225000
47
+ 0.31818265,0.19714473,-24.474335,-174.88457,-209.28133,1.9051831,-0.9254932,17.51853,1230000
48
+ 0.3339692,0.17657356,1.157182,-172.68256,-211.33621,2.6633165,-1.1234536,20.79651,1235000
49
+ 0.35620224,0.30714548,-7.6532264,-175.15855,-208.0124,2.5599728,-3.558061,33.995075,1240000
50
+ 0.29963267,0.25066218,-9.517758,-176.86563,-206.59764,9.271787,-3.2502992,44.902725,1245000
51
+ 0.34050953,0.19367762,-8.024555,-175.88008,-208.14624,1.549048,-2.5850475,17.090252,1250000
52
+ 0.31681243,0.24897937,-7.9410048,-172.66429,-212.77795,1.754152,-2.996387,20.16333,1255000
53
+ 0.33587503,0.18466607,-5.986287,-175.27129,-210.45618,0.7894888,-1.82602,15.022686,1260000
54
+ 0.32183242,0.20087826,-44.139164,-175.12698,-206.98456,1.3295665,-0.99035126,18.217644,1265000
55
+ 0.28769225,0.22170062,1.3067496,-171.3184,-209.93423,2.326919,-2.6747673,23.980394,1270000
56
+ 0.3579524,0.24253237,-24.944084,-175.0437,-208.92442,3.6421816,-1.6412889,32.596085,1275000
57
+ 0.33497506,0.2382245,-27.950277,-177.54558,-209.01514,0.5650568,-1.2856289,13.877261,1280000
58
+ 0.31808454,0.23024622,0.3122547,-174.10121,-211.13219,1.043861,-2.9725218,21.624636,1285000
59
+ 0.3340639,0.23772728,-17.21012,-176.2216,-209.29663,1.0030725,-1.7579044,17.300688,1290000
60
+ 0.345569,0.25850397,0.37161842,-174.59741,-207.63466,2.5169365,-1.4414942,17.773191,1295000
61
+ 0.31242302,0.3101208,0.5859927,-167.12527,-208.36514,4.1169233,-8.986571,51.979317,1300000
62
+ 0.32691294,0.16847879,-12.164048,-178.18335,-209.2295,1.4999298,-4.1554656,25.127398,1305000
63
+ 0.29528567,0.25289875,-29.71897,-177.77576,-210.28311,1.3453357,-1.8376803,17.807457,1310000
64
+ 0.3134706,0.28663462,-10.771253,-174.87244,-209.55722,1.4147252,-4.2212996,27.019472,1315000
65
+ 0.2885564,0.27548638,-4.361427,-173.16838,-211.28406,1.6036518,-3.8186724,33.213177,1320000
66
+ 0.2993699,0.2619768,-25.045916,-169.52098,-207.69113,2.1804695,-3.4657607,28.741035,1325000
67
+ 0.35167164,0.24203096,-0.2812243,-172.41405,-209.29605,2.015914,-0.80745584,16.960442,1330000
68
+ 0.35601145,0.19610444,-0.38415796,-173.0946,-206.76767,3.058426,-3.6487336,20.69127,1335000
69
+ 0.35490596,0.26272544,-0.6527226,-174.3726,-210.17825,1.0483685,-3.7110727,20.810596,1340000
70
+ 0.31075746,0.18086961,-9.941097,-171.90695,-209.41084,2.0055559,-3.1242118,24.956886,1345000
71
+ 0.29875192,0.19375512,0.7290647,-177.95598,-209.2717,2.685913,-1.1279624,20.30267,1350000
72
+ 0.34002843,0.17782305,-2.2366226,-173.96179,-214.04611,1.2476163,-3.0839224,21.653326,1355000
73
+ 0.32268864,0.2050664,-13.978692,-175.36278,-209.60675,1.687528,-0.9733945,21.121975,1360000
74
+ 0.3108366,0.18846826,1.4044397,-170.08142,-210.74133,6.8925543,-1.7002981,22.264019,1365000
75
+ 0.31075856,0.20978947,-0.012289256,-169.7186,-208.87276,3.4453468,-1.229059,20.179756,1370000
76
+ 0.34957048,0.19346754,0.034294426,-173.03296,-210.07033,1.840577,-1.3997387,16.943684,1375000
77
+ 0.29060757,0.19010943,-22.992502,-175.87144,-209.58601,0.5979893,-0.8401629,11.492025,1380000
78
+ 0.3213159,0.25996086,-4.518206,-174.37047,-210.32393,5.728197,-4.1025944,30.293808,1385000
79
+ 0.28306842,0.18548606,0.06517631,-172.17032,-208.042,1.0475593,-1.9797263,12.891127,1390000
80
+ 0.28841954,0.20012324,-11.147811,-176.2608,-208.56169,2.3070347,-3.6770234,32.04782,1395000
81
+ 0.3152499,0.2769482,-5.436821,-174.28181,-209.73172,0.9768799,-3.2481093,20.810658,1400000
82
+ 0.2996897,0.25619206,1.4182858,-171.79457,-209.9404,1.6570246,-4.1730714,27.477118,1405000
83
+ 0.2902141,0.26286003,1.9721766,-170.18579,-213.0455,3.0937645,-2.5694015,23.11458,1410000
84
+ 0.32340336,0.16917105,1.0639307,-173.01677,-208.77853,6.2469873,-1.6785847,28.895126,1415000
85
+ 0.27745906,0.22282758,-0.003654331,-174.66797,-208.82022,1.8537624,-0.9870671,14.822664,1420000
86
+ 0.31876862,0.3683122,-5.9014473,-170.95502,-209.09962,3.2132168,-8.824225,64.01779,1425000
87
+ 0.27260897,0.2652837,0.4653568,-174.60051,-210.36707,3.9112225,-1.6007953,23.142263,1430000
88
+ 0.32218593,0.14168833,-19.830225,-175.87816,-209.71062,0.7838106,-2.4201431,13.649482,1435000
89
+ 0.31622356,0.27788752,0.12834772,-169.72728,-208.31636,1.975498,-8.182283,38.574516,1440000
90
+ 0.29374158,0.21572988,0.3443664,-169.3239,-211.08206,3.781481,-1.7505573,23.746313,1445000
91
+ 0.30797577,0.34440026,-3.3944955,-174.0339,-210.6821,4.3264995,-11.672228,70.791916,1450000
92
+ 0.29958183,0.22189818,-2.2084093,-173.27614,-210.43747,2.339195,-5.5099936,31.835087,1455000
93
+ 0.32394266,0.24494305,-26.646233,-174.7663,-209.61377,1.1589122,-2.891561,20.891005,1460000
94
+ 0.31300658,0.18685304,1.5753105,-175.53307,-210.30103,2.4256487,-1.8366312,15.810375,1465000
95
+ 0.29461515,0.21054588,-6.401142,-171.90637,-213.85115,4.699739,-2.5199964,30.541653,1470000
96
+ 0.31592125,0.24333493,-0.2696118,-170.56255,-210.01682,8.273656,-6.3631325,40.868706,1475000
97
+ 0.30293,0.18857543,0.39104083,-169.99632,-207.96129,1.5812516,-1.1756179,16.683361,1480000
98
+ 0.3058651,0.36042482,-4.4109974,-171.79497,-208.51372,7.020408,-2.0338693,36.8777,1485000
99
+ 0.32242835,0.16679369,-22.974165,-176.52124,-208.96,1.4182116,-0.73235065,14.795292,1490000
100
+ 0.2878495,0.331925,-7.612011,-172.21532,-209.8881,1.4417126,-2.6542237,17.377619,1495000
101
+ 0.33937836,0.23022942,-12.739137,-172.23099,-208.64297,1.2110947,-1.3549339,16.363499,1500000
O2O-w-diff-ckpts/cgql/20260318_085240/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/flow_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 0.2757188,0.24932995,-6.8187165,-165.42313,-207.07358,1.8819021,-1.3926582,20.145782,1005000
3
+ 0.2760018,0.21493101,-9.2512245,-162.49748,-207.23335,0.9292645,-0.70847756,14.132397,1010000
4
+ 0.33784002,0.19599095,-7.9655237,-168.53392,-210.53554,1.5933404,-1.3339407,20.430855,1015000
5
+ 0.28946513,0.1973801,-16.520441,-167.69127,-210.79283,2.2282674,-1.0988592,18.936653,1020000
6
+ 0.32244524,0.29068375,0.6815015,-164.14494,-208.78056,1.2239302,-2.056798,20.88412,1025000
7
+ 0.2985832,0.23440278,0.22156614,-165.44121,-207.56883,1.8933871,-1.2535281,23.142057,1030000
8
+ 0.34479713,0.26367125,0.7046306,-165.69205,-210.05121,0.9502883,-0.8874404,12.817882,1035000
9
+ 0.2659489,0.21686211,-5.302234,-166.06555,-208.91759,0.7011474,-0.5798365,11.238279,1040000
10
+ 0.29671824,0.18447462,-7.164996,-168.96754,-210.15215,0.98086727,-1.1010232,13.318889,1045000
11
+ 0.3264516,0.19373505,-0.18919751,-167.38072,-209.75993,0.9883155,-1.0529616,13.934447,1050000
12
+ 0.30630913,0.29738888,0.5781903,-165.90025,-208.47466,3.6445055,-2.0637152,32.69731,1055000
13
+ 0.3179896,0.41146556,-35.50542,-169.26372,-210.55418,5.4979143,-3.1708727,51.025135,1060000
14
+ 0.31734282,0.19671059,-14.70156,-171.97401,-208.34811,1.1138767,-0.98405445,11.745972,1065000
15
+ 0.33754677,0.31145015,-15.22413,-170.71786,-207.20561,1.2412467,-0.66516656,16.314077,1070000
16
+ 0.34544784,0.21571355,-0.625108,-173.57611,-208.8821,1.4509645,-1.4436914,14.250902,1075000
17
+ 0.3122379,0.25971636,-10.2958765,-171.55644,-208.79274,2.2034543,-1.3349702,20.375252,1080000
18
+ 0.3107438,0.23192611,-2.3382616,-172.31285,-209.26189,1.238916,-1.4038097,18.350445,1085000
19
+ 0.31990325,0.24880557,-21.489634,-170.76738,-205.59915,1.9215748,-1.1911794,24.59683,1090000
20
+ 0.32549107,0.33916765,1.0627165,-167.86266,-210.63419,2.0496094,-5.991201,28.726086,1095000
21
+ 0.34198725,0.28441092,-4.451391,-169.08882,-208.01923,1.5877584,-4.6173515,27.94935,1100000
22
+ 0.34661198,0.231984,-18.072277,-174.30815,-209.09564,1.5940168,-0.7613491,15.167725,1105000
23
+ 0.28375602,0.38956836,-9.08734,-168.40854,-206.44206,6.6517606,-3.1021032,46.97253,1110000
24
+ 0.27820566,0.22815077,-12.068341,-177.59526,-211.2477,2.1324356,-4.032596,22.616138,1115000
25
+ 0.3000974,0.25438926,-16.421686,-175.10979,-208.38048,2.3837645,-2.3341627,21.153574,1120000
26
+ 0.3384323,0.20761871,-29.929466,-173.89174,-208.95714,1.3426074,-2.9419026,25.11412,1125000
27
+ 0.32486337,0.27664217,-2.9415262,-173.67775,-210.5966,5.1061707,-2.0217373,42.054184,1130000
28
+ 0.32326627,0.31508225,-21.449486,-174.26347,-208.0543,1.1577034,-2.794912,30.116,1135000
29
+ 0.28463912,0.22224343,-2.6781504,-177.30148,-208.75496,1.9896535,-2.0948584,20.863121,1140000
30
+ 0.32209194,0.3628674,-0.9853225,-172.27908,-209.69112,1.289222,-1.011419,19.656982,1145000
31
+ 0.29820883,0.2910201,-5.9008236,-173.62675,-205.8894,1.0923891,-3.0454667,21.47339,1150000
32
+ 0.34587193,0.25058126,-22.564342,-176.77672,-211.67288,1.8917799,-1.2384688,22.005611,1155000
33
+ 0.3306436,0.28733265,-0.008759052,-171.40054,-209.95845,2.2319405,-1.2105981,19.242952,1160000
34
+ 0.3038727,0.27019557,-0.44718117,-172.83907,-210.72928,1.9149158,-3.1697342,29.167042,1165000
35
+ 0.3184435,0.42158747,-5.088914,-175.12268,-205.81375,2.250281,-5.807274,51.67089,1170000
36
+ 0.27705854,0.3140284,-3.9108706,-173.54205,-205.98456,1.5262377,-6.0506916,29.757318,1175000
37
+ 0.33508718,0.46609163,-10.996679,-168.70897,-210.62883,7.058089,-5.2374387,47.21183,1180000
38
+ 0.32788384,0.31979927,-4.354794,-175.12955,-211.72884,4.447243,-3.224459,37.386776,1185000
39
+ 0.2901316,0.37663147,-23.872646,-172.01094,-208.28085,1.9917805,-2.9520433,24.353111,1190000
40
+ 0.3266046,0.2421191,0.59748113,-173.62062,-208.35193,2.2680314,-2.0244613,21.934841,1195000
41
+ 0.30432594,0.43180153,-0.3792128,-173.94724,-210.77887,9.63074,-4.379065,41.307846,1200000
42
+ 0.30495727,0.23759785,0.2949415,-174.15775,-210.47527,2.611272,-1.1877639,25.21822,1205000
43
+ 0.31813878,0.22998965,-22.229528,-174.9042,-211.25743,1.2839835,-2.3713105,20.132933,1210000
44
+ 0.35736448,0.25256297,0.5424722,-177.13216,-207.68945,3.4127574,-1.824238,24.766125,1215000
45
+ 0.33365768,0.30726433,1.2008957,-176.03351,-208.53789,1.8199736,-0.8126318,18.278666,1220000
46
+ 0.34726083,0.27114415,0.38107455,-173.43645,-208.1267,1.827003,-2.998451,28.532932,1225000
47
+ 0.31818265,0.19714473,-24.474335,-174.88457,-209.28133,1.9051831,-0.9254932,17.51853,1230000
48
+ 0.3339692,0.17657356,1.157182,-172.68256,-211.33621,2.6633165,-1.1234536,20.79651,1235000
49
+ 0.35620224,0.30714548,-7.6532264,-175.15855,-208.0124,2.5599728,-3.558061,33.995075,1240000
50
+ 0.29963267,0.25066218,-9.517758,-176.86563,-206.59764,9.271787,-3.2502992,44.902725,1245000
51
+ 0.34050953,0.19367762,-8.024555,-175.88008,-208.14624,1.549048,-2.5850475,17.090252,1250000
52
+ 0.31681243,0.24897937,-7.9410048,-172.66429,-212.77795,1.754152,-2.996387,20.16333,1255000
53
+ 0.33587503,0.18466607,-5.986287,-175.27129,-210.45618,0.7894888,-1.82602,15.022686,1260000
54
+ 0.32183242,0.20087826,-44.139164,-175.12698,-206.98456,1.3295665,-0.99035126,18.217644,1265000
55
+ 0.28769225,0.22170062,1.3067496,-171.3184,-209.93423,2.326919,-2.6747673,23.980394,1270000
56
+ 0.3579524,0.24253237,-24.944084,-175.0437,-208.92442,3.6421816,-1.6412889,32.596085,1275000
57
+ 0.33497506,0.2382245,-27.950277,-177.54558,-209.01514,0.5650568,-1.2856289,13.877261,1280000
58
+ 0.31808454,0.23024622,0.3122547,-174.10121,-211.13219,1.043861,-2.9725218,21.624636,1285000
59
+ 0.3340639,0.23772728,-17.21012,-176.2216,-209.29663,1.0030725,-1.7579044,17.300688,1290000
60
+ 0.345569,0.25850397,0.37161842,-174.59741,-207.63466,2.5169365,-1.4414942,17.773191,1295000
61
+ 0.31242302,0.3101208,0.5859927,-167.12527,-208.36514,4.1169233,-8.986571,51.979317,1300000
62
+ 0.32691294,0.16847879,-12.164048,-178.18335,-209.2295,1.4999298,-4.1554656,25.127398,1305000
63
+ 0.29528567,0.25289875,-29.71897,-177.77576,-210.28311,1.3453357,-1.8376803,17.807457,1310000
64
+ 0.3134706,0.28663462,-10.771253,-174.87244,-209.55722,1.4147252,-4.2212996,27.019472,1315000
65
+ 0.2885564,0.27548638,-4.361427,-173.16838,-211.28406,1.6036518,-3.8186724,33.213177,1320000
66
+ 0.2993699,0.2619768,-25.045916,-169.52098,-207.69113,2.1804695,-3.4657607,28.741035,1325000
67
+ 0.35167164,0.24203096,-0.2812243,-172.41405,-209.29605,2.015914,-0.80745584,16.960442,1330000
68
+ 0.35601145,0.19610444,-0.38415796,-173.0946,-206.76767,3.058426,-3.6487336,20.69127,1335000
69
+ 0.35490596,0.26272544,-0.6527226,-174.3726,-210.17825,1.0483685,-3.7110727,20.810596,1340000
70
+ 0.31075746,0.18086961,-9.941097,-171.90695,-209.41084,2.0055559,-3.1242118,24.956886,1345000
71
+ 0.29875192,0.19375512,0.7290647,-177.95598,-209.2717,2.685913,-1.1279624,20.30267,1350000
72
+ 0.34002843,0.17782305,-2.2366226,-173.96179,-214.04611,1.2476163,-3.0839224,21.653326,1355000
73
+ 0.32268864,0.2050664,-13.978692,-175.36278,-209.60675,1.687528,-0.9733945,21.121975,1360000
74
+ 0.3108366,0.18846826,1.4044397,-170.08142,-210.74133,6.8925543,-1.7002981,22.264019,1365000
75
+ 0.31075856,0.20978947,-0.012289256,-169.7186,-208.87276,3.4453468,-1.229059,20.179756,1370000
76
+ 0.34957048,0.19346754,0.034294426,-173.03296,-210.07033,1.840577,-1.3997387,16.943684,1375000
77
+ 0.29060757,0.19010943,-22.992502,-175.87144,-209.58601,0.5979893,-0.8401629,11.492025,1380000
78
+ 0.3213159,0.25996086,-4.518206,-174.37047,-210.32393,5.728197,-4.1025944,30.293808,1385000
79
+ 0.28306842,0.18548606,0.06517631,-172.17032,-208.042,1.0475593,-1.9797263,12.891127,1390000
80
+ 0.28841954,0.20012324,-11.147811,-176.2608,-208.56169,2.3070347,-3.6770234,32.04782,1395000
81
+ 0.3152499,0.2769482,-5.436821,-174.28181,-209.73172,0.9768799,-3.2481093,20.810658,1400000
82
+ 0.2996897,0.25619206,1.4182858,-171.79457,-209.9404,1.6570246,-4.1730714,27.477118,1405000
83
+ 0.2902141,0.26286003,1.9721766,-170.18579,-213.0455,3.0937645,-2.5694015,23.11458,1410000
84
+ 0.32340336,0.16917105,1.0639307,-173.01677,-208.77853,6.2469873,-1.6785847,28.895126,1415000
85
+ 0.27745906,0.22282758,-0.003654331,-174.66797,-208.82022,1.8537624,-0.9870671,14.822664,1420000
86
+ 0.31876862,0.3683122,-5.9014473,-170.95502,-209.09962,3.2132168,-8.824225,64.01779,1425000
87
+ 0.27260897,0.2652837,0.4653568,-174.60051,-210.36707,3.9112225,-1.6007953,23.142263,1430000
88
+ 0.32218593,0.14168833,-19.830225,-175.87816,-209.71062,0.7838106,-2.4201431,13.649482,1435000
89
+ 0.31622356,0.27788752,0.12834772,-169.72728,-208.31636,1.975498,-8.182283,38.574516,1440000
90
+ 0.29374158,0.21572988,0.3443664,-169.3239,-211.08206,3.781481,-1.7505573,23.746313,1445000
91
+ 0.30797577,0.34440026,-3.3944955,-174.0339,-210.6821,4.3264995,-11.672228,70.791916,1450000
92
+ 0.29958183,0.22189818,-2.2084093,-173.27614,-210.43747,2.339195,-5.5099936,31.835087,1455000
93
+ 0.32394266,0.24494305,-26.646233,-174.7663,-209.61377,1.1589122,-2.891561,20.891005,1460000
94
+ 0.31300658,0.18685304,1.5753105,-175.53307,-210.30103,2.4256487,-1.8366312,15.810375,1465000
95
+ 0.29461515,0.21054588,-6.401142,-171.90637,-213.85115,4.699739,-2.5199964,30.541653,1470000
96
+ 0.31592125,0.24333493,-0.2696118,-170.56255,-210.01682,8.273656,-6.3631325,40.868706,1475000
97
+ 0.30293,0.18857543,0.39104083,-169.99632,-207.96129,1.5812516,-1.1756179,16.683361,1480000
98
+ 0.3058651,0.36042482,-4.4109974,-171.79497,-208.51372,7.020408,-2.0338693,36.8777,1485000
99
+ 0.32242835,0.16679369,-22.974165,-176.52124,-208.96,1.4182116,-0.73235065,14.795292,1490000
100
+ 0.2878495,0.331925,-7.612011,-172.21532,-209.8881,1.4417126,-2.6542237,17.377619,1495000
101
+ 0.33937836,0.23022942,-12.739137,-172.23099,-208.64297,1.2110947,-1.3549339,16.363499,1500000
O2O-w-diff-ckpts/cgql/20260318_085240/params_1050000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7ce6771a62c93dd3c4d48771e7d519ab8873f303a9dfa6012d28ce8b3711606
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1100000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:353a69a5f3b0c2a46fa4d4ddfcd0a20d71f19ce1cade3cbdf289a9b6f05d9c2d
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1150000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92341dad52a03a63ced5e5277afca17dfa35618d43998cf9d807234d32fb37a1
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1200000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b066783ba10fea377e48704f53d4791537bc75b4a6cc63e9f85058714691885a
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aee205e568ec44e66e06f015113a11479d1835e63d10b8b0a3b01dc1c48c0925
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f89bc3028c3a9e64b1f37d82d0b50f0cd7be931e49a3535f4b9aed1d25b64f9
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c87d6be497a8f6ee58ea114eb8a19ec0960648ccdd489b6b99c7955b7e3bb33e
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab7ebe90ebaf3963691a609d6560edb1cb96fe979eb85d2822755239e28532bb
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e31293e85f571a08698929bfdabf71c92b7c844607e23e5800fb73b9d11f511f
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/params_1500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14ae5bae5199d2f51f43b6f88dfaee23b36e2c71ab456b4e2ddf2577a60ee7e0
3
+ size 214509745
O2O-w-diff-ckpts/cgql/20260318_085240/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cgql/20260318_085240/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/0yyn39om
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1050000.png ADDED

Git LFS Details

  • SHA256: 45d650dc1006ce61e1812f2fe25f3263771e9e4ab72bcc4848d558dd8d54f59b
  • Pointer size: 131 Bytes
  • Size of remote file: 224 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1100000.png ADDED

Git LFS Details

  • SHA256: 66c468f0b1aeaf339c786249687bcfa750ff2182a18285b0716f9f0329c2e046
  • Pointer size: 131 Bytes
  • Size of remote file: 158 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1150000.png ADDED

Git LFS Details

  • SHA256: 93ce941418737bf2f79210d7dfd6ef6969250390e156187f0482ba19ffa14e6c
  • Pointer size: 131 Bytes
  • Size of remote file: 178 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1200000.png ADDED

Git LFS Details

  • SHA256: db6433db292231bcf3be7c8af92cfeaf9ca8e453e59b4696ec6c9cffac21f5cb
  • Pointer size: 131 Bytes
  • Size of remote file: 169 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1250000.png ADDED

Git LFS Details

  • SHA256: 4446710c32b029369bd83544e97ff34ab376b093866dbf4c9548ab64e8d819b3
  • Pointer size: 131 Bytes
  • Size of remote file: 181 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1300000.png ADDED

Git LFS Details

  • SHA256: b346656a84cc6498bc07e39e5cf89bda711a01f414a544e2d0915944bc3caae1
  • Pointer size: 131 Bytes
  • Size of remote file: 152 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1350000.png ADDED

Git LFS Details

  • SHA256: b70095d700fb425e94e12494c4a84b1d0492a3d2318b61d2ebe50dcb6da5fd1f
  • Pointer size: 131 Bytes
  • Size of remote file: 144 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1400000.png ADDED

Git LFS Details

  • SHA256: 7df1c8e2a906d4c5a5e58f1cb82754f9986570c2c40a87232d6bd70997812a93
  • Pointer size: 131 Bytes
  • Size of remote file: 118 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1450000.png ADDED

Git LFS Details

  • SHA256: 4791abc880412c10dcff013c0db6e5b835d9f4c18d0dcb8d3de95c82a47618ae
  • Pointer size: 131 Bytes
  • Size of remote file: 133 kB
O2O-w-diff-ckpts/cgql/20260318_085240/visited_states_1500000.png ADDED

Git LFS Details

  • SHA256: 2bb51bc8e845a420f6dad99615a63f10c17b1b260a6696b3f4fff972e07647a6
  • Pointer size: 131 Bytes
  • Size of remote file: 117 kB