Tiredsheep commited on
Commit
7de2bc5
·
verified ·
1 Parent(s): 65fb79a

Upload folder using huggingface_hub

Browse files
Files changed (29) hide show
  1. .gitattributes +1 -0
  2. O2O-w-diff-ckpts/fawac/20260312_164229/env.csv +0 -0
  3. O2O-w-diff-ckpts/fawac/20260312_164229/env_sv.csv +0 -0
  4. O2O-w-diff-ckpts/fawac/20260312_164229/eval.csv +11 -0
  5. O2O-w-diff-ckpts/fawac/20260312_164229/eval_sv.csv +11 -0
  6. O2O-w-diff-ckpts/fawac/20260312_164229/online_agent.csv +101 -0
  7. O2O-w-diff-ckpts/fawac/20260312_164229/online_agent_sv.csv +101 -0
  8. O2O-w-diff-ckpts/fawac/20260312_164229/params_350000.pkl +3 -0
  9. O2O-w-diff-ckpts/fawac/20260312_164229/params_400000.pkl +3 -0
  10. O2O-w-diff-ckpts/fawac/20260312_164229/params_450000.pkl +3 -0
  11. O2O-w-diff-ckpts/fawac/20260312_164229/params_500000.pkl +3 -0
  12. O2O-w-diff-ckpts/fawac/20260312_164229/params_550000.pkl +3 -0
  13. O2O-w-diff-ckpts/fawac/20260312_164229/params_600000.pkl +3 -0
  14. O2O-w-diff-ckpts/fawac/20260312_164229/params_650000.pkl +3 -0
  15. O2O-w-diff-ckpts/fawac/20260312_164229/params_700000.pkl +3 -0
  16. O2O-w-diff-ckpts/fawac/20260312_164229/params_750000.pkl +3 -0
  17. O2O-w-diff-ckpts/fawac/20260312_164229/params_800000.pkl +3 -0
  18. O2O-w-diff-ckpts/fawac/20260312_164229/progress.tk +1 -0
  19. O2O-w-diff-ckpts/fawac/20260312_164229/token.tk +1 -0
  20. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_350000.png +3 -0
  21. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_400000.png +0 -0
  22. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_450000.png +0 -0
  23. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_500000.png +0 -0
  24. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_550000.png +0 -0
  25. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_600000.png +0 -0
  26. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_650000.png +0 -0
  27. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_700000.png +0 -0
  28. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_750000.png +0 -0
  29. O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_800000.png +0 -0
.gitattributes CHANGED
@@ -440,3 +440,4 @@ O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_450000.png filter=lfs diff=
440
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_500000.png filter=lfs diff=lfs merge=lfs -text
441
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
442
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_600000.png filter=lfs diff=lfs merge=lfs -text
 
 
440
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_500000.png filter=lfs diff=lfs merge=lfs -text
441
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_550000.png filter=lfs diff=lfs merge=lfs -text
442
  O2O-w-diff-ckpts/cgql/20260316_104602/visited_states_600000.png filter=lfs diff=lfs merge=lfs -text
443
+ O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_350000.png filter=lfs diff=lfs merge=lfs -text
O2O-w-diff-ckpts/fawac/20260312_164229/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_164229/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/fawac/20260312_164229/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.055821211831607445,0.08870086915838063,-0.014231007197341583,0.08807371104647203,0.02264522833425847,0.0,25500.0,-1.0,-1000.0,1000.0,1.3912513494491576,350000
3
+ 0.0,0.0,0.10373505003278603,0.090797241673365,-0.05703317043923572,0.08815061387918517,0.010009521893273778,0.0,77500.0,-1.0,-1000.0,1000.0,1.3732549333572388,400000
4
+ 0.0,0.0,0.32940458253365756,0.13840650439416177,-0.02167030574976476,0.14034547008761183,0.046853186033816385,0.0,129500.0,-1.0,-1000.0,1000.0,1.4079357719421386,450000
5
+ 0.0,0.0,0.20227240135190197,0.12877865368325836,-0.007074772516377989,0.12639127945269027,-0.05337273485285993,0.0,181500.0,-1.0,-1000.0,1000.0,1.3722185945510865,500000
6
+ 0.0,0.0,0.2936721933870499,0.12147093700929534,-0.014576549789946856,0.12187137432380238,0.009916160423846033,0.0,233500.0,-1.0,-1000.0,1000.0,1.3767066717147827,550000
7
+ 0.0,0.0,0.28541582759683387,0.13666264522958324,0.00016726384680637552,0.135809447079527,-0.05642993192389434,0.0,285500.0,-1.0,-1000.0,1000.0,1.377379388809204,600000
8
+ 0.0,0.0,0.18418295974727916,0.10999549769545577,0.057997270937228965,0.11633801233356943,-0.003735033942393393,0.0,337500.0,-1.0,-1000.0,1000.0,1.4149243450164795,650000
9
+ 0.0,0.0,0.39153704168794257,0.15111804620538033,0.027823890167315457,0.15224932911922323,-0.021974226781092863,0.0,389500.0,-1.0,-1000.0,1000.0,1.3776173973083496,700000
10
+ 0.0,0.0,0.2551992687465706,0.13887284764702643,0.049675761067279466,0.1431259979309876,0.05726103343095599,0.0,441500.0,-1.0,-1000.0,1000.0,1.3668574285507202,750000
11
+ 0.0,0.0,0.20644126308826116,0.13321079231444635,-0.020691965185202,0.13344559417582288,-0.012624841889568096,0.0,493500.0,-1.0,-1000.0,1000.0,1.3756241130828857,800000
O2O-w-diff-ckpts/fawac/20260312_164229/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,xy,prev_qpos,prev_qvel,qpos,qvel,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,0.055821211831607445,0.08870086915838063,-0.014231007197341583,0.08807371104647203,0.02264522833425847,0.0,25500.0,-1.0,-1000.0,1000.0,1.3912513494491576,350000
3
+ 0.0,0.0,0.10373505003278603,0.090797241673365,-0.05703317043923572,0.08815061387918517,0.010009521893273778,0.0,77500.0,-1.0,-1000.0,1000.0,1.3732549333572388,400000
4
+ 0.0,0.0,0.32940458253365756,0.13840650439416177,-0.02167030574976476,0.14034547008761183,0.046853186033816385,0.0,129500.0,-1.0,-1000.0,1000.0,1.4079357719421386,450000
5
+ 0.0,0.0,0.20227240135190197,0.12877865368325836,-0.007074772516377989,0.12639127945269027,-0.05337273485285993,0.0,181500.0,-1.0,-1000.0,1000.0,1.3722185945510865,500000
6
+ 0.0,0.0,0.2936721933870499,0.12147093700929534,-0.014576549789946856,0.12187137432380238,0.009916160423846033,0.0,233500.0,-1.0,-1000.0,1000.0,1.3767066717147827,550000
7
+ 0.0,0.0,0.28541582759683387,0.13666264522958324,0.00016726384680637552,0.135809447079527,-0.05642993192389434,0.0,285500.0,-1.0,-1000.0,1000.0,1.377379388809204,600000
8
+ 0.0,0.0,0.18418295974727916,0.10999549769545577,0.057997270937228965,0.11633801233356943,-0.003735033942393393,0.0,337500.0,-1.0,-1000.0,1000.0,1.4149243450164795,650000
9
+ 0.0,0.0,0.39153704168794257,0.15111804620538033,0.027823890167315457,0.15224932911922323,-0.021974226781092863,0.0,389500.0,-1.0,-1000.0,1000.0,1.3776173973083496,700000
10
+ 0.0,0.0,0.2551992687465706,0.13887284764702643,0.049675761067279466,0.1431259979309876,0.05726103343095599,0.0,441500.0,-1.0,-1000.0,1000.0,1.3668574285507202,750000
11
+ 0.0,0.0,0.20644126308826116,0.13321079231444635,-0.020691965185202,0.13344559417582288,-0.012624841889568096,0.0,493500.0,-1.0,-1000.0,1000.0,1.3756241130828857,800000
O2O-w-diff-ckpts/fawac/20260312_164229/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 3.0724192,28.853388,-64.10254,-291.25757,-4195.3145,37.190884,394.32852,-196.76825,3560.2659,305000
3
+ 1.9049425,13.861748,2.0077853,-270.90445,-4224.1,18.780363,92.70291,-108.78323,1500.6975,310000
4
+ 2.0489347,50.994625,-132.59724,-344.40915,-4327.265,40.221485,1402.6056,-1196.7886,9155.292,315000
5
+ 1.5704203,8.975355,-107.966934,-291.03134,-4357.113,12.451352,97.59747,-60.019917,1201.9462,320000
6
+ 2.383957,36.824585,2.9195695,-301.81186,-4374.57,31.943378,412.43753,-457.79947,4706.2686,325000
7
+ 2.4921937,18.60326,6.6528635,-312.8418,-4497.61,26.142975,137.33421,-159.79778,2459.9487,330000
8
+ 1.9647443,30.518452,8.417838,-261.68283,-529.6105,10.798523,55.09262,-90.889565,945.256,335000
9
+ 0.97249216,10.125047,10.562922,-307.70505,-4620.1543,46.941853,2816.7651,-1644.4738,14109.326,340000
10
+ 4.2062535,19.131577,-157.6187,-301.29694,-4692.8115,39.381664,573.8346,-246.98935,5019.6665,345000
11
+ 4.1368794,35.84744,0.93865573,-357.94333,-4763.4995,108.224815,2954.6318,-2664.2717,21105.426,350000
12
+ 2.4000802,71.660286,0.16125178,-290.2402,-4858.2725,37.581356,328.09692,-377.86243,5074.9785,355000
13
+ 1.8086841,25.419834,-156.94998,-309.1628,-4921.1724,39.430756,219.49716,-301.18307,3303.2305,360000
14
+ 2.7003863,37.504078,-140.74776,-283.87167,-780.9405,22.656372,108.03701,-197.57843,1877.7871,365000
15
+ 2.7999592,30.23728,-28.052958,-299.703,-5051.565,23.598867,66.134,-147.70883,1843.2386,370000
16
+ 3.6310494,1119.2177,0.42828536,-309.8705,-5164.621,61.62904,14036.805,-26199.443,117942.34,375000
17
+ 1.990941,30.966543,-92.47216,-345.69946,-5135.36,51.96128,339.50858,-469.51694,4402.824,380000
18
+ 1.1582367,22.591528,-7.4739985,-291.23874,-3742.876,29.582712,204.85165,-538.44696,4943.919,385000
19
+ 1.5863371,23.595133,-20.354387,-361.86172,-5277.9272,32.196575,261.26816,-235.63075,2969.3252,390000
20
+ 9.020733,52.361694,14.172217,-326.35983,-5235.8765,71.590515,1089.7745,-1181.9592,13080.764,395000
21
+ 1.9393828,54.556408,3.509084,-358.92892,-5296.5864,47.420174,371.84418,-392.41132,4859.6016,400000
22
+ 2.3511395,26.889494,-124.384415,-339.67584,-5313.4976,115.12974,1812.394,-1647.6195,15137.527,405000
23
+ 3.4524179,107.96703,42.395744,-399.7547,-5286.988,54.558804,5835.556,-2007.5858,26970.225,410000
24
+ 2.6358693,94.354355,49.783073,-339.447,-5425.719,68.85476,1358.2966,-1542.2489,13510.835,415000
25
+ 1.6282191,41.197704,-135.24889,-316.49692,-5411.7554,18.7451,286.8793,-177.88956,2486.0132,420000
26
+ 2.414199,54.397804,81.40069,-327.56723,-5466.605,25.699757,61.030483,-99.11007,1827.5181,425000
27
+ 2.680674,26.300108,-122.88219,-340.42746,-5417.1494,21.88915,409.70285,-286.27744,3531.6787,430000
28
+ 2.0484715,37.05497,-118.1281,-345.4403,-5417.0366,18.609041,60.540066,-49.63749,1339.0278,435000
29
+ 2.390277,20.765934,-186.84521,-313.55762,-5425.125,115.78002,4293.722,-5822.1587,32719.537,440000
30
+ 2.01143,41.49717,-24.000643,-412.05893,-5447.8647,36.633007,749.38336,-999.3201,6599.4688,445000
31
+ 6.645431,30.522858,-169.61674,-329.10626,-5431.2544,25.625513,68.04997,-133.9401,1999.7358,450000
32
+ 2.4731438,31.901386,-98.54256,-325.4305,-5308.6885,37.51501,430.61758,-594.941,4472.5083,455000
33
+ 2.0417156,27.160166,1.7956934,-341.8524,-5425.2397,29.672052,233.71536,-772.0416,3811.3887,460000
34
+ 3.3225865,32.260796,-89.05922,-342.53867,-5278.8564,28.474821,169.89375,-121.434616,2558.595,465000
35
+ 3.682244,42.40713,4.093942,-430.8591,-5216.7666,57.5813,276.4356,-267.3195,4579.415,470000
36
+ 2.681997,1545.6311,-69.50013,-314.72876,-5346.9653,31.021046,621.98004,-485.20834,4105.4116,475000
37
+ 3.1450548,28.806736,8.504672,-319.89655,-5195.0996,32.374226,184.32103,-184.2575,2208.2134,480000
38
+ 2.3404636,29.957764,-7.344728,-328.49445,-5162.1104,30.940847,166.84976,-124.96478,2342.8875,485000
39
+ 2.3757463,34.80151,-184.3915,-328.7568,-4988.714,31.748499,198.89374,-274.27997,3618.1882,490000
40
+ 1.9428611,117.71804,12.366931,-326.7394,-4995.714,55.14297,304.05377,-510.72284,5424.498,495000
41
+ 2.3985567,96.923584,-1.5382284,-347.89737,-4845.391,42.91702,475.77982,-440.5117,7145.1216,500000
42
+ 2.2434301,43.687893,-97.573814,-282.33932,-732.3912,33.124363,433.71375,-270.93008,3528.1077,505000
43
+ 3.8680506,56.202026,-93.746414,-335.36914,-4536.6333,22.575386,870.2557,-861.5129,6222.9297,510000
44
+ 4.403643,55.712933,8.344434,-338.40637,-4313.52,64.11207,652.30414,-346.80008,5736.825,515000
45
+ 4.495682,19.803898,10.351732,-293.71313,-3992.7117,24.544584,96.16512,-87.642975,1664.5162,520000
46
+ 1.177802,327.15582,9.572893,-329.05746,-3762.8665,49.79028,522.43463,-354.41275,6126.1753,525000
47
+ 4.68739,60.12393,-150.3197,-370.96814,-3568.643,50.580482,253.45778,-297.17407,3711.1885,530000
48
+ 1.2357244,35.48663,-16.443241,-286.83942,-829.70215,23.766327,121.13034,-157.49362,2321.9497,535000
49
+ 1.8492974,53.132,-158.94824,-306.7764,-3272.7024,38.743927,714.3499,-769.5646,3736.086,540000
50
+ 2.2273207,28.717825,-3.5442886,-295.95694,-3115.5852,21.653193,52.763733,-94.31953,1659.5061,545000
51
+ 3.1692815,91.3625,1.3015159,-296.89478,-3142.9963,24.20879,4483.22,-3236.718,27358.277,550000
52
+ 2.8306227,52.651527,-5.3350835,-293.5327,-2701.29,51.713978,294.1131,-642.61554,3840.992,555000
53
+ 2.1859338,11.84352,-4.318362,-270.59818,-579.50366,11.636602,56.72118,-153.3956,1119.4432,560000
54
+ 2.7128437,81.69998,-93.47127,-304.9894,-2365.8633,63.65748,464.18808,-509.6458,7096.732,565000
55
+ 5.8644776,30.510595,-98.527985,-296.20532,-2144.339,26.862934,76.19816,-156.70076,2287.142,570000
56
+ 2.349844,13.814765,-191.7505,-284.31827,-1974.8229,13.590738,134.7916,-258.314,1531.7339,575000
57
+ 2.5328217,21.040165,-12.116355,-293.96954,-1841.1993,10.868491,91.96259,-160.91786,1331.5706,580000
58
+ 1.5872049,15.233002,4.251298,-287.33444,-1898.3589,15.134847,73.051575,-56.808624,1160.7261,585000
59
+ 1.2495148,40.771126,13.422203,-283.7643,-1549.2372,22.102808,329.479,-244.47658,3860.1318,590000
60
+ 2.0987175,114.23284,-7.867107,-268.57077,-1389.79,26.286987,2521.4387,-3463.519,18807.059,595000
61
+ 1.2263623,30.237776,-5.6970015,-264.89694,-1442.2177,7.7829485,79.56176,-30.245977,818.1054,600000
62
+ 1.1765696,7.386603,95.59022,-262.14868,-1155.0436,6.7006416,106.0197,-86.1208,880.65906,605000
63
+ 2.0606823,14.80757,-29.192322,-264.42123,-1055.427,14.700244,80.516556,-104.35957,1227.0259,610000
64
+ 2.534268,10.557302,143.78879,-264.6402,-975.42206,37.822155,647.4618,-784.61945,5471.43,615000
65
+ 1.3396587,18.640884,25.86977,-252.90076,-886.26074,15.014426,506.96692,-346.6431,4958.466,620000
66
+ 0.89485323,6.6219134,144.17639,-245.84305,-466.39136,5.8003783,29.824064,-22.482819,501.51935,625000
67
+ 0.667052,5.600968,173.72859,-249.01396,-753.3973,4.4600954,36.828503,-21.510496,435.2979,630000
68
+ 1.167455,6.419121,195.91408,-248.354,-725.6343,5.3050966,57.326023,-38.46311,558.6924,635000
69
+ 0.53435725,10.853772,-163.63722,-249.16797,-621.0299,13.526349,491.93256,-257.2282,3830.3887,640000
70
+ 0.89611495,5.3923163,-110.839325,-244.23872,-724.00653,3.8903635,19.462809,-44.301247,484.14072,645000
71
+ 0.4726736,23.08859,196.6264,-240.30737,-533.9427,14.577834,96.96658,-202.77838,1442.2572,650000
72
+ 0.7292604,9.962557,202.81223,-236.01964,-475.8442,7.689728,66.80654,-125.79416,1102.4596,655000
73
+ 0.6146381,12.208339,-57.09894,-244.80687,-839.2387,4.336592,40.902153,-47.61926,843.44806,660000
74
+ 0.79024196,12.013214,232.90376,-234.98619,-516.4873,10.992798,262.70572,-300.5507,2618.1167,665000
75
+ 1.9509494,5.222488,7.8358173,-238.87633,-748.4458,3.7628236,51.322247,-70.12841,869.9226,670000
76
+ 0.54000187,7.695395,233.36139,-233.61324,-829.4259,2.6908746,129.93555,-71.52551,1177.7944,675000
77
+ 0.7752655,6.2482677,-101.15601,-234.42094,-436.0518,4.5157523,93.03273,-123.84792,901.95935,680000
78
+ 1.0704676,2.783041,225.66322,-229.70952,-306.6221,2.1045935,103.033806,-34.68658,534.2055,685000
79
+ 1.2886419,3.173209,7.6123734,-229.15665,-348.95663,3.350335,10.768478,-11.160885,362.61816,690000
80
+ 0.7177242,2.3417413,-128.35207,-236.69719,-758.30176,2.4837625,8.52648,-9.482983,273.4023,695000
81
+ 0.93391883,13.10721,194.72163,-230.8501,-563.3073,7.7045627,134.9856,-116.14877,1814.1138,700000
82
+ 0.6700295,5.0846505,173.01703,-227.87158,-692.9177,5.942475,95.41499,-170.39388,1074.9591,705000
83
+ 0.7258336,2.168888,-7.367796,-228.07857,-312.5033,2.2661068,10.215625,-27.226582,349.08374,710000
84
+ 0.8284698,2.9294057,150.11023,-229.09673,-386.00372,4.6967716,46.887196,-48.876038,451.85486,715000
85
+ 0.8425602,10.520807,62.483162,-230.89522,-709.6983,2.729966,33.47929,-46.550285,770.15424,720000
86
+ 1.1181772,7.7206955,66.98042,-226.98103,-444.3971,5.020517,39.58668,-26.437141,690.2864,725000
87
+ 0.5300191,9.922309,131.61388,-227.36221,-482.87833,4.7337804,48.943905,-41.47088,612.7118,730000
88
+ 0.69137836,3.7302933,123.16838,-225.45625,-605.81,3.476748,64.999886,-95.0128,834.52155,735000
89
+ 0.40671182,4.3227344,10.65114,-224.70317,-309.7027,19.962156,447.3151,-844.1555,5250.071,740000
90
+ 0.5785327,2.4287405,89.92214,-224.33482,-393.6905,1.6270055,13.635025,-28.56815,275.10724,745000
91
+ 0.5083012,3.3350685,42.76849,-221.86563,-451.83176,2.5315318,33.743736,-58.91578,473.8685,750000
92
+ 0.9794934,13.261325,-6.695782,-223.83397,-478.55292,36.85165,590.7986,-445.57574,4710.0776,755000
93
+ 0.45802692,5.6177707,2.619739,-222.72823,-389.9202,4.2706494,246.85703,-378.6352,1714.1416,760000
94
+ 0.4464779,4.382383,28.48358,-223.44844,-298.7713,2.4667377,16.315712,-16.630625,382.31885,765000
95
+ 0.6720967,3.8505628,-81.385185,-223.73328,-337.26822,1.9110807,63.62299,-68.781006,870.7342,770000
96
+ 0.5963525,3.1206462,-2.8234482,-221.86638,-357.0033,2.8962398,7.6513186,-4.7000656,166.87633,775000
97
+ 0.4359156,4.303551,5.7509365,-219.83284,-357.24005,2.7385128,107.12455,-62.450817,743.068,780000
98
+ 0.5868622,3.9273896,-54.560688,-223.02184,-565.99884,3.8858361,44.141064,-38.938732,619.89087,785000
99
+ 0.4132011,17.758692,-48.496796,-220.54105,-297.2123,5.8229175,392.3505,-156.08209,2502.1729,790000
100
+ 0.46987176,2.0352945,-42.970062,-222.35661,-672.8579,1.5770744,13.722035,-41.261726,340.7335,795000
101
+ 0.42185268,1.9688648,-44.55104,-219.09822,-383.7801,1.6085072,10.362793,-5.7097154,161.3391,800000
O2O-w-diff-ckpts/fawac/20260312_164229/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,critic/value_loss,grad/max,grad/min,grad/norm,step
2
+ 3.0724192,28.853388,-64.10254,-291.25757,-4195.3145,37.190884,394.32852,-196.76825,3560.2659,305000
3
+ 1.9049425,13.861748,2.0077853,-270.90445,-4224.1,18.780363,92.70291,-108.78323,1500.6975,310000
4
+ 2.0489347,50.994625,-132.59724,-344.40915,-4327.265,40.221485,1402.6056,-1196.7886,9155.292,315000
5
+ 1.5704203,8.975355,-107.966934,-291.03134,-4357.113,12.451352,97.59747,-60.019917,1201.9462,320000
6
+ 2.383957,36.824585,2.9195695,-301.81186,-4374.57,31.943378,412.43753,-457.79947,4706.2686,325000
7
+ 2.4921937,18.60326,6.6528635,-312.8418,-4497.61,26.142975,137.33421,-159.79778,2459.9487,330000
8
+ 1.9647443,30.518452,8.417838,-261.68283,-529.6105,10.798523,55.09262,-90.889565,945.256,335000
9
+ 0.97249216,10.125047,10.562922,-307.70505,-4620.1543,46.941853,2816.7651,-1644.4738,14109.326,340000
10
+ 4.2062535,19.131577,-157.6187,-301.29694,-4692.8115,39.381664,573.8346,-246.98935,5019.6665,345000
11
+ 4.1368794,35.84744,0.93865573,-357.94333,-4763.4995,108.224815,2954.6318,-2664.2717,21105.426,350000
12
+ 2.4000802,71.660286,0.16125178,-290.2402,-4858.2725,37.581356,328.09692,-377.86243,5074.9785,355000
13
+ 1.8086841,25.419834,-156.94998,-309.1628,-4921.1724,39.430756,219.49716,-301.18307,3303.2305,360000
14
+ 2.7003863,37.504078,-140.74776,-283.87167,-780.9405,22.656372,108.03701,-197.57843,1877.7871,365000
15
+ 2.7999592,30.23728,-28.052958,-299.703,-5051.565,23.598867,66.134,-147.70883,1843.2386,370000
16
+ 3.6310494,1119.2177,0.42828536,-309.8705,-5164.621,61.62904,14036.805,-26199.443,117942.34,375000
17
+ 1.990941,30.966543,-92.47216,-345.69946,-5135.36,51.96128,339.50858,-469.51694,4402.824,380000
18
+ 1.1582367,22.591528,-7.4739985,-291.23874,-3742.876,29.582712,204.85165,-538.44696,4943.919,385000
19
+ 1.5863371,23.595133,-20.354387,-361.86172,-5277.9272,32.196575,261.26816,-235.63075,2969.3252,390000
20
+ 9.020733,52.361694,14.172217,-326.35983,-5235.8765,71.590515,1089.7745,-1181.9592,13080.764,395000
21
+ 1.9393828,54.556408,3.509084,-358.92892,-5296.5864,47.420174,371.84418,-392.41132,4859.6016,400000
22
+ 2.3511395,26.889494,-124.384415,-339.67584,-5313.4976,115.12974,1812.394,-1647.6195,15137.527,405000
23
+ 3.4524179,107.96703,42.395744,-399.7547,-5286.988,54.558804,5835.556,-2007.5858,26970.225,410000
24
+ 2.6358693,94.354355,49.783073,-339.447,-5425.719,68.85476,1358.2966,-1542.2489,13510.835,415000
25
+ 1.6282191,41.197704,-135.24889,-316.49692,-5411.7554,18.7451,286.8793,-177.88956,2486.0132,420000
26
+ 2.414199,54.397804,81.40069,-327.56723,-5466.605,25.699757,61.030483,-99.11007,1827.5181,425000
27
+ 2.680674,26.300108,-122.88219,-340.42746,-5417.1494,21.88915,409.70285,-286.27744,3531.6787,430000
28
+ 2.0484715,37.05497,-118.1281,-345.4403,-5417.0366,18.609041,60.540066,-49.63749,1339.0278,435000
29
+ 2.390277,20.765934,-186.84521,-313.55762,-5425.125,115.78002,4293.722,-5822.1587,32719.537,440000
30
+ 2.01143,41.49717,-24.000643,-412.05893,-5447.8647,36.633007,749.38336,-999.3201,6599.4688,445000
31
+ 6.645431,30.522858,-169.61674,-329.10626,-5431.2544,25.625513,68.04997,-133.9401,1999.7358,450000
32
+ 2.4731438,31.901386,-98.54256,-325.4305,-5308.6885,37.51501,430.61758,-594.941,4472.5083,455000
33
+ 2.0417156,27.160166,1.7956934,-341.8524,-5425.2397,29.672052,233.71536,-772.0416,3811.3887,460000
34
+ 3.3225865,32.260796,-89.05922,-342.53867,-5278.8564,28.474821,169.89375,-121.434616,2558.595,465000
35
+ 3.682244,42.40713,4.093942,-430.8591,-5216.7666,57.5813,276.4356,-267.3195,4579.415,470000
36
+ 2.681997,1545.6311,-69.50013,-314.72876,-5346.9653,31.021046,621.98004,-485.20834,4105.4116,475000
37
+ 3.1450548,28.806736,8.504672,-319.89655,-5195.0996,32.374226,184.32103,-184.2575,2208.2134,480000
38
+ 2.3404636,29.957764,-7.344728,-328.49445,-5162.1104,30.940847,166.84976,-124.96478,2342.8875,485000
39
+ 2.3757463,34.80151,-184.3915,-328.7568,-4988.714,31.748499,198.89374,-274.27997,3618.1882,490000
40
+ 1.9428611,117.71804,12.366931,-326.7394,-4995.714,55.14297,304.05377,-510.72284,5424.498,495000
41
+ 2.3985567,96.923584,-1.5382284,-347.89737,-4845.391,42.91702,475.77982,-440.5117,7145.1216,500000
42
+ 2.2434301,43.687893,-97.573814,-282.33932,-732.3912,33.124363,433.71375,-270.93008,3528.1077,505000
43
+ 3.8680506,56.202026,-93.746414,-335.36914,-4536.6333,22.575386,870.2557,-861.5129,6222.9297,510000
44
+ 4.403643,55.712933,8.344434,-338.40637,-4313.52,64.11207,652.30414,-346.80008,5736.825,515000
45
+ 4.495682,19.803898,10.351732,-293.71313,-3992.7117,24.544584,96.16512,-87.642975,1664.5162,520000
46
+ 1.177802,327.15582,9.572893,-329.05746,-3762.8665,49.79028,522.43463,-354.41275,6126.1753,525000
47
+ 4.68739,60.12393,-150.3197,-370.96814,-3568.643,50.580482,253.45778,-297.17407,3711.1885,530000
48
+ 1.2357244,35.48663,-16.443241,-286.83942,-829.70215,23.766327,121.13034,-157.49362,2321.9497,535000
49
+ 1.8492974,53.132,-158.94824,-306.7764,-3272.7024,38.743927,714.3499,-769.5646,3736.086,540000
50
+ 2.2273207,28.717825,-3.5442886,-295.95694,-3115.5852,21.653193,52.763733,-94.31953,1659.5061,545000
51
+ 3.1692815,91.3625,1.3015159,-296.89478,-3142.9963,24.20879,4483.22,-3236.718,27358.277,550000
52
+ 2.8306227,52.651527,-5.3350835,-293.5327,-2701.29,51.713978,294.1131,-642.61554,3840.992,555000
53
+ 2.1859338,11.84352,-4.318362,-270.59818,-579.50366,11.636602,56.72118,-153.3956,1119.4432,560000
54
+ 2.7128437,81.69998,-93.47127,-304.9894,-2365.8633,63.65748,464.18808,-509.6458,7096.732,565000
55
+ 5.8644776,30.510595,-98.527985,-296.20532,-2144.339,26.862934,76.19816,-156.70076,2287.142,570000
56
+ 2.349844,13.814765,-191.7505,-284.31827,-1974.8229,13.590738,134.7916,-258.314,1531.7339,575000
57
+ 2.5328217,21.040165,-12.116355,-293.96954,-1841.1993,10.868491,91.96259,-160.91786,1331.5706,580000
58
+ 1.5872049,15.233002,4.251298,-287.33444,-1898.3589,15.134847,73.051575,-56.808624,1160.7261,585000
59
+ 1.2495148,40.771126,13.422203,-283.7643,-1549.2372,22.102808,329.479,-244.47658,3860.1318,590000
60
+ 2.0987175,114.23284,-7.867107,-268.57077,-1389.79,26.286987,2521.4387,-3463.519,18807.059,595000
61
+ 1.2263623,30.237776,-5.6970015,-264.89694,-1442.2177,7.7829485,79.56176,-30.245977,818.1054,600000
62
+ 1.1765696,7.386603,95.59022,-262.14868,-1155.0436,6.7006416,106.0197,-86.1208,880.65906,605000
63
+ 2.0606823,14.80757,-29.192322,-264.42123,-1055.427,14.700244,80.516556,-104.35957,1227.0259,610000
64
+ 2.534268,10.557302,143.78879,-264.6402,-975.42206,37.822155,647.4618,-784.61945,5471.43,615000
65
+ 1.3396587,18.640884,25.86977,-252.90076,-886.26074,15.014426,506.96692,-346.6431,4958.466,620000
66
+ 0.89485323,6.6219134,144.17639,-245.84305,-466.39136,5.8003783,29.824064,-22.482819,501.51935,625000
67
+ 0.667052,5.600968,173.72859,-249.01396,-753.3973,4.4600954,36.828503,-21.510496,435.2979,630000
68
+ 1.167455,6.419121,195.91408,-248.354,-725.6343,5.3050966,57.326023,-38.46311,558.6924,635000
69
+ 0.53435725,10.853772,-163.63722,-249.16797,-621.0299,13.526349,491.93256,-257.2282,3830.3887,640000
70
+ 0.89611495,5.3923163,-110.839325,-244.23872,-724.00653,3.8903635,19.462809,-44.301247,484.14072,645000
71
+ 0.4726736,23.08859,196.6264,-240.30737,-533.9427,14.577834,96.96658,-202.77838,1442.2572,650000
72
+ 0.7292604,9.962557,202.81223,-236.01964,-475.8442,7.689728,66.80654,-125.79416,1102.4596,655000
73
+ 0.6146381,12.208339,-57.09894,-244.80687,-839.2387,4.336592,40.902153,-47.61926,843.44806,660000
74
+ 0.79024196,12.013214,232.90376,-234.98619,-516.4873,10.992798,262.70572,-300.5507,2618.1167,665000
75
+ 1.9509494,5.222488,7.8358173,-238.87633,-748.4458,3.7628236,51.322247,-70.12841,869.9226,670000
76
+ 0.54000187,7.695395,233.36139,-233.61324,-829.4259,2.6908746,129.93555,-71.52551,1177.7944,675000
77
+ 0.7752655,6.2482677,-101.15601,-234.42094,-436.0518,4.5157523,93.03273,-123.84792,901.95935,680000
78
+ 1.0704676,2.783041,225.66322,-229.70952,-306.6221,2.1045935,103.033806,-34.68658,534.2055,685000
79
+ 1.2886419,3.173209,7.6123734,-229.15665,-348.95663,3.350335,10.768478,-11.160885,362.61816,690000
80
+ 0.7177242,2.3417413,-128.35207,-236.69719,-758.30176,2.4837625,8.52648,-9.482983,273.4023,695000
81
+ 0.93391883,13.10721,194.72163,-230.8501,-563.3073,7.7045627,134.9856,-116.14877,1814.1138,700000
82
+ 0.6700295,5.0846505,173.01703,-227.87158,-692.9177,5.942475,95.41499,-170.39388,1074.9591,705000
83
+ 0.7258336,2.168888,-7.367796,-228.07857,-312.5033,2.2661068,10.215625,-27.226582,349.08374,710000
84
+ 0.8284698,2.9294057,150.11023,-229.09673,-386.00372,4.6967716,46.887196,-48.876038,451.85486,715000
85
+ 0.8425602,10.520807,62.483162,-230.89522,-709.6983,2.729966,33.47929,-46.550285,770.15424,720000
86
+ 1.1181772,7.7206955,66.98042,-226.98103,-444.3971,5.020517,39.58668,-26.437141,690.2864,725000
87
+ 0.5300191,9.922309,131.61388,-227.36221,-482.87833,4.7337804,48.943905,-41.47088,612.7118,730000
88
+ 0.69137836,3.7302933,123.16838,-225.45625,-605.81,3.476748,64.999886,-95.0128,834.52155,735000
89
+ 0.40671182,4.3227344,10.65114,-224.70317,-309.7027,19.962156,447.3151,-844.1555,5250.071,740000
90
+ 0.5785327,2.4287405,89.92214,-224.33482,-393.6905,1.6270055,13.635025,-28.56815,275.10724,745000
91
+ 0.5083012,3.3350685,42.76849,-221.86563,-451.83176,2.5315318,33.743736,-58.91578,473.8685,750000
92
+ 0.9794934,13.261325,-6.695782,-223.83397,-478.55292,36.85165,590.7986,-445.57574,4710.0776,755000
93
+ 0.45802692,5.6177707,2.619739,-222.72823,-389.9202,4.2706494,246.85703,-378.6352,1714.1416,760000
94
+ 0.4464779,4.382383,28.48358,-223.44844,-298.7713,2.4667377,16.315712,-16.630625,382.31885,765000
95
+ 0.6720967,3.8505628,-81.385185,-223.73328,-337.26822,1.9110807,63.62299,-68.781006,870.7342,770000
96
+ 0.5963525,3.1206462,-2.8234482,-221.86638,-357.0033,2.8962398,7.6513186,-4.7000656,166.87633,775000
97
+ 0.4359156,4.303551,5.7509365,-219.83284,-357.24005,2.7385128,107.12455,-62.450817,743.068,780000
98
+ 0.5868622,3.9273896,-54.560688,-223.02184,-565.99884,3.8858361,44.141064,-38.938732,619.89087,785000
99
+ 0.4132011,17.758692,-48.496796,-220.54105,-297.2123,5.8229175,392.3505,-156.08209,2502.1729,790000
100
+ 0.46987176,2.0352945,-42.970062,-222.35661,-672.8579,1.5770744,13.722035,-41.261726,340.7335,795000
101
+ 0.42185268,1.9688648,-44.55104,-219.09822,-383.7801,1.6085072,10.362793,-5.7097154,161.3391,800000
O2O-w-diff-ckpts/fawac/20260312_164229/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7cc6ca51582ae2de8dc6eafedc3400c16e19c1bff3fd36f958c902f7f5e4f78
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4554824db0fe1bb20cb3b8f3435aac9db002ed938f54f15d731595832b5a81e1
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59af6f9a28722703b0420fe7b2c95ed9f83880c32b40bc462960c03ffc77219e
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97487c8f1e903fc4bd58427450801e646f3d36e160963cae2b48ef264f069d67
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b4669661aae14fa4178ac0e350e85151621bccd15d5304da4088412f101157c
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0153294e15f05a5b0077c8bf0e84a643e08f83abb24060e12f903b9df9a35bf
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30bb2ec1441c42bc4eb07c04e25f877fbf59ddeecea69575f4c0d8d3abcdb000
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c95b89bc7321c37e87dbc4b16ff7b069e624a979a8e59791b0c3cf343fd2f27
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_750000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c7c8cff85fb302c5108c183745ba7a5018bc473873bf4b5a6a374bfd40a14ed
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/params_800000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fbfa77d9bf83973645826ac98f8d9e9f9c89e877ba3ffef13121094875f16f04
3
+ size 214338962
O2O-w-diff-ckpts/fawac/20260312_164229/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/fawac/20260312_164229/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/wi92il5v
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_350000.png ADDED

Git LFS Details

  • SHA256: 91f7025d34ffe4fa6c7a3dc566c61c475cf0f06c10e3555b104e969874872add
  • Pointer size: 131 Bytes
  • Size of remote file: 222 kB
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_400000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_450000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_500000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_550000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_600000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_650000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_700000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_750000.png ADDED
O2O-w-diff-ckpts/fawac/20260312_164229/visited_states_800000.png ADDED