Tiredsheep commited on
Commit
5a661f5
·
verified ·
1 Parent(s): 133e83c

Upload folder using huggingface_hub

Browse files
Files changed (18) hide show
  1. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/env.csv +0 -0
  2. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/env_sv.csv +0 -0
  3. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/eval.csv +11 -0
  4. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/eval_sv.csv +11 -0
  5. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/online_agent.csv +101 -0
  6. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/online_agent_sv.csv +101 -0
  7. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_250000.pkl +3 -0
  8. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_300000.pkl +3 -0
  9. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_350000.pkl +3 -0
  10. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_400000.pkl +3 -0
  11. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_450000.pkl +3 -0
  12. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_500000.pkl +3 -0
  13. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_550000.pkl +3 -0
  14. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_600000.pkl +3 -0
  15. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_650000.pkl +3 -0
  16. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_700000.pkl +3 -0
  17. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/progress.tk +1 -0
  18. O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/token.tk +1 -0
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/env.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/env_sv.csv ADDED
The diff for this file is too large to render. See raw diff
 
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/eval.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.06827226495902013,-0.008270483732810627,-0.06850788989289236,-0.0054545975683608135,25.799119923197598,32.08800000000923,0.4,15650.86,-0.7,-701.46,639.76,1.948512439727783,250000
3
+ 0.0,0.0,-0.0649848062021535,-0.002979128625781262,-0.0654282032323827,-0.00438245465846301,33.724632941339244,6.494000000000779,0.94,35655.7,-0.06,-126.94,127.88,0.416212739944458,300000
4
+ 0.0,0.0,-0.06353080179571594,0.022373950866092097,-0.063624130975412,0.016674640971283308,35.51184772553676,1.9909999999999837,1.0,39526.12,0.0,-36.82,37.82,0.13653002738952635,350000
5
+ 0.0,0.0,-0.05455612147489755,0.039001288546105115,-0.05413264082046722,0.031602646429769315,35.60103296156913,2.16099999999999,1.0,41556.34,0.0,-40.22,41.22,0.13938138484954835,400000
6
+ 0.0,0.0,-0.04954069332613532,0.05574190901942404,-0.0483794709970935,0.04313020622621451,35.62191646729197,1.5709999999999917,1.0,43408.38,0.0,-28.42,29.42,0.10305714130401611,450000
7
+ 0.0,0.0,-0.05487944334120831,0.03401224146089007,-0.053736182170661326,0.03443747290871041,35.62007274146856,2.2999999999999123,1.0,45424.76,0.0,-48.12,44.0,0.1478364372253418,500000
8
+ 0.0,0.0,-0.048828844022103315,0.04536582710064226,-0.04789715974582748,0.05815729247899938,35.621971254741304,1.400999999999995,1.0,47105.24,0.0,-25.02,26.02,0.09387188911437988,550000
9
+ 0.0,0.0,-0.039545247412944524,0.054417573293236446,-0.03816428838451643,0.057081410779470536,35.63557709950459,1.4979999999999891,1.0,48534.08,0.0,-26.96,27.96,0.09801967144012451,600000
10
+ 0.0,0.0,-0.03985716488308867,0.052804839446260514,-0.03841438215034561,0.05405879648638668,35.67286165483984,1.464999999999989,1.0,49927.6,0.0,-26.3,27.3,0.09475958824157715,650000
11
+ 0.0,0.0,-0.04248144094607098,0.042375429991493505,-0.040990000344788,0.03758644889364695,35.617805724978176,1.498999999999986,1.0,51439.46,0.0,-26.98,27.98,0.09995078563690185,700000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/eval_sv.csv ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ avg_gripper_contact_length,num_gripper_contacts,prev_qpos,prev_qvel,qpos,qvel,control,time,success,total.timesteps,episode.final_reward,episode.return,episode.length,episode.duration,step
2
+ 0.0,0.0,-0.06827226495902013,-0.008270483732810627,-0.06850788989289236,-0.0054545975683608135,25.799119923197598,32.08800000000923,0.4,15650.86,-0.7,-701.46,639.76,1.948512439727783,250000
3
+ 0.0,0.0,-0.0649848062021535,-0.002979128625781262,-0.0654282032323827,-0.00438245465846301,33.724632941339244,6.494000000000779,0.94,35655.7,-0.06,-126.94,127.88,0.416212739944458,300000
4
+ 0.0,0.0,-0.06353080179571594,0.022373950866092097,-0.063624130975412,0.016674640971283308,35.51184772553676,1.9909999999999837,1.0,39526.12,0.0,-36.82,37.82,0.13653002738952635,350000
5
+ 0.0,0.0,-0.05455612147489755,0.039001288546105115,-0.05413264082046722,0.031602646429769315,35.60103296156913,2.16099999999999,1.0,41556.34,0.0,-40.22,41.22,0.13938138484954835,400000
6
+ 0.0,0.0,-0.04954069332613532,0.05574190901942404,-0.0483794709970935,0.04313020622621451,35.62191646729197,1.5709999999999917,1.0,43408.38,0.0,-28.42,29.42,0.10305714130401611,450000
7
+ 0.0,0.0,-0.05487944334120831,0.03401224146089007,-0.053736182170661326,0.03443747290871041,35.62007274146856,2.2999999999999123,1.0,45424.76,0.0,-48.12,44.0,0.1478364372253418,500000
8
+ 0.0,0.0,-0.048828844022103315,0.04536582710064226,-0.04789715974582748,0.05815729247899938,35.621971254741304,1.400999999999995,1.0,47105.24,0.0,-25.02,26.02,0.09387188911437988,550000
9
+ 0.0,0.0,-0.039545247412944524,0.054417573293236446,-0.03816428838451643,0.057081410779470536,35.63557709950459,1.4979999999999891,1.0,48534.08,0.0,-26.96,27.96,0.09801967144012451,600000
10
+ 0.0,0.0,-0.03985716488308867,0.052804839446260514,-0.03841438215034561,0.05405879648638668,35.67286165483984,1.464999999999989,1.0,49927.6,0.0,-26.3,27.3,0.09475958824157715,650000
11
+ 0.0,0.0,-0.04248144094607098,0.042375429991493505,-0.040990000344788,0.03758644889364695,35.617805724978176,1.498999999999986,1.0,51439.46,0.0,-26.98,27.98,0.09995078563690185,700000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/online_agent.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 229.99387,0.20546067,0.064432025,4.521254,-123.716446,-231.6585,-306.21896,3.0049622,-1.420109,76.4441,205000
3
+ 229.786,0.2008268,0.06391222,3.5432186,-138.85098,-231.39542,-307.54248,0.48056704,-0.57844526,50.36886,210000
4
+ 225.52559,0.18713269,0.063060485,3.0819838,-104.986404,-227.24522,-307.4983,0.6636756,-0.7107446,50.731144,215000
5
+ 230.6403,0.20210609,0.065148436,5.145928,-133.7058,-232.38428,-308.0072,0.73949695,-0.85796446,55.668808,220000
6
+ 229.24782,0.22591175,0.06640024,4.2421265,-97.32618,-231.17027,-306.45306,0.9117506,-0.9657963,61.48246,225000
7
+ 230.32205,0.19965804,0.060996044,4.025768,3.86628,-231.72252,-305.5695,0.68873787,-0.65995556,53.372063,230000
8
+ 228.82492,0.20429522,0.070745654,2.9461792,-102.05428,-231.16905,-304.9562,0.59371555,-0.39766145,43.843853,235000
9
+ 224.3375,0.2230684,0.068730384,3.6309707,-84.695206,-226.24988,-306.90604,0.757256,-0.6101829,57.61514,240000
10
+ 224.96548,0.19392641,0.0667506,3.5233674,-75.456024,-226.3835,-303.47437,0.7572098,-0.73540086,49.887905,245000
11
+ 221.75766,0.2113069,0.06953649,4.68061,-81.34745,-223.39464,-306.99866,0.52460366,-0.81988734,55.741257,250000
12
+ 220.07765,0.17340969,0.064609915,3.8876915,-66.66511,-222.0485,-305.34488,0.324301,-0.37279812,47.258,255000
13
+ 220.95226,0.21385977,0.06987731,3.91267,-83.68362,-222.89775,-305.93857,0.5234973,-0.86106604,58.351524,260000
14
+ 220.06004,0.2035194,0.06705677,4.3098264,-42.02828,-221.95206,-307.3661,0.98776424,-0.975501,59.166492,265000
15
+ 214.45157,0.1844413,0.07207954,6.05608,-20.36413,-216.46342,-306.26685,1.3140109,-1.1524626,65.53386,270000
16
+ 210.71794,0.21564004,0.074813016,5.8640237,-28.573849,-213.29732,-303.19684,1.4658701,-1.1115123,88.4949,275000
17
+ 213.3268,0.21030709,0.07319261,3.6999567,-52.383736,-215.33476,-307.27164,0.50084364,-0.89926845,61.565594,280000
18
+ 213.38744,0.19698995,0.07668313,5.40085,-10.444582,-215.86168,-307.69583,0.6504888,-1.0966094,67.3107,285000
19
+ 212.01276,0.19039321,0.08199356,4.288975,-8.59039,-214.52193,-302.2282,1.0388391,-1.3862166,68.77907,290000
20
+ 214.48227,0.20089388,0.07582543,3.4345596,-31.43196,-216.58781,-305.9466,1.2533089,-0.9574178,62.301655,295000
21
+ 209.98975,0.21097751,0.07212036,3.8215852,-47.222725,-212.1632,-305.21115,1.1222849,-1.4591407,57.325005,300000
22
+ 216.32033,0.1694046,0.071111016,3.815556,-31.462996,-218.63399,-306.71823,1.1374149,-0.74457383,54.72073,305000
23
+ 215.41556,0.20178379,0.07288871,4.4924846,-41.95584,-217.51102,-306.88544,1.2936108,-0.8964029,67.31162,310000
24
+ 208.03917,0.16589507,0.071990155,3.9883974,-21.091324,-210.59952,-298.17374,0.605711,-0.78964293,56.878536,315000
25
+ 208.72069,0.18351032,0.06960488,3.8603432,-39.466347,-210.97945,-305.1061,1.2527066,-0.8420794,70.27368,320000
26
+ 213.27507,0.19754486,0.07084101,4.007862,-35.300846,-215.82007,-306.88977,0.8532208,-0.59185725,56.780113,325000
27
+ 209.19255,0.21218029,0.07617179,3.6750534,-17.860748,-211.57063,-306.71362,0.49134493,-0.6045281,47.74208,330000
28
+ 207.96687,0.18622053,0.07819722,4.600363,-29.705994,-210.72803,-305.455,0.57042533,-1.2416697,64.86892,335000
29
+ 207.65561,0.18104595,0.0734249,3.3990617,-43.524113,-210.03496,-306.86682,1.4769707,-0.3090221,50.31021,340000
30
+ 202.37839,0.20195325,0.070477776,3.8979046,-14.573616,-204.51125,-304.59442,0.57729155,-0.9228122,50.73804,345000
31
+ 206.73032,0.19582865,0.072400175,5.37341,-38.730747,-209.04903,-304.76123,1.1782974,-0.9246913,69.22534,350000
32
+ 206.61987,0.18956624,0.07462577,3.7124174,-8.171364,-208.8623,-306.20667,0.5263605,-0.6660281,51.303757,355000
33
+ 201.97484,0.22218552,0.07465827,4.771917,-18.289434,-204.21678,-303.6892,0.7245151,-0.9660625,63.267048,360000
34
+ 203.27168,0.18701422,0.08061549,4.441507,-4.97724,-205.94096,-305.54135,1.3686001,-0.5247526,57.379974,365000
35
+ 198.37569,0.18443808,0.07802537,4.616852,-4.1712646,-200.68123,-306.0253,1.7052293,-2.0018685,72.56833,370000
36
+ 200.8123,0.21245006,0.07991041,3.8293595,-3.1963885,-203.29509,-301.9587,0.81514895,-0.7659005,55.962677,375000
37
+ 198.40634,0.19270569,0.07579912,3.50154,-18.697384,-200.75935,-301.6916,0.5238628,-1.0673181,51.7697,380000
38
+ 197.07118,0.18501681,0.07066394,3.8824983,-6.114997,-199.28723,-305.50195,0.5627531,-0.9655336,46.679024,385000
39
+ 197.49933,0.18322244,0.07418336,4.2768397,-8.502601,-199.90302,-303.4367,0.47615954,-0.4587711,51.410973,390000
40
+ 200.59944,0.19193754,0.07570805,5.2629104,-7.159084,-202.9506,-307.09537,0.96392214,-0.63910186,54.630096,395000
41
+ 195.20967,0.18776149,0.08233004,4.1065135,-16.747885,-197.89708,-304.75415,0.96125126,-0.6945939,52.724976,400000
42
+ 193.81885,0.20596635,0.07696968,4.1222796,-8.752255,-196.40721,-306.44916,1.174021,-1.283145,72.18397,405000
43
+ 198.86903,0.17093413,0.07431771,3.6004562,-3.3332832,-201.49248,-302.3186,0.46471328,-0.51947135,44.99168,410000
44
+ 195.0907,0.22467287,0.080097176,4.8223653,-8.400207,-197.21135,-306.27316,1.4234669,-0.9405937,81.96872,415000
45
+ 198.41772,0.17390552,0.07775659,4.25893,-5.518412,-200.90433,-306.6232,0.48052785,-1.0339053,54.42254,420000
46
+ 201.52289,0.20455709,0.08081303,4.570183,-6.440452,-203.93622,-305.59747,0.81797445,-0.7939724,61.604233,425000
47
+ 200.91856,0.20449333,0.07711245,3.6066551,-9.979294,-203.43958,-303.4986,0.89185226,-0.61430347,49.003036,430000
48
+ 202.11694,0.19675669,0.07317677,3.0376604,-11.555157,-204.2796,-305.25674,0.7188722,-1.0174208,44.337646,435000
49
+ 199.16333,0.2210662,0.07605782,3.799174,-9.32201,-201.36618,-299.89407,0.90860945,-2.4887686,71.12215,440000
50
+ 194.70111,0.20274709,0.07913547,5.271301,1.1395278,-197.0312,-303.73514,1.4481344,-1.2342988,71.98244,445000
51
+ 204.89276,0.17509855,0.07683371,4.3277164,-2.6283216,-207.49983,-304.37695,0.8192203,-0.6310431,51.416687,450000
52
+ 198.71594,0.1784454,0.07055347,3.426962,-1.4933423,-201.16043,-304.30484,0.4547193,-1.045078,49.077374,455000
53
+ 198.96869,0.22437312,0.06863469,4.482888,-4.47317,-201.16446,-304.62622,0.5342024,-1.0154036,63.30857,460000
54
+ 197.11507,0.17443252,0.07497052,3.1936195,-11.627894,-199.33902,-305.67386,0.62704945,-0.9786635,46.67102,465000
55
+ 198.93338,0.20348373,0.07436135,3.234471,-10.340691,-201.33452,-295.34088,1.3291477,-0.49843156,47.615856,470000
56
+ 197.76105,0.19966432,0.07580799,3.1272428,-4.7512484,-199.84581,-307.4728,1.772891,-2.1412969,58.622917,475000
57
+ 196.74985,0.2044077,0.06857388,3.4084759,-4.9090242,-199.02942,-300.6575,0.41014266,-0.83004,43.49308,480000
58
+ 198.0944,0.16156706,0.071600385,3.0156019,-5.559214,-200.51678,-301.8476,2.5247593,-0.8134826,45.149086,485000
59
+ 192.88524,0.18778643,0.07319867,2.9939203,-8.159991,-195.18947,-305.3073,0.467852,-0.97517,51.481853,490000
60
+ 202.15372,0.19715169,0.07405125,4.553123,-9.207069,-204.30501,-303.8401,1.0759686,-0.9059949,53.033222,495000
61
+ 198.44527,0.18220054,0.07573603,3.1669743,-8.60617,-200.80292,-306.24277,0.44113588,-0.34547913,41.644325,500000
62
+ 194.93619,0.20489313,0.072815895,4.383677,-1.2075025,-197.10631,-303.58267,1.4680177,-0.65563005,57.417404,505000
63
+ 192.5097,0.2207219,0.07631655,3.2991104,-3.5175838,-194.93094,-305.75,0.8179101,-0.6716564,45.072502,510000
64
+ 189.94356,0.19556472,0.07648427,3.8567193,-1.7617314,-192.60034,-304.16785,1.1560137,-0.47146085,49.482224,515000
65
+ 183.95659,0.1856674,0.071459465,4.506075,-2.6227055,-186.26147,-300.7474,0.9770409,-0.38175288,47.48589,520000
66
+ 197.35347,0.1712931,0.074659646,3.3609369,-7.0136704,-200.06075,-305.6883,0.5266571,-2.1591735,53.551895,525000
67
+ 192.63692,0.19618389,0.0690897,4.4414096,-8.167323,-195.06165,-304.55646,0.78240705,-0.76925766,53.57838,530000
68
+ 189.58418,0.21989235,0.06935962,3.946402,-1.9826052,-191.68668,-299.42813,1.2367336,-0.48539662,47.692097,535000
69
+ 199.93497,0.17984095,0.067125596,2.6158798,2.321385,-201.88379,-305.66766,0.46220744,-0.5664075,36.733562,540000
70
+ 198.31706,0.21289438,0.073054165,3.0497844,-6.9768586,-200.64867,-305.26788,0.64357674,-0.72835314,42.28832,545000
71
+ 190.98741,0.17357363,0.066256955,2.912258,-2.681069,-193.34993,-306.77756,0.9892359,-0.6683556,47.97386,550000
72
+ 195.34637,0.20555954,0.0754378,3.7977078,-4.5893164,-197.98262,-305.4031,0.3705391,-0.49195355,43.504787,555000
73
+ 190.56961,0.18812984,0.07805291,6.812043,-8.352745,-193.1668,-304.586,3.3506444,-3.5134842,146.43439,560000
74
+ 200.08794,0.1989243,0.07023758,2.723625,-3.9908392,-202.06459,-306.23987,0.29121923,-0.9049493,39.087204,565000
75
+ 184.29893,0.18406045,0.06906479,3.3828523,-0.7969015,-186.71387,-304.40137,1.691789,-0.8740783,62.294437,570000
76
+ 192.83667,0.21041976,0.07325685,3.7337246,-2.070329,-195.20583,-300.0803,0.588382,-1.5156701,61.212883,575000
77
+ 192.86058,0.1706584,0.073898315,3.0686882,-11.876755,-195.37436,-305.3514,0.5417867,-0.7317611,42.457623,580000
78
+ 191.96896,0.17565742,0.073124506,3.0366106,-0.269903,-194.37457,-303.61472,0.35570574,-0.5394885,39.492928,585000
79
+ 188.96555,0.1803146,0.07190576,2.7235205,-2.714522,-191.27855,-299.39636,1.1326996,-0.3697896,44.54649,590000
80
+ 194.89777,0.19185041,0.06787133,3.3212304,-6.137928,-197.15819,-304.7881,2.0268564,-1.0057173,55.180595,595000
81
+ 187.94057,0.18417539,0.07275171,2.9904556,-6.9144344,-190.23119,-304.40118,0.39158425,-1.3089579,41.682346,600000
82
+ 190.27808,0.20892411,0.073447704,2.5795157,-4.4733825,-192.38602,-299.7684,0.8835082,-0.2540486,37.590298,605000
83
+ 193.3964,0.19827595,0.07145168,2.9726667,-5.7761526,-195.71695,-305.6084,0.7112915,-1.572984,49.39122,610000
84
+ 184.25684,0.17534252,0.06772201,3.3251755,-6.4500604,-186.35693,-304.24088,0.80120015,-0.55461323,44.237446,615000
85
+ 192.23343,0.1744388,0.07613548,2.5403988,-0.59162825,-194.71964,-296.97342,0.6640805,-2.2758825,51.37629,620000
86
+ 192.83339,0.18111266,0.061813373,3.9436085,-3.4594328,-194.84483,-300.35004,0.5823705,-1.1344548,48.32788,625000
87
+ 189.841,0.17017087,0.071032494,3.3055508,-5.1747303,-192.34322,-304.05643,0.97171086,-1.1722553,52.97595,630000
88
+ 188.17764,0.17977285,0.072257586,3.0120323,-3.420364,-190.6363,-304.42093,1.4909089,-0.4197499,54.543816,635000
89
+ 185.10193,0.18825206,0.0787183,3.989956,-2.9212341,-187.7725,-299.91382,1.0832964,-0.75481105,56.73751,640000
90
+ 181.9468,0.17849003,0.072138,3.3373935,-1.760951,-184.199,-304.9745,0.41790938,-0.60877806,40.894363,645000
91
+ 184.81647,0.20408845,0.07369916,3.158472,-1.9148054,-187.58855,-304.48532,1.3896173,-0.45232537,45.679188,650000
92
+ 191.14542,0.21876991,0.06819723,2.8304093,-3.4837048,-193.08963,-305.22385,1.3706298,-0.61861384,44.77105,655000
93
+ 177.42125,0.20275906,0.06743956,2.5111182,-4.993872,-179.40558,-305.59033,0.48327848,-1.0057598,42.827766,660000
94
+ 184.54839,0.18571696,0.06617538,3.0177636,-7.7068353,-186.74838,-301.75653,1.4452455,-0.82931525,50.3909,665000
95
+ 186.59593,0.19343287,0.07060431,3.3127403,-4.0476227,-188.77814,-304.63675,0.44773144,-0.9971028,42.240627,670000
96
+ 183.11311,0.19359244,0.06674534,2.8096364,-4.46571,-185.44962,-306.4961,0.7369728,-1.1323128,43.102768,675000
97
+ 194.19693,0.19033714,0.0713588,2.795015,-6.453324,-196.60686,-303.3389,0.78815424,-0.6395461,43.260445,680000
98
+ 192.73866,0.17964822,0.06548831,2.2481499,-4.4019823,-194.92473,-300.87012,1.4535326,-1.0122968,40.979992,685000
99
+ 181.40593,0.18718214,0.06859675,2.602405,-2.667825,-183.79482,-304.0094,1.284225,-0.7455632,42.068123,690000
100
+ 184.08386,0.21367773,0.06741838,2.734102,-3.4923685,-186.36589,-303.96527,1.1331127,-0.40957534,41.311066,695000
101
+ 189.89156,0.20577219,0.07177734,2.807512,-5.6322002,-192.30077,-307.39035,0.71439075,-0.7045894,45.23936,700000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/online_agent_sv.csv ADDED
@@ -0,0 +1,101 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ actor/actor_loss,actor/bc_flow_loss,actor/distill_loss,critic/critic_loss,critic/q_max,critic/q_mean,critic/q_min,grad/max,grad/min,grad/norm,step
2
+ 229.99387,0.20546067,0.064432025,4.521254,-123.716446,-231.6585,-306.21896,3.0049622,-1.420109,76.4441,205000
3
+ 229.786,0.2008268,0.06391222,3.5432186,-138.85098,-231.39542,-307.54248,0.48056704,-0.57844526,50.36886,210000
4
+ 225.52559,0.18713269,0.063060485,3.0819838,-104.986404,-227.24522,-307.4983,0.6636756,-0.7107446,50.731144,215000
5
+ 230.6403,0.20210609,0.065148436,5.145928,-133.7058,-232.38428,-308.0072,0.73949695,-0.85796446,55.668808,220000
6
+ 229.24782,0.22591175,0.06640024,4.2421265,-97.32618,-231.17027,-306.45306,0.9117506,-0.9657963,61.48246,225000
7
+ 230.32205,0.19965804,0.060996044,4.025768,3.86628,-231.72252,-305.5695,0.68873787,-0.65995556,53.372063,230000
8
+ 228.82492,0.20429522,0.070745654,2.9461792,-102.05428,-231.16905,-304.9562,0.59371555,-0.39766145,43.843853,235000
9
+ 224.3375,0.2230684,0.068730384,3.6309707,-84.695206,-226.24988,-306.90604,0.757256,-0.6101829,57.61514,240000
10
+ 224.96548,0.19392641,0.0667506,3.5233674,-75.456024,-226.3835,-303.47437,0.7572098,-0.73540086,49.887905,245000
11
+ 221.75766,0.2113069,0.06953649,4.68061,-81.34745,-223.39464,-306.99866,0.52460366,-0.81988734,55.741257,250000
12
+ 220.07765,0.17340969,0.064609915,3.8876915,-66.66511,-222.0485,-305.34488,0.324301,-0.37279812,47.258,255000
13
+ 220.95226,0.21385977,0.06987731,3.91267,-83.68362,-222.89775,-305.93857,0.5234973,-0.86106604,58.351524,260000
14
+ 220.06004,0.2035194,0.06705677,4.3098264,-42.02828,-221.95206,-307.3661,0.98776424,-0.975501,59.166492,265000
15
+ 214.45157,0.1844413,0.07207954,6.05608,-20.36413,-216.46342,-306.26685,1.3140109,-1.1524626,65.53386,270000
16
+ 210.71794,0.21564004,0.074813016,5.8640237,-28.573849,-213.29732,-303.19684,1.4658701,-1.1115123,88.4949,275000
17
+ 213.3268,0.21030709,0.07319261,3.6999567,-52.383736,-215.33476,-307.27164,0.50084364,-0.89926845,61.565594,280000
18
+ 213.38744,0.19698995,0.07668313,5.40085,-10.444582,-215.86168,-307.69583,0.6504888,-1.0966094,67.3107,285000
19
+ 212.01276,0.19039321,0.08199356,4.288975,-8.59039,-214.52193,-302.2282,1.0388391,-1.3862166,68.77907,290000
20
+ 214.48227,0.20089388,0.07582543,3.4345596,-31.43196,-216.58781,-305.9466,1.2533089,-0.9574178,62.301655,295000
21
+ 209.98975,0.21097751,0.07212036,3.8215852,-47.222725,-212.1632,-305.21115,1.1222849,-1.4591407,57.325005,300000
22
+ 216.32033,0.1694046,0.071111016,3.815556,-31.462996,-218.63399,-306.71823,1.1374149,-0.74457383,54.72073,305000
23
+ 215.41556,0.20178379,0.07288871,4.4924846,-41.95584,-217.51102,-306.88544,1.2936108,-0.8964029,67.31162,310000
24
+ 208.03917,0.16589507,0.071990155,3.9883974,-21.091324,-210.59952,-298.17374,0.605711,-0.78964293,56.878536,315000
25
+ 208.72069,0.18351032,0.06960488,3.8603432,-39.466347,-210.97945,-305.1061,1.2527066,-0.8420794,70.27368,320000
26
+ 213.27507,0.19754486,0.07084101,4.007862,-35.300846,-215.82007,-306.88977,0.8532208,-0.59185725,56.780113,325000
27
+ 209.19255,0.21218029,0.07617179,3.6750534,-17.860748,-211.57063,-306.71362,0.49134493,-0.6045281,47.74208,330000
28
+ 207.96687,0.18622053,0.07819722,4.600363,-29.705994,-210.72803,-305.455,0.57042533,-1.2416697,64.86892,335000
29
+ 207.65561,0.18104595,0.0734249,3.3990617,-43.524113,-210.03496,-306.86682,1.4769707,-0.3090221,50.31021,340000
30
+ 202.37839,0.20195325,0.070477776,3.8979046,-14.573616,-204.51125,-304.59442,0.57729155,-0.9228122,50.73804,345000
31
+ 206.73032,0.19582865,0.072400175,5.37341,-38.730747,-209.04903,-304.76123,1.1782974,-0.9246913,69.22534,350000
32
+ 206.61987,0.18956624,0.07462577,3.7124174,-8.171364,-208.8623,-306.20667,0.5263605,-0.6660281,51.303757,355000
33
+ 201.97484,0.22218552,0.07465827,4.771917,-18.289434,-204.21678,-303.6892,0.7245151,-0.9660625,63.267048,360000
34
+ 203.27168,0.18701422,0.08061549,4.441507,-4.97724,-205.94096,-305.54135,1.3686001,-0.5247526,57.379974,365000
35
+ 198.37569,0.18443808,0.07802537,4.616852,-4.1712646,-200.68123,-306.0253,1.7052293,-2.0018685,72.56833,370000
36
+ 200.8123,0.21245006,0.07991041,3.8293595,-3.1963885,-203.29509,-301.9587,0.81514895,-0.7659005,55.962677,375000
37
+ 198.40634,0.19270569,0.07579912,3.50154,-18.697384,-200.75935,-301.6916,0.5238628,-1.0673181,51.7697,380000
38
+ 197.07118,0.18501681,0.07066394,3.8824983,-6.114997,-199.28723,-305.50195,0.5627531,-0.9655336,46.679024,385000
39
+ 197.49933,0.18322244,0.07418336,4.2768397,-8.502601,-199.90302,-303.4367,0.47615954,-0.4587711,51.410973,390000
40
+ 200.59944,0.19193754,0.07570805,5.2629104,-7.159084,-202.9506,-307.09537,0.96392214,-0.63910186,54.630096,395000
41
+ 195.20967,0.18776149,0.08233004,4.1065135,-16.747885,-197.89708,-304.75415,0.96125126,-0.6945939,52.724976,400000
42
+ 193.81885,0.20596635,0.07696968,4.1222796,-8.752255,-196.40721,-306.44916,1.174021,-1.283145,72.18397,405000
43
+ 198.86903,0.17093413,0.07431771,3.6004562,-3.3332832,-201.49248,-302.3186,0.46471328,-0.51947135,44.99168,410000
44
+ 195.0907,0.22467287,0.080097176,4.8223653,-8.400207,-197.21135,-306.27316,1.4234669,-0.9405937,81.96872,415000
45
+ 198.41772,0.17390552,0.07775659,4.25893,-5.518412,-200.90433,-306.6232,0.48052785,-1.0339053,54.42254,420000
46
+ 201.52289,0.20455709,0.08081303,4.570183,-6.440452,-203.93622,-305.59747,0.81797445,-0.7939724,61.604233,425000
47
+ 200.91856,0.20449333,0.07711245,3.6066551,-9.979294,-203.43958,-303.4986,0.89185226,-0.61430347,49.003036,430000
48
+ 202.11694,0.19675669,0.07317677,3.0376604,-11.555157,-204.2796,-305.25674,0.7188722,-1.0174208,44.337646,435000
49
+ 199.16333,0.2210662,0.07605782,3.799174,-9.32201,-201.36618,-299.89407,0.90860945,-2.4887686,71.12215,440000
50
+ 194.70111,0.20274709,0.07913547,5.271301,1.1395278,-197.0312,-303.73514,1.4481344,-1.2342988,71.98244,445000
51
+ 204.89276,0.17509855,0.07683371,4.3277164,-2.6283216,-207.49983,-304.37695,0.8192203,-0.6310431,51.416687,450000
52
+ 198.71594,0.1784454,0.07055347,3.426962,-1.4933423,-201.16043,-304.30484,0.4547193,-1.045078,49.077374,455000
53
+ 198.96869,0.22437312,0.06863469,4.482888,-4.47317,-201.16446,-304.62622,0.5342024,-1.0154036,63.30857,460000
54
+ 197.11507,0.17443252,0.07497052,3.1936195,-11.627894,-199.33902,-305.67386,0.62704945,-0.9786635,46.67102,465000
55
+ 198.93338,0.20348373,0.07436135,3.234471,-10.340691,-201.33452,-295.34088,1.3291477,-0.49843156,47.615856,470000
56
+ 197.76105,0.19966432,0.07580799,3.1272428,-4.7512484,-199.84581,-307.4728,1.772891,-2.1412969,58.622917,475000
57
+ 196.74985,0.2044077,0.06857388,3.4084759,-4.9090242,-199.02942,-300.6575,0.41014266,-0.83004,43.49308,480000
58
+ 198.0944,0.16156706,0.071600385,3.0156019,-5.559214,-200.51678,-301.8476,2.5247593,-0.8134826,45.149086,485000
59
+ 192.88524,0.18778643,0.07319867,2.9939203,-8.159991,-195.18947,-305.3073,0.467852,-0.97517,51.481853,490000
60
+ 202.15372,0.19715169,0.07405125,4.553123,-9.207069,-204.30501,-303.8401,1.0759686,-0.9059949,53.033222,495000
61
+ 198.44527,0.18220054,0.07573603,3.1669743,-8.60617,-200.80292,-306.24277,0.44113588,-0.34547913,41.644325,500000
62
+ 194.93619,0.20489313,0.072815895,4.383677,-1.2075025,-197.10631,-303.58267,1.4680177,-0.65563005,57.417404,505000
63
+ 192.5097,0.2207219,0.07631655,3.2991104,-3.5175838,-194.93094,-305.75,0.8179101,-0.6716564,45.072502,510000
64
+ 189.94356,0.19556472,0.07648427,3.8567193,-1.7617314,-192.60034,-304.16785,1.1560137,-0.47146085,49.482224,515000
65
+ 183.95659,0.1856674,0.071459465,4.506075,-2.6227055,-186.26147,-300.7474,0.9770409,-0.38175288,47.48589,520000
66
+ 197.35347,0.1712931,0.074659646,3.3609369,-7.0136704,-200.06075,-305.6883,0.5266571,-2.1591735,53.551895,525000
67
+ 192.63692,0.19618389,0.0690897,4.4414096,-8.167323,-195.06165,-304.55646,0.78240705,-0.76925766,53.57838,530000
68
+ 189.58418,0.21989235,0.06935962,3.946402,-1.9826052,-191.68668,-299.42813,1.2367336,-0.48539662,47.692097,535000
69
+ 199.93497,0.17984095,0.067125596,2.6158798,2.321385,-201.88379,-305.66766,0.46220744,-0.5664075,36.733562,540000
70
+ 198.31706,0.21289438,0.073054165,3.0497844,-6.9768586,-200.64867,-305.26788,0.64357674,-0.72835314,42.28832,545000
71
+ 190.98741,0.17357363,0.066256955,2.912258,-2.681069,-193.34993,-306.77756,0.9892359,-0.6683556,47.97386,550000
72
+ 195.34637,0.20555954,0.0754378,3.7977078,-4.5893164,-197.98262,-305.4031,0.3705391,-0.49195355,43.504787,555000
73
+ 190.56961,0.18812984,0.07805291,6.812043,-8.352745,-193.1668,-304.586,3.3506444,-3.5134842,146.43439,560000
74
+ 200.08794,0.1989243,0.07023758,2.723625,-3.9908392,-202.06459,-306.23987,0.29121923,-0.9049493,39.087204,565000
75
+ 184.29893,0.18406045,0.06906479,3.3828523,-0.7969015,-186.71387,-304.40137,1.691789,-0.8740783,62.294437,570000
76
+ 192.83667,0.21041976,0.07325685,3.7337246,-2.070329,-195.20583,-300.0803,0.588382,-1.5156701,61.212883,575000
77
+ 192.86058,0.1706584,0.073898315,3.0686882,-11.876755,-195.37436,-305.3514,0.5417867,-0.7317611,42.457623,580000
78
+ 191.96896,0.17565742,0.073124506,3.0366106,-0.269903,-194.37457,-303.61472,0.35570574,-0.5394885,39.492928,585000
79
+ 188.96555,0.1803146,0.07190576,2.7235205,-2.714522,-191.27855,-299.39636,1.1326996,-0.3697896,44.54649,590000
80
+ 194.89777,0.19185041,0.06787133,3.3212304,-6.137928,-197.15819,-304.7881,2.0268564,-1.0057173,55.180595,595000
81
+ 187.94057,0.18417539,0.07275171,2.9904556,-6.9144344,-190.23119,-304.40118,0.39158425,-1.3089579,41.682346,600000
82
+ 190.27808,0.20892411,0.073447704,2.5795157,-4.4733825,-192.38602,-299.7684,0.8835082,-0.2540486,37.590298,605000
83
+ 193.3964,0.19827595,0.07145168,2.9726667,-5.7761526,-195.71695,-305.6084,0.7112915,-1.572984,49.39122,610000
84
+ 184.25684,0.17534252,0.06772201,3.3251755,-6.4500604,-186.35693,-304.24088,0.80120015,-0.55461323,44.237446,615000
85
+ 192.23343,0.1744388,0.07613548,2.5403988,-0.59162825,-194.71964,-296.97342,0.6640805,-2.2758825,51.37629,620000
86
+ 192.83339,0.18111266,0.061813373,3.9436085,-3.4594328,-194.84483,-300.35004,0.5823705,-1.1344548,48.32788,625000
87
+ 189.841,0.17017087,0.071032494,3.3055508,-5.1747303,-192.34322,-304.05643,0.97171086,-1.1722553,52.97595,630000
88
+ 188.17764,0.17977285,0.072257586,3.0120323,-3.420364,-190.6363,-304.42093,1.4909089,-0.4197499,54.543816,635000
89
+ 185.10193,0.18825206,0.0787183,3.989956,-2.9212341,-187.7725,-299.91382,1.0832964,-0.75481105,56.73751,640000
90
+ 181.9468,0.17849003,0.072138,3.3373935,-1.760951,-184.199,-304.9745,0.41790938,-0.60877806,40.894363,645000
91
+ 184.81647,0.20408845,0.07369916,3.158472,-1.9148054,-187.58855,-304.48532,1.3896173,-0.45232537,45.679188,650000
92
+ 191.14542,0.21876991,0.06819723,2.8304093,-3.4837048,-193.08963,-305.22385,1.3706298,-0.61861384,44.77105,655000
93
+ 177.42125,0.20275906,0.06743956,2.5111182,-4.993872,-179.40558,-305.59033,0.48327848,-1.0057598,42.827766,660000
94
+ 184.54839,0.18571696,0.06617538,3.0177636,-7.7068353,-186.74838,-301.75653,1.4452455,-0.82931525,50.3909,665000
95
+ 186.59593,0.19343287,0.07060431,3.3127403,-4.0476227,-188.77814,-304.63675,0.44773144,-0.9971028,42.240627,670000
96
+ 183.11311,0.19359244,0.06674534,2.8096364,-4.46571,-185.44962,-306.4961,0.7369728,-1.1323128,43.102768,675000
97
+ 194.19693,0.19033714,0.0713588,2.795015,-6.453324,-196.60686,-303.3389,0.78815424,-0.6395461,43.260445,680000
98
+ 192.73866,0.17964822,0.06548831,2.2481499,-4.4019823,-194.92473,-300.87012,1.4535326,-1.0122968,40.979992,685000
99
+ 181.40593,0.18718214,0.06859675,2.602405,-2.667825,-183.79482,-304.0094,1.284225,-0.7455632,42.068123,690000
100
+ 184.08386,0.21367773,0.06741838,2.734102,-3.4923685,-186.36589,-303.96527,1.1331127,-0.40957534,41.311066,695000
101
+ 189.89156,0.20577219,0.07177734,2.807512,-5.6322002,-192.30077,-307.39035,0.71439075,-0.7045894,45.23936,700000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_250000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:203377fc57f5da9044355e291530c798b5e09d5b02d8a7b68489bef61d15bf55
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_300000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34f6e5aa51c1426ae949861bd6bd442b5fff95d86b5f081f38adb878cd045999
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_350000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c13f6930e34ad2b683cbc3f2af4fd7ecc7defc88b8db306cda207dd86c922ae
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_400000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c537cc19e35c27faf822ac73fe57dfb63d6f7252ae16af4f1bc450a46eae3a98
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_450000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e79c9e4c4110075b8ddc026bb92d9dbb60e1ba0e01d35a542429d12983e12b0
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_500000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4587f81bcad15943b91a623612b124299a7a2acf5e01b821c0cd5d63acc4cac
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_550000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c36c131f073d9daebba80dba0e1e6ea76ba6dfb36fd0d20469261fc88f5352ee
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_600000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81fa489bf231b288cdd211d5280ecc634eef1c7fa88b1f700c1f3cd2482d9ad
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_650000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bf29a35475c93becbf31dafe7ebaeadad634cc6173887a9cd3a487b8df74c32
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/params_700000.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:126d54c35c8476143689a9f1c4d01d1581d830ca4de6474613b88e2156fc8b77
3
+ size 219185966
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/progress.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ online,500000
O2O-w-diff-ckpts/cube-triple-play-singletask-task1-v0/fql/20260324_204545/token.tk ADDED
@@ -0,0 +1 @@
 
 
1
+ https://wandb.ai/tiredsheep-national-taiwan-university/qam-finetune-OfflineRL/runs/ctcpurxq