amirali1985 commited on
Commit
cbf1406
·
verified ·
1 Parent(s): acc34eb

Upload queue_status.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. queue_status.json +40 -40
queue_status.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "timestamp": "2026-04-15 12:30:07",
3
  "total": 59,
4
  "pending": 26,
5
  "running": 6,
@@ -15,7 +15,7 @@
15
  "gpu": 0,
16
  "status": "done",
17
  "elapsed": 19215,
18
- "idle_time": 34135,
19
  "exit_code": 0,
20
  "retries": 0,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs20_K1_100K_2L1H128d_gpu0.log"
@@ -27,7 +27,7 @@
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 17962,
30
- "idle_time": 35388,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs20_K1_100K_1L2H256d_gpu1.log"
@@ -39,7 +39,7 @@
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 20071,
42
- "idle_time": 33279,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs20_K1_100K_1L3H510d_gpu2.log"
@@ -51,7 +51,7 @@
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 19232,
54
- "idle_time": 34118,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs1_K1_100K_2L1H128d_gpu0.log"
@@ -63,7 +63,7 @@
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 17980,
66
- "idle_time": 35370,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs1_K1_100K_1L2H256d_gpu1.log"
@@ -75,7 +75,7 @@
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 20071,
78
- "idle_time": 33279,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs1_K1_100K_1L3H510d_gpu2.log"
@@ -87,7 +87,7 @@
87
  "gpu": 2,
88
  "status": "done",
89
  "elapsed": 17731,
90
- "idle_time": 11147,
91
  "exit_code": 0,
92
  "retries": 0,
93
  "log_file": "/tmp/gpu_queue/job_006_as_sorl_abs2_K1_100K_2L1H128d_gpu2.log"
@@ -99,7 +99,7 @@
99
  "gpu": 1,
100
  "status": "done",
101
  "elapsed": 14745,
102
- "idle_time": 4222,
103
  "exit_code": 0,
104
  "retries": 0,
105
  "log_file": "/tmp/gpu_queue/job_007_as_sorl_abs2_K1_100K_1L2H256d_gpu1.log"
@@ -123,7 +123,7 @@
123
  "gpu": 1,
124
  "status": "done",
125
  "elapsed": 15057,
126
- "idle_time": 20311,
127
  "exit_code": 0,
128
  "retries": 0,
129
  "log_file": "/tmp/gpu_queue/job_009_as_sorl_abs5_K1_100K_2L1H128d_gpu1.log"
@@ -134,8 +134,8 @@
134
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 1 --num",
135
  "gpu": 0,
136
  "status": "running",
137
- "elapsed": 3919,
138
- "idle_time": 25,
139
  "exit_code": -1,
140
  "retries": 0,
141
  "log_file": "/tmp/gpu_queue/job_010_as_sorl_abs5_K1_100K_1L2H256d_gpu0.log"
@@ -146,8 +146,8 @@
146
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 1 --num",
147
  "gpu": 0,
148
  "status": "running",
149
- "elapsed": 16125,
150
- "idle_time": 22,
151
  "exit_code": -1,
152
  "retries": 0,
153
  "log_file": "/tmp/gpu_queue/job_011_as_sorl_abs5_K1_100K_1L3H510d_gpu0.log"
@@ -159,7 +159,7 @@
159
  "gpu": 2,
160
  "status": "done",
161
  "elapsed": 15640,
162
- "idle_time": 1012,
163
  "exit_code": 0,
164
  "retries": 0,
165
  "log_file": "/tmp/gpu_queue/job_012_as_sorl_abs50_K1_100K_2L1H128d_gpu2.log"
@@ -195,7 +195,7 @@
195
  "gpu": 2,
196
  "status": "done",
197
  "elapsed": 1366,
198
- "idle_time": 1880,
199
  "exit_code": 0,
200
  "retries": 0,
201
  "log_file": "/tmp/gpu_queue/job_015_as_baseline_10K_2L1H128d_gpu2.log"
@@ -207,7 +207,7 @@
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 1347,
210
- "idle_time": 24366,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_baseline_10K_1L2H256d_gpu1.log"
@@ -219,7 +219,7 @@
219
  "gpu": 1,
220
  "status": "done",
221
  "elapsed": 1337,
222
- "idle_time": 18970,
223
  "exit_code": 0,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_baseline_10K_1L3H510d_gpu1.log"
@@ -231,7 +231,7 @@
231
  "gpu": 1,
232
  "status": "done",
233
  "elapsed": 6071,
234
- "idle_time": 11266,
235
  "exit_code": 0,
236
  "retries": 0,
237
  "log_file": "/tmp/gpu_queue/job_018_as_sorl_abs30_K1_10K_2L1H128d_gpu1.log"
@@ -254,8 +254,8 @@
254
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 30 --K 1 --num",
255
  "gpu": 2,
256
  "status": "running",
257
- "elapsed": 1009,
258
- "idle_time": 122,
259
  "exit_code": -1,
260
  "retries": 0,
261
  "log_file": "/tmp/gpu_queue/job_020_as_sorl_abs30_K1_10K_1L3H510d_gpu2.log"
@@ -267,7 +267,7 @@
267
  "gpu": 1,
268
  "status": "done",
269
  "elapsed": 1517,
270
- "idle_time": 25716,
271
  "exit_code": 0,
272
  "retries": 0,
273
  "log_file": "/tmp/gpu_queue/job_021_as_baseline_25K_2L1H128d_gpu1.log"
@@ -279,7 +279,7 @@
279
  "gpu": 1,
280
  "status": "done",
281
  "elapsed": 1506,
282
- "idle_time": 2715,
283
  "exit_code": 0,
284
  "retries": 0,
285
  "log_file": "/tmp/gpu_queue/job_022_as_baseline_25K_1L2H256d_gpu1.log"
@@ -290,8 +290,8 @@
290
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --n_la",
291
  "gpu": 2,
292
  "status": "running",
293
- "elapsed": 239,
294
- "idle_time": 16,
295
  "exit_code": -1,
296
  "retries": 0,
297
  "log_file": "/tmp/gpu_queue/job_023_as_baseline_25K_1L3H510d_gpu2.log"
@@ -303,7 +303,7 @@
303
  "gpu": 2,
304
  "status": "done",
305
  "elapsed": 7897,
306
- "idle_time": 3249,
307
  "exit_code": 0,
308
  "retries": 0,
309
  "log_file": "/tmp/gpu_queue/job_024_as_sorl_abs30_K1_25K_2L1H128d_gpu2.log"
@@ -315,7 +315,7 @@
315
  "gpu": 1,
316
  "status": "done",
317
  "elapsed": 7025,
318
- "idle_time": 17338,
319
  "exit_code": 0,
320
  "retries": 0,
321
  "log_file": "/tmp/gpu_queue/job_025_as_sorl_abs30_K1_25K_1L2H256d_gpu1.log"
@@ -327,7 +327,7 @@
327
  "gpu": 1,
328
  "status": "done",
329
  "elapsed": 8147,
330
- "idle_time": 27237,
331
  "exit_code": 0,
332
  "retries": 0,
333
  "log_file": "/tmp/gpu_queue/job_026_as_sorl_abs30_K1_25K_1L3H510d_gpu1.log"
@@ -339,7 +339,7 @@
339
  "gpu": 1,
340
  "status": "done",
341
  "elapsed": 1789,
342
- "idle_time": 9472,
343
  "exit_code": 0,
344
  "retries": 0,
345
  "log_file": "/tmp/gpu_queue/job_027_as_baseline_50K_2L1H128d_gpu1.log"
@@ -351,7 +351,7 @@
351
  "gpu": 2,
352
  "status": "done",
353
  "elapsed": 1633,
354
- "idle_time": 243,
355
  "exit_code": 0,
356
  "retries": 0,
357
  "log_file": "/tmp/gpu_queue/job_028_as_baseline_50K_1L2H256d_gpu2.log"
@@ -363,7 +363,7 @@
363
  "gpu": 2,
364
  "status": "done",
365
  "elapsed": 2052,
366
- "idle_time": 28881,
367
  "exit_code": 0,
368
  "retries": 0,
369
  "log_file": "/tmp/gpu_queue/job_029_as_baseline_50K_1L3H510d_gpu2.log"
@@ -375,7 +375,7 @@
375
  "gpu": 0,
376
  "status": "done",
377
  "elapsed": 11753,
378
- "idle_time": 22381,
379
  "exit_code": 0,
380
  "retries": 0,
381
  "log_file": "/tmp/gpu_queue/job_030_as_sorl_abs30_K1_50K_2L1H128d_gpu0.log"
@@ -398,8 +398,8 @@
398
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 1 --num",
399
  "gpu": 1,
400
  "status": "running",
401
- "elapsed": 9469,
402
- "idle_time": 15,
403
  "exit_code": -1,
404
  "retries": 0,
405
  "log_file": "/tmp/gpu_queue/job_032_as_sorl_abs30_K1_50K_1L3H510d_gpu1.log"
@@ -411,7 +411,7 @@
411
  "gpu": 2,
412
  "status": "done",
413
  "elapsed": 2343,
414
- "idle_time": 30935,
415
  "exit_code": 0,
416
  "retries": 0,
417
  "log_file": "/tmp/gpu_queue/job_033_as_baseline_100K_2L1H128d_gpu2.log"
@@ -434,8 +434,8 @@
434
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --n_l",
435
  "gpu": 1,
436
  "status": "running",
437
- "elapsed": 2709,
438
- "idle_time": 121,
439
  "exit_code": -1,
440
  "retries": 0,
441
  "log_file": "/tmp/gpu_queue/job_035_as_baseline_100K_1L3H510d_gpu1.log"
@@ -447,7 +447,7 @@
447
  "gpu": 0,
448
  "status": "done",
449
  "elapsed": 18453,
450
- "idle_time": 3924,
451
  "exit_code": 0,
452
  "retries": 0,
453
  "log_file": "/tmp/gpu_queue/job_036_as_sorl_abs30_K1_100K_2L1H128d_gpu0.log"
@@ -459,7 +459,7 @@
459
  "gpu": 2,
460
  "status": "done",
461
  "elapsed": 16622,
462
- "idle_time": 16657,
463
  "exit_code": 0,
464
  "retries": 0,
465
  "log_file": "/tmp/gpu_queue/job_037_as_sorl_abs30_K1_100K_1L2H256d_gpu2.log"
@@ -471,7 +471,7 @@
471
  "gpu": 0,
472
  "status": "done",
473
  "elapsed": 17990,
474
- "idle_time": 16129,
475
  "exit_code": 0,
476
  "retries": 0,
477
  "log_file": "/tmp/gpu_queue/job_038_as_sorl_abs30_K1_100K_1L3H510d_gpu0.log"
 
1
  {
2
+ "timestamp": "2026-04-15 12:30:38",
3
  "total": 59,
4
  "pending": 26,
5
  "running": 6,
 
15
  "gpu": 0,
16
  "status": "done",
17
  "elapsed": 19215,
18
+ "idle_time": 34165,
19
  "exit_code": 0,
20
  "retries": 0,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs20_K1_100K_2L1H128d_gpu0.log"
 
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 17962,
30
+ "idle_time": 35418,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs20_K1_100K_1L2H256d_gpu1.log"
 
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 20071,
42
+ "idle_time": 33310,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs20_K1_100K_1L3H510d_gpu2.log"
 
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 19232,
54
+ "idle_time": 34149,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs1_K1_100K_2L1H128d_gpu0.log"
 
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 17980,
66
+ "idle_time": 35401,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs1_K1_100K_1L2H256d_gpu1.log"
 
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 20071,
78
+ "idle_time": 33310,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs1_K1_100K_1L3H510d_gpu2.log"
 
87
  "gpu": 2,
88
  "status": "done",
89
  "elapsed": 17731,
90
+ "idle_time": 11177,
91
  "exit_code": 0,
92
  "retries": 0,
93
  "log_file": "/tmp/gpu_queue/job_006_as_sorl_abs2_K1_100K_2L1H128d_gpu2.log"
 
99
  "gpu": 1,
100
  "status": "done",
101
  "elapsed": 14745,
102
+ "idle_time": 4252,
103
  "exit_code": 0,
104
  "retries": 0,
105
  "log_file": "/tmp/gpu_queue/job_007_as_sorl_abs2_K1_100K_1L2H256d_gpu1.log"
 
123
  "gpu": 1,
124
  "status": "done",
125
  "elapsed": 15057,
126
+ "idle_time": 20342,
127
  "exit_code": 0,
128
  "retries": 0,
129
  "log_file": "/tmp/gpu_queue/job_009_as_sorl_abs5_K1_100K_2L1H128d_gpu1.log"
 
134
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 1 --num",
135
  "gpu": 0,
136
  "status": "running",
137
+ "elapsed": 3950,
138
+ "idle_time": 6,
139
  "exit_code": -1,
140
  "retries": 0,
141
  "log_file": "/tmp/gpu_queue/job_010_as_sorl_abs5_K1_100K_1L2H256d_gpu0.log"
 
146
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 1 --num",
147
  "gpu": 0,
148
  "status": "running",
149
+ "elapsed": 16155,
150
+ "idle_time": 26,
151
  "exit_code": -1,
152
  "retries": 0,
153
  "log_file": "/tmp/gpu_queue/job_011_as_sorl_abs5_K1_100K_1L3H510d_gpu0.log"
 
159
  "gpu": 2,
160
  "status": "done",
161
  "elapsed": 15640,
162
+ "idle_time": 1043,
163
  "exit_code": 0,
164
  "retries": 0,
165
  "log_file": "/tmp/gpu_queue/job_012_as_sorl_abs50_K1_100K_2L1H128d_gpu2.log"
 
195
  "gpu": 2,
196
  "status": "done",
197
  "elapsed": 1366,
198
+ "idle_time": 1910,
199
  "exit_code": 0,
200
  "retries": 0,
201
  "log_file": "/tmp/gpu_queue/job_015_as_baseline_10K_2L1H128d_gpu2.log"
 
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 1347,
210
+ "idle_time": 24396,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_baseline_10K_1L2H256d_gpu1.log"
 
219
  "gpu": 1,
220
  "status": "done",
221
  "elapsed": 1337,
222
+ "idle_time": 19000,
223
  "exit_code": 0,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_baseline_10K_1L3H510d_gpu1.log"
 
231
  "gpu": 1,
232
  "status": "done",
233
  "elapsed": 6071,
234
+ "idle_time": 11296,
235
  "exit_code": 0,
236
  "retries": 0,
237
  "log_file": "/tmp/gpu_queue/job_018_as_sorl_abs30_K1_10K_2L1H128d_gpu1.log"
 
254
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 30 --K 1 --num",
255
  "gpu": 2,
256
  "status": "running",
257
+ "elapsed": 1039,
258
+ "idle_time": 5,
259
  "exit_code": -1,
260
  "retries": 0,
261
  "log_file": "/tmp/gpu_queue/job_020_as_sorl_abs30_K1_10K_1L3H510d_gpu2.log"
 
267
  "gpu": 1,
268
  "status": "done",
269
  "elapsed": 1517,
270
+ "idle_time": 25747,
271
  "exit_code": 0,
272
  "retries": 0,
273
  "log_file": "/tmp/gpu_queue/job_021_as_baseline_25K_2L1H128d_gpu1.log"
 
279
  "gpu": 1,
280
  "status": "done",
281
  "elapsed": 1506,
282
+ "idle_time": 2746,
283
  "exit_code": 0,
284
  "retries": 0,
285
  "log_file": "/tmp/gpu_queue/job_022_as_baseline_25K_1L2H256d_gpu1.log"
 
290
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --n_la",
291
  "gpu": 2,
292
  "status": "running",
293
+ "elapsed": 269,
294
+ "idle_time": 47,
295
  "exit_code": -1,
296
  "retries": 0,
297
  "log_file": "/tmp/gpu_queue/job_023_as_baseline_25K_1L3H510d_gpu2.log"
 
303
  "gpu": 2,
304
  "status": "done",
305
  "elapsed": 7897,
306
+ "idle_time": 3280,
307
  "exit_code": 0,
308
  "retries": 0,
309
  "log_file": "/tmp/gpu_queue/job_024_as_sorl_abs30_K1_25K_2L1H128d_gpu2.log"
 
315
  "gpu": 1,
316
  "status": "done",
317
  "elapsed": 7025,
318
+ "idle_time": 17368,
319
  "exit_code": 0,
320
  "retries": 0,
321
  "log_file": "/tmp/gpu_queue/job_025_as_sorl_abs30_K1_25K_1L2H256d_gpu1.log"
 
327
  "gpu": 1,
328
  "status": "done",
329
  "elapsed": 8147,
330
+ "idle_time": 27267,
331
  "exit_code": 0,
332
  "retries": 0,
333
  "log_file": "/tmp/gpu_queue/job_026_as_sorl_abs30_K1_25K_1L3H510d_gpu1.log"
 
339
  "gpu": 1,
340
  "status": "done",
341
  "elapsed": 1789,
342
+ "idle_time": 9503,
343
  "exit_code": 0,
344
  "retries": 0,
345
  "log_file": "/tmp/gpu_queue/job_027_as_baseline_50K_2L1H128d_gpu1.log"
 
351
  "gpu": 2,
352
  "status": "done",
353
  "elapsed": 1633,
354
+ "idle_time": 273,
355
  "exit_code": 0,
356
  "retries": 0,
357
  "log_file": "/tmp/gpu_queue/job_028_as_baseline_50K_1L2H256d_gpu2.log"
 
363
  "gpu": 2,
364
  "status": "done",
365
  "elapsed": 2052,
366
+ "idle_time": 28912,
367
  "exit_code": 0,
368
  "retries": 0,
369
  "log_file": "/tmp/gpu_queue/job_029_as_baseline_50K_1L3H510d_gpu2.log"
 
375
  "gpu": 0,
376
  "status": "done",
377
  "elapsed": 11753,
378
+ "idle_time": 22411,
379
  "exit_code": 0,
380
  "retries": 0,
381
  "log_file": "/tmp/gpu_queue/job_030_as_sorl_abs30_K1_50K_2L1H128d_gpu0.log"
 
398
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 1 --num",
399
  "gpu": 1,
400
  "status": "running",
401
+ "elapsed": 9500,
402
+ "idle_time": 28,
403
  "exit_code": -1,
404
  "retries": 0,
405
  "log_file": "/tmp/gpu_queue/job_032_as_sorl_abs30_K1_50K_1L3H510d_gpu1.log"
 
411
  "gpu": 2,
412
  "status": "done",
413
  "elapsed": 2343,
414
+ "idle_time": 30966,
415
  "exit_code": 0,
416
  "retries": 0,
417
  "log_file": "/tmp/gpu_queue/job_033_as_baseline_100K_2L1H128d_gpu2.log"
 
434
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --n_l",
435
  "gpu": 1,
436
  "status": "running",
437
+ "elapsed": 2739,
438
+ "idle_time": 0,
439
  "exit_code": -1,
440
  "retries": 0,
441
  "log_file": "/tmp/gpu_queue/job_035_as_baseline_100K_1L3H510d_gpu1.log"
 
447
  "gpu": 0,
448
  "status": "done",
449
  "elapsed": 18453,
450
+ "idle_time": 3955,
451
  "exit_code": 0,
452
  "retries": 0,
453
  "log_file": "/tmp/gpu_queue/job_036_as_sorl_abs30_K1_100K_2L1H128d_gpu0.log"
 
459
  "gpu": 2,
460
  "status": "done",
461
  "elapsed": 16622,
462
+ "idle_time": 16687,
463
  "exit_code": 0,
464
  "retries": 0,
465
  "log_file": "/tmp/gpu_queue/job_037_as_sorl_abs30_K1_100K_1L2H256d_gpu2.log"
 
471
  "gpu": 0,
472
  "status": "done",
473
  "elapsed": 17990,
474
+ "idle_time": 16159,
475
  "exit_code": 0,
476
  "retries": 0,
477
  "log_file": "/tmp/gpu_queue/job_038_as_sorl_abs30_K1_100K_1L3H510d_gpu0.log"