amirali1985 commited on
Commit
bd32447
·
verified ·
1 Parent(s): 7929035

Upload queue_status.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. queue_status.json +24 -24
queue_status.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "timestamp": "2026-04-15 07:13:04",
3
  "total": 59,
4
  "pending": 40,
5
  "running": 6,
@@ -15,7 +15,7 @@
15
  "gpu": 0,
16
  "status": "done",
17
  "elapsed": 19215,
18
- "idle_time": 15111,
19
  "exit_code": 0,
20
  "retries": 0,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs20_K1_100K_2L1H128d_gpu0.log"
@@ -27,7 +27,7 @@
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 17962,
30
- "idle_time": 16364,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs20_K1_100K_1L2H256d_gpu1.log"
@@ -39,7 +39,7 @@
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 20071,
42
- "idle_time": 14255,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs20_K1_100K_1L3H510d_gpu2.log"
@@ -51,7 +51,7 @@
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 19232,
54
- "idle_time": 15095,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs1_K1_100K_2L1H128d_gpu0.log"
@@ -63,7 +63,7 @@
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 17980,
66
- "idle_time": 16346,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs1_K1_100K_1L2H256d_gpu1.log"
@@ -75,7 +75,7 @@
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 20071,
78
- "idle_time": 14255,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs1_K1_100K_1L3H510d_gpu2.log"
@@ -86,7 +86,7 @@
86
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 2 --K 1 --num",
87
  "gpu": 2,
88
  "status": "running",
89
- "elapsed": 9852,
90
  "idle_time": 7,
91
  "exit_code": -1,
92
  "retries": 0,
@@ -123,7 +123,7 @@
123
  "gpu": 1,
124
  "status": "done",
125
  "elapsed": 15057,
126
- "idle_time": 1287,
127
  "exit_code": 0,
128
  "retries": 0,
129
  "log_file": "/tmp/gpu_queue/job_009_as_sorl_abs5_K1_100K_2L1H128d_gpu1.log"
@@ -207,7 +207,7 @@
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 1347,
210
- "idle_time": 5342,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_baseline_10K_1L2H256d_gpu1.log"
@@ -218,8 +218,8 @@
218
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 10000 --num_epochs 20 --n_la",
219
  "gpu": 1,
220
  "status": "running",
221
- "elapsed": 1282,
222
- "idle_time": 86,
223
  "exit_code": -1,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_baseline_10K_1L3H510d_gpu1.log"
@@ -267,7 +267,7 @@
267
  "gpu": 1,
268
  "status": "done",
269
  "elapsed": 1517,
270
- "idle_time": 6692,
271
  "exit_code": 0,
272
  "retries": 0,
273
  "log_file": "/tmp/gpu_queue/job_021_as_baseline_25K_2L1H128d_gpu1.log"
@@ -314,7 +314,7 @@
314
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 30 --K 1 --num",
315
  "gpu": 1,
316
  "status": "running",
317
- "elapsed": 5337,
318
  "idle_time": 10,
319
  "exit_code": -1,
320
  "retries": 0,
@@ -327,7 +327,7 @@
327
  "gpu": 1,
328
  "status": "done",
329
  "elapsed": 8147,
330
- "idle_time": 8213,
331
  "exit_code": 0,
332
  "retries": 0,
333
  "log_file": "/tmp/gpu_queue/job_026_as_sorl_abs30_K1_25K_1L3H510d_gpu1.log"
@@ -363,7 +363,7 @@
363
  "gpu": 2,
364
  "status": "done",
365
  "elapsed": 2052,
366
- "idle_time": 9857,
367
  "exit_code": 0,
368
  "retries": 0,
369
  "log_file": "/tmp/gpu_queue/job_029_as_baseline_50K_1L3H510d_gpu2.log"
@@ -375,7 +375,7 @@
375
  "gpu": 0,
376
  "status": "done",
377
  "elapsed": 11753,
378
- "idle_time": 3357,
379
  "exit_code": 0,
380
  "retries": 0,
381
  "log_file": "/tmp/gpu_queue/job_030_as_sorl_abs30_K1_50K_2L1H128d_gpu0.log"
@@ -411,7 +411,7 @@
411
  "gpu": 2,
412
  "status": "done",
413
  "elapsed": 2343,
414
- "idle_time": 11912,
415
  "exit_code": 0,
416
  "retries": 0,
417
  "log_file": "/tmp/gpu_queue/job_033_as_baseline_100K_2L1H128d_gpu2.log"
@@ -446,8 +446,8 @@
446
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
447
  "gpu": 0,
448
  "status": "running",
449
- "elapsed": 3352,
450
- "idle_time": 23,
451
  "exit_code": -1,
452
  "retries": 0,
453
  "log_file": "/tmp/gpu_queue/job_036_as_sorl_abs30_K1_100K_2L1H128d_gpu0.log"
@@ -458,8 +458,8 @@
458
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
459
  "gpu": 2,
460
  "status": "running",
461
- "elapsed": 14252,
462
- "idle_time": 131,
463
  "exit_code": -1,
464
  "retries": 0,
465
  "log_file": "/tmp/gpu_queue/job_037_as_sorl_abs30_K1_100K_1L2H256d_gpu2.log"
@@ -470,8 +470,8 @@
470
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
471
  "gpu": 0,
472
  "status": "running",
473
- "elapsed": 15093,
474
- "idle_time": 18,
475
  "exit_code": -1,
476
  "retries": 0,
477
  "log_file": "/tmp/gpu_queue/job_038_as_sorl_abs30_K1_100K_1L3H510d_gpu0.log"
 
1
  {
2
+ "timestamp": "2026-04-15 07:13:34",
3
  "total": 59,
4
  "pending": 40,
5
  "running": 6,
 
15
  "gpu": 0,
16
  "status": "done",
17
  "elapsed": 19215,
18
+ "idle_time": 15141,
19
  "exit_code": 0,
20
  "retries": 0,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs20_K1_100K_2L1H128d_gpu0.log"
 
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 17962,
30
+ "idle_time": 16395,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs20_K1_100K_1L2H256d_gpu1.log"
 
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 20071,
42
+ "idle_time": 14286,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs20_K1_100K_1L3H510d_gpu2.log"
 
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 19232,
54
+ "idle_time": 15125,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs1_K1_100K_2L1H128d_gpu0.log"
 
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 17980,
66
+ "idle_time": 16377,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs1_K1_100K_1L2H256d_gpu1.log"
 
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 20071,
78
+ "idle_time": 14286,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs1_K1_100K_1L3H510d_gpu2.log"
 
86
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 2 --K 1 --num",
87
  "gpu": 2,
88
  "status": "running",
89
+ "elapsed": 9883,
90
  "idle_time": 7,
91
  "exit_code": -1,
92
  "retries": 0,
 
123
  "gpu": 1,
124
  "status": "done",
125
  "elapsed": 15057,
126
+ "idle_time": 1318,
127
  "exit_code": 0,
128
  "retries": 0,
129
  "log_file": "/tmp/gpu_queue/job_009_as_sorl_abs5_K1_100K_2L1H128d_gpu1.log"
 
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 1347,
210
+ "idle_time": 5373,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_baseline_10K_1L2H256d_gpu1.log"
 
218
  "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 10000 --num_epochs 20 --n_la",
219
  "gpu": 1,
220
  "status": "running",
221
+ "elapsed": 1312,
222
+ "idle_time": 117,
223
  "exit_code": -1,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_baseline_10K_1L3H510d_gpu1.log"
 
267
  "gpu": 1,
268
  "status": "done",
269
  "elapsed": 1517,
270
+ "idle_time": 6723,
271
  "exit_code": 0,
272
  "retries": 0,
273
  "log_file": "/tmp/gpu_queue/job_021_as_baseline_25K_2L1H128d_gpu1.log"
 
314
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 30 --K 1 --num",
315
  "gpu": 1,
316
  "status": "running",
317
+ "elapsed": 5367,
318
  "idle_time": 10,
319
  "exit_code": -1,
320
  "retries": 0,
 
327
  "gpu": 1,
328
  "status": "done",
329
  "elapsed": 8147,
330
+ "idle_time": 8243,
331
  "exit_code": 0,
332
  "retries": 0,
333
  "log_file": "/tmp/gpu_queue/job_026_as_sorl_abs30_K1_25K_1L3H510d_gpu1.log"
 
363
  "gpu": 2,
364
  "status": "done",
365
  "elapsed": 2052,
366
+ "idle_time": 9888,
367
  "exit_code": 0,
368
  "retries": 0,
369
  "log_file": "/tmp/gpu_queue/job_029_as_baseline_50K_1L3H510d_gpu2.log"
 
375
  "gpu": 0,
376
  "status": "done",
377
  "elapsed": 11753,
378
+ "idle_time": 3388,
379
  "exit_code": 0,
380
  "retries": 0,
381
  "log_file": "/tmp/gpu_queue/job_030_as_sorl_abs30_K1_50K_2L1H128d_gpu0.log"
 
411
  "gpu": 2,
412
  "status": "done",
413
  "elapsed": 2343,
414
+ "idle_time": 11942,
415
  "exit_code": 0,
416
  "retries": 0,
417
  "log_file": "/tmp/gpu_queue/job_033_as_baseline_100K_2L1H128d_gpu2.log"
 
446
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
447
  "gpu": 0,
448
  "status": "running",
449
+ "elapsed": 3382,
450
+ "idle_time": 4,
451
  "exit_code": -1,
452
  "retries": 0,
453
  "log_file": "/tmp/gpu_queue/job_036_as_sorl_abs30_K1_100K_2L1H128d_gpu0.log"
 
458
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
459
  "gpu": 2,
460
  "status": "running",
461
+ "elapsed": 14283,
462
+ "idle_time": 162,
463
  "exit_code": -1,
464
  "retries": 0,
465
  "log_file": "/tmp/gpu_queue/job_037_as_sorl_abs30_K1_100K_1L2H256d_gpu2.log"
 
470
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu",
471
  "gpu": 0,
472
  "status": "running",
473
+ "elapsed": 15123,
474
+ "idle_time": 23,
475
  "exit_code": -1,
476
  "retries": 0,
477
  "log_file": "/tmp/gpu_queue/job_038_as_sorl_abs30_K1_100K_1L3H510d_gpu0.log"