amirali1985 commited on
Commit
8efdd7d
·
verified ·
1 Parent(s): 295fd9c

Upload queue_status.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. queue_status.json +28 -28
queue_status.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "timestamp": "2026-04-16 05:37:17",
3
  "total": 20,
4
  "pending": 2,
5
- "running": 6,
6
- "done": 11,
7
  "failed": 1,
8
  "stale": 0,
9
  "retrying": 0,
@@ -15,7 +15,7 @@
15
  "gpu": 0,
16
  "status": "failed",
17
  "elapsed": 7,
18
- "idle_time": 16019,
19
  "exit_code": 2,
20
  "retries": 1,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs30_K1_100K_emlr5_2L_gpu0.log"
@@ -27,7 +27,7 @@
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 10909,
30
- "idle_time": 5128,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs30_K1_50K_ig1_2L1H1_gpu1.log"
@@ -39,7 +39,7 @@
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 10932,
42
- "idle_time": 5105,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs30_K1_50K_ig1_1L3H5_gpu2.log"
@@ -51,7 +51,7 @@
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 9082,
54
- "idle_time": 6955,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs30_K1_50K_ig5_2L1H1_gpu0.log"
@@ -63,7 +63,7 @@
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 10997,
66
- "idle_time": 5040,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs30_K1_50K_ig5_1L3H5_gpu1.log"
@@ -75,7 +75,7 @@
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 10836,
78
- "idle_time": 5201,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs30_K1_50K_abs05_2L1_gpu2.log"
@@ -110,8 +110,8 @@
110
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 1 --num",
111
  "gpu": 1,
112
  "status": "running",
113
- "elapsed": 59,
114
- "idle_time": 16,
115
  "exit_code": -1,
116
  "retries": 0,
117
  "log_file": "/tmp/gpu_queue/job_008_as_sorl_abs30_K1_50K_abs001_1L_gpu1.log"
@@ -122,7 +122,7 @@
122
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
123
  "gpu": 0,
124
  "status": "running",
125
- "elapsed": 1419,
126
  "idle_time": 9,
127
  "exit_code": -1,
128
  "retries": 0,
@@ -134,8 +134,8 @@
134
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
135
  "gpu": 2,
136
  "status": "running",
137
- "elapsed": 109,
138
- "idle_time": 9,
139
  "exit_code": -1,
140
  "retries": 0,
141
  "log_file": "/tmp/gpu_queue/job_010_as_sorl_abs30_K4_100K_1L2H256d_gpu2.log"
@@ -146,8 +146,8 @@
146
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
147
  "gpu": 0,
148
  "status": "running",
149
- "elapsed": 3589,
150
- "idle_time": 53,
151
  "exit_code": -1,
152
  "retries": 0,
153
  "log_file": "/tmp/gpu_queue/job_011_as_sorl_abs30_K4_100K_1L3H510d_gpu0.log"
@@ -159,7 +159,7 @@
159
  "gpu": 0,
160
  "status": "done",
161
  "elapsed": 1450,
162
- "idle_time": 14567,
163
  "exit_code": 0,
164
  "retries": 0,
165
  "log_file": "/tmp/gpu_queue/job_012_as_baseline_10K_2L3H510d_gpu0.log"
@@ -169,10 +169,10 @@
169
  "name": "as_sorl_abs1_K1_10K_2L3H510d",
170
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 1 --K 1 --num_",
171
  "gpu": 2,
172
- "status": "running",
173
- "elapsed": 5099,
174
- "idle_time": 368,
175
- "exit_code": -1,
176
  "retries": 0,
177
  "log_file": "/tmp/gpu_queue/job_013_as_sorl_abs1_K1_10K_2L3H510d_gpu2.log"
178
  },
@@ -182,8 +182,8 @@
182
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 2 --K 1 --num_",
183
  "gpu": 1,
184
  "status": "running",
185
- "elapsed": 5034,
186
- "idle_time": 324,
187
  "exit_code": -1,
188
  "retries": 0,
189
  "log_file": "/tmp/gpu_queue/job_014_as_sorl_abs2_K1_10K_2L3H510d_gpu1.log"
@@ -195,7 +195,7 @@
195
  "gpu": 0,
196
  "status": "done",
197
  "elapsed": 5222,
198
- "idle_time": 3595,
199
  "exit_code": 0,
200
  "retries": 0,
201
  "log_file": "/tmp/gpu_queue/job_015_as_sorl_abs5_K1_10K_2L3H510d_gpu0.log"
@@ -207,7 +207,7 @@
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 5062,
210
- "idle_time": 64,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_sorl_abs10_K1_10K_2L3H510d_gpu1.log"
@@ -219,7 +219,7 @@
219
  "gpu": 2,
220
  "status": "done",
221
  "elapsed": 5089,
222
- "idle_time": 112,
223
  "exit_code": 0,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_sorl_abs20_K1_10K_2L3H510d_gpu2.log"
@@ -231,7 +231,7 @@
231
  "gpu": 0,
232
  "status": "done",
233
  "elapsed": 5528,
234
- "idle_time": 1424,
235
  "exit_code": 0,
236
  "retries": 0,
237
  "log_file": "/tmp/gpu_queue/job_018_as_sorl_abs30_K1_10K_2L3H510d_gpu0.log"
@@ -243,7 +243,7 @@
243
  "gpu": 0,
244
  "status": "done",
245
  "elapsed": 5747,
246
- "idle_time": 8819,
247
  "exit_code": 0,
248
  "retries": 0,
249
  "log_file": "/tmp/gpu_queue/job_019_as_sorl_abs50_K1_10K_2L3H510d_gpu0.log"
 
1
  {
2
+ "timestamp": "2026-04-16 05:37:35",
3
  "total": 20,
4
  "pending": 2,
5
+ "running": 5,
6
+ "done": 12,
7
  "failed": 1,
8
  "stale": 0,
9
  "retrying": 0,
 
15
  "gpu": 0,
16
  "status": "failed",
17
  "elapsed": 7,
18
+ "idle_time": 16038,
19
  "exit_code": 2,
20
  "retries": 1,
21
  "log_file": "/tmp/gpu_queue/job_000_as_sorl_abs30_K1_100K_emlr5_2L_gpu0.log"
 
27
  "gpu": 1,
28
  "status": "done",
29
  "elapsed": 10909,
30
+ "idle_time": 5147,
31
  "exit_code": 0,
32
  "retries": 0,
33
  "log_file": "/tmp/gpu_queue/job_001_as_sorl_abs30_K1_50K_ig1_2L1H1_gpu1.log"
 
39
  "gpu": 2,
40
  "status": "done",
41
  "elapsed": 10932,
42
+ "idle_time": 5123,
43
  "exit_code": 0,
44
  "retries": 0,
45
  "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs30_K1_50K_ig1_1L3H5_gpu2.log"
 
51
  "gpu": 0,
52
  "status": "done",
53
  "elapsed": 9082,
54
+ "idle_time": 6974,
55
  "exit_code": 0,
56
  "retries": 0,
57
  "log_file": "/tmp/gpu_queue/job_003_as_sorl_abs30_K1_50K_ig5_2L1H1_gpu0.log"
 
63
  "gpu": 1,
64
  "status": "done",
65
  "elapsed": 10997,
66
+ "idle_time": 5059,
67
  "exit_code": 0,
68
  "retries": 0,
69
  "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs30_K1_50K_ig5_1L3H5_gpu1.log"
 
75
  "gpu": 2,
76
  "status": "done",
77
  "elapsed": 10836,
78
+ "idle_time": 5220,
79
  "exit_code": 0,
80
  "retries": 0,
81
  "log_file": "/tmp/gpu_queue/job_005_as_sorl_abs30_K1_50K_abs05_2L1_gpu2.log"
 
110
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 1 --num",
111
  "gpu": 1,
112
  "status": "running",
113
+ "elapsed": 77,
114
+ "idle_time": 1,
115
  "exit_code": -1,
116
  "retries": 0,
117
  "log_file": "/tmp/gpu_queue/job_008_as_sorl_abs30_K1_50K_abs001_1L_gpu1.log"
 
122
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
123
  "gpu": 0,
124
  "status": "running",
125
+ "elapsed": 1438,
126
  "idle_time": 9,
127
  "exit_code": -1,
128
  "retries": 0,
 
134
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
135
  "gpu": 2,
136
  "status": "running",
137
+ "elapsed": 127,
138
+ "idle_time": 2,
139
  "exit_code": -1,
140
  "retries": 0,
141
  "log_file": "/tmp/gpu_queue/job_010_as_sorl_abs30_K4_100K_1L2H256d_gpu2.log"
 
146
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu",
147
  "gpu": 0,
148
  "status": "running",
149
+ "elapsed": 3608,
150
+ "idle_time": 71,
151
  "exit_code": -1,
152
  "retries": 0,
153
  "log_file": "/tmp/gpu_queue/job_011_as_sorl_abs30_K4_100K_1L3H510d_gpu0.log"
 
159
  "gpu": 0,
160
  "status": "done",
161
  "elapsed": 1450,
162
+ "idle_time": 14586,
163
  "exit_code": 0,
164
  "retries": 0,
165
  "log_file": "/tmp/gpu_queue/job_012_as_baseline_10K_2L3H510d_gpu0.log"
 
169
  "name": "as_sorl_abs1_K1_10K_2L3H510d",
170
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 1 --K 1 --num_",
171
  "gpu": 2,
172
+ "status": "done",
173
+ "elapsed": 5118,
174
+ "idle_time": 2,
175
+ "exit_code": 0,
176
  "retries": 0,
177
  "log_file": "/tmp/gpu_queue/job_013_as_sorl_abs1_K1_10K_2L3H510d_gpu2.log"
178
  },
 
182
  "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 2 --K 1 --num_",
183
  "gpu": 1,
184
  "status": "running",
185
+ "elapsed": 5053,
186
+ "idle_time": 343,
187
  "exit_code": -1,
188
  "retries": 0,
189
  "log_file": "/tmp/gpu_queue/job_014_as_sorl_abs2_K1_10K_2L3H510d_gpu1.log"
 
195
  "gpu": 0,
196
  "status": "done",
197
  "elapsed": 5222,
198
+ "idle_time": 3614,
199
  "exit_code": 0,
200
  "retries": 0,
201
  "log_file": "/tmp/gpu_queue/job_015_as_sorl_abs5_K1_10K_2L3H510d_gpu0.log"
 
207
  "gpu": 1,
208
  "status": "done",
209
  "elapsed": 5062,
210
+ "idle_time": 83,
211
  "exit_code": 0,
212
  "retries": 0,
213
  "log_file": "/tmp/gpu_queue/job_016_as_sorl_abs10_K1_10K_2L3H510d_gpu1.log"
 
219
  "gpu": 2,
220
  "status": "done",
221
  "elapsed": 5089,
222
+ "idle_time": 131,
223
  "exit_code": 0,
224
  "retries": 0,
225
  "log_file": "/tmp/gpu_queue/job_017_as_sorl_abs20_K1_10K_2L3H510d_gpu2.log"
 
231
  "gpu": 0,
232
  "status": "done",
233
  "elapsed": 5528,
234
+ "idle_time": 1443,
235
  "exit_code": 0,
236
  "retries": 0,
237
  "log_file": "/tmp/gpu_queue/job_018_as_sorl_abs30_K1_10K_2L3H510d_gpu0.log"
 
243
  "gpu": 0,
244
  "status": "done",
245
  "elapsed": 5747,
246
+ "idle_time": 8838,
247
  "exit_code": 0,
248
  "retries": 0,
249
  "log_file": "/tmp/gpu_queue/job_019_as_sorl_abs50_K1_10K_2L3H510d_gpu0.log"