{ "timestamp": "2026-04-12 08:11:05", "total": 120, "pending": 0, "running": 0, "done": 15, "failed": 105, "stale": 0, "retrying": 0, "jobs": [ { "job_id": 0, "name": "add_sub_baseline_10K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 10000 --num_epochs 20 --push", "gpu": 0, "status": "done", "elapsed": 1786, "idle_time": 20603, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_000_add_sub_baseline_10K_gpu0.log" }, { "job_id": 1, "name": "add_sub_baseline_25K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --push", "gpu": 1, "status": "done", "elapsed": 2101, "idle_time": 20288, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_001_add_sub_baseline_25K_gpu1.log" }, { "job_id": 2, "name": "as_sorl_abs10_K1_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 10 --K 1 --num", "gpu": 2, "status": "done", "elapsed": 4753, "idle_time": 17636, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_002_as_sorl_abs10_K1_25K_gpu2.log" }, { "job_id": 3, "name": "add_sub_baseline_50K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 50000 --num_epochs 20 --push", "gpu": 0, "status": "done", "elapsed": 2366, "idle_time": 20022, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_003_add_sub_baseline_50K_gpu0.log" }, { "job_id": 4, "name": "as_sorl_abs10_K1_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 10 --K 1 --num", "gpu": 1, "status": "done", "elapsed": 6727, "idle_time": 15662, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_004_as_sorl_abs10_K1_50K_gpu1.log" }, { "job_id": 5, "name": "add_sub_baseline_100K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --pus", "gpu": 2, "status": "done", "elapsed": 3112, "idle_time": 19276, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_005_add_sub_baseline_100K_gpu2.log" }, { "job_id": 6, "name": "as_sorl_abs10_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --nu", "gpu": 0, "status": "done", "elapsed": 8856, "idle_time": 11743, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_006_as_sorl_abs10_K1_100K_gpu0.log" }, { "job_id": 7, "name": "add_sub_baseline_250K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 250000 --num_epochs 20 --pus", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 45, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_007_add_sub_baseline_250K_gpu0.log" }, { "job_id": 8, "name": "as_sorl_abs10_K1_250K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 10 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 75, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_008_as_sorl_abs10_K1_250K_gpu0.log" }, { "job_id": 9, "name": "add_sub_baseline_500K", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 500000 --num_epochs 20 --pus", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 110, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_009_add_sub_baseline_500K_gpu1.log" }, { "job_id": 10, "name": "as_sorl_abs10_K1_10K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 10 --K 1 --num", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 159, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_010_as_sorl_abs10_K1_10K_gpu2.log" }, { "job_id": 11, "name": "as_sorl_abs2_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 2 --K 4 --num", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 215, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_011_as_sorl_abs2_K4_500K_gpu2.log" }, { "job_id": 12, "name": "as_sorl_abs5_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 5 --K 4 --num", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 175, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_012_as_sorl_abs5_K4_500K_gpu1.log" }, { "job_id": 13, "name": "as_sorl_abs10_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 4 --nu", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 1249, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_013_as_sorl_abs10_K4_500K_gpu0.log" }, { "job_id": 14, "name": "as_sorl_abs16_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 16 --K 4 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 140, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_014_as_sorl_abs16_K4_500K_gpu0.log" }, { "job_id": 15, "name": "as_sorl_abs20_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 20 --K 4 --nu", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 110, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_015_as_sorl_abs20_K4_500K_gpu2.log" }, { "job_id": 16, "name": "as_sorl_abs50_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 50 --K 4 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 145, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_016_as_sorl_abs50_K4_500K_gpu1.log" }, { "job_id": 17, "name": "as_sorl_abs70_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 70 --K 4 --nu", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 145, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_017_as_sorl_abs70_K4_500K_gpu2.log" }, { "job_id": 18, "name": "as_sorl_abs100_K4_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 4 --n", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 205, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_018_as_sorl_abs100_K4_500K_gpu2.log" }, { "job_id": 19, "name": "as_sorl_abs2_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 2 --K 1 --num", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 90, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_019_as_sorl_abs2_K1_500K_gpu1.log" }, { "job_id": 20, "name": "as_sorl_abs5_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 5 --K 1 --num", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 90, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_020_as_sorl_abs5_K1_500K_gpu1.log" }, { "job_id": 21, "name": "as_sorl_abs10_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 154, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_021_as_sorl_abs10_K1_500K_gpu0.log" }, { "job_id": 22, "name": "as_sorl_abs16_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 16 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 90, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_022_as_sorl_abs16_K1_500K_gpu0.log" }, { "job_id": 23, "name": "as_sorl_abs20_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 20 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 75, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_023_as_sorl_abs20_K1_500K_gpu1.log" }, { "job_id": 24, "name": "as_sorl_abs50_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 50 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 4, "idle_time": 136, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_024_as_sorl_abs50_K1_500K_gpu1.log" }, { "job_id": 25, "name": "as_sorl_abs70_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 70 --K 1 --nu", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 145, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_025_as_sorl_abs70_K1_500K_gpu2.log" }, { "job_id": 26, "name": "as_sorl_abs100_K1_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 1 --n", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 120, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_026_as_sorl_abs100_K1_500K_gpu1.log" }, { "job_id": 27, "name": "as_sorl_abs5_K1_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 5 --K 1 --num_", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 220, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_027_as_sorl_abs5_K1_25K_gpu0.log" }, { "job_id": 28, "name": "as_sorl_abs30_K1_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 30 --K 1 --num", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 154, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_028_as_sorl_abs30_K1_25K_gpu1.log" }, { "job_id": 29, "name": "as_sorl_abs50_K1_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 50 --K 1 --num", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 85, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_029_as_sorl_abs50_K1_25K_gpu0.log" }, { "job_id": 30, "name": "as_sorl_abs5_K1_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 5 --K 1 --num_", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 95, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_030_as_sorl_abs5_K1_50K_gpu2.log" }, { "job_id": 31, "name": "as_sorl_abs30_K1_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 1 --num", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 200, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_031_as_sorl_abs30_K1_50K_gpu2.log" }, { "job_id": 32, "name": "as_sorl_abs50_K1_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 50 --K 1 --num", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 119, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_032_as_sorl_abs50_K1_50K_gpu0.log" }, { "job_id": 33, "name": "as_sorl_abs5_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 1 --num", "gpu": 2, "status": "failed", "elapsed": 7, "idle_time": 159, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_033_as_sorl_abs5_K1_100K_gpu2.log" }, { "job_id": 34, "name": "as_sorl_abs30_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 184, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_034_as_sorl_abs30_K1_100K_gpu0.log" }, { "job_id": 35, "name": "as_sorl_abs50_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 50 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 200, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_035_as_sorl_abs50_K1_100K_gpu1.log" }, { "job_id": 36, "name": "as_sorl_abs5_K4_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 5 --K 4 --num_", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 95, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_036_as_sorl_abs5_K4_25K_gpu2.log" }, { "job_id": 37, "name": "as_sorl_abs10_K4_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 10 --K 4 --num", "gpu": 0, "status": "done", "elapsed": 4510, "idle_time": 15508, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_037_as_sorl_abs10_K4_25K_gpu0.log" }, { "job_id": 38, "name": "as_sorl_abs30_K4_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 30 --K 4 --num", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 184, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_038_as_sorl_abs30_K4_25K_gpu1.log" }, { "job_id": 39, "name": "as_sorl_abs50_K4_25K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 50 --K 4 --num", "gpu": 2, "status": "failed", "elapsed": 4, "idle_time": 135, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_039_as_sorl_abs50_K4_25K_gpu2.log" }, { "job_id": 40, "name": "as_sorl_abs5_K4_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 5 --K 4 --num_", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 70, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_040_as_sorl_abs5_K4_50K_gpu2.log" }, { "job_id": 41, "name": "as_sorl_abs10_K4_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 10 --K 4 --num", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 220, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_041_as_sorl_abs10_K4_50K_gpu2.log" }, { "job_id": 42, "name": "as_sorl_abs30_K4_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 30 --K 4 --num", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 60, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_042_as_sorl_abs30_K4_50K_gpu0.log" }, { "job_id": 43, "name": "as_sorl_abs50_K4_50K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 50 --K 4 --num", "gpu": 0, "status": "done", "elapsed": 5510, "idle_time": 9994, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_043_as_sorl_abs50_K4_50K_gpu0.log" }, { "job_id": 44, "name": "as_sorl_abs5_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 5 --K 4 --num", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 125, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_044_as_sorl_abs5_K4_100K_gpu2.log" }, { "job_id": 45, "name": "as_sorl_abs10_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 4 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 205, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_045_as_sorl_abs10_K4_100K_gpu0.log" }, { "job_id": 46, "name": "as_sorl_abs30_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 30 --K 4 --nu", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 190, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_046_as_sorl_abs30_K4_100K_gpu2.log" }, { "job_id": 47, "name": "as_sorl_abs50_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 50 --K 4 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 169, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_047_as_sorl_abs50_K4_100K_gpu0.log" }, { "job_id": 48, "name": "as_sorl_abs10_K1_zipf2.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --al", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 80, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_048_as_sorl_abs10_K1_zipf2.0_500K_gpu0.log" }, { "job_id": 49, "name": "as_sorl_abs10_K1_zipf5.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --al", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 50, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_049_as_sorl_abs10_K1_zipf5.0_500K_gpu1.log" }, { "job_id": 50, "name": "as_sorl_abs10_K1_zipf10.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --al", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 226, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_050_as_sorl_abs10_K1_zipf10.0_500K_gpu2.log" }, { "job_id": 51, "name": "as_sorl_abs10_K4_zipf2.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 4 --al", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 45, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_051_as_sorl_abs10_K4_zipf2.0_500K_gpu0.log" }, { "job_id": 52, "name": "as_sorl_abs10_K4_zipf5.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 4 --al", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 185, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_052_as_sorl_abs10_K4_zipf5.0_500K_gpu0.log" }, { "job_id": 53, "name": "as_sorl_abs10_K4_zipf10.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 4 --al", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 13672, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_053_as_sorl_abs10_K4_zipf10.0_500K_gpu1.log" }, { "job_id": 54, "name": "as_sorl_abs100_K1_zipf2.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 1 --a", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 169, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_054_as_sorl_abs100_K1_zipf2.0_500K_gpu0.log" }, { "job_id": 55, "name": "as_sorl_abs100_K1_zipf5.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 1 --a", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 6372, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_055_as_sorl_abs100_K1_zipf5.0_500K_gpu0.log" }, { "job_id": 56, "name": "as_sorl_abs100_K1_zipf10.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 1 --a", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 80, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_056_as_sorl_abs100_K1_zipf10.0_500_gpu2.log" }, { "job_id": 57, "name": "as_sorl_abs100_K4_zipf2.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 4 --a", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 175, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_057_as_sorl_abs100_K4_zipf2.0_500K_gpu2.log" }, { "job_id": 58, "name": "as_sorl_abs100_K4_zipf5.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 4 --a", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 205, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_058_as_sorl_abs100_K4_zipf5.0_500K_gpu1.log" }, { "job_id": 59, "name": "as_sorl_abs100_K4_zipf10.0_500K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 100 --K 4 --a", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 169, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_059_as_sorl_abs100_K4_zipf10.0_500_gpu1.log" }, { "job_id": 60, "name": "as_baseline_25K_1L3H510d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --n_la", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 120, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_060_as_baseline_25K_1L3H510d_gpu2.log" }, { "job_id": 61, "name": "as_sorl_abs10_K1_25K_1L3H510d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 10 --K 1 --num", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 65, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_061_as_sorl_abs10_K1_25K_1L3H510d_gpu2.log" }, { "job_id": 62, "name": "as_baseline_50K_1L3H510d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 50000 --num_epochs 20 --n_la", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 215, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_062_as_baseline_50K_1L3H510d_gpu0.log" }, { "job_id": 63, "name": "as_sorl_abs10_K1_50K_1L3H510d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 10 --K 1 --num", "gpu": 0, "status": "done", "elapsed": 5352, "idle_time": 6386, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_063_as_sorl_abs10_K1_50K_1L3H510d_gpu0.log" }, { "job_id": 64, "name": "as_baseline_100K_1L3H510d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --n_l", "gpu": 1, "status": "failed", "elapsed": 4, "idle_time": 236, "exit_code": -15, "retries": 1, "log_file": "/tmp/gpu_queue/job_064_as_baseline_100K_1L3H510d_gpu1.log" }, { "job_id": 65, "name": "as_sorl_abs10_K1_100K_1L3H510d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 226, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_065_as_sorl_abs10_K1_100K_1L3H510d_gpu0.log" }, { "job_id": 66, "name": "as_baseline_250K_1L3H510d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 250000 --num_epochs 20 --n_l", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 200, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_066_as_baseline_250K_1L3H510d_gpu0.log" }, { "job_id": 67, "name": "as_sorl_abs10_K1_250K_1L3H510d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 10 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 125, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_067_as_sorl_abs10_K1_250K_1L3H510d_gpu1.log" }, { "job_id": 68, "name": "as_baseline_500K_1L3H510d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 500000 --num_epochs 20 --n_l", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 105, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_068_as_baseline_500K_1L3H510d_gpu1.log" }, { "job_id": 69, "name": "as_sorl_abs10_K1_500K_1L3H510d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --nu", "gpu": 2, "status": "failed", "elapsed": 2, "idle_time": 234, "exit_code": -15, "retries": 1, "log_file": "/tmp/gpu_queue/job_069_as_sorl_abs10_K1_500K_1L3H510d_gpu2.log" }, { "job_id": 70, "name": "as_baseline_25K_1L2H256d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --n_la", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 226, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_070_as_baseline_25K_1L2H256d_gpu1.log" }, { "job_id": 71, "name": "as_sorl_abs10_K1_25K_1L2H256d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 10 --K 1 --num", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 190, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_071_as_sorl_abs10_K1_25K_1L2H256d_gpu0.log" }, { "job_id": 72, "name": "as_baseline_50K_1L2H256d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 50000 --num_epochs 20 --n_la", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 55, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_072_as_baseline_50K_1L2H256d_gpu2.log" }, { "job_id": 73, "name": "as_sorl_abs10_K1_50K_1L2H256d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 10 --K 1 --num", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 75, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_073_as_sorl_abs10_K1_50K_1L2H256d_gpu1.log" }, { "job_id": 74, "name": "as_baseline_100K_1L2H256d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --n_l", "gpu": 2, "status": "done", "elapsed": 2797, "idle_time": 14836, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_074_as_baseline_100K_1L2H256d_gpu2.log" }, { "job_id": 75, "name": "as_sorl_abs10_K1_100K_1L2H256d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 220, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_075_as_sorl_abs10_K1_100K_1L2H256d_gpu1.log" }, { "job_id": 76, "name": "as_baseline_250K_1L2H256d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 250000 --num_epochs 20 --n_l", "gpu": 0, "status": "done", "elapsed": 4832, "idle_time": 1682, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_076_as_baseline_250K_1L2H256d_gpu0.log" }, { "job_id": 77, "name": "as_sorl_abs10_K1_250K_1L2H256d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 10 --K 1 --nu", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 49, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_077_as_sorl_abs10_K1_250K_1L2H256d_gpu2.log" }, { "job_id": 78, "name": "as_baseline_500K_1L2H256d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 500000 --num_epochs 20 --n_l", "gpu": 2, "status": "done", "elapsed": 7064, "idle_time": 12209, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_078_as_baseline_500K_1L2H256d_gpu2.log" }, { "job_id": 79, "name": "as_sorl_abs10_K1_500K_1L2H256d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --nu", "gpu": 2, "status": "failed", "elapsed": 4, "idle_time": 136, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_079_as_sorl_abs10_K1_500K_1L2H256d_gpu2.log" }, { "job_id": 80, "name": "as_baseline_25K_2L1H128d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 25000 --num_epochs 20 --n_la", "gpu": 1, "status": "done", "elapsed": 1971, "idle_time": 13688, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_080_as_baseline_25K_2L1H128d_gpu1.log" }, { "job_id": 81, "name": "as_sorl_abs10_K1_25K_2L1H128d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 25000 --abs_vocab 10 --K 1 --num", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 175, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_081_as_sorl_abs10_K1_25K_2L1H128d_gpu2.log" }, { "job_id": 82, "name": "as_baseline_50K_2L1H128d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 50000 --num_epochs 20 --n_la", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 155, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_082_as_baseline_50K_2L1H128d_gpu0.log" }, { "job_id": 83, "name": "as_sorl_abs10_K1_50K_2L1H128d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 50000 --abs_vocab 10 --K 1 --num", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 60, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_083_as_sorl_abs10_K1_50K_2L1H128d_gpu0.log" }, { "job_id": 84, "name": "as_baseline_100K_2L1H128d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 100000 --num_epochs 20 --n_l", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 125, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_084_as_baseline_100K_2L1H128d_gpu0.log" }, { "job_id": 85, "name": "as_sorl_abs10_K1_100K_2L1H128d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 105, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_085_as_sorl_abs10_K1_100K_2L1H128d_gpu0.log" }, { "job_id": 86, "name": "as_baseline_250K_2L1H128d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 250000 --num_epochs 20 --n_l", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 140, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_086_as_baseline_250K_2L1H128d_gpu1.log" }, { "job_id": 87, "name": "as_sorl_abs10_K1_250K_2L1H128d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 10 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 241, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_087_as_sorl_abs10_K1_250K_2L1H128d_gpu1.log" }, { "job_id": 88, "name": "as_baseline_500K_2L1H128d", "cmd": "python -m arithmetic.train --mode baseline --ops add_sub --dataset_size 500000 --num_epochs 20 --n_l", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 60, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_088_as_baseline_500K_2L1H128d_gpu1.log" }, { "job_id": 89, "name": "as_sorl_abs10_K1_500K_2L1H128d", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 500000 --abs_vocab 10 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 241, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_089_as_sorl_abs10_K1_500K_2L1H128d_gpu1.log" }, { "job_id": 90, "name": "as_sorl_abs5_K4_10K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 5 --K 4 --num_", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 65, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_090_as_sorl_abs5_K4_10K_gpu0.log" }, { "job_id": 91, "name": "as_sorl_abs10_K4_10K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 10 --K 4 --num", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 140, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_091_as_sorl_abs10_K4_10K_gpu0.log" }, { "job_id": 92, "name": "as_sorl_abs30_K4_10K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 30 --K 4 --num", "gpu": 0, "status": "done", "elapsed": 3477, "idle_time": 6517, "exit_code": 0, "retries": 0, "log_file": "/tmp/gpu_queue/job_092_as_sorl_abs30_K4_10K_gpu0.log" }, { "job_id": 93, "name": "as_sorl_abs50_K4_10K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 10000 --abs_vocab 50 --K 4 --num", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 159, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_093_as_sorl_abs50_K4_10K_gpu1.log" }, { "job_id": 94, "name": "as_sorl_abs5_K4_250K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 5 --K 4 --num", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 100, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_094_as_sorl_abs5_K4_250K_gpu0.log" }, { "job_id": 95, "name": "as_sorl_abs10_K4_250K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 10 --K 4 --nu", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 237, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_095_as_sorl_abs10_K4_250K_gpu2.log" }, { "job_id": 96, "name": "as_sorl_abs30_K4_250K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 30 --K 4 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 104, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_096_as_sorl_abs30_K4_250K_gpu1.log" }, { "job_id": 97, "name": "as_sorl_abs50_K4_250K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 250000 --abs_vocab 50 --K 4 --nu", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 190, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_097_as_sorl_abs50_K4_250K_gpu1.log" }, { "job_id": 98, "name": "as_sorl_abs2_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 2 --K 1 --num", "gpu": 1, "status": "failed", "elapsed": 3, "idle_time": 235, "exit_code": -15, "retries": 1, "log_file": "/tmp/gpu_queue/job_098_as_sorl_abs2_K1_100K_gpu1.log" }, { "job_id": 99, "name": "as_sorl_abs2_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 2 --K 4 --num", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 215, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_099_as_sorl_abs2_K4_100K_gpu1.log" }, { "job_id": 100, "name": "as_sorl_abs16_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 16 --K 1 --nu", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 114, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_100_as_sorl_abs16_K1_100K_gpu0.log" }, { "job_id": 101, "name": "as_sorl_abs16_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 16 --K 4 --nu", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 0, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_101_as_sorl_abs16_K4_100K_gpu1.log" }, { "job_id": 102, "name": "as_sorl_abs20_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 20 --K 1 --nu", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 40, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_102_as_sorl_abs20_K1_100K_gpu2.log" }, { "job_id": 103, "name": "as_sorl_abs20_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 20 --K 4 --nu", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 0, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_103_as_sorl_abs20_K4_100K_gpu0.log" }, { "job_id": 104, "name": "as_sorl_abs70_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 70 --K 1 --nu", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 30, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_104_as_sorl_abs70_K1_100K_gpu1.log" }, { "job_id": 105, "name": "as_sorl_abs70_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 70 --K 4 --nu", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 35, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_105_as_sorl_abs70_K4_100K_gpu2.log" }, { "job_id": 106, "name": "as_sorl_abs100_K1_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 1 --n", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 15, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_106_as_sorl_abs100_K1_100K_gpu1.log" }, { "job_id": 107, "name": "as_sorl_abs100_K4_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 4 --n", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 24, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_107_as_sorl_abs100_K4_100K_gpu0.log" }, { "job_id": 108, "name": "as_sorl_abs10_K1_zipf2.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --al", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 10, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_108_as_sorl_abs10_K1_zipf2.0_100K_gpu0.log" }, { "job_id": 109, "name": "as_sorl_abs10_K4_zipf2.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 4 --al", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 30, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_109_as_sorl_abs10_K4_zipf2.0_100K_gpu1.log" }, { "job_id": 110, "name": "as_sorl_abs10_K1_zipf5.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --al", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 24, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_110_as_sorl_abs10_K1_zipf5.0_100K_gpu1.log" }, { "job_id": 111, "name": "as_sorl_abs10_K4_zipf5.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 4 --al", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 5, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_111_as_sorl_abs10_K4_zipf5.0_100K_gpu2.log" }, { "job_id": 112, "name": "as_sorl_abs10_K1_zipf10.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 1 --al", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 14, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_112_as_sorl_abs10_K1_zipf10.0_100K_gpu2.log" }, { "job_id": 113, "name": "as_sorl_abs10_K4_zipf10.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 10 --K 4 --al", "gpu": 1, "status": "failed", "elapsed": 6, "idle_time": 10, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_113_as_sorl_abs10_K4_zipf10.0_100K_gpu1.log" }, { "job_id": 114, "name": "as_sorl_abs100_K1_zipf2.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 1 --a", "gpu": 2, "status": "failed", "elapsed": 6, "idle_time": 19, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_114_as_sorl_abs100_K1_zipf2.0_100K_gpu2.log" }, { "job_id": 115, "name": "as_sorl_abs100_K4_zipf2.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 4 --a", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 14, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_115_as_sorl_abs100_K4_zipf2.0_100K_gpu0.log" }, { "job_id": 116, "name": "as_sorl_abs100_K1_zipf5.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 1 --a", "gpu": 2, "status": "failed", "elapsed": 5, "idle_time": 0, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_116_as_sorl_abs100_K1_zipf5.0_100K_gpu2.log" }, { "job_id": 117, "name": "as_sorl_abs100_K4_zipf5.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 4 --a", "gpu": 1, "status": "failed", "elapsed": 5, "idle_time": 44, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_117_as_sorl_abs100_K4_zipf5.0_100K_gpu1.log" }, { "job_id": 118, "name": "as_sorl_abs100_K1_zipf10.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 1 --a", "gpu": 0, "status": "failed", "elapsed": 5, "idle_time": 36, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_118_as_sorl_abs100_K1_zipf10.0_100_gpu0.log" }, { "job_id": 119, "name": "as_sorl_abs100_K4_zipf10.0_100K", "cmd": "python -m arithmetic.train --mode sorl --ops add_sub --dataset_size 100000 --abs_vocab 100 --K 4 --a", "gpu": 0, "status": "failed", "elapsed": 6, "idle_time": 30, "exit_code": -9, "retries": 1, "log_file": "/tmp/gpu_queue/job_119_as_sorl_abs100_K4_zipf10.0_100_gpu0.log" } ] }