| [{"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 25, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num25_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num25_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 25, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num25_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num25_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 75, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num75_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num75_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 75, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num75_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num75_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 128, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num128_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num128_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 128, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num128_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num128_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 180, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num180_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num180_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 180, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num180_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num180_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 230, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num230_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num230_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "target_num": 230, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/pernumber/intensity_num230_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_num230_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 25, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num25_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num25_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 25, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num25_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num25_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 75, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num75_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num75_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 75, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num75_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num75_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 128, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num128_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num128_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 128, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num128_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num128_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 180, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num180_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num180_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 180, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num180_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num180_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 230, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num230_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num230_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "target_num": 230, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/pernumber/intensity_num230_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_num230_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 25, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num25_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num25_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 25, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num25_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num25_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 75, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num75_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num75_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 75, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num75_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num75_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 128, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num128_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num128_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 128, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num128_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num128_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 180, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num180_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num180_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 180, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num180_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num180_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 230, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num230_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num230_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "target_num": 230, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/pernumber/intensity_num230_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_num230_L1"}] |