llm-sort / outputs /task_files /perloc_gpu2.json
gatmiry's picture
Upload folder using huggingface_hub
beda614 verified
[{"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 1, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos1_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos1_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 1, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos1_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos1_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 4, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos4_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos4_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 4, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos4_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos4_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 7, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos7_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos7_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 7, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos7_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos7_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 10, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos10_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos10_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 10, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos10_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos10_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 13, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos13_layer0.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos13_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1337__final.pt", "folder_name": "plots_N256_B16_ds1337_is1337_final", "sorted_pos": 13, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1337_final/perlocation/intensity_pos13_layer1.npz", "itr": 100000, "dseed": "1337", "iseed": "1337", "name": "plots_N256_B16_ds1337_is1337_final_pos13_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 1, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos1_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos1_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 1, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos1_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos1_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 4, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos4_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos4_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 4, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos4_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos4_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 7, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos7_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos7_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 7, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos7_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos7_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 10, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos10_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos10_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 10, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos10_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos10_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 13, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos13_layer0.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos13_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1337_iseed1340__ckpt80000.pt", "folder_name": "plots_N256_B16_ds1337_is1340_ckpt80000", "sorted_pos": 13, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1337_is1340_ckpt80000/perlocation/intensity_pos13_layer1.npz", "itr": 80000, "dseed": "1337", "iseed": "1340", "name": "plots_N256_B16_ds1337_is1340_ckpt80000_pos13_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 1, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos1_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos1_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 1, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos1_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos1_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 4, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos4_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos4_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 4, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos4_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos4_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 7, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos7_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos7_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 7, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos7_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos7_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 10, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos10_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos10_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 10, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos10_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos10_L1"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 13, "layer": 0, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos13_layer0.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos13_L0"}, {"ckpt_path": "/mnt/task_runtime/sort-llm/100k-checkpoints/final_models/sortgpt_k16_methfixed_mlp1_L2_N256_E64_pos0_fln1_wd0p0_lr0p01_dseed1338_iseed1339__ckpt60000.pt", "folder_name": "plots_N256_B16_ds1338_is1339_ckpt60000", "sorted_pos": 13, "layer": 1, "out": "/mnt/task_runtime/sort-llm/100k-checkpoints/outputs/tmp_results/plots_N256_B16_ds1338_is1339_ckpt60000/perlocation/intensity_pos13_layer1.npz", "itr": 60000, "dseed": "1338", "iseed": "1339", "name": "plots_N256_B16_ds1338_is1339_ckpt60000_pos13_L1"}]