{ "top_heads": [ { "rank": 1, "layer": 19, "head": 5, "aie": -0.024941083043813705, "abs_aie": 0.024941083043813705 }, { "rank": 2, "layer": 19, "head": 3, "aie": -0.02465316466987133, "abs_aie": 0.02465316466987133 }, { "rank": 3, "layer": 23, "head": 1, "aie": 0.020055249333381653, "abs_aie": 0.020055249333381653 }, { "rank": 4, "layer": 17, "head": 7, "aie": -0.013633356429636478, "abs_aie": 0.013633356429636478 }, { "rank": 5, "layer": 25, "head": 4, "aie": -0.012786902487277985, "abs_aie": 0.012786902487277985 }, { "rank": 6, "layer": 20, "head": 0, "aie": -0.01222932618111372, "abs_aie": 0.01222932618111372 }, { "rank": 7, "layer": 24, "head": 8, "aie": -0.011511072516441345, "abs_aie": 0.011511072516441345 }, { "rank": 8, "layer": 19, "head": 6, "aie": -0.010977868922054768, "abs_aie": 0.010977868922054768 }, { "rank": 9, "layer": 23, "head": 0, "aie": -0.010334699414670467, "abs_aie": 0.010334699414670467 }, { "rank": 10, "layer": 15, "head": 7, "aie": -0.010305065661668777, "abs_aie": 0.010305065661668777 } ], "function_vector_path": "/root/SafeGenAI/work/cache/fv/part3_function_vector.pt", "default_layer": 9, "steering_layers": [ 9 ], "heatmap_path": "/root/SafeGenAI/work/plots/part3_aie_heatmap.png", "top_tokens": [ { "token_id": 358, "token": " I", "probability": 0.7904141545295715 }, { "token_id": 35946, "token": "我", "probability": 0.028790833428502083 }, { "token_id": 40, "token": "I", "probability": 0.016404522582888603 }, { "token_id": 10168, "token": "“I", "probability": 0.00994984619319439 }, { "token_id": 64395, "token": " }},\n", "probability": 0.005669251084327698 }, { "token_id": 28492, "token": " winds", "probability": 0.003896415466442704 }, { "token_id": 34957, "token": " lenses", "probability": 0.003230242058634758 }, { "token_id": 5318, "token": "_i", "probability": 0.003034531371667981 }, { "token_id": 66769, "token": "dataTable", "probability": 0.003034531371667981 }, { "token_id": 79592, "token": "ASA", "probability": 0.0028506785165518522 }, { "token_id": 7959, "token": "_I", "probability": 0.0026779647450894117 }, { "token_id": 9956, "token": " wind", "probability": 0.0026779647450894117 }, { "token_id": 111734, "token": "中国队", "probability": 0.002363295527175069 }, { "token_id": 125153, "token": "мы", "probability": 0.002363295527175069 }, { "token_id": 36828, "token": "},{\"", "probability": 0.0020856009796261787 }, { "token_id": 48700, "token": " Credits", "probability": 0.0020856009796261787 }, { "token_id": 82979, "token": "},\r\n\r\n", "probability": 0.0018405363662168384 }, { "token_id": 112898, "token": "我当时", "probability": 0.0017290239920839667 }, { "token_id": 25230, "token": " Wolf", "probability": 0.0017290239920839667 }, { "token_id": 7044, "token": "\"I", "probability": 0.0017290239920839667 } ] }