Add precomputed results for p=3
Browse files- .gitattributes +6 -0
- precomputed_results/p_003/p003_dft_heatmap_in.png +0 -0
- precomputed_results/p_003/p003_dft_heatmap_out.png +0 -0
- precomputed_results/p_003/p003_lineplot_in.png +3 -0
- precomputed_results/p_003/p003_lineplot_out.png +3 -0
- precomputed_results/p_003/p003_logits_interactive.json +1 -0
- precomputed_results/p_003/p003_lottery_beta_contour.png +0 -0
- precomputed_results/p_003/p003_lottery_mech_magnitude.png +0 -0
- precomputed_results/p_003/p003_lottery_mech_phase.png +0 -0
- precomputed_results/p_003/p003_magnitude_distribution.png +0 -0
- precomputed_results/p_003/p003_metadata.json +82 -0
- precomputed_results/p_003/p003_neuron_spectra.json +1 -0
- precomputed_results/p_003/p003_output_logits.png +0 -0
- precomputed_results/p_003/p003_overview.json +1 -0
- precomputed_results/p_003/p003_overview_loss_ipr.png +0 -0
- precomputed_results/p_003/p003_overview_phase_scatter.png +0 -0
- precomputed_results/p_003/p003_phase_align_approx1.png +3 -0
- precomputed_results/p_003/p003_phase_align_approx2.png +3 -0
- precomputed_results/p_003/p003_phase_align_quad.png +0 -0
- precomputed_results/p_003/p003_phase_align_relu.png +0 -0
- precomputed_results/p_003/p003_phase_distribution.png +0 -0
- precomputed_results/p_003/p003_phase_relationship.png +0 -0
- precomputed_results/p_003/p003_single_freq_quad.png +3 -0
- precomputed_results/p_003/p003_single_freq_relu.png +3 -0
- precomputed_results/p_003/p003_training_log.json +0 -0
.gitattributes
CHANGED
|
@@ -167,3 +167,9 @@ precomputed_results/p_067/p067_phase_align_approx2.png filter=lfs diff=lfs merge
|
|
| 167 |
precomputed_results/p_067/p067_phase_align_quad.png filter=lfs diff=lfs merge=lfs -text
|
| 168 |
precomputed_results/p_067/p067_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
|
| 169 |
precomputed_results/p_067/p067_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 167 |
precomputed_results/p_067/p067_phase_align_quad.png filter=lfs diff=lfs merge=lfs -text
|
| 168 |
precomputed_results/p_067/p067_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
|
| 169 |
precomputed_results/p_067/p067_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
|
| 170 |
+
precomputed_results/p_003/p003_lineplot_in.png filter=lfs diff=lfs merge=lfs -text
|
| 171 |
+
precomputed_results/p_003/p003_lineplot_out.png filter=lfs diff=lfs merge=lfs -text
|
| 172 |
+
precomputed_results/p_003/p003_phase_align_approx1.png filter=lfs diff=lfs merge=lfs -text
|
| 173 |
+
precomputed_results/p_003/p003_phase_align_approx2.png filter=lfs diff=lfs merge=lfs -text
|
| 174 |
+
precomputed_results/p_003/p003_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
|
| 175 |
+
precomputed_results/p_003/p003_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
|
precomputed_results/p_003/p003_dft_heatmap_in.png
ADDED
|
precomputed_results/p_003/p003_dft_heatmap_out.png
ADDED
|
precomputed_results/p_003/p003_lineplot_in.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_lineplot_out.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_logits_interactive.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"pairs": [[0, 0], [1, 0], [2, 0]], "correct_answers": [0, 1, 2], "logits": [[4.3912763595581055, -3.80269718170166, -3.5643606185913086], [-2.968888282775879, 5.465089797973633, -2.4930355548858643], [-2.4251582622528076, -2.766524314880371, 5.376070976257324]], "output_classes": [0, 1, 2]}
|
precomputed_results/p_003/p003_lottery_beta_contour.png
ADDED
|
precomputed_results/p_003/p003_lottery_mech_magnitude.png
ADDED
|
precomputed_results/p_003/p003_lottery_mech_phase.png
ADDED
|
precomputed_results/p_003/p003_magnitude_distribution.png
ADDED
|
precomputed_results/p_003/p003_metadata.json
ADDED
|
@@ -0,0 +1,82 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"prime": 3,
|
| 3 |
+
"d_mlp": 512,
|
| 4 |
+
"training_runs": {
|
| 5 |
+
"standard": {
|
| 6 |
+
"act_type": "ReLU",
|
| 7 |
+
"lr": 5e-05,
|
| 8 |
+
"weight_decay": 0,
|
| 9 |
+
"num_epochs": 5000,
|
| 10 |
+
"frac_train": 1.0,
|
| 11 |
+
"init_type": "random",
|
| 12 |
+
"init_scale": 0.1,
|
| 13 |
+
"optimizer": "AdamW"
|
| 14 |
+
},
|
| 15 |
+
"grokking": {
|
| 16 |
+
"act_type": "ReLU",
|
| 17 |
+
"lr": 0.0001,
|
| 18 |
+
"weight_decay": 2.0,
|
| 19 |
+
"num_epochs": 50000,
|
| 20 |
+
"frac_train": 0.75,
|
| 21 |
+
"init_type": "random",
|
| 22 |
+
"init_scale": 0.1,
|
| 23 |
+
"optimizer": "AdamW"
|
| 24 |
+
},
|
| 25 |
+
"quad_random": {
|
| 26 |
+
"act_type": "Quad",
|
| 27 |
+
"lr": 5e-05,
|
| 28 |
+
"weight_decay": 0,
|
| 29 |
+
"num_epochs": 5000,
|
| 30 |
+
"frac_train": 1.0,
|
| 31 |
+
"init_type": "random",
|
| 32 |
+
"init_scale": 0.1,
|
| 33 |
+
"optimizer": "AdamW"
|
| 34 |
+
},
|
| 35 |
+
"quad_single_freq": {
|
| 36 |
+
"act_type": "Quad",
|
| 37 |
+
"lr": 0.1,
|
| 38 |
+
"weight_decay": 0,
|
| 39 |
+
"num_epochs": 10000,
|
| 40 |
+
"frac_train": 1.0,
|
| 41 |
+
"init_type": "single-freq",
|
| 42 |
+
"init_scale": 0.02,
|
| 43 |
+
"optimizer": "SGD"
|
| 44 |
+
},
|
| 45 |
+
"relu_single_freq": {
|
| 46 |
+
"act_type": "ReLU",
|
| 47 |
+
"lr": 0.01,
|
| 48 |
+
"weight_decay": 0,
|
| 49 |
+
"num_epochs": 10000,
|
| 50 |
+
"frac_train": 1.0,
|
| 51 |
+
"init_type": "single-freq",
|
| 52 |
+
"init_scale": 0.002,
|
| 53 |
+
"optimizer": "SGD"
|
| 54 |
+
}
|
| 55 |
+
},
|
| 56 |
+
"final_metrics": {
|
| 57 |
+
"standard": {
|
| 58 |
+
"train_acc": 1.0,
|
| 59 |
+
"test_acc": 1.0,
|
| 60 |
+
"train_loss": 0.000652323302347213,
|
| 61 |
+
"test_loss": 0.000652323302347213
|
| 62 |
+
},
|
| 63 |
+
"quad_random": {
|
| 64 |
+
"train_acc": 1.0,
|
| 65 |
+
"test_acc": 1.0,
|
| 66 |
+
"train_loss": 2.1325192847143626e-06,
|
| 67 |
+
"test_loss": 2.1325192847143626e-06
|
| 68 |
+
},
|
| 69 |
+
"quad_single_freq": {
|
| 70 |
+
"train_acc": 1.0,
|
| 71 |
+
"test_acc": 1.0,
|
| 72 |
+
"train_loss": 0.00011593083763727918,
|
| 73 |
+
"test_loss": 0.00011593083763727918
|
| 74 |
+
},
|
| 75 |
+
"relu_single_freq": {
|
| 76 |
+
"train_acc": 1.0,
|
| 77 |
+
"test_acc": 1.0,
|
| 78 |
+
"train_loss": 0.010676158592104912,
|
| 79 |
+
"test_loss": 0.010676158592104912
|
| 80 |
+
}
|
| 81 |
+
}
|
| 82 |
+
}
|
precomputed_results/p_003/p003_neuron_spectra.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"fourier_basis_names": ["Const", "cos 1", "sin 1"], "neurons": {"neuron_0": {"global_index": 103, "dominant_freq": 1, "fourier_magnitudes_in": [0.1533791720867157, 0.4337967336177826, 5.208070433582179e-06], "fourier_magnitudes_out": [0.08648745715618134, 0.4276861846446991, 0.02207593433558941]}, "neuron_1": {"global_index": 378, "dominant_freq": 1, "fourier_magnitudes_in": [4.64054483018117e-06, 4.665445885621011e-06, 0.4044943153858185], "fourier_magnitudes_out": [0.17398148775100708, 0.4107496738433838, 0.030531879514455795]}, "neuron_2": {"global_index": 391, "dominant_freq": 1, "fourier_magnitudes_in": [0.13995108008384705, 0.3958445191383362, 5.925997356825974e-06], "fourier_magnitudes_out": [0.14620955288410187, 0.38962724804878235, 0.03937247395515442]}, "neuron_3": {"global_index": 233, "dominant_freq": 1, "fourier_magnitudes_in": [0.15963488817214966, 0.2257595956325531, 0.3910297155380249], "fourier_magnitudes_out": [0.08809392154216766, 0.2753666937351227, 0.3857313394546509]}, "neuron_4": {"global_index": 154, "dominant_freq": 1, "fourier_magnitudes_in": [0.13708585500717163, 0.38772234320640564, 1.113968551180733e-06], "fourier_magnitudes_out": [0.06758829206228256, 0.4502902328968048, 0.051096681505441666]}, "neuron_5": {"global_index": 510, "dominant_freq": 1, "fourier_magnitudes_in": [7.893670044722967e-06, 1.8176755474996753e-05, 0.38303306698799133], "fourier_magnitudes_out": [0.04921259358525276, 0.38618966937065125, 0.08766306936740875]}, "neuron_6": {"global_index": 96, "dominant_freq": 1, "fourier_magnitudes_in": [0.13497814536094666, 0.38177254796028137, 1.6130212543430389e-06], "fourier_magnitudes_out": [0.26065441966056824, 0.40997833013534546, 0.007034400478005409]}, "neuron_7": {"global_index": 43, "dominant_freq": 1, "fourier_magnitudes_in": [0.13383585214614868, 0.37854236364364624, 1.4905696161804372e-06], "fourier_magnitudes_out": [0.1364678144454956, 0.43534204363822937, 0.06277579069137573]}, "neuron_8": {"global_index": 390, "dominant_freq": 1, "fourier_magnitudes_in": [0.13247808814048767, 0.3747110366821289, 8.8494389274274e-06], "fourier_magnitudes_out": [0.24026153981685638, 0.557335615158081, 0.004272053483873606]}, "neuron_9": {"global_index": 62, "dominant_freq": 1, "fourier_magnitudes_in": [0.13209901750087738, 0.3736351430416107, 1.8117368654202437e-06], "fourier_magnitudes_out": [0.12142280489206314, 0.4252035915851593, 0.036476437002420425]}, "neuron_10": {"global_index": 186, "dominant_freq": 1, "fourier_magnitudes_in": [0.13167119026184082, 0.3724355101585388, 1.934191914187977e-06], "fourier_magnitudes_out": [0.0953248143196106, 0.3960951566696167, 0.006950821727514267]}, "neuron_11": {"global_index": 440, "dominant_freq": 1, "fourier_magnitudes_in": [0.13059888780117035, 0.36938971281051636, 1.577009101083604e-08], "fourier_magnitudes_out": [0.18008223176002502, 0.45487624406814575, 0.0012096347054466605]}, "neuron_12": {"global_index": 204, "dominant_freq": 1, "fourier_magnitudes_in": [1.0441669473948423e-05, 1.7463373296777718e-05, 0.3687886893749237], "fourier_magnitudes_out": [0.24216553568840027, 0.5107343792915344, 0.030801700428128242]}, "neuron_13": {"global_index": 152, "dominant_freq": 1, "fourier_magnitudes_in": [0.1296875923871994, 0.36682939529418945, 3.893473149219062e-06], "fourier_magnitudes_out": [0.15559691190719604, 0.4267895817756653, 0.004331708420068026]}, "neuron_14": {"global_index": 291, "dominant_freq": 1, "fourier_magnitudes_in": [0.1292923092842102, 0.3656914234161377, 2.285550635861e-06], "fourier_magnitudes_out": [0.23610876500606537, 0.426614910364151, 0.010882842354476452]}, "neuron_15": {"global_index": 479, "dominant_freq": 1, "fourier_magnitudes_in": [2.439726131342468e-06, 1.6284006960631814e-06, 0.36531955003738403], "fourier_magnitudes_out": [0.22035831212997437, 0.4314888119697571, 0.005853819660842419]}, "neuron_16": {"global_index": 312, "dominant_freq": 1, "fourier_magnitudes_in": [0.1287197470664978, 0.3640706241130829, 2.744055564107839e-06], "fourier_magnitudes_out": [0.18508373200893402, 0.3727245330810547, 0.01098876353353262]}, "neuron_17": {"global_index": 507, "dominant_freq": 1, "fourier_magnitudes_in": [0.12828592956066132, 0.36283373832702637, 2.710246178594389e-07], "fourier_magnitudes_out": [0.07814954966306686, 0.38358065485954285, 0.018465369939804077]}, "neuron_18": {"global_index": 83, "dominant_freq": 1, "fourier_magnitudes_in": [0.12704670429229736, 0.35935837030410767, 9.542891348246485e-06], "fourier_magnitudes_out": [0.17191722989082336, 0.4832451343536377, 0.043526772409677505]}, "neuron_19": {"global_index": 458, "dominant_freq": 1, "fourier_magnitudes_in": [0.1466502845287323, 0.2073993682861328, 0.3592132329940796], "fourier_magnitudes_out": [0.1300494223833084, 0.19639000296592712, 0.3800045847892761]}}}
|
precomputed_results/p_003/p003_output_logits.png
ADDED
|
precomputed_results/p_003/p003_overview.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"std_epochs": [0, 200, 400, 600, 800, 1000, 1200, 1400, 1600, 1800, 2000, 2200, 2400, 2600, 2800, 3000, 3200, 3400, 3600, 3800, 4000, 4200, 4400, 4600, 4800], "std_ipr": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "std_train_loss": [1.1109483242034912, 1.0304484367370605, 0.947655439376831, 0.8612433671951294, 0.7710723876953125, 0.6785023212432861, 0.5850968360900879, 0.4940829277038574, 0.4079987108707428, 0.32920774817466736, 0.2594999074935913, 0.19986817240715027, 0.15040792524814606, 0.11062172055244446, 0.07959280908107758, 0.05608634278178215, 0.038758277893066406, 0.026288457214832306, 0.017514534294605255, 0.011475162580609322, 0.007394743617624044, 0.004688998684287071, 0.002927658148109913, 0.0018001209245994687, 0.0010903897928074002]}
|
precomputed_results/p_003/p003_overview_loss_ipr.png
ADDED
|
precomputed_results/p_003/p003_overview_phase_scatter.png
ADDED
|
precomputed_results/p_003/p003_phase_align_approx1.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_phase_align_approx2.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_phase_align_quad.png
ADDED
|
precomputed_results/p_003/p003_phase_align_relu.png
ADDED
|
precomputed_results/p_003/p003_phase_distribution.png
ADDED
|
precomputed_results/p_003/p003_phase_relationship.png
ADDED
|
precomputed_results/p_003/p003_single_freq_quad.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_single_freq_relu.png
ADDED
|
Git LFS Details
|
precomputed_results/p_003/p003_training_log.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|