zhuoranyang commited on
Commit
5a1ae71
·
verified ·
1 Parent(s): c178e48

Add precomputed results for p=3

Browse files
.gitattributes CHANGED
@@ -167,3 +167,9 @@ precomputed_results/p_067/p067_phase_align_approx2.png filter=lfs diff=lfs merge
167
  precomputed_results/p_067/p067_phase_align_quad.png filter=lfs diff=lfs merge=lfs -text
168
  precomputed_results/p_067/p067_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
169
  precomputed_results/p_067/p067_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
167
  precomputed_results/p_067/p067_phase_align_quad.png filter=lfs diff=lfs merge=lfs -text
168
  precomputed_results/p_067/p067_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
169
  precomputed_results/p_067/p067_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
170
+ precomputed_results/p_003/p003_lineplot_in.png filter=lfs diff=lfs merge=lfs -text
171
+ precomputed_results/p_003/p003_lineplot_out.png filter=lfs diff=lfs merge=lfs -text
172
+ precomputed_results/p_003/p003_phase_align_approx1.png filter=lfs diff=lfs merge=lfs -text
173
+ precomputed_results/p_003/p003_phase_align_approx2.png filter=lfs diff=lfs merge=lfs -text
174
+ precomputed_results/p_003/p003_single_freq_quad.png filter=lfs diff=lfs merge=lfs -text
175
+ precomputed_results/p_003/p003_single_freq_relu.png filter=lfs diff=lfs merge=lfs -text
precomputed_results/p_003/p003_dft_heatmap_in.png ADDED
precomputed_results/p_003/p003_dft_heatmap_out.png ADDED
precomputed_results/p_003/p003_lineplot_in.png ADDED

Git LFS Details

  • SHA256: 8571a0b38d847678a6f64c282309e13e581309677abbb0f4f44467344f6353a0
  • Pointer size: 131 Bytes
  • Size of remote file: 103 kB
precomputed_results/p_003/p003_lineplot_out.png ADDED

Git LFS Details

  • SHA256: 9e7132b123200e598c279f1b263179de52e4ad91f25f350b6b477e6cf72b85fd
  • Pointer size: 131 Bytes
  • Size of remote file: 118 kB
precomputed_results/p_003/p003_logits_interactive.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"pairs": [[0, 0], [1, 0], [2, 0]], "correct_answers": [0, 1, 2], "logits": [[4.3912763595581055, -3.80269718170166, -3.5643606185913086], [-2.968888282775879, 5.465089797973633, -2.4930355548858643], [-2.4251582622528076, -2.766524314880371, 5.376070976257324]], "output_classes": [0, 1, 2]}
precomputed_results/p_003/p003_lottery_beta_contour.png ADDED
precomputed_results/p_003/p003_lottery_mech_magnitude.png ADDED
precomputed_results/p_003/p003_lottery_mech_phase.png ADDED
precomputed_results/p_003/p003_magnitude_distribution.png ADDED
precomputed_results/p_003/p003_metadata.json ADDED
@@ -0,0 +1,82 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "prime": 3,
3
+ "d_mlp": 512,
4
+ "training_runs": {
5
+ "standard": {
6
+ "act_type": "ReLU",
7
+ "lr": 5e-05,
8
+ "weight_decay": 0,
9
+ "num_epochs": 5000,
10
+ "frac_train": 1.0,
11
+ "init_type": "random",
12
+ "init_scale": 0.1,
13
+ "optimizer": "AdamW"
14
+ },
15
+ "grokking": {
16
+ "act_type": "ReLU",
17
+ "lr": 0.0001,
18
+ "weight_decay": 2.0,
19
+ "num_epochs": 50000,
20
+ "frac_train": 0.75,
21
+ "init_type": "random",
22
+ "init_scale": 0.1,
23
+ "optimizer": "AdamW"
24
+ },
25
+ "quad_random": {
26
+ "act_type": "Quad",
27
+ "lr": 5e-05,
28
+ "weight_decay": 0,
29
+ "num_epochs": 5000,
30
+ "frac_train": 1.0,
31
+ "init_type": "random",
32
+ "init_scale": 0.1,
33
+ "optimizer": "AdamW"
34
+ },
35
+ "quad_single_freq": {
36
+ "act_type": "Quad",
37
+ "lr": 0.1,
38
+ "weight_decay": 0,
39
+ "num_epochs": 10000,
40
+ "frac_train": 1.0,
41
+ "init_type": "single-freq",
42
+ "init_scale": 0.02,
43
+ "optimizer": "SGD"
44
+ },
45
+ "relu_single_freq": {
46
+ "act_type": "ReLU",
47
+ "lr": 0.01,
48
+ "weight_decay": 0,
49
+ "num_epochs": 10000,
50
+ "frac_train": 1.0,
51
+ "init_type": "single-freq",
52
+ "init_scale": 0.002,
53
+ "optimizer": "SGD"
54
+ }
55
+ },
56
+ "final_metrics": {
57
+ "standard": {
58
+ "train_acc": 1.0,
59
+ "test_acc": 1.0,
60
+ "train_loss": 0.000652323302347213,
61
+ "test_loss": 0.000652323302347213
62
+ },
63
+ "quad_random": {
64
+ "train_acc": 1.0,
65
+ "test_acc": 1.0,
66
+ "train_loss": 2.1325192847143626e-06,
67
+ "test_loss": 2.1325192847143626e-06
68
+ },
69
+ "quad_single_freq": {
70
+ "train_acc": 1.0,
71
+ "test_acc": 1.0,
72
+ "train_loss": 0.00011593083763727918,
73
+ "test_loss": 0.00011593083763727918
74
+ },
75
+ "relu_single_freq": {
76
+ "train_acc": 1.0,
77
+ "test_acc": 1.0,
78
+ "train_loss": 0.010676158592104912,
79
+ "test_loss": 0.010676158592104912
80
+ }
81
+ }
82
+ }
precomputed_results/p_003/p003_neuron_spectra.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"fourier_basis_names": ["Const", "cos 1", "sin 1"], "neurons": {"neuron_0": {"global_index": 103, "dominant_freq": 1, "fourier_magnitudes_in": [0.1533791720867157, 0.4337967336177826, 5.208070433582179e-06], "fourier_magnitudes_out": [0.08648745715618134, 0.4276861846446991, 0.02207593433558941]}, "neuron_1": {"global_index": 378, "dominant_freq": 1, "fourier_magnitudes_in": [4.64054483018117e-06, 4.665445885621011e-06, 0.4044943153858185], "fourier_magnitudes_out": [0.17398148775100708, 0.4107496738433838, 0.030531879514455795]}, "neuron_2": {"global_index": 391, "dominant_freq": 1, "fourier_magnitudes_in": [0.13995108008384705, 0.3958445191383362, 5.925997356825974e-06], "fourier_magnitudes_out": [0.14620955288410187, 0.38962724804878235, 0.03937247395515442]}, "neuron_3": {"global_index": 233, "dominant_freq": 1, "fourier_magnitudes_in": [0.15963488817214966, 0.2257595956325531, 0.3910297155380249], "fourier_magnitudes_out": [0.08809392154216766, 0.2753666937351227, 0.3857313394546509]}, "neuron_4": {"global_index": 154, "dominant_freq": 1, "fourier_magnitudes_in": [0.13708585500717163, 0.38772234320640564, 1.113968551180733e-06], "fourier_magnitudes_out": [0.06758829206228256, 0.4502902328968048, 0.051096681505441666]}, "neuron_5": {"global_index": 510, "dominant_freq": 1, "fourier_magnitudes_in": [7.893670044722967e-06, 1.8176755474996753e-05, 0.38303306698799133], "fourier_magnitudes_out": [0.04921259358525276, 0.38618966937065125, 0.08766306936740875]}, "neuron_6": {"global_index": 96, "dominant_freq": 1, "fourier_magnitudes_in": [0.13497814536094666, 0.38177254796028137, 1.6130212543430389e-06], "fourier_magnitudes_out": [0.26065441966056824, 0.40997833013534546, 0.007034400478005409]}, "neuron_7": {"global_index": 43, "dominant_freq": 1, "fourier_magnitudes_in": [0.13383585214614868, 0.37854236364364624, 1.4905696161804372e-06], "fourier_magnitudes_out": [0.1364678144454956, 0.43534204363822937, 0.06277579069137573]}, "neuron_8": {"global_index": 390, "dominant_freq": 1, "fourier_magnitudes_in": [0.13247808814048767, 0.3747110366821289, 8.8494389274274e-06], "fourier_magnitudes_out": [0.24026153981685638, 0.557335615158081, 0.004272053483873606]}, "neuron_9": {"global_index": 62, "dominant_freq": 1, "fourier_magnitudes_in": [0.13209901750087738, 0.3736351430416107, 1.8117368654202437e-06], "fourier_magnitudes_out": [0.12142280489206314, 0.4252035915851593, 0.036476437002420425]}, "neuron_10": {"global_index": 186, "dominant_freq": 1, "fourier_magnitudes_in": [0.13167119026184082, 0.3724355101585388, 1.934191914187977e-06], "fourier_magnitudes_out": [0.0953248143196106, 0.3960951566696167, 0.006950821727514267]}, "neuron_11": {"global_index": 440, "dominant_freq": 1, "fourier_magnitudes_in": [0.13059888780117035, 0.36938971281051636, 1.577009101083604e-08], "fourier_magnitudes_out": [0.18008223176002502, 0.45487624406814575, 0.0012096347054466605]}, "neuron_12": {"global_index": 204, "dominant_freq": 1, "fourier_magnitudes_in": [1.0441669473948423e-05, 1.7463373296777718e-05, 0.3687886893749237], "fourier_magnitudes_out": [0.24216553568840027, 0.5107343792915344, 0.030801700428128242]}, "neuron_13": {"global_index": 152, "dominant_freq": 1, "fourier_magnitudes_in": [0.1296875923871994, 0.36682939529418945, 3.893473149219062e-06], "fourier_magnitudes_out": [0.15559691190719604, 0.4267895817756653, 0.004331708420068026]}, "neuron_14": {"global_index": 291, "dominant_freq": 1, "fourier_magnitudes_in": [0.1292923092842102, 0.3656914234161377, 2.285550635861e-06], "fourier_magnitudes_out": [0.23610876500606537, 0.426614910364151, 0.010882842354476452]}, "neuron_15": {"global_index": 479, "dominant_freq": 1, "fourier_magnitudes_in": [2.439726131342468e-06, 1.6284006960631814e-06, 0.36531955003738403], "fourier_magnitudes_out": [0.22035831212997437, 0.4314888119697571, 0.005853819660842419]}, "neuron_16": {"global_index": 312, "dominant_freq": 1, "fourier_magnitudes_in": [0.1287197470664978, 0.3640706241130829, 2.744055564107839e-06], "fourier_magnitudes_out": [0.18508373200893402, 0.3727245330810547, 0.01098876353353262]}, "neuron_17": {"global_index": 507, "dominant_freq": 1, "fourier_magnitudes_in": [0.12828592956066132, 0.36283373832702637, 2.710246178594389e-07], "fourier_magnitudes_out": [0.07814954966306686, 0.38358065485954285, 0.018465369939804077]}, "neuron_18": {"global_index": 83, "dominant_freq": 1, "fourier_magnitudes_in": [0.12704670429229736, 0.35935837030410767, 9.542891348246485e-06], "fourier_magnitudes_out": [0.17191722989082336, 0.4832451343536377, 0.043526772409677505]}, "neuron_19": {"global_index": 458, "dominant_freq": 1, "fourier_magnitudes_in": [0.1466502845287323, 0.2073993682861328, 0.3592132329940796], "fourier_magnitudes_out": [0.1300494223833084, 0.19639000296592712, 0.3800045847892761]}}}
precomputed_results/p_003/p003_output_logits.png ADDED
precomputed_results/p_003/p003_overview.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"std_epochs": [0, 200, 400, 600, 800, 1000, 1200, 1400, 1600, 1800, 2000, 2200, 2400, 2600, 2800, 3000, 3200, 3400, 3600, 3800, 4000, 4200, 4400, 4600, 4800], "std_ipr": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "std_train_loss": [1.1109483242034912, 1.0304484367370605, 0.947655439376831, 0.8612433671951294, 0.7710723876953125, 0.6785023212432861, 0.5850968360900879, 0.4940829277038574, 0.4079987108707428, 0.32920774817466736, 0.2594999074935913, 0.19986817240715027, 0.15040792524814606, 0.11062172055244446, 0.07959280908107758, 0.05608634278178215, 0.038758277893066406, 0.026288457214832306, 0.017514534294605255, 0.011475162580609322, 0.007394743617624044, 0.004688998684287071, 0.002927658148109913, 0.0018001209245994687, 0.0010903897928074002]}
precomputed_results/p_003/p003_overview_loss_ipr.png ADDED
precomputed_results/p_003/p003_overview_phase_scatter.png ADDED
precomputed_results/p_003/p003_phase_align_approx1.png ADDED

Git LFS Details

  • SHA256: dfafb96a5386ddd82c6af654ecf4be21025cee227434fd89cd1f3b699b499d89
  • Pointer size: 131 Bytes
  • Size of remote file: 128 kB
precomputed_results/p_003/p003_phase_align_approx2.png ADDED

Git LFS Details

  • SHA256: 6c6c5d8f3140e49c49558ee706e22512abde2c7db31e306d133704775e34542f
  • Pointer size: 131 Bytes
  • Size of remote file: 136 kB
precomputed_results/p_003/p003_phase_align_quad.png ADDED
precomputed_results/p_003/p003_phase_align_relu.png ADDED
precomputed_results/p_003/p003_phase_distribution.png ADDED
precomputed_results/p_003/p003_phase_relationship.png ADDED
precomputed_results/p_003/p003_single_freq_quad.png ADDED

Git LFS Details

  • SHA256: 01e712d04004dfbb8a97b1046746c25546ea70a7deb3d26a13362f09fe14b47d
  • Pointer size: 131 Bytes
  • Size of remote file: 128 kB
precomputed_results/p_003/p003_single_freq_relu.png ADDED

Git LFS Details

  • SHA256: 1e43df8e5f1bde24115c378bb7089d996b9ee911af065b75febd06c6c7f4de87
  • Pointer size: 131 Bytes
  • Size of remote file: 139 kB
precomputed_results/p_003/p003_training_log.json ADDED
The diff for this file is too large to render. See raw diff