LisaMegaWatts commited on
Commit
22300e2
·
verified ·
1 Parent(s): db000de

Compression metadata and results

Browse files
Files changed (1) hide show
  1. compression_metadata.json +59 -0
compression_metadata.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "method": "downscaling_projection",
3
+ "source_model": "LisaMegaWatts/JuliaSLM",
4
+ "source_params": 5037312,
5
+ "source_loss": 3.552281068317482,
6
+ "best_config": "A-3M",
7
+ "finetune_steps": 2000,
8
+ "finetune_lr": 0.0006,
9
+ "configs": {
10
+ "A-3M": {
11
+ "config": {
12
+ "d_model": 192,
13
+ "n_layers": 6,
14
+ "n_heads": 3,
15
+ "head_dim": 64,
16
+ "ffn_inner": 480,
17
+ "context_length": 256,
18
+ "vocab_size": 2000
19
+ },
20
+ "params": 2930112,
21
+ "reduction": 0.41831834121055034,
22
+ "pre_finetune_loss": 6.9663840472007115,
23
+ "post_finetune_loss": 3.9081690383949335,
24
+ "post_finetune_ppl": 49.8076724983192
25
+ },
26
+ "B-2.5M": {
27
+ "config": {
28
+ "d_model": 192,
29
+ "n_layers": 5,
30
+ "n_heads": 3,
31
+ "head_dim": 64,
32
+ "ffn_inner": 480,
33
+ "context_length": 256,
34
+ "vocab_size": 2000
35
+ },
36
+ "params": 2505792,
37
+ "reduction": 0.5025537429486202,
38
+ "pre_finetune_loss": 7.5051396219378885,
39
+ "post_finetune_loss": 3.9149324556950593,
40
+ "post_finetune_ppl": 50.14568434125149
41
+ },
42
+ "C-2M": {
43
+ "config": {
44
+ "d_model": 192,
45
+ "n_layers": 4,
46
+ "n_heads": 3,
47
+ "head_dim": 64,
48
+ "ffn_inner": 480,
49
+ "context_length": 256,
50
+ "vocab_size": 2000
51
+ },
52
+ "params": 2081472,
53
+ "reduction": 0.58678914468669,
54
+ "pre_finetune_loss": 8.09140216928519,
55
+ "post_finetune_loss": 3.9662209947702864,
56
+ "post_finetune_ppl": 52.78467987729236
57
+ }
58
+ }
59
+ }