File size: 383 Bytes
1a4b406
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
{
  "model_type": "sprog",
  "architecture": "seq2seq-transformer",
  "framework": "mlx",
  "d": 304,
  "n_heads": 4,
  "n_layers": 4,
  "ff": 608,
  "max_src": 220,
  "max_tgt": 64,
  "src_vocab_size": 6000,
  "tgt_vocab_size": 79,
  "n_params": 9370000,
  "task": "gsm8k-math-word-problems",
  "inference": "self-consistency (96 samples) + symbolic verifier",
  "license": "mit"
}