File size: 981 Bytes
efd2986
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
{
  "description": "FRANKENSTALLM 3B v2 sampling/generation parameters (ORPO eval grid best)",
  "default": {
    "max_new_tokens": 512,
    "temperature": 0.8,
    "top_p": 0.9,
    "do_sample": true,
    "repetition_penalty": 1.05
  },
  "recommended": {
    "comment": "ORPO repetition grid best: t0.7_rep1.2 (0% 3-gram rep, 100% EOS)",
    "temperature": 0.7,
    "repetition_penalty": 1.2,
    "top_p": 0.9,
    "max_new_tokens": 512,
    "do_sample": true
  },
  "greedy": {
    "temperature": 0.0,
    "repetition_penalty": 1.0,
    "do_sample": false,
    "max_new_tokens": 256
  },
  "ollama": {
    "comment": "Ollama Modelfile PARAMETERS or runtime options",
    "temperature": 0.7,
    "repeat_penalty": 1.2,
    "top_p": 0.9,
    "num_predict": 512
  },
  "grid_best": {
    "name": "t0.7_rep1.2",
    "temperature": 0.70,
    "repetition_penalty": 1.20,
    "top_p": 0.9,
    "3gram_rep": 0.0,
    "4gram_rep": 0.0,
    "eos_rate": 1.0,
    "avg_tokens": 189.2
  }
}