ThingsAI commited on
Commit
2dfe12b
·
verified ·
1 Parent(s): f115d8d

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +11 -16
config.json CHANGED
@@ -1,8 +1,10 @@
1
  {
2
  "model_type": "quark",
3
- "architectures": [
4
- "QuarkForCausalLM"
5
- ],
 
 
6
  "vocab_size": 65537,
7
  "d_model": 576,
8
  "n_heads": 9,
@@ -12,23 +14,16 @@
12
  "head_dim": 64,
13
  "max_seq_len": 2048,
14
  "rope_theta": 10000.0,
15
- "rms_eps": 1e-05,
16
  "qkv_bias": true,
17
  "dropout": 0.0,
18
  "torch_dtype": "bfloat16",
 
19
  "sft_dataset": "MBZUAI/Bactrian-X (it+en)",
20
  "sft_steps": 4000,
21
- "sft_loss": 1.8805,
22
- "base_pretrain": "step_0030000 (15.7B tokens bilingual IT+EN)",
23
  "tokenizer": "ThingAI/QuarkTokenizer",
24
- "languages": [
25
- "it",
26
- "en"
27
- ],
28
- "special_tokens": [
29
- "<|user|>",
30
- "<|assistant|>",
31
- "<|end|>"
32
- ],
33
- "tie_word_embeddings": true
34
  }
 
1
  {
2
  "model_type": "quark",
3
+ "architectures": ["QuarkForCausalLM"],
4
+ "auto_map": {
5
+ "AutoConfig": "configuration_quark.QuarkConfig",
6
+ "AutoModelForCausalLM": "modeling_quark.QuarkForCausalLM"
7
+ },
8
  "vocab_size": 65537,
9
  "d_model": 576,
10
  "n_heads": 9,
 
14
  "head_dim": 64,
15
  "max_seq_len": 2048,
16
  "rope_theta": 10000.0,
17
+ "rms_eps": 1e-5,
18
  "qkv_bias": true,
19
  "dropout": 0.0,
20
  "torch_dtype": "bfloat16",
21
+ "tie_word_embeddings": true,
22
  "sft_dataset": "MBZUAI/Bactrian-X (it+en)",
23
  "sft_steps": 4000,
24
+ "sft_loss": 1.9,
25
+ "base_pretrain": "15.7B tokens bilingual IT+EN",
26
  "tokenizer": "ThingAI/QuarkTokenizer",
27
+ "languages": ["it", "en"],
28
+ "special_tokens": ["<|user|>", "<|assistant|>", "<|end|>"]
 
 
 
 
 
 
 
 
29
  }