LilPhat23 commited on
Commit
7af71be
·
verified ·
1 Parent(s): 6b714f9

Delete config.json

Browse files
Files changed (1) hide show
  1. config.json +0 -51
config.json DELETED
@@ -1,51 +0,0 @@
1
- {
2
- "architectures": [
3
- "MPTForCausalLM"
4
- ],
5
- "attn_config": {
6
- "alibi": true,
7
- "alibi_bias_max": 8,
8
- "attn_impl": "torch",
9
- "attn_pdrop": 0.0,
10
- "attn_type": "multihead_attention",
11
- "attn_uses_sequence_id": false,
12
- "clip_qkv": null,
13
- "prefix_lm": false,
14
- "qk_ln": false,
15
- "softmax_scale": null
16
- },
17
- "auto_map": {
18
- "AutoConfig": "configuration_mpt.MPTConfig",
19
- "AutoModelForCausalLM": "modeling_mpt.MPTForCausalLM"
20
- },
21
- "d_model": 3072,
22
- "emb_pdrop": 0.0,
23
- "embedding_fraction": 1.0,
24
- "expansion_ratio": 4,
25
- "init_config": {
26
- "emb_init_std": null,
27
- "emb_init_uniform_lim": null,
28
- "fan_mode": "fan_in",
29
- "init_div_is_residual": true,
30
- "init_gain": 0.0,
31
- "init_nonlinearity": "relu",
32
- "init_std": null,
33
- "name": "kaiming_normal_",
34
- "verbose": 0
35
- },
36
- "init_device": "cpu",
37
- "learned_pos_emb": true,
38
- "logit_scale": null,
39
- "max_seq_len": 8192,
40
- "model_type": "phogpt",
41
- "n_heads": 24,
42
- "n_layers": 32,
43
- "no_bias": false,
44
- "norm_type": "low_precision_layernorm",
45
- "resid_pdrop": 0.0,
46
- "torch_dtype": "bfloat16",
47
- "transformers_version": "4.30.2",
48
- "use_cache": false,
49
- "verbose": 0,
50
- "vocab_size": 20480
51
- }