wygbb commited on
Commit
9bca9c6
·
verified ·
1 Parent(s): 9ceab5a

Delete configuration_baichuan.py

Browse files
Files changed (1) hide show
  1. configuration_baichuan.py +0 -46
configuration_baichuan.py DELETED
@@ -1,46 +0,0 @@
1
- # Copyright (c) 2023, Baichuan Intelligent Technology. All rights reserved.
2
-
3
- from transformers.configuration_utils import PretrainedConfig
4
-
5
- class BaichuanConfig(PretrainedConfig):
6
- model_type = "baichuan"
7
- keys_to_ignore_at_inference = ["past_key_values"]
8
-
9
- def __init__(
10
- self,
11
- vocab_size=64000,
12
- hidden_size=5120,
13
- intermediate_size=13696,
14
- num_hidden_layers=40,
15
- num_attention_heads=40,
16
- hidden_act="silu",
17
- model_max_length=4096,
18
- initializer_range=0.02,
19
- rms_norm_eps=1e-6,
20
- use_cache=True,
21
- pad_token_id=0,
22
- bos_token_id=1,
23
- eos_token_id=2,
24
- tie_word_embeddings=False,
25
- gradient_checkpointing=False,
26
- **kwargs,
27
- ):
28
- self.vocab_size = vocab_size
29
- self.model_max_length = model_max_length
30
- self.hidden_size = hidden_size
31
- self.intermediate_size = intermediate_size
32
- self.num_hidden_layers = num_hidden_layers
33
- self.num_attention_heads = num_attention_heads
34
- self.hidden_act = hidden_act
35
- self.initializer_range = initializer_range
36
- self.rms_norm_eps = rms_norm_eps
37
- self.use_cache = use_cache
38
- self.gradient_checkpointing = gradient_checkpointing,
39
- super().__init__(
40
- pad_token_id=pad_token_id,
41
- bos_token_id=bos_token_id,
42
- eos_token_id=eos_token_id,
43
- tie_word_embeddings=tie_word_embeddings,
44
- **kwargs,
45
- )
46
-