PyTorch
English
delulu
custom_code
massabaali commited on
Commit
4c3bfb9
·
verified ·
1 Parent(s): a4a60fd

Upload config.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.json +32 -10
config.json CHANGED
@@ -1,13 +1,39 @@
1
  {
2
  "model_type": "delulu",
3
- "architectures": ["DELULUModel"],
 
 
4
  "auto_map": {
5
  "AutoConfig": "configuration_delulu.DELULUConfig",
6
  "AutoModel": "modeling_delulu.DELULUModel"
7
  },
8
- "conv_dim": [512, 512, 512, 512, 512, 512, 512],
9
- "conv_kernel": [10, 3, 3, 3, 3, 2, 2],
10
- "conv_stride": [4, 2, 2, 2, 2, 2, 2],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  "conv_bias": false,
12
  "extractor_mode": "group_norm",
13
  "hidden_size": 768,
@@ -18,7 +44,7 @@
18
  "attention_dropout": 0.1,
19
  "final_dropout": 0.1,
20
  "feat_proj_dropout": 0.1,
21
- "layer_norm_eps": 1e-5,
22
  "layer_drop": 0.05,
23
  "num_conv_pos_embeddings": 128,
24
  "num_conv_pos_embedding_groups": 16,
@@ -27,9 +53,5 @@
27
  "num_clusters": 256,
28
  "feature_type": "redimnet",
29
  "num_feat_extract_layers": 7,
30
- "pad_token_id": 0,
31
- "bos_token_id": 1,
32
- "eos_token_id": 2,
33
- "transformers_version": "4.36.0",
34
  "torch_dtype": "float32"
35
- }
 
1
  {
2
  "model_type": "delulu",
3
+ "architectures": [
4
+ "DELULUModel"
5
+ ],
6
  "auto_map": {
7
  "AutoConfig": "configuration_delulu.DELULUConfig",
8
  "AutoModel": "modeling_delulu.DELULUModel"
9
  },
10
+ "conv_dim": [
11
+ 512,
12
+ 512,
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512
18
+ ],
19
+ "conv_kernel": [
20
+ 10,
21
+ 3,
22
+ 3,
23
+ 3,
24
+ 3,
25
+ 2,
26
+ 2
27
+ ],
28
+ "conv_stride": [
29
+ 4,
30
+ 2,
31
+ 2,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2
36
+ ],
37
  "conv_bias": false,
38
  "extractor_mode": "group_norm",
39
  "hidden_size": 768,
 
44
  "attention_dropout": 0.1,
45
  "final_dropout": 0.1,
46
  "feat_proj_dropout": 0.1,
47
+ "layer_norm_eps": 1e-05,
48
  "layer_drop": 0.05,
49
  "num_conv_pos_embeddings": 128,
50
  "num_conv_pos_embedding_groups": 16,
 
53
  "num_clusters": 256,
54
  "feature_type": "redimnet",
55
  "num_feat_extract_layers": 7,
 
 
 
 
56
  "torch_dtype": "float32"
57
+ }