pelossof commited on
Commit
32bfe2a
·
1 Parent(s): cc05f28

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,25 +1,25 @@
1
  {
2
- "_name_or_path": "microsoft/deberta-v3-xsmall",
3
  "architectures": [
4
  "DebertaV2ForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
- "hidden_size": 384,
10
  "initializer_range": 0.02,
11
- "intermediate_size": 1536,
12
  "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
  "max_relative_positions": -1,
15
  "model_type": "deberta-v2",
16
  "norm_rel_ebd": "layer_norm",
17
- "num_attention_heads": 6,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
20
  "pooler_dropout": 0,
21
  "pooler_hidden_act": "gelu",
22
- "pooler_hidden_size": 384,
23
  "pos_att_type": [
24
  "p2c",
25
  "c2p"
 
1
  {
2
+ "_name_or_path": "microsoft/deberta-v3-base",
3
  "architectures": [
4
  "DebertaV2ForMaskedLM"
5
  ],
6
  "attention_probs_dropout_prob": 0.1,
7
  "hidden_act": "gelu",
8
  "hidden_dropout_prob": 0.1,
9
+ "hidden_size": 768,
10
  "initializer_range": 0.02,
11
+ "intermediate_size": 3072,
12
  "layer_norm_eps": 1e-07,
13
  "max_position_embeddings": 512,
14
  "max_relative_positions": -1,
15
  "model_type": "deberta-v2",
16
  "norm_rel_ebd": "layer_norm",
17
+ "num_attention_heads": 12,
18
  "num_hidden_layers": 12,
19
  "pad_token_id": 0,
20
  "pooler_dropout": 0,
21
  "pooler_hidden_act": "gelu",
22
+ "pooler_hidden_size": 768,
23
  "pos_att_type": [
24
  "p2c",
25
  "c2p"
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:adca21531de52ba1622a8208366290326b1b08e9635e560c29c59041dd000c22
3
- size 283860016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aae86d32a9f0b6c1dea2ae74395163f52d7c9f5daccfdb2384bd9db40d20dddf
3
+ size 738231856
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b8843fd60452b2ee77050a224e132fba9e3f23d97e3fab65f26b6ed69f8dd70
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:075ae1fbccd329b3e256a3e7c66c8ecde732bae31e872953b8f24b031f0856a6
3
  size 4600