makifcevik commited on
Commit
e57771b
·
verified ·
1 Parent(s): b1a6c8e

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-7/config.json CHANGED
@@ -1,33 +1,41 @@
1
  {
2
  "architectures": [
3
- "BertForSequenceClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
 
6
  "classifier_dropout": null,
7
- "hidden_act": "gelu",
8
- "hidden_dropout_prob": 0.1,
9
- "hidden_size": 128,
 
10
  "id2label": {
11
  "LABEL_0": "negative",
12
  "LABEL_1": "positive"
13
  },
14
  "initializer_range": 0.02,
15
  "intermediate_size": 512,
 
 
16
  "label2id": {
17
  "negative": 0,
18
  "positive": 1
19
  },
20
  "layer_norm_eps": 1e-12,
21
  "max_position_embeddings": 512,
22
- "model_type": "bert",
23
- "num_attention_heads": 2,
24
- "num_hidden_layers": 2,
 
 
25
  "pad_token_id": 0,
26
- "position_embedding_type": "absolute",
27
  "problem_type": "single_label_classification",
28
  "torch_dtype": "float32",
29
  "transformers_version": "4.51.3",
 
 
30
  "type_vocab_size": 2,
31
- "use_cache": true,
 
32
  "vocab_size": 30522
33
  }
 
1
  {
2
  "architectures": [
3
+ "MobileBertForSequenceClassification"
4
  ],
5
  "attention_probs_dropout_prob": 0.1,
6
+ "classifier_activation": false,
7
  "classifier_dropout": null,
8
+ "embedding_size": 128,
9
+ "hidden_act": "relu",
10
+ "hidden_dropout_prob": 0.0,
11
+ "hidden_size": 512,
12
  "id2label": {
13
  "LABEL_0": "negative",
14
  "LABEL_1": "positive"
15
  },
16
  "initializer_range": 0.02,
17
  "intermediate_size": 512,
18
+ "intra_bottleneck_size": 128,
19
+ "key_query_shared_bottleneck": true,
20
  "label2id": {
21
  "negative": 0,
22
  "positive": 1
23
  },
24
  "layer_norm_eps": 1e-12,
25
  "max_position_embeddings": 512,
26
+ "model_type": "mobilebert",
27
+ "normalization_type": "no_norm",
28
+ "num_attention_heads": 4,
29
+ "num_feedforward_networks": 4,
30
+ "num_hidden_layers": 24,
31
  "pad_token_id": 0,
 
32
  "problem_type": "single_label_classification",
33
  "torch_dtype": "float32",
34
  "transformers_version": "4.51.3",
35
+ "trigram_input": true,
36
+ "true_hidden_size": 128,
37
  "type_vocab_size": 2,
38
+ "use_bottleneck": true,
39
+ "use_bottleneck_attention": false,
40
  "vocab_size": 30522
41
  }
checkpoint-7/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0053fef86ddfa093cdaccc6931a3dc51c243ed13d68523fc4d065afc87ab1604
3
- size 17549312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf83bce81e36c9be6ce3c489f440f7b2626836074b1f7b6963213bc7ebfabc36
3
+ size 98470112
checkpoint-7/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a287d2025c941c456eac19e5cbb1c2227ecbce1472440672dc1d742c82c83eb
3
- size 35123898
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcc0e7bf2ca72f2e8202e1b7f034ddd4a86824ada12c4deddcc567b259edefac
3
+ size 197593757
checkpoint-7/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f42508f1fa811c01793b47e142274e8086f1d7bcec910eff64443ea1ee4491a6
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85d6eca64aa942b1fb6242ccacdb356b249b16a5213116b7a463df59ba8a0592
3
  size 14244
checkpoint-7/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 7,
3
- "best_metric": 0.30054421768707484,
4
  "best_model_checkpoint": "./results\\checkpoint-7",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
@@ -11,12 +11,12 @@
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
- "eval_accuracy": 0.47,
15
- "eval_f1": 0.30054421768707484,
16
- "eval_loss": 0.7224627733230591,
17
- "eval_runtime": 0.1369,
18
- "eval_samples_per_second": 730.665,
19
- "eval_steps_per_second": 51.147,
20
  "step": 7
21
  }
22
  ],
@@ -37,7 +37,7 @@
37
  "attributes": {}
38
  }
39
  },
40
- "total_flos": 127048704000.0,
41
  "train_batch_size": 16,
42
  "trial_name": null,
43
  "trial_params": null
 
1
  {
2
  "best_global_step": 7,
3
+ "best_metric": 0.3671895424836601,
4
  "best_model_checkpoint": "./results\\checkpoint-7",
5
  "epoch": 1.0,
6
  "eval_steps": 500,
 
11
  "log_history": [
12
  {
13
  "epoch": 1.0,
14
+ "eval_accuracy": 0.53,
15
+ "eval_f1": 0.3671895424836601,
16
+ "eval_loss": 390876.71875,
17
+ "eval_runtime": 2.5345,
18
+ "eval_samples_per_second": 39.456,
19
+ "eval_steps_per_second": 2.762,
20
  "step": 7
21
  }
22
  ],
 
37
  "attributes": {}
38
  }
39
  },
40
+ "total_flos": 6270852096000.0,
41
  "train_batch_size": 16,
42
  "trial_name": null,
43
  "trial_params": null
checkpoint-7/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9bda51bd81b8a1c7f9c3de07b155661dcbc50fd649940b4dedccc037a1028b31
3
  size 5304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab0605f9ed33d05f165c2819fb33ed3f1442d423c372f77031105ed68bd9dbbb
3
  size 5304