k4black commited on
Commit
fc5d5ac
·
1 Parent(s): c393379

Model save

Browse files
last-checkpoint/config.json DELETED
@@ -1,33 +0,0 @@
1
- {
2
- "_name_or_path": "albert-base-v2",
3
- "architectures": [
4
- "AlbertForMaskedLM"
5
- ],
6
- "attention_probs_dropout_prob": 0,
7
- "bos_token_id": 2,
8
- "classifier_dropout_prob": 0.1,
9
- "down_scale_factor": 1,
10
- "embedding_size": 128,
11
- "eos_token_id": 3,
12
- "gap_size": 0,
13
- "hidden_act": "gelu_new",
14
- "hidden_dropout_prob": 0,
15
- "hidden_size": 768,
16
- "initializer_range": 0.02,
17
- "inner_group_num": 1,
18
- "intermediate_size": 3072,
19
- "layer_norm_eps": 1e-12,
20
- "max_position_embeddings": 512,
21
- "model_type": "albert",
22
- "net_structure_type": 0,
23
- "num_attention_heads": 12,
24
- "num_hidden_groups": 1,
25
- "num_hidden_layers": 12,
26
- "num_memory_blocks": 0,
27
- "pad_token_id": 0,
28
- "position_embedding_type": "absolute",
29
- "torch_dtype": "float32",
30
- "transformers_version": "4.23.1",
31
- "type_vocab_size": 2,
32
- "vocab_size": 30000
33
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0496b32513d75c8f410f18a7a7693cc1ca92ebccc07b0fb87b51fa3458bc31d6
3
- size 89789873
 
 
 
 
last-checkpoint/pytorch_model.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6b18a485539c6ced214f6f282b8a356c27c3f08b89cb37a05d973ed814d0b4e
3
- size 44900936
 
 
 
 
last-checkpoint/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:cde37b1d59ec8275aa116b67c6503ca997bd9a90886b106af365cbb8dfef4db9
3
- size 14575
 
 
 
 
last-checkpoint/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a758d7f80645ca7b6df48d736de4036b46f37bd0ee72c0a8f5b7db555d7202d4
3
- size 557
 
 
 
 
last-checkpoint/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3297467e71d3fc7db550ac11668566984d0914e69787cecd311b029149f474e3
3
- size 627
 
 
 
 
last-checkpoint/special_tokens_map.json DELETED
@@ -1,15 +0,0 @@
1
- {
2
- "bos_token": "[CLS]",
3
- "cls_token": "[CLS]",
4
- "eos_token": "[SEP]",
5
- "mask_token": {
6
- "content": "[MASK]",
7
- "lstrip": true,
8
- "normalized": false,
9
- "rstrip": false,
10
- "single_word": false
11
- },
12
- "pad_token": "<pad>",
13
- "sep_token": "[SEP]",
14
- "unk_token": "<unk>"
15
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/spiece.model DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fefb02b667a6c5c2fe27602d28e5fb3428f66ab89c7d6f388e7c8d44a02d0336
3
- size 760289
 
 
 
 
last-checkpoint/tokenizer.json DELETED
The diff for this file is too large to render. See raw diff
 
last-checkpoint/tokenizer_config.json DELETED
@@ -1,23 +0,0 @@
1
- {
2
- "bos_token": "[CLS]",
3
- "cls_token": "[CLS]",
4
- "do_lower_case": true,
5
- "eos_token": "[SEP]",
6
- "keep_accents": false,
7
- "mask_token": {
8
- "__type": "AddedToken",
9
- "content": "[MASK]",
10
- "lstrip": true,
11
- "normalized": false,
12
- "rstrip": false,
13
- "single_word": false
14
- },
15
- "model_max_length": 512,
16
- "name_or_path": "albert-base-v2",
17
- "pad_token": "<pad>",
18
- "remove_space": true,
19
- "sep_token": "[SEP]",
20
- "special_tokens_map_file": null,
21
- "tokenizer_class": "AlbertTokenizer",
22
- "unk_token": "<unk>"
23
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/trainer_state.json DELETED
@@ -1,86 +0,0 @@
1
- {
2
- "best_metric": 0.000184760894626379,
3
- "best_model_checkpoint": "./albert-results/checkpoint-500",
4
- "epoch": 0.32679738562091504,
5
- "global_step": 500,
6
- "is_hyper_param_search": false,
7
- "is_local_process_zero": true,
8
- "is_world_process_zero": true,
9
- "log_history": [
10
- {
11
- "epoch": 0.07,
12
- "learning_rate": 1.9925653594771244e-05,
13
- "loss": 3.3585,
14
- "step": 100
15
- },
16
- {
17
- "epoch": 0.07,
18
- "eval_loss": 0.14794819056987762,
19
- "eval_runtime": 16.5325,
20
- "eval_samples_per_second": 60.487,
21
- "eval_steps_per_second": 1.936,
22
- "step": 100
23
- },
24
- {
25
- "epoch": 0.13,
26
- "learning_rate": 1.9843954248366014e-05,
27
- "loss": 0.0929,
28
- "step": 200
29
- },
30
- {
31
- "epoch": 0.13,
32
- "eval_loss": 0.0728602185845375,
33
- "eval_runtime": 16.8991,
34
- "eval_samples_per_second": 59.175,
35
- "eval_steps_per_second": 1.894,
36
- "step": 200
37
- },
38
- {
39
- "epoch": 0.2,
40
- "learning_rate": 1.9762254901960787e-05,
41
- "loss": 0.0295,
42
- "step": 300
43
- },
44
- {
45
- "epoch": 0.2,
46
- "eval_loss": 0.0029316628351807594,
47
- "eval_runtime": 16.8378,
48
- "eval_samples_per_second": 59.39,
49
- "eval_steps_per_second": 1.9,
50
- "step": 300
51
- },
52
- {
53
- "epoch": 0.26,
54
- "learning_rate": 1.9680555555555557e-05,
55
- "loss": 0.0029,
56
- "step": 400
57
- },
58
- {
59
- "epoch": 0.26,
60
- "eval_loss": 0.0027500337455421686,
61
- "eval_runtime": 16.9348,
62
- "eval_samples_per_second": 59.05,
63
- "eval_steps_per_second": 1.89,
64
- "step": 400
65
- },
66
- {
67
- "epoch": 0.33,
68
- "learning_rate": 1.9598856209150327e-05,
69
- "loss": 0.0008,
70
- "step": 500
71
- },
72
- {
73
- "epoch": 0.33,
74
- "eval_loss": 0.000184760894626379,
75
- "eval_runtime": 16.883,
76
- "eval_samples_per_second": 59.231,
77
- "eval_steps_per_second": 1.895,
78
- "step": 500
79
- }
80
- ],
81
- "max_steps": 24480,
82
- "num_train_epochs": 16,
83
- "total_flos": 89897631744000.0,
84
- "trial_name": null,
85
- "trial_params": null
86
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
last-checkpoint/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:33bff3c131bd36da74e172c6d6a8e361cf13df6107f3da2909e49f51ec49a0fd
3
- size 3451
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6b18a485539c6ced214f6f282b8a356c27c3f08b89cb37a05d973ed814d0b4e
3
  size 44900936
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a246b08c8cf009af41cdc219512d6573aa6156680b27a56944baa66d4552c36c
3
  size 44900936
runs/Oct30_18-39-30_daccc72d0fea/events.out.tfevents.1667155186.daccc72d0fea.78.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a54b777c2922439609349f094c34bb405be8d44db7b023cf82fa4b4fdb4941ea
3
- size 6023
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:477b438414e2521b857e1158e474ca9901dfd08941926ddcfaf43618a87aa06f
3
+ size 6451