SaitejaJate commited on
Commit
c75105a
·
verified ·
1 Parent(s): 4485604

Delete checkpoint-400

Browse files
checkpoint-400/config.json DELETED
@@ -1,25 +0,0 @@
1
- {
2
- "_name_or_path": "distilbert-base-uncased",
3
- "activation": "gelu",
4
- "architectures": [
5
- "DistilBertForSequenceClassification"
6
- ],
7
- "attention_dropout": 0.1,
8
- "dim": 768,
9
- "dropout": 0.1,
10
- "hidden_dim": 3072,
11
- "initializer_range": 0.02,
12
- "max_position_embeddings": 512,
13
- "model_type": "distilbert",
14
- "n_heads": 12,
15
- "n_layers": 6,
16
- "pad_token_id": 0,
17
- "problem_type": "single_label_classification",
18
- "qa_dropout": 0.1,
19
- "seq_classif_dropout": 0.2,
20
- "sinusoidal_pos_embds": false,
21
- "tie_weights_": true,
22
- "torch_dtype": "float32",
23
- "transformers_version": "4.49.0",
24
- "vocab_size": 30522
25
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-400/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a75078d7a59b6799de31673f39d27b34af0df229c8e3941beebcec1fe94aff22
3
- size 267832560
 
 
 
 
checkpoint-400/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e861d35446023aa01f002cd372ae3f20f187ece1fbeacc408fd97f317f9b367
3
- size 535724410
 
 
 
 
checkpoint-400/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:06e55bfc8723f269a626afca0be6f7def5753f3bb265436b94c5580b703cfcc7
3
- size 13990
 
 
 
 
checkpoint-400/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6fe93f995d555235837eb9f033279025ea84b859d771a1c41c585f055a1dd1f4
3
- size 1064
 
 
 
 
checkpoint-400/trainer_state.json DELETED
@@ -1,107 +0,0 @@
1
- {
2
- "best_metric": 0.9985358711566618,
3
- "best_model_checkpoint": "./cbt_classifier/checkpoint-400",
4
- "epoch": 1.338358458961474,
5
- "eval_steps": 200,
6
- "global_step": 400,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.16750418760469013,
13
- "grad_norm": 0.858985424041748,
14
- "learning_rate": 2.5e-05,
15
- "loss": 0.5097,
16
- "step": 50
17
- },
18
- {
19
- "epoch": 0.33500837520938026,
20
- "grad_norm": 2.54575777053833,
21
- "learning_rate": 5e-05,
22
- "loss": 0.0863,
23
- "step": 100
24
- },
25
- {
26
- "epoch": 0.5025125628140703,
27
- "grad_norm": 38.31464767456055,
28
- "learning_rate": 4.495967741935484e-05,
29
- "loss": 0.0248,
30
- "step": 150
31
- },
32
- {
33
- "epoch": 0.6700167504187605,
34
- "grad_norm": 0.0192014928907156,
35
- "learning_rate": 3.991935483870968e-05,
36
- "loss": 0.0322,
37
- "step": 200
38
- },
39
- {
40
- "epoch": 0.6700167504187605,
41
- "eval_accuracy": 0.9941434846266471,
42
- "eval_loss": 0.023075200617313385,
43
- "eval_runtime": 7.8942,
44
- "eval_samples_per_second": 86.519,
45
- "eval_steps_per_second": 10.894,
46
- "step": 200
47
- },
48
- {
49
- "epoch": 0.8375209380234506,
50
- "grad_norm": 0.010706444270908833,
51
- "learning_rate": 3.487903225806452e-05,
52
- "loss": 0.0155,
53
- "step": 250
54
- },
55
- {
56
- "epoch": 1.003350083752094,
57
- "grad_norm": 0.030784547328948975,
58
- "learning_rate": 2.9838709677419357e-05,
59
- "loss": 0.0134,
60
- "step": 300
61
- },
62
- {
63
- "epoch": 1.170854271356784,
64
- "grad_norm": 0.012720568105578423,
65
- "learning_rate": 2.4798387096774196e-05,
66
- "loss": 0.015,
67
- "step": 350
68
- },
69
- {
70
- "epoch": 1.338358458961474,
71
- "grad_norm": 0.0057291556149721146,
72
- "learning_rate": 1.975806451612903e-05,
73
- "loss": 0.0028,
74
- "step": 400
75
- },
76
- {
77
- "epoch": 1.338358458961474,
78
- "eval_accuracy": 0.9985358711566618,
79
- "eval_loss": 0.003182810265570879,
80
- "eval_runtime": 7.8968,
81
- "eval_samples_per_second": 86.491,
82
- "eval_steps_per_second": 10.891,
83
- "step": 400
84
- }
85
- ],
86
- "logging_steps": 50,
87
- "max_steps": 596,
88
- "num_input_tokens_seen": 0,
89
- "num_train_epochs": 2,
90
- "save_steps": 200,
91
- "stateful_callbacks": {
92
- "TrainerControl": {
93
- "args": {
94
- "should_epoch_stop": false,
95
- "should_evaluate": false,
96
- "should_log": false,
97
- "should_save": true,
98
- "should_training_stop": false
99
- },
100
- "attributes": {}
101
- }
102
- },
103
- "total_flos": 211682903052288.0,
104
- "train_batch_size": 8,
105
- "trial_name": null,
106
- "trial_params": null
107
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-400/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb638b9ec3e9109a3efd288a3ca3e8f97fe303983495cc33a011258151b00099
3
- size 5240