SaitejaJate commited on
Commit
4485604
·
verified ·
1 Parent(s): 88b8fd6

Delete checkpoint-200

Browse files
checkpoint-200/config.json DELETED
@@ -1,25 +0,0 @@
1
- {
2
- "_name_or_path": "distilbert-base-uncased",
3
- "activation": "gelu",
4
- "architectures": [
5
- "DistilBertForSequenceClassification"
6
- ],
7
- "attention_dropout": 0.1,
8
- "dim": 768,
9
- "dropout": 0.1,
10
- "hidden_dim": 3072,
11
- "initializer_range": 0.02,
12
- "max_position_embeddings": 512,
13
- "model_type": "distilbert",
14
- "n_heads": 12,
15
- "n_layers": 6,
16
- "pad_token_id": 0,
17
- "problem_type": "single_label_classification",
18
- "qa_dropout": 0.1,
19
- "seq_classif_dropout": 0.2,
20
- "sinusoidal_pos_embds": false,
21
- "tie_weights_": true,
22
- "torch_dtype": "float32",
23
- "transformers_version": "4.49.0",
24
- "vocab_size": 30522
25
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-200/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ba1ed4009db0f14fe96f723225588f2732128715085903a163691ad19d1183e
3
- size 267832560
 
 
 
 
checkpoint-200/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:78129a9bf914880b817b2e7d52fc1084f4990cee96d77884966a0d07f850171d
3
- size 535724410
 
 
 
 
checkpoint-200/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b182573f61d8bcf5eaefcbf8f98d8734b6db51b44ad36aed3a305c431539fa1
3
- size 13990
 
 
 
 
checkpoint-200/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d3604dd67acb2c38b76741c9250cef6941c411bc49a9218ce93c4bfef9ecf1d
3
- size 1064
 
 
 
 
checkpoint-200/trainer_state.json DELETED
@@ -1,70 +0,0 @@
1
- {
2
- "best_metric": 0.9941434846266471,
3
- "best_model_checkpoint": "./cbt_classifier/checkpoint-200",
4
- "epoch": 0.6700167504187605,
5
- "eval_steps": 200,
6
- "global_step": 200,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.16750418760469013,
13
- "grad_norm": 0.858985424041748,
14
- "learning_rate": 2.5e-05,
15
- "loss": 0.5097,
16
- "step": 50
17
- },
18
- {
19
- "epoch": 0.33500837520938026,
20
- "grad_norm": 2.54575777053833,
21
- "learning_rate": 5e-05,
22
- "loss": 0.0863,
23
- "step": 100
24
- },
25
- {
26
- "epoch": 0.5025125628140703,
27
- "grad_norm": 38.31464767456055,
28
- "learning_rate": 4.495967741935484e-05,
29
- "loss": 0.0248,
30
- "step": 150
31
- },
32
- {
33
- "epoch": 0.6700167504187605,
34
- "grad_norm": 0.0192014928907156,
35
- "learning_rate": 3.991935483870968e-05,
36
- "loss": 0.0322,
37
- "step": 200
38
- },
39
- {
40
- "epoch": 0.6700167504187605,
41
- "eval_accuracy": 0.9941434846266471,
42
- "eval_loss": 0.023075200617313385,
43
- "eval_runtime": 7.8942,
44
- "eval_samples_per_second": 86.519,
45
- "eval_steps_per_second": 10.894,
46
- "step": 200
47
- }
48
- ],
49
- "logging_steps": 50,
50
- "max_steps": 596,
51
- "num_input_tokens_seen": 0,
52
- "num_train_epochs": 2,
53
- "save_steps": 200,
54
- "stateful_callbacks": {
55
- "TrainerControl": {
56
- "args": {
57
- "should_epoch_stop": false,
58
- "should_evaluate": false,
59
- "should_log": false,
60
- "should_save": true,
61
- "should_training_stop": false
62
- },
63
- "attributes": {}
64
- }
65
- },
66
- "total_flos": 105973918924800.0,
67
- "train_batch_size": 8,
68
- "trial_name": null,
69
- "trial_params": null
70
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
checkpoint-200/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb638b9ec3e9109a3efd288a3ca3e8f97fe303983495cc33a011258151b00099
3
- size 5240