aixk commited on
Commit
cec9b34
·
1 Parent(s): bf01a26

prune 1 old checkpoints

Browse files
slots/10/checkpoint-8/config.json DELETED
@@ -1,24 +0,0 @@
1
- {
2
- "architectures": [
3
- "TwinyForCausalLM"
4
- ],
5
- "attention_dropout": 0.0,
6
- "dtype": "float32",
7
- "hidden_dropout": 0.0,
8
- "hidden_size": 1024,
9
- "initializer_range": 0.02,
10
- "intermediate_size": 4096,
11
- "max_position_embeddings": 160,
12
- "model_type": "twiny",
13
- "neftune_alpha": 0.0,
14
- "num_attention_heads": 16,
15
- "num_hidden_layers": 16,
16
- "num_key_value_heads": 4,
17
- "qk_norm": true,
18
- "rezero_init": 1.0,
19
- "rms_norm_eps": 1e-06,
20
- "rope_theta": 10000.0,
21
- "transformers_version": "5.0.0",
22
- "use_cache": false,
23
- "vocab_size": 4352
24
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
slots/10/checkpoint-8/rng_state.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1971a7f5a4b2dbf37c7eaedcc9ddd90b7f2853c5557f35719c1a2082903b821
3
- size 14455
 
 
 
 
slots/10/checkpoint-8/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e688c2645bb5d27329e0fbc058117fd5a0ad178cc2b74ed044ab00aa4abbaee7
3
- size 1465
 
 
 
 
slots/10/checkpoint-8/trainer_state.json DELETED
@@ -1,41 +0,0 @@
1
- {
2
- "best_global_step": null,
3
- "best_metric": null,
4
- "best_model_checkpoint": null,
5
- "epoch": 0.06306661411115491,
6
- "eval_steps": 500,
7
- "global_step": 8,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.007883326763894364,
14
- "grad_norm": 48.64533615112305,
15
- "learning_rate": 5e-05,
16
- "loss": 342.7203674316406,
17
- "step": 1
18
- }
19
- ],
20
- "logging_steps": 20,
21
- "max_steps": 35,
22
- "num_input_tokens_seen": 0,
23
- "num_train_epochs": 1,
24
- "save_steps": 1000000000,
25
- "stateful_callbacks": {
26
- "TrainerControl": {
27
- "args": {
28
- "should_epoch_stop": false,
29
- "should_evaluate": false,
30
- "should_log": false,
31
- "should_save": true,
32
- "should_training_stop": false
33
- },
34
- "attributes": {}
35
- }
36
- },
37
- "total_flos": 81290974003200.0,
38
- "train_batch_size": 1,
39
- "trial_name": null,
40
- "trial_params": null
41
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
slots/10/checkpoint-8/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9dc6d9a344877db6a986f580384331fc3de64a080c896f8fe9b8f2f0f044470
3
- size 5201