aixk commited on
Commit
1f5e8dc
·
verified ·
1 Parent(s): fbce39c

update slot resume pointers for step 45

Browse files
slots/0/checkpoint-42/config.json DELETED
@@ -1,36 +0,0 @@
1
- {
2
- "architectures": [
3
- "LlamaForCausalLM"
4
- ],
5
- "attention_bias": false,
6
- "attention_dropout": 0.0,
7
- "bos_token_id": 1,
8
- "dtype": "float32",
9
- "eos_token_id": 2,
10
- "head_dim": 64,
11
- "hidden_act": "silu",
12
- "hidden_dropout": 0.0,
13
- "hidden_size": 960,
14
- "initializer_range": 0.02,
15
- "intermediate_size": 2560,
16
- "max_position_embeddings": 1024,
17
- "mlp_bias": false,
18
- "model_type": "llama",
19
- "neftune_alpha": 0.0,
20
- "num_attention_heads": 15,
21
- "num_hidden_layers": 34,
22
- "num_key_value_heads": 5,
23
- "pad_token_id": null,
24
- "pretraining_tp": 1,
25
- "qk_norm": true,
26
- "rezero_init": 1.0,
27
- "rms_norm_eps": 1e-06,
28
- "rope_parameters": {
29
- "rope_theta": 100000.0,
30
- "rope_type": "default"
31
- },
32
- "tie_word_embeddings": false,
33
- "transformers_version": "5.0.0",
34
- "use_cache": false,
35
- "vocab_size": 49152
36
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
slots/0/checkpoint-42/generation_config.json DELETED
@@ -1,9 +0,0 @@
1
- {
2
- "_from_model_config": true,
3
- "bos_token_id": 1,
4
- "eos_token_id": 2,
5
- "output_attentions": false,
6
- "output_hidden_states": false,
7
- "transformers_version": "5.0.0",
8
- "use_cache": false
9
- }
 
 
 
 
 
 
 
 
 
 
slots/0/checkpoint-42/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ea1ff2e568f9dcaed3fc5c55262d03e77f149db0723475a721ec256dfc493e2
3
- size 1714721544
 
 
 
 
slots/0/checkpoint-42/optimizer.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:9ea99e421d4a4f28e9c713137c202fededfb61902826551a78447f79fd36e768
3
- size 175903435
 
 
 
 
slots/0/checkpoint-42/scaler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:73724ecbb293c433e222e4ddd1118f0e5a681c1a3d5f69c3dce9929e331ed56a
3
- size 1383
 
 
 
 
slots/0/checkpoint-42/scheduler.pt DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:635ca6592eeca73857d83634649bd4b0175d13502975eda520dd7e1d931f902d
3
- size 1465
 
 
 
 
slots/0/checkpoint-42/trainer_state.json DELETED
@@ -1,55 +0,0 @@
1
- {
2
- "best_global_step": null,
3
- "best_metric": null,
4
- "best_model_checkpoint": null,
5
- "epoch": 0.49203734211971445,
6
- "eval_steps": 500,
7
- "global_step": 42,
8
- "is_hyper_param_search": false,
9
- "is_local_process_zero": true,
10
- "is_world_process_zero": true,
11
- "log_history": [
12
- {
13
- "epoch": 0.003905296558457408,
14
- "grad_norm": 2.961405038833618,
15
- "learning_rate": 5e-05,
16
- "loss": 11.042926788330078,
17
- "step": 1
18
- },
19
- {
20
- "epoch": 0.07810593116914816,
21
- "grad_norm": 2.913111925125122,
22
- "learning_rate": 4.994503670730125e-05,
23
- "loss": 10.412632992393092,
24
- "step": 20
25
- },
26
- {
27
- "epoch": 0.4686069924949661,
28
- "grad_norm": 3.2043919563293457,
29
- "learning_rate": 4.795731611254473e-05,
30
- "loss": 8.956547207302517,
31
- "step": 40
32
- }
33
- ],
34
- "logging_steps": 20,
35
- "max_steps": 301,
36
- "num_input_tokens_seen": 0,
37
- "num_train_epochs": 4,
38
- "save_steps": 1000000000,
39
- "stateful_callbacks": {
40
- "TrainerControl": {
41
- "args": {
42
- "should_epoch_stop": false,
43
- "should_evaluate": false,
44
- "should_log": false,
45
- "should_save": true,
46
- "should_training_stop": false
47
- },
48
- "attributes": {}
49
- }
50
- },
51
- "total_flos": 1.260052958674944e+16,
52
- "train_batch_size": 1,
53
- "trial_name": null,
54
- "trial_params": null
55
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
slots/0/checkpoint-42/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e69ada62714d958c25cca51829f8ea6cdd265294d59777b45e1eca279f136098
3
- size 5201
 
 
 
 
slots/0/latest.json CHANGED
@@ -1 +1 @@
1
- {"worker_id": "slot:0", "checkpoint": "slots/0/checkpoint-42", "step": 42, "updated_at": 1776838127}
 
1
+ {"worker_id": "slot:0", "checkpoint": "slots/0/checkpoint-45", "step": 45, "updated_at": 1776843653}