Basma2423 commited on
Commit
013610d
·
verified ·
1 Parent(s): d874c8b

Training in progress, step 3342

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:460494fca0f4acea2091375e6de05c014dcf0bfb165313b31bb5e67f778c2fd7
3
  size 558937304
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7fdb2b53096835a5a02597fbcbbb8b279b8398b05f1bdb4f9983b9ef5737b1fe
3
  size 558937304
runs/Apr27_12-02-54_ip-10-192-12-76/events.out.tfevents.1745755375.ip-10-192-12-76.2375.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2dce00904eb8a9eb57a26917dfd445c1295c0016e266de1444f683965cf0bb
3
+ size 6679
trainer_state.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "best_global_step": 2228,
3
- "best_metric": 0.7726060406484112,
4
- "best_model_checkpoint": "./checkpoints/checkpoint-2228",
5
- "epoch": 0.39987436622246153,
6
  "eval_steps": 1114,
7
- "global_step": 2228,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -54,6 +54,29 @@
54
  "eval_samples_per_second": 405.3,
55
  "eval_steps_per_second": 1.057,
56
  "step": 2228
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  }
58
  ],
59
  "logging_steps": 500,
@@ -73,7 +96,7 @@
73
  "attributes": {}
74
  }
75
  },
76
- "total_flos": 2.608386971617198e+17,
77
  "train_batch_size": 384,
78
  "trial_name": null,
79
  "trial_params": null
 
1
  {
2
+ "best_global_step": 3342,
3
+ "best_metric": 0.7720533296293449,
4
+ "best_model_checkpoint": "./checkpoints/checkpoint-3342",
5
+ "epoch": 0.5998115493336923,
6
  "eval_steps": 1114,
7
+ "global_step": 3342,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
54
  "eval_samples_per_second": 405.3,
55
  "eval_steps_per_second": 1.057,
56
  "step": 2228
57
+ },
58
+ {
59
+ "epoch": 0.44869206263741196,
60
+ "grad_norm": 0.04356146231293678,
61
+ "learning_rate": 4.970863550514242e-05,
62
+ "loss": 0.0398,
63
+ "step": 2500
64
+ },
65
+ {
66
+ "epoch": 0.5384304751648943,
67
+ "grad_norm": 0.03718848526477814,
68
+ "learning_rate": 4.767405209364289e-05,
69
+ "loss": 0.0348,
70
+ "step": 3000
71
+ },
72
+ {
73
+ "epoch": 0.5998115493336923,
74
+ "eval_cer": 0.7720533296293449,
75
+ "eval_loss": 0.022723019123077393,
76
+ "eval_runtime": 439.0491,
77
+ "eval_samples_per_second": 403.306,
78
+ "eval_steps_per_second": 1.052,
79
+ "step": 3342
80
  }
81
  ],
82
  "logging_steps": 500,
 
96
  "attributes": {}
97
  }
98
  },
99
+ "total_flos": 3.912580457425797e+17,
100
  "train_batch_size": 384,
101
  "trial_name": null,
102
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d196aaedfdfd5bf4cdd22a7af058a95539d2d015355bfb0a175769535634028
3
- size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bce4c2a570e5406234205443c86622d09135dc71fc8963eb2e85ed7f5af2b7c
3
+ size 5841