nour4286 commited on
Commit
18ae4a2
·
verified ·
1 Parent(s): 181c39b

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-3743/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "moussakam/Arabart",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
 
1
  {
2
+ "_name_or_path": "nour4286/ArabartModel",
3
  "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
checkpoint-3743/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c2930f8ab2dd0a46858cbba04e476117ffa46128c52f9ef92c761063c84326e
3
  size 557116312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1121eefca3b4957308588e5490479bc7e5dfe0e28c12dc1ef2b264a712dea926
3
  size 557116312
checkpoint-3743/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:699a98a7a52d70ff1d86e339f4d11b9683d24fddd3cbdceea50a59f1a8b05f05
3
  size 1113991930
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b00fab32c4b4a0c7467ab865cb82f3946a88826109286f603e3643b60531efbf
3
  size 1113991930
checkpoint-3743/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:557e659df0fae2e63fc7ba4fd94075ae8b0ea2a8d60d30519b66bc17dbd7e027
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e1af3b209edf367387ccd9ba32486ff7328abe4d196775ffadc967aab340f30
3
  size 1064
checkpoint-3743/tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 128,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
checkpoint-3743/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 26.0848,
3
  "best_model_checkpoint": "/content/drive/MyDrive/checkpoint-3743",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
@@ -10,62 +10,62 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.1335826876836762,
13
- "grad_norm": 4.480758190155029,
14
- "learning_rate": 4.7773621871938735e-05,
15
- "loss": 3.8388,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.2671653753673524,
20
- "grad_norm": 4.0973663330078125,
21
- "learning_rate": 4.554724374387746e-05,
22
- "loss": 3.534,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.4007480630510286,
27
- "grad_norm": 3.4115138053894043,
28
- "learning_rate": 4.332086561581619e-05,
29
- "loss": 3.4407,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.5343307507347048,
34
- "grad_norm": 4.144280910491943,
35
- "learning_rate": 4.1094487487754926e-05,
36
- "loss": 3.3758,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.667913438418381,
41
- "grad_norm": 4.332496643066406,
42
- "learning_rate": 3.886810935969365e-05,
43
- "loss": 3.3258,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.8014961261020572,
48
- "grad_norm": 3.689181089401245,
49
- "learning_rate": 3.6641731231632384e-05,
50
- "loss": 3.2834,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.9350788137857333,
55
- "grad_norm": 3.1737449169158936,
56
- "learning_rate": 3.441535310357111e-05,
57
- "loss": 3.2471,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 1.0,
62
- "eval_loss": 2.7515902519226074,
63
- "eval_rouge1": 26.0848,
64
- "eval_rouge2": 12.3268,
65
- "eval_rougeL": 23.6134,
66
- "eval_runtime": 766.0717,
67
- "eval_samples_per_second": 6.121,
68
- "eval_steps_per_second": 0.612,
69
  "step": 3743
70
  }
71
  ],
 
1
  {
2
+ "best_metric": 26.9521,
3
  "best_model_checkpoint": "/content/drive/MyDrive/checkpoint-3743",
4
  "epoch": 1.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.1335826876836762,
13
+ "grad_norm": 4.5242133140563965,
14
+ "learning_rate": 5e-05,
15
+ "loss": 3.2029,
16
  "step": 500
17
  },
18
  {
19
  "epoch": 0.2671653753673524,
20
+ "grad_norm": 4.41894006729126,
21
+ "learning_rate": 4.766986671637618e-05,
22
+ "loss": 2.8643,
23
  "step": 1000
24
  },
25
  {
26
  "epoch": 0.4007480630510286,
27
+ "grad_norm": 4.079468250274658,
28
+ "learning_rate": 4.533973343275236e-05,
29
+ "loss": 2.7844,
30
  "step": 1500
31
  },
32
  {
33
  "epoch": 0.5343307507347048,
34
+ "grad_norm": 3.858260154724121,
35
+ "learning_rate": 4.3009600149128535e-05,
36
+ "loss": 2.7501,
37
  "step": 2000
38
  },
39
  {
40
  "epoch": 0.667913438418381,
41
+ "grad_norm": 4.262380599975586,
42
+ "learning_rate": 4.0679466865504706e-05,
43
+ "loss": 2.6947,
44
  "step": 2500
45
  },
46
  {
47
  "epoch": 0.8014961261020572,
48
+ "grad_norm": 4.304072856903076,
49
+ "learning_rate": 3.834933358188088e-05,
50
+ "loss": 2.6785,
51
  "step": 3000
52
  },
53
  {
54
  "epoch": 0.9350788137857333,
55
+ "grad_norm": 3.803712844848633,
56
+ "learning_rate": 3.601920029825706e-05,
57
+ "loss": 2.6409,
58
  "step": 3500
59
  },
60
  {
61
  "epoch": 1.0,
62
+ "eval_loss": 2.9351165294647217,
63
+ "eval_rouge1": 26.9521,
64
+ "eval_rouge2": 12.8371,
65
+ "eval_rougeL": 24.3565,
66
+ "eval_runtime": 736.5698,
67
+ "eval_samples_per_second": 6.366,
68
+ "eval_steps_per_second": 0.637,
69
  "step": 3743
70
  }
71
  ],
checkpoint-3743/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d05d32a13e629e372fd63a6a56914009e5a295d344b7df97bfa8a0480ad14ed0
3
  size 7032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc12377bc5c5e926d6591071c08141a1e803bbd801c62b57f2957c80f9609e63
3
  size 7032