jerawincel commited on
Commit
deee812
·
1 Parent(s): 31f3c0b

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46014f2aa3cf12db55160a7ed802a0aebadd99bb4acc628f96b8f3d1bc0fd0fd
3
  size 498692800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f18a9c17794dcc64794600f514a20ec18ee99383447802910963fbc3fbd74a5
3
  size 498692800
run-3/checkpoint-272/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fec49f3a0b2296e4d011156d27067cbc32d943744daa803b56c53b9ce1820e6d
3
  size 498692800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f18a9c17794dcc64794600f514a20ec18ee99383447802910963fbc3fbd74a5
3
  size 498692800
run-3/checkpoint-272/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32802688230b2cca3f9e1a0a1db0bc0970bbc4a8132be3d86b2b86d3fd76da43
3
  size 997505402
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b25566a8dc0ae19360e446f27c6cff0afae23e4afeeaa3cf14ea0e99b9857a3b
3
  size 997505402
run-3/checkpoint-272/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7627164f6a838ab6071d3af2f4c07c4ae2a8a7750ab699aa23e9b7b2754037c0
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3646b4cdcd364d917497fd74fcfe29f7162e919c3f979cdb24aebb68f1f7cf36
3
+ size 14308
run-3/checkpoint-272/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cbb06ded40b0bac91743e26822e9c4748c00cbfadf00fae5289f79eb8b9670d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79a25765cf01b8c285d64615aacbe0ee01a4e20cc23d32d1d6fed0a37344b0cc
3
  size 1064
run-3/checkpoint-272/tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 64,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 64
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 128,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 128
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
run-3/checkpoint-272/tokenizer_config.json CHANGED
@@ -49,7 +49,7 @@
49
  "eos_token": "</s>",
50
  "errors": "replace",
51
  "mask_token": "<mask>",
52
- "model_max_length": 64,
53
  "pad_token": "<pad>",
54
  "sep_token": "</s>",
55
  "tokenizer_class": "RobertaTokenizer",
 
49
  "eos_token": "</s>",
50
  "errors": "replace",
51
  "mask_token": "<mask>",
52
+ "model_max_length": 128,
53
  "pad_token": "<pad>",
54
  "sep_token": "</s>",
55
  "tokenizer_class": "RobertaTokenizer",
run-3/checkpoint-272/trainer_state.json CHANGED
@@ -11,23 +11,23 @@
11
  {
12
  "epoch": 1.0,
13
  "eval_f1": 0.0,
14
- "eval_loss": 0.2641439437866211,
15
- "eval_runtime": 7.1825,
16
- "eval_samples_per_second": 755.446,
17
- "eval_steps_per_second": 5.987,
18
  "step": 272
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 1360,
23
- "num_train_epochs": 5,
24
  "save_steps": 500,
25
  "total_flos": 0,
26
  "trial_name": null,
27
  "trial_params": {
28
- "learning_rate": 2.4573800348719033e-06,
29
- "num_train_epochs": 5,
30
- "per_device_train_batch_size": 16,
31
- "seed": 4
32
  }
33
  }
 
11
  {
12
  "epoch": 1.0,
13
  "eval_f1": 0.0,
14
+ "eval_loss": 0.15121705830097198,
15
+ "eval_runtime": 1.7687,
16
+ "eval_samples_per_second": 153.22,
17
+ "eval_steps_per_second": 1.131,
18
  "step": 272
19
  }
20
  ],
21
  "logging_steps": 500,
22
+ "max_steps": 272,
23
+ "num_train_epochs": 1,
24
  "save_steps": 500,
25
  "total_flos": 0,
26
  "trial_name": null,
27
  "trial_params": {
28
+ "learning_rate": 3.4549942125392434e-05,
29
+ "num_train_epochs": 1,
30
+ "per_device_train_batch_size": 8,
31
+ "seed": 32
32
  }
33
  }
run-3/checkpoint-272/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cedcfdbe7c29e6f37dca0518c3a22279de6ad973240451544d5c9e7a0a75ce08
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a860ef08b878fc8a841fef69af13e56850d256386ceb720646e3b321efbbe86b
3
  size 4600
runs/Dec01_22-15-05_9632749e57d1/events.out.tfevents.1701469520.9632749e57d1.10239.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65e7551c3de41ea0f263bb3bdfb4bc35cf1a3072cc23a1ef12e69a26d9dee0d7
3
+ size 6092
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8b4b571495d2d3af592eaa59e396bd9f2868fc92a95d7c44c370053edc46bc9
3
  size 4600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a860ef08b878fc8a841fef69af13e56850d256386ceb720646e3b321efbbe86b
3
  size 4600