SodaXII commited on
Commit
bd0532a
·
verified ·
1 Parent(s): 243a08b

Model save

Browse files
README.md CHANGED
@@ -34,8 +34,8 @@ More information needed
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0003
37
- - train_batch_size: 64
38
- - eval_batch_size: 64
39
  - seed: 42
40
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
41
  - lr_scheduler_type: cosine_with_restarts
 
34
 
35
  The following hyperparameters were used during training:
36
  - learning_rate: 0.0003
37
+ - train_batch_size: 128
38
+ - eval_batch_size: 128
39
  - seed: 42
40
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
41
  - lr_scheduler_type: cosine_with_restarts
config.json CHANGED
@@ -57,6 +57,7 @@
57
  ],
58
  "patch_size": 4,
59
  "path_norm": true,
 
60
  "qkv_bias": true,
61
  "stage_names": [
62
  "stem",
 
57
  ],
58
  "patch_size": 4,
59
  "path_norm": true,
60
+ "problem_type": "single_label_classification",
61
  "qkv_bias": true,
62
  "stage_names": [
63
  "stem",
logs/events.out.tfevents.1740248341.943ca99e1f33.812.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50d7d9dcc74857039590802ccd1cc97ab45361b5a1501c87e33ba3dc58a609a6
3
- size 88
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11652482b8e3545cbbefc4f248adec4cc1105712f771b6ad18cdb574543a17b2
3
+ size 6058
logs/events.out.tfevents.1740248566.943ca99e1f33.812.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca696c031bd73372d3eefcbada800d8fa71291ae7cf91cc849cfd6fa7662017c
3
+ size 88
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26503754261fd4ee769194b7ed0db2f4e16009156e8f0275e203d29d61d0711e
3
  size 347523416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9883de3c1b05220773ab950916f65bf4fb80ee01e5cb8f0914e0df02e419822
3
  size 347523416
trainer_state.json ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0,
5
+ "eval_steps": 500,
6
+ "global_step": 0,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [],
11
+ "logging_steps": 500,
12
+ "max_steps": 2500,
13
+ "num_input_tokens_seen": 0,
14
+ "num_train_epochs": 20,
15
+ "save_steps": 500,
16
+ "stateful_callbacks": {
17
+ "TrainerControl": {
18
+ "args": {
19
+ "should_epoch_stop": false,
20
+ "should_evaluate": false,
21
+ "should_log": false,
22
+ "should_save": false,
23
+ "should_training_stop": false
24
+ },
25
+ "attributes": {}
26
+ }
27
+ },
28
+ "total_flos": 0,
29
+ "train_batch_size": 64,
30
+ "trial_name": null,
31
+ "trial_params": null
32
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1432a45a87f78d16321d550a5eb80d944c53afb091422facf1b12e82e25c427
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2aa27d7b85cc841b9c04b978097c8a2456afee17bd48de31f3d9352e70815b48
3
  size 5496