sizhkhy commited on
Commit
75e85be
·
verified ·
1 Parent(s): abdeb96
adapter_config.json CHANGED
@@ -20,13 +20,13 @@
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
23
- "o_proj",
24
  "up_proj",
25
  "gate_proj",
26
- "k_proj",
27
- "q_proj",
28
  "v_proj",
29
- "down_proj"
 
 
 
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
 
20
  "rank_pattern": {},
21
  "revision": null,
22
  "target_modules": [
 
23
  "up_proj",
24
  "gate_proj",
 
 
25
  "v_proj",
26
+ "o_proj",
27
+ "down_proj",
28
+ "k_proj",
29
+ "q_proj"
30
  ],
31
  "task_type": "CAUSAL_LM",
32
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f4df28160aa2cacaeceebeac4b0ff96d4e2e2078aa9e6967cff0bfbe22f87ba
3
  size 1556140392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cf73554208b66e451d3bdaa3cf09c4c0809a22711e973fb5037e53716148ac2
3
  size 1556140392
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 0.6956521739130435,
3
- "eval_loss": 0.04214267060160637,
4
- "eval_runtime": 3.45,
5
- "eval_samples_per_second": 2.899,
6
- "eval_steps_per_second": 0.29,
7
  "total_flos": 3880733380509696.0,
8
- "train_loss": 0.029286871664226055,
9
- "train_runtime": 89.5279,
10
- "train_samples_per_second": 1.005,
11
- "train_steps_per_second": 0.022
12
  }
 
1
  {
2
  "epoch": 0.6956521739130435,
3
+ "eval_loss": 0.04213493689894676,
4
+ "eval_runtime": 3.3693,
5
+ "eval_samples_per_second": 2.968,
6
+ "eval_steps_per_second": 0.297,
7
  "total_flos": 3880733380509696.0,
8
+ "train_loss": 0.02928687445819378,
9
+ "train_runtime": 86.3619,
10
+ "train_samples_per_second": 1.042,
11
+ "train_steps_per_second": 0.023
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 0.6956521739130435,
3
- "eval_loss": 0.04214267060160637,
4
- "eval_runtime": 3.45,
5
- "eval_samples_per_second": 2.899,
6
- "eval_steps_per_second": 0.29
7
  }
 
1
  {
2
  "epoch": 0.6956521739130435,
3
+ "eval_loss": 0.04213493689894676,
4
+ "eval_runtime": 3.3693,
5
+ "eval_samples_per_second": 2.968,
6
+ "eval_steps_per_second": 0.297
7
  }
experiment.config ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ vision_config {
2
+ vision_api: TEXT_DETECTION
3
+ feature_element: WORD
4
+ word_confidence_threshold: -0.1
5
+ return_raw_response: true
6
+ }
7
+ preprocess_config {
8
+ label_overlap_threshold: 0.4
9
+ num_processes: 4
10
+ rotation_fixer: VISION_BASED_FAST
11
+ }
12
+ train_config {
13
+ num_epochs: 1
14
+ }
15
+ version: "3.0.2"
16
+ field_extraction {
17
+ sub_exp_config {
18
+ model_config {
19
+ architecture {
20
+ nova {
21
+ }
22
+ }
23
+ }
24
+ }
25
+ }
model.bin ADDED
File without changes
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 0.6956521739130435,
3
  "total_flos": 3880733380509696.0,
4
- "train_loss": 0.029286871664226055,
5
- "train_runtime": 89.5279,
6
- "train_samples_per_second": 1.005,
7
- "train_steps_per_second": 0.022
8
  }
 
1
  {
2
  "epoch": 0.6956521739130435,
3
  "total_flos": 3880733380509696.0,
4
+ "train_loss": 0.02928687445819378,
5
+ "train_runtime": 86.3619,
6
+ "train_samples_per_second": 1.042,
7
+ "train_steps_per_second": 0.023
8
  }
trainer_log.jsonl CHANGED
@@ -1,3 +1,3 @@
1
- {"current_steps": 1, "total_steps": 2, "loss": 0.0288, "lr": 0.0001, "epoch": 0.34782608695652173, "percentage": 50.0, "elapsed_time": "0:00:52", "remaining_time": "0:00:52"}
2
- {"current_steps": 2, "total_steps": 2, "loss": 0.0298, "lr": 0.0, "epoch": 0.6956521739130435, "percentage": 100.0, "elapsed_time": "0:01:22", "remaining_time": "0:00:00"}
3
- {"current_steps": 2, "total_steps": 2, "epoch": 0.6956521739130435, "percentage": 100.0, "elapsed_time": "0:01:28", "remaining_time": "0:00:00"}
 
1
+ {"current_steps": 1, "total_steps": 2, "loss": 0.0288, "lr": 0.0001, "epoch": 0.34782608695652173, "percentage": 50.0, "elapsed_time": "0:00:39", "remaining_time": "0:00:39"}
2
+ {"current_steps": 2, "total_steps": 2, "loss": 0.0298, "lr": 0.0, "epoch": 0.6956521739130435, "percentage": 100.0, "elapsed_time": "0:01:07", "remaining_time": "0:00:00"}
3
+ {"current_steps": 2, "total_steps": 2, "epoch": 0.6956521739130435, "percentage": 100.0, "elapsed_time": "0:01:24", "remaining_time": "0:00:00"}
trainer_state.json CHANGED
@@ -10,14 +10,14 @@
10
  "log_history": [
11
  {
12
  "epoch": 0.34782608695652173,
13
- "grad_norm": 0.07414738088846207,
14
  "learning_rate": 0.0001,
15
  "loss": 0.0288,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.6956521739130435,
20
- "grad_norm": 0.06888309866189957,
21
  "learning_rate": 0.0,
22
  "loss": 0.0298,
23
  "step": 2
@@ -26,10 +26,10 @@
26
  "epoch": 0.6956521739130435,
27
  "step": 2,
28
  "total_flos": 3880733380509696.0,
29
- "train_loss": 0.029286871664226055,
30
- "train_runtime": 89.5279,
31
- "train_samples_per_second": 1.005,
32
- "train_steps_per_second": 0.022
33
  }
34
  ],
35
  "logging_steps": 1,
 
10
  "log_history": [
11
  {
12
  "epoch": 0.34782608695652173,
13
+ "grad_norm": 0.0741637647151947,
14
  "learning_rate": 0.0001,
15
  "loss": 0.0288,
16
  "step": 1
17
  },
18
  {
19
  "epoch": 0.6956521739130435,
20
+ "grad_norm": 0.06889505684375763,
21
  "learning_rate": 0.0,
22
  "loss": 0.0298,
23
  "step": 2
 
26
  "epoch": 0.6956521739130435,
27
  "step": 2,
28
  "total_flos": 3880733380509696.0,
29
+ "train_loss": 0.02928687445819378,
30
+ "train_runtime": 86.3619,
31
+ "train_samples_per_second": 1.042,
32
+ "train_steps_per_second": 0.023
33
  }
34
  ],
35
  "logging_steps": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68b07d6117d888dc51d19e06cb48a53cb20d5edb3faef27e7da7fca291d4a00d
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f9d3edd57c685ba0165f354d6d438df2d7a056465c7e502c3ff099b11d297e
3
  size 5496