prthm29 commited on
Commit
4087805
·
verified ·
1 Parent(s): f9fb98f

End of training

Browse files
README.md CHANGED
@@ -20,10 +20,10 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  # smoke_test_glm4v_checkpoints
22
 
23
- This model is a fine-tuned version of [zai-org/GLM-OCR](https://huggingface.co/zai-org/GLM-OCR) on an unknown dataset.
24
  It achieves the following results on the evaluation set:
25
- - Loss: 2.5868
26
- - Accuracy: 0.5556
27
 
28
  ## Model description
29
 
 
20
 
21
  # smoke_test_glm4v_checkpoints
22
 
23
+ This model is a fine-tuned version of [zai-org/GLM-OCR](https://huggingface.co/zai-org/GLM-OCR) on the gujarati_ocr_stream dataset.
24
  It achieves the following results on the evaluation set:
25
+ - Loss: 2.5668
26
+ - Accuracy: 0.5594
27
 
28
  ## Model description
29
 
all_results.json CHANGED
@@ -2,12 +2,12 @@
2
  "epoch": 1.3076923076923077,
3
  "eval_accuracy": 0.5594251982846505,
4
  "eval_loss": 2.566760301589966,
5
- "eval_runtime": 2.0028,
6
- "eval_samples_per_second": 24.965,
7
- "eval_steps_per_second": 3.495,
8
  "total_flos": 197425390977024.0,
9
  "train_loss": 2.7674348831176756,
10
- "train_runtime": 14.1312,
11
- "train_samples_per_second": 5.661,
12
- "train_steps_per_second": 0.354
13
  }
 
2
  "epoch": 1.3076923076923077,
3
  "eval_accuracy": 0.5594251982846505,
4
  "eval_loss": 2.566760301589966,
5
+ "eval_runtime": 2.0398,
6
+ "eval_samples_per_second": 24.512,
7
+ "eval_steps_per_second": 3.432,
8
  "total_flos": 197425390977024.0,
9
  "train_loss": 2.7674348831176756,
10
+ "train_runtime": 14.3041,
11
+ "train_samples_per_second": 5.593,
12
+ "train_steps_per_second": 0.35
13
  }
eval_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 1.3076923076923077,
3
  "eval_accuracy": 0.5594251982846505,
4
  "eval_loss": 2.566760301589966,
5
- "eval_runtime": 2.0028,
6
- "eval_samples_per_second": 24.965,
7
- "eval_steps_per_second": 3.495
8
  }
 
2
  "epoch": 1.3076923076923077,
3
  "eval_accuracy": 0.5594251982846505,
4
  "eval_loss": 2.566760301589966,
5
+ "eval_runtime": 2.0398,
6
+ "eval_samples_per_second": 24.512,
7
+ "eval_steps_per_second": 3.432
8
  }
runs/Apr09_05-18-42_cs-01knr8f8jy7kcvx4v0ce8jkn3q-1tpz/events.out.tfevents.1775711944.cs-01knr8f8jy7kcvx4v0ce8jkn3q-1tpz.131664.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab4e73b6a031c0f4a80319852aa0106e65509edc06f2177c72ae89b158ea6685
3
+ size 405
train_results.json CHANGED
@@ -2,7 +2,7 @@
2
  "epoch": 1.3076923076923077,
3
  "total_flos": 197425390977024.0,
4
  "train_loss": 2.7674348831176756,
5
- "train_runtime": 14.1312,
6
- "train_samples_per_second": 5.661,
7
- "train_steps_per_second": 0.354
8
  }
 
2
  "epoch": 1.3076923076923077,
3
  "total_flos": 197425390977024.0,
4
  "train_loss": 2.7674348831176756,
5
+ "train_runtime": 14.3041,
6
+ "train_samples_per_second": 5.593,
7
+ "train_steps_per_second": 0.35
8
  }
trainer_state.json CHANGED
@@ -27,9 +27,9 @@
27
  "epoch": 0.6153846153846154,
28
  "eval_accuracy": 0.5348454543007923,
29
  "eval_loss": 2.749584436416626,
30
- "eval_runtime": 2.0771,
31
- "eval_samples_per_second": 24.072,
32
- "eval_steps_per_second": 3.37,
33
  "step": 2
34
  },
35
  {
@@ -50,9 +50,9 @@
50
  "epoch": 1.0,
51
  "eval_accuracy": 0.5556479950956826,
52
  "eval_loss": 2.586768388748169,
53
- "eval_runtime": 2.0364,
54
- "eval_samples_per_second": 24.553,
55
- "eval_steps_per_second": 3.437,
56
  "step": 4
57
  },
58
  {
@@ -67,9 +67,9 @@
67
  "step": 5,
68
  "total_flos": 197425390977024.0,
69
  "train_loss": 2.7674348831176756,
70
- "train_runtime": 14.1312,
71
- "train_samples_per_second": 5.661,
72
- "train_steps_per_second": 0.354
73
  }
74
  ],
75
  "logging_steps": 1,
 
27
  "epoch": 0.6153846153846154,
28
  "eval_accuracy": 0.5348454543007923,
29
  "eval_loss": 2.749584436416626,
30
+ "eval_runtime": 2.0604,
31
+ "eval_samples_per_second": 24.267,
32
+ "eval_steps_per_second": 3.397,
33
  "step": 2
34
  },
35
  {
 
50
  "epoch": 1.0,
51
  "eval_accuracy": 0.5556479950956826,
52
  "eval_loss": 2.586768388748169,
53
+ "eval_runtime": 2.0408,
54
+ "eval_samples_per_second": 24.5,
55
+ "eval_steps_per_second": 3.43,
56
  "step": 4
57
  },
58
  {
 
67
  "step": 5,
68
  "total_flos": 197425390977024.0,
69
  "train_loss": 2.7674348831176756,
70
+ "train_runtime": 14.3041,
71
+ "train_samples_per_second": 5.593,
72
+ "train_steps_per_second": 0.35
73
  }
74
  ],
75
  "logging_steps": 1,