koke143 commited on
Commit
58205cd
·
verified ·
1 Parent(s): 4f27c72

Date of push: 20240728222808

Browse files
README.md CHANGED
@@ -2,6 +2,9 @@
2
  license: mit
3
  base_model: microsoft/deberta-v3-base
4
  tags:
 
 
 
5
  - generated_from_trainer
6
  metrics:
7
  - f1
@@ -17,8 +20,8 @@ should probably proofread and complete it, then remove this comment. -->
17
 
18
  This model is a fine-tuned version of [microsoft/deberta-v3-base](https://huggingface.co/microsoft/deberta-v3-base) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - F1: 0.3068
21
- - Loss: 7.9021
22
 
23
  ## Model description
24
 
 
2
  license: mit
3
  base_model: microsoft/deberta-v3-base
4
  tags:
5
+ - deberta
6
+ - fine-tune
7
+ - huggingface
8
  - generated_from_trainer
9
  metrics:
10
  - f1
 
20
 
21
  This model is a fine-tuned version of [microsoft/deberta-v3-base](https://huggingface.co/microsoft/deberta-v3-base) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 7.9823
24
+ - F1: 0.3103
25
 
26
  ## Model description
27
 
all_results.json CHANGED
@@ -2,14 +2,14 @@
2
  "epoch": 9.275862068965518,
3
  "eval_f1": 0.31034482758620696,
4
  "eval_loss": 7.982325553894043,
5
- "eval_runtime": 0.1837,
6
  "eval_samples": 10,
7
- "eval_samples_per_second": 54.436,
8
- "eval_steps_per_second": 27.218,
9
  "total_flos": 202609940734866.0,
10
  "train_loss": 0.0,
11
- "train_runtime": 0.245,
12
  "train_samples": 87,
13
- "train_samples_per_second": 355.061,
14
- "train_steps_per_second": 32.649
15
  }
 
2
  "epoch": 9.275862068965518,
3
  "eval_f1": 0.31034482758620696,
4
  "eval_loss": 7.982325553894043,
5
+ "eval_runtime": 0.1806,
6
  "eval_samples": 10,
7
+ "eval_samples_per_second": 55.367,
8
+ "eval_steps_per_second": 27.683,
9
  "total_flos": 202609940734866.0,
10
  "train_loss": 0.0,
11
+ "train_runtime": 0.244,
12
  "train_samples": 87,
13
+ "train_samples_per_second": 356.519,
14
+ "train_steps_per_second": 32.783
15
  }
eval_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 9.275862068965518,
3
  "eval_f1": 0.31034482758620696,
4
  "eval_loss": 7.982325553894043,
5
- "eval_runtime": 0.1837,
6
  "eval_samples": 10,
7
- "eval_samples_per_second": 54.436,
8
- "eval_steps_per_second": 27.218
9
  }
 
2
  "epoch": 9.275862068965518,
3
  "eval_f1": 0.31034482758620696,
4
  "eval_loss": 7.982325553894043,
5
+ "eval_runtime": 0.1806,
6
  "eval_samples": 10,
7
+ "eval_samples_per_second": 55.367,
8
+ "eval_steps_per_second": 27.683
9
  }
runs/Jul28_20-17-26_766925b9bca5/events.out.tfevents.1722198477.766925b9bca5.538.24 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f41c2107145978f1c94e8c96495628f6dba6302749a4b25f5ef740d99e41c332
3
+ size 399
runs/Jul28_20-17-26_766925b9bca5/events.out.tfevents.1722198477.766925b9bca5.538.25 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa7c530342a64db60a01513fcfca76b6656c20fb6b982fb021b95fceeb870aa
3
+ size 399
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 9.275862068965518,
3
  "total_flos": 202609940734866.0,
4
  "train_loss": 0.0,
5
- "train_runtime": 0.245,
6
  "train_samples": 87,
7
- "train_samples_per_second": 355.061,
8
- "train_steps_per_second": 32.649
9
  }
 
2
  "epoch": 9.275862068965518,
3
  "total_flos": 202609940734866.0,
4
  "train_loss": 0.0,
5
+ "train_runtime": 0.244,
6
  "train_samples": 87,
7
+ "train_samples_per_second": 356.519,
8
+ "train_steps_per_second": 32.783
9
  }
trainer_state.json CHANGED
@@ -133,6 +133,15 @@
133
  "train_runtime": 0.245,
134
  "train_samples_per_second": 355.061,
135
  "train_steps_per_second": 32.649
 
 
 
 
 
 
 
 
 
136
  }
137
  ],
138
  "logging_steps": 500,
 
133
  "train_runtime": 0.245,
134
  "train_samples_per_second": 355.061,
135
  "train_steps_per_second": 32.649
136
+ },
137
+ {
138
+ "epoch": 9.275862068965518,
139
+ "step": 80,
140
+ "total_flos": 202609940734866.0,
141
+ "train_loss": 0.0,
142
+ "train_runtime": 0.244,
143
+ "train_samples_per_second": 356.519,
144
+ "train_steps_per_second": 32.783
145
  }
146
  ],
147
  "logging_steps": 500,