hf-tuner commited on
Commit
30dfe66
verified
1 Parent(s): 137cda9

End of training

Browse files
README.md CHANGED
@@ -16,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  This model is a fine-tuned version of [microsoft/MiniLM-L12-H384-uncased](https://huggingface.co/microsoft/MiniLM-L12-H384-uncased) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
- - Loss: nan
20
 
21
  ## Model description
22
 
@@ -42,13 +42,14 @@ The following hyperparameters were used during training:
42
  - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - num_epochs: 2
 
45
 
46
  ### Training results
47
 
48
  | Training Loss | Epoch | Step | Validation Loss |
49
  |:-------------:|:-----:|:-----:|:---------------:|
50
- | 0.9316 | 1.0 | 8134 | nan |
51
- | 0.7836 | 2.0 | 16268 | nan |
52
 
53
 
54
  ### Framework versions
 
16
 
17
  This model is a fine-tuned version of [microsoft/MiniLM-L12-H384-uncased](https://huggingface.co/microsoft/MiniLM-L12-H384-uncased) on an unknown dataset.
18
  It achieves the following results on the evaluation set:
19
+ - Loss: 1.4653
20
 
21
  ## Model description
22
 
 
42
  - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
43
  - lr_scheduler_type: linear
44
  - num_epochs: 2
45
+ - mixed_precision_training: Native AMP
46
 
47
  ### Training results
48
 
49
  | Training Loss | Epoch | Step | Validation Loss |
50
  |:-------------:|:-----:|:-----:|:---------------:|
51
+ | 1.3678 | 1.0 | 8134 | 1.4974 |
52
+ | 1.1809 | 2.0 | 16268 | 1.4653 |
53
 
54
 
55
  ### Framework versions
config.json CHANGED
@@ -20,5 +20,5 @@
20
  "transformers_version": "4.57.1",
21
  "type_vocab_size": 2,
22
  "use_cache": true,
23
- "vocab_size": 30523
24
  }
 
20
  "transformers_version": "4.57.1",
21
  "type_vocab_size": 2,
22
  "use_cache": true,
23
+ "vocab_size": 30522
24
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e20e70325bc2b04edfedb4e579e588f7cd79b760045af7a77c1b673953fb0d0
3
- size 132876360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05f5ffd839326b9220d1c28a932e820badfad6bb2c8bc6b72d932140154a293c
3
+ size 132874824
runs/Nov20_03-14-07_26cd4a53f5b5/events.out.tfevents.1763608469.26cd4a53f5b5.285.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43eb94c897b5ff07d4efc529d48c6820577f3cfb22bbff0c0795655760a327d2
3
+ size 40020
tokenizer.json CHANGED
@@ -1,14 +1,7 @@
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
- "padding": {
5
- "strategy": "BatchLongest",
6
- "direction": "Right",
7
- "pad_to_multiple_of": null,
8
- "pad_id": 0,
9
- "pad_type_id": 0,
10
- "pad_token": "[PAD]"
11
- },
12
  "added_tokens": [
13
  {
14
  "id": 0,
@@ -54,15 +47,6 @@
54
  "rstrip": false,
55
  "normalized": false,
56
  "special": true
57
- },
58
- {
59
- "id": 30522,
60
- "content": "<no_answer>",
61
- "single_word": false,
62
- "lstrip": false,
63
- "rstrip": false,
64
- "normalized": true,
65
- "special": false
66
  }
67
  ],
68
  "normalizer": {
 
1
  {
2
  "version": "1.0",
3
  "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
 
47
  "rstrip": false,
48
  "normalized": false,
49
  "special": true
 
 
 
 
 
 
 
 
 
50
  }
51
  ],
52
  "normalizer": {
tokenizer_config.json CHANGED
@@ -39,14 +39,6 @@
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
- },
43
- "30522": {
44
- "content": "<no_answer>",
45
- "lstrip": false,
46
- "normalized": true,
47
- "rstrip": false,
48
- "single_word": false,
49
- "special": false
50
  }
51
  },
52
  "clean_up_tokenization_spaces": true,
 
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
 
 
 
 
 
 
 
 
42
  }
43
  },
44
  "clean_up_tokenization_spaces": true,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6af54618a182499fbc4c29b222e2ef83f7628c325d27b2cd7d78932d872b0eb9
3
  size 5841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:498c5d0fc3f7a62a2d8f4e0d73a974ec2f3d7b792fb80caafbb5a0cc19250cad
3
  size 5841