ThomasCeraso commited on
Commit
a3e2c75
·
verified ·
1 Parent(s): ac67724

End of training

Browse files
Files changed (3) hide show
  1. README.md +4 -0
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
README.md CHANGED
@@ -8,6 +8,8 @@ tags:
8
  - trl
9
  - sft
10
  - generated_from_trainer
 
 
11
  model-index:
12
  - name: SmolLM2-FT-MyDataset
13
  results: []
@@ -41,6 +43,8 @@ The following hyperparameters were used during training:
41
  - train_batch_size: 1
42
  - eval_batch_size: 8
43
  - seed: 42
 
 
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: linear
46
  - training_steps: 300
 
8
  - trl
9
  - sft
10
  - generated_from_trainer
11
+ - trl
12
+ - sft
13
  model-index:
14
  - name: SmolLM2-FT-MyDataset
15
  results: []
 
43
  - train_batch_size: 1
44
  - eval_batch_size: 8
45
  - seed: 42
46
+ - gradient_accumulation_steps: 2
47
+ - total_train_batch_size: 2
48
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
49
  - lr_scheduler_type: linear
50
  - training_steps: 300
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0d245f3f614ad011aceacf08f21642cc9e8a7492077aa68d1ab32d48062b283
3
  size 538090408
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:304f52aa02ffbd39ed3fb708c192519ec2f6b5ba0a2929f15fb341de5dd87b56
3
  size 538090408
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:366b359d7cd0bbcce8b4a43d40256954e83866f68e2ab267e91d964e63709454
3
  size 5841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:782894cf779fb098b13323e0259499b49562828a0e85ce9369daae2b6d8241db
3
  size 5841