CharlesLi commited on
Commit
7bb756d
·
verified ·
1 Parent(s): 51cc130

Model save

Browse files
README.md CHANGED
@@ -5,6 +5,7 @@ base_model: mistralai/Mistral-7B-Instruct-v0.1
5
  tags:
6
  - trl
7
  - sft
 
8
  - generated_from_trainer
9
  datasets:
10
  - generator
 
5
  tags:
6
  - trl
7
  - sft
8
+ - alignment-handbook
9
  - generated_from_trainer
10
  datasets:
11
  - generator
all_results.json CHANGED
@@ -1,9 +1,14 @@
1
  {
2
  "epoch": 1.0,
 
 
 
 
 
3
  "total_flos": 4763387166720.0,
4
- "train_loss": 0.6144113825715106,
5
- "train_runtime": 264.9731,
6
  "train_samples": 7980,
7
- "train_samples_per_second": 5.54,
8
- "train_steps_per_second": 0.174
9
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_loss": 0.5740787982940674,
4
+ "eval_runtime": 0.7569,
5
+ "eval_samples": 20,
6
+ "eval_samples_per_second": 5.285,
7
+ "eval_steps_per_second": 1.321,
8
  "total_flos": 4763387166720.0,
9
+ "train_loss": 0.6139289477597112,
10
+ "train_runtime": 257.2977,
11
  "train_samples": 7980,
12
+ "train_samples_per_second": 5.705,
13
+ "train_steps_per_second": 0.179
14
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.0,
3
+ "eval_loss": 0.5740787982940674,
4
+ "eval_runtime": 0.7569,
5
+ "eval_samples": 20,
6
+ "eval_samples_per_second": 5.285,
7
+ "eval_steps_per_second": 1.321
8
+ }
model-00001-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5a40261db1b7ba32f05a98b0fb869b2d16a2e57af5606e3d48621954945dd154
3
  size 4943162336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9cb749dd61a277098adc6dddecc880eae82181df441523908716b6b635fb01d
3
  size 4943162336
model-00002-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f1cc43200f8473833f17758bcbf4b6dff0c2ec04ce281256ceaf3cdadd57c46d
3
  size 4999819336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05b4daee984a6496d68f5e1878c6deba6b6b90d3786a2425ddeae24ebc640a07
3
  size 4999819336
model-00003-of-00003.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df401546eb56b64a05e6d1457a13f0a09add2260daddcb7f3299bb6a54fad43c
3
  size 4540516344
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:377f888b1afb8888b3224ff5d6fe33683afb703590f41ee760693c95771dff4e
3
  size 4540516344
runs/Jan20_00-57-52_dgx-a100-13/events.out.tfevents.1737331762.dgx-a100-13.1005098.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9e83d318eca30f4d199171159cd0ecbad0e1be4813ea302677b1ca74896b732
3
+ size 354
runs/Jan20_01-06-27_dgx-a100-14/events.out.tfevents.1737331600.dgx-a100-14.655707.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dda58b7d97438b60452afb76c1b12f7826f24ebc9308abb67c0253373207dcd
3
- size 5858
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef1f19f44421045bc57a51baeaf73cdcdfc111edcf35c695cc0a7153be1928b
3
+ size 6206
train_results.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 4763387166720.0,
4
- "train_loss": 0.6144113825715106,
5
- "train_runtime": 264.9731,
6
  "train_samples": 7980,
7
- "train_samples_per_second": 5.54,
8
- "train_steps_per_second": 0.174
9
  }
 
1
  {
2
  "epoch": 1.0,
3
  "total_flos": 4763387166720.0,
4
+ "train_loss": 0.6139289477597112,
5
+ "train_runtime": 257.2977,
6
  "train_samples": 7980,
7
+ "train_samples_per_second": 5.705,
8
+ "train_steps_per_second": 0.179
9
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e13f48deecd588d69b971adc1201a810b6469443bf5f676437b7901e87e4966b
3
  size 7032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:432ce073d46aa8f991ef4ccf4b07b19bdb86a23939c22ec86368fd3459e48b7f
3
  size 7032