Ksjsjjdj commited on
Commit
a4d81aa
·
verified ·
1 Parent(s): 0922efa

Live Checkpoint 3

Browse files
adapter_config.json CHANGED
@@ -16,7 +16,7 @@
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
- "lora_alpha": 104,
20
  "lora_bias": false,
21
  "lora_dropout": 0.05,
22
  "megatron_config": null,
@@ -25,7 +25,7 @@
25
  "peft_type": "LORA",
26
  "peft_version": "0.18.0",
27
  "qalora_group_size": 16,
28
- "r": 200,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
16
  "layers_pattern": null,
17
  "layers_to_transform": null,
18
  "loftq_config": {},
19
+ "lora_alpha": 512,
20
  "lora_bias": false,
21
  "lora_dropout": 0.05,
22
  "megatron_config": null,
 
25
  "peft_type": "LORA",
26
  "peft_version": "0.18.0",
27
  "qalora_group_size": 16,
28
+ "r": 256,
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a2e3e3e6d69ab8bf663f5fa64ef76c4c16b91d3ad46935cab911fff52f21e330
3
- size 73747392
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36c7253b4ba70ab65aa934ce811f7be3a0cf368aad73b4ac1bff12f95e9577da
3
+ size 94391240
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e239d4c6af1c8fc4e6fce227710b73843ee6c02f69be2b6dd1ce43f619f08d8c
3
- size 147573899
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcbf02964e210661f85c4d37097b6f9327a6c0dd2b34d11224ee8d7d1d0b7850
3
+ size 188862155
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fb1feb2393d444411081aa60ebdb29ea2c48b3bc2ccfc9ce86899de522cb26ec
3
- size 14455
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9e13dd4ca4af08228a91634a046f6bdd24626ae522be4fbdf8f03b3a08819fb
3
+ size 14391
trainer_state.json CHANGED
@@ -11,23 +11,23 @@
11
  "log_history": [
12
  {
13
  "epoch": 0.3333333333333333,
14
- "grad_norm": 1.8294399976730347,
15
  "learning_rate": 0.0002,
16
  "loss": 2.2678,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.6666666666666666,
21
- "grad_norm": 1.3883302211761475,
22
  "learning_rate": 0.00013333333333333334,
23
- "loss": 1.8692,
24
  "step": 2
25
  },
26
  {
27
  "epoch": 1.0,
28
- "grad_norm": 1.213472843170166,
29
  "learning_rate": 6.666666666666667e-05,
30
- "loss": 1.8266,
31
  "step": 3
32
  }
33
  ],
@@ -48,7 +48,7 @@
48
  "attributes": {}
49
  }
50
  },
51
- "total_flos": 1813434904320.0,
52
  "train_batch_size": 1,
53
  "trial_name": null,
54
  "trial_params": null
 
11
  "log_history": [
12
  {
13
  "epoch": 0.3333333333333333,
14
+ "grad_norm": 8.043458938598633,
15
  "learning_rate": 0.0002,
16
  "loss": 2.2678,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.6666666666666666,
21
+ "grad_norm": 26.383363723754883,
22
  "learning_rate": 0.00013333333333333334,
23
+ "loss": 2.4716,
24
  "step": 2
25
  },
26
  {
27
  "epoch": 1.0,
28
+ "grad_norm": 9.134888648986816,
29
  "learning_rate": 6.666666666666667e-05,
30
+ "loss": 2.1976,
31
  "step": 3
32
  }
33
  ],
 
48
  "attributes": {}
49
  }
50
  },
51
+ "total_flos": 1892242763520.0,
52
  "train_batch_size": 1,
53
  "trial_name": null,
54
  "trial_params": null
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3078edd2666b04ce93c65237cae2b17a52d1969fdcd17bf5fde40b98b6a346f
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92ad46923c8c77887df1899b19b2cff8af20805ac59096ce09e3dac9d8652b47
3
  size 5905