bgglee commited on
Commit
1719518
·
1 Parent(s): e300ec8

v3 — added self-correction + optimized hyperparams

Browse files
README.md CHANGED
@@ -1,9 +1,9 @@
1
- # NL2SQL Fine-Tuned Model v2
2
  This is an updated version with self-correction and improved hyperparameters.
3
 
4
  ## Config
5
  {
6
- "version": "v2",
7
  "base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
8
  "merged_repo": "bgglee/NL2SQL_finetuned",
9
  "method": "LoRA (merged)",
 
1
+ # NL2SQL Fine-Tuned Model v3
2
  This is an updated version with self-correction and improved hyperparameters.
3
 
4
  ## Config
5
  {
6
+ "version": "v3",
7
  "base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
8
  "merged_repo": "bgglee/NL2SQL_finetuned",
9
  "method": "LoRA (merged)",
finetune_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "version": "v2",
3
  "base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
4
  "merged_repo": "bgglee/NL2SQL_finetuned",
5
  "method": "LoRA (merged)",
 
1
  {
2
+ "version": "v3",
3
  "base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
4
  "merged_repo": "bgglee/NL2SQL_finetuned",
5
  "method": "LoRA (merged)",
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:327be157f17b9c75f03b065000ad4decd2e8627dfb2873a44c582969a63377a5
3
+ size 4965799096
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27a56c7c360ac1ce923510880488bcb82e88b359bfdd32b56e6ff73e62638e98
3
  size 1459729952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a25a2554bc877ae6efdd628c84985539c5b1542870310551a44427a6abd9448b
3
  size 1459729952
training_loss.csv CHANGED
@@ -1,37 +1,13 @@
1
  step,loss
2
- 10,6.7013
3
- 20,1.932
4
- 30,0.0372
5
- 40,0.0363
6
- 50,0.0271
7
- 60,0.0308
8
- 70,0.0333
9
- 80,0.0342
10
- 90,0.0275
11
- 100,0.0304
12
- 110,0.0202
13
- 120,0.0277
14
- 130,0.0359
15
- 140,0.0321
16
- 150,0.0316
17
- 160,0.0203
18
- 170,0.0272
19
- 180,0.0296
20
- 190,0.0302
21
- 200,0.0214
22
- 210,0.0271
23
- 220,0.0251
24
- 230,0.0244
25
- 240,0.0238
26
- 250,0.0267
27
- 260,0.0239
28
- 270,0.0199
29
- 280,0.037
30
- 290,0.0213
31
- 300,0.0224
32
- 310,0.0223
33
- 320,0.0314
34
- 330,0.0214
35
- 340,0.0271
36
- 350,0.0246
37
- 360,0.0287
 
1
  step,loss
2
+ 10,0.0329
3
+ 20,0.0293
4
+ 30,0.0239
5
+ 40,0.0236
6
+ 50,0.0187
7
+ 60,0.0224
8
+ 70,0.0248
9
+ 80,0.0261
10
+ 90,0.0212
11
+ 100,0.0233
12
+ 110,0.0159
13
+ 120,0.0228
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
training_loss.png CHANGED
wrong_ids.json CHANGED
@@ -0,0 +1 @@
 
 
1
+ []