v3 — added self-correction + optimized hyperparams
Browse files- README.md +2 -2
- finetune_config.json +1 -1
- model-00001-of-00002.safetensors +3 -0
- model-00002-of-00002.safetensors +1 -1
- training_loss.csv +12 -36
- training_loss.png +0 -0
- wrong_ids.json +1 -0
README.md
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
-
# NL2SQL Fine-Tuned Model
|
| 2 |
This is an updated version with self-correction and improved hyperparameters.
|
| 3 |
|
| 4 |
## Config
|
| 5 |
{
|
| 6 |
-
"version": "
|
| 7 |
"base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
|
| 8 |
"merged_repo": "bgglee/NL2SQL_finetuned",
|
| 9 |
"method": "LoRA (merged)",
|
|
|
|
| 1 |
+
# NL2SQL Fine-Tuned Model v3
|
| 2 |
This is an updated version with self-correction and improved hyperparameters.
|
| 3 |
|
| 4 |
## Config
|
| 5 |
{
|
| 6 |
+
"version": "v3",
|
| 7 |
"base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
|
| 8 |
"merged_repo": "bgglee/NL2SQL_finetuned",
|
| 9 |
"method": "LoRA (merged)",
|
finetune_config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"version": "
|
| 3 |
"base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
|
| 4 |
"merged_repo": "bgglee/NL2SQL_finetuned",
|
| 5 |
"method": "LoRA (merged)",
|
|
|
|
| 1 |
{
|
| 2 |
+
"version": "v3",
|
| 3 |
"base_model": "./hf_models/meta-llama--Llama-3.2-3B-Instruct",
|
| 4 |
"merged_repo": "bgglee/NL2SQL_finetuned",
|
| 5 |
"method": "LoRA (merged)",
|
model-00001-of-00002.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:327be157f17b9c75f03b065000ad4decd2e8627dfb2873a44c582969a63377a5
|
| 3 |
+
size 4965799096
|
model-00002-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1459729952
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a25a2554bc877ae6efdd628c84985539c5b1542870310551a44427a6abd9448b
|
| 3 |
size 1459729952
|
training_loss.csv
CHANGED
|
@@ -1,37 +1,13 @@
|
|
| 1 |
step,loss
|
| 2 |
-
10,
|
| 3 |
-
20,
|
| 4 |
-
30,0.
|
| 5 |
-
40,0.
|
| 6 |
-
50,0.
|
| 7 |
-
60,0.
|
| 8 |
-
70,0.
|
| 9 |
-
80,0.
|
| 10 |
-
90,0.
|
| 11 |
-
100,0.
|
| 12 |
-
110,0.
|
| 13 |
-
120,0.
|
| 14 |
-
130,0.0359
|
| 15 |
-
140,0.0321
|
| 16 |
-
150,0.0316
|
| 17 |
-
160,0.0203
|
| 18 |
-
170,0.0272
|
| 19 |
-
180,0.0296
|
| 20 |
-
190,0.0302
|
| 21 |
-
200,0.0214
|
| 22 |
-
210,0.0271
|
| 23 |
-
220,0.0251
|
| 24 |
-
230,0.0244
|
| 25 |
-
240,0.0238
|
| 26 |
-
250,0.0267
|
| 27 |
-
260,0.0239
|
| 28 |
-
270,0.0199
|
| 29 |
-
280,0.037
|
| 30 |
-
290,0.0213
|
| 31 |
-
300,0.0224
|
| 32 |
-
310,0.0223
|
| 33 |
-
320,0.0314
|
| 34 |
-
330,0.0214
|
| 35 |
-
340,0.0271
|
| 36 |
-
350,0.0246
|
| 37 |
-
360,0.0287
|
|
|
|
| 1 |
step,loss
|
| 2 |
+
10,0.0329
|
| 3 |
+
20,0.0293
|
| 4 |
+
30,0.0239
|
| 5 |
+
40,0.0236
|
| 6 |
+
50,0.0187
|
| 7 |
+
60,0.0224
|
| 8 |
+
70,0.0248
|
| 9 |
+
80,0.0261
|
| 10 |
+
90,0.0212
|
| 11 |
+
100,0.0233
|
| 12 |
+
110,0.0159
|
| 13 |
+
120,0.0228
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
training_loss.png
CHANGED
|
|
wrong_ids.json
CHANGED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
[]
|