Upload LoRA adapter (README written by author)

Browse files

Files changed (4) hide show

README.md +4 -4
adapter_config.json +7 -7
adapter_model.safetensors +2 -2
all_experiments_details.json +434 -0

README.md CHANGED Viewed

@@ -13,7 +13,7 @@ tags:
 - structured-output
 ---
-qwen3-4b-structured-output-lora-sample
 This repository provides a **LoRA adapter** fine-tuned from
 **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
@@ -34,9 +34,9 @@ while intermediate reasoning (Chain-of-Thought) is masked.
 - Base model: Qwen/Qwen3-4B-Instruct-2507
 - Method: QLoRA (4-bit)
 - Max sequence length: 512
-- Epochs: 1
-- Learning rate: 1e-06
-- LoRA: r=64, alpha=128
 ## Usage

 - structured-output
 ---
+# Qwen3-4B RSLoRA (R=256) for Structured Output
 This repository provides a **LoRA adapter** fine-tuned from
 **Qwen/Qwen3-4B-Instruct-2507** using **QLoRA (4-bit, Unsloth)**.
 - Base model: Qwen/Qwen3-4B-Instruct-2507
 - Method: QLoRA (4-bit)
 - Max sequence length: 512
+- Epochs: 2
+- Learning rate: 2e-04
+- LoRA: r=256, alpha=32
 ## Usage

adapter_config.json CHANGED Viewed

@@ -20,7 +20,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 128,
   "lora_bias": false,
   "lora_dropout": 0.0,
   "megatron_config": null,
@@ -29,22 +29,22 @@
   "peft_type": "LORA",
   "peft_version": "0.18.1",
   "qalora_group_size": 16,
-  "r": 64,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "k_proj",
-    "v_proj",
-    "q_proj",
     "gate_proj",
     "down_proj",
     "up_proj",
-    "o_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,
   "use_dora": false,
   "use_qalora": false,
-  "use_rslora": false
 }

   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 32,
   "lora_bias": false,
   "lora_dropout": 0.0,
   "megatron_config": null,
   "peft_type": "LORA",
   "peft_version": "0.18.1",
   "qalora_group_size": 16,
+  "r": 256,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "gate_proj",
     "down_proj",
+    "k_proj",
     "up_proj",
+    "o_proj",
+    "v_proj",
+    "q_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,
   "use_dora": false,
   "use_qalora": false,
+  "use_rslora": true
 }

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4153ae1cdb39b66371216d654822939f812dfffe97bec65d35b8eaaeda011817
-size 528550256

 version https://git-lfs.github.com/spec/v1
+oid sha256:9f7e32a8d79b5e697d84e7807625629d764aff33c2a8a303e7ff31d5cb7fe96d
+size 2113998360

all_experiments_details.json ADDED Viewed

	@@ -0,0 +1,434 @@

+{
+    "Experiment_1": {
+        "config": {
+            "BASE_MODEL_ID": "Qwen/Qwen3-4B-Instruct-2507",
+            "DATASET_ID": "u-10bei/structured_data_with_cot_dataset_512_v2",
+            "BASE_OUT_DIR": "./lora_experiments",
+            "SEED": 3407,
+            "VAL_RATIO": 0.05,
+            "MAX_SEQ_LEN": 512,
+            "LORA_R": 256,
+            "LORA_ALPHA": 32,
+            "LORA_DROPOUT": 0.0,
+            "LORA_TARGET_MODULES": [
+                "q_proj",
+                "k_proj",
+                "v_proj",
+                "o_proj",
+                "gate_proj",
+                "up_proj",
+                "down_proj"
+            ],
+            "EPOCHS": 2,
+            "PER_DEVICE_TRAIN_BS": 2,
+            "PER_DEVICE_EVAL_BS": 2,
+            "GRAD_ACCUM": 8,
+            "LR": 0.0002,
+            "WARMUP_RATIO": 0.1,
+            "WEIGHT_DECAY": 0.05,
+            "MAX_STEPS": -1,
+            "LOGGING_STEPS": 10,
+            "EVAL_STEPS": 50,
+            "SAVE_STEPS": 100,
+            "SAVE_TOTAL_LIMIT": 2,
+            "MASK_COT": true,
+            "OUTPUT_MARKERS": [
+                "Output:",
+                "OUTPUT:",
+                "Final:",
+                "Answer:",
+                "Result:",
+                "Response:"
+            ],
+            "OUTPUT_LEARN_MODE": "after_marker",
+            "UPSAMPLE_ENABLE": false,
+            "UPSAMPLE_RULES_JSON": "{\"xml_to_yaml\": 2.0}",
+            "Experiment_Name": "Method_RSLoRA_R256",
+            "USE_RSLORA": true
+        },
+        "history": [
+            {
+                "loss": 1.3966,
+                "grad_norm": 1.0872466564178467,
+                "learning_rate": 4e-05,
+                "epoch": 0.04501969611705121,
+                "step": 10
+            },
+            {
+                "loss": 0.9325,
+                "grad_norm": 0.9557391405105591,
+                "learning_rate": 8.444444444444444e-05,
+                "epoch": 0.09003939223410241,
+                "step": 20
+            },
+            {
+                "loss": 0.8011,
+                "grad_norm": 0.513979971408844,
+                "learning_rate": 0.00012888888888888892,
+                "epoch": 0.13505908835115363,
+                "step": 30
+            },
+            {
+                "loss": 0.8125,
+                "grad_norm": 0.5614296197891235,
+                "learning_rate": 0.00017333333333333334,
+                "epoch": 0.18007878446820483,
+                "step": 40
+            },
+            {
+                "loss": 0.7486,
+                "grad_norm": 0.32493776082992554,
+                "learning_rate": 0.0001999509018141497,
+                "epoch": 0.22509848058525606,
+                "step": 50
+            },
+            {
+                "eval_loss": 0.8527934551239014,
+                "eval_runtime": 25.8751,
+                "eval_samples_per_second": 7.227,
+                "eval_steps_per_second": 3.633,
+                "epoch": 0.22509848058525606,
+                "step": 50
+            },
+            {
+                "loss": 0.7415,
+                "grad_norm": 0.2533496022224426,
+                "learning_rate": 0.00019939910076582706,
+                "epoch": 0.27011817670230726,
+                "step": 60
+            },
+            {
+                "loss": 0.8629,
+                "grad_norm": 0.3107249438762665,
+                "learning_rate": 0.00019823752233636866,
+                "epoch": 0.31513787281935846,
+                "step": 70
+            },
+            {
+                "loss": 0.7151,
+                "grad_norm": 0.32290422916412354,
+                "learning_rate": 0.00019647329238755036,
+                "epoch": 0.36015756893640966,
+                "step": 80
+            },
+            {
+                "loss": 0.7843,
+                "grad_norm": 0.3160030245780945,
+                "learning_rate": 0.0001941172338293343,
+                "epoch": 0.4051772650534609,
+                "step": 90
+            },
+            {
+                "loss": 0.7931,
+                "grad_norm": 0.40372225642204285,
+                "learning_rate": 0.00019118380022524738,
+                "epoch": 0.4501969611705121,
+                "step": 100
+            },
+            {
+                "eval_loss": 0.7929844260215759,
+                "eval_runtime": 25.6248,
+                "eval_samples_per_second": 7.298,
+                "eval_steps_per_second": 3.668,
+                "epoch": 0.4501969611705121,
+                "step": 100
+            },
+            {
+                "loss": 0.812,
+                "grad_norm": 0.4371040165424347,
+                "learning_rate": 0.0001876909871250184,
+                "epoch": 0.4952166572875633,
+                "step": 110
+            },
+            {
+                "loss": 0.7258,
+                "grad_norm": 0.28696581721305847,
+                "learning_rate": 0.00018366022166841676,
+                "epoch": 0.5402363534046145,
+                "step": 120
+            },
+            {
+                "loss": 0.7824,
+                "grad_norm": 0.9101247787475586,
+                "learning_rate": 0.0001791162311375321,
+                "epoch": 0.5852560495216658,
+                "step": 130
+            },
+            {
+                "loss": 0.7643,
+                "grad_norm": 0.2658868730068207,
+                "learning_rate": 0.00017408689126387995,
+                "epoch": 0.6302757456387169,
+                "step": 140
+            },
+            {
+                "loss": 0.711,
+                "grad_norm": 0.43262964487075806,
+                "learning_rate": 0.0001686030552209133,
+                "epoch": 0.6752954417557682,
+                "step": 150
+            },
+            {
+                "eval_loss": 0.7660654783248901,
+                "eval_runtime": 24.682,
+                "eval_samples_per_second": 7.576,
+                "eval_steps_per_second": 3.808,
+                "epoch": 0.6752954417557682,
+                "step": 150
+            },
+            {
+                "loss": 0.6915,
+                "grad_norm": 0.36354902386665344,
+                "learning_rate": 0.00016269836435100934,
+                "epoch": 0.7203151378728193,
+                "step": 160
+            },
+            {
+                "loss": 0.7233,
+                "grad_norm": 0.3520168662071228,
+                "learning_rate": 0.0001564090417880529,
+                "epoch": 0.7653348339898706,
+                "step": 170
+            },
+            {
+                "loss": 0.6626,
+                "grad_norm": 0.33897820115089417,
+                "learning_rate": 0.0001497736702416662,
+                "epoch": 0.8103545301069218,
+                "step": 180
+            },
+            {
+                "loss": 0.6801,
+                "grad_norm": 0.4690793752670288,
+                "learning_rate": 0.00014283295530629877,
+                "epoch": 0.855374226223973,
+                "step": 190
+            },
+            {
+                "loss": 0.6281,
+                "grad_norm": 0.42146065831184387,
+                "learning_rate": 0.00013562947574718976,
+                "epoch": 0.9003939223410242,
+                "step": 200
+            },
+            {
+                "eval_loss": 0.6899478435516357,
+                "eval_runtime": 24.6215,
+                "eval_samples_per_second": 7.595,
+                "eval_steps_per_second": 3.818,
+                "epoch": 0.9003939223410242,
+                "step": 200
+            },
+            {
+                "loss": 0.6237,
+                "grad_norm": 0.38645192980766296,
+                "learning_rate": 0.00012820742229510817,
+                "epoch": 0.9454136184580754,
+                "step": 210
+            },
+            {
+                "loss": 0.5856,
+                "grad_norm": 0.4482150375843048,
+                "learning_rate": 0.00012061232655226964,
+                "epoch": 0.9904333145751266,
+                "step": 220
+            },
+            {
+                "loss": 0.4553,
+                "grad_norm": 0.5086686015129089,
+                "learning_rate": 0.00011289078167249402,
+                "epoch": 1.0315137872819358,
+                "step": 230
+            },
+            {
+                "loss": 0.5029,
+                "grad_norm": 0.8159873485565186,
+                "learning_rate": 0.00010509015652912966,
+                "epoch": 1.076533483398987,
+                "step": 240
+            },
+            {
+                "loss": 0.5179,
+                "grad_norm": 0.5635101199150085,
+                "learning_rate": 9.72583051242198e-05,
+                "epoch": 1.1215531795160383,
+                "step": 250
+            },
+            {
+                "eval_loss": 0.5836588144302368,
+                "eval_runtime": 24.7575,
+                "eval_samples_per_second": 7.553,
+                "eval_steps_per_second": 3.797,
+                "epoch": 1.1215531795160383,
+                "step": 250
+            },
+            {
+                "loss": 0.514,
+                "grad_norm": 0.661852240562439,
+                "learning_rate": 8.944327302158073e-05,
+                "epoch": 1.1665728756330895,
+                "step": 260
+            },
+            {
+                "loss": 0.4472,
+                "grad_norm": 0.4757942259311676,
+                "learning_rate": 8.169300260471818e-05,
+                "epoch": 1.2115925717501406,
+                "step": 270
+            },
+            {
+                "loss": 0.4286,
+                "grad_norm": 0.6126232743263245,
+                "learning_rate": 7.405503896771729e-05,
+                "epoch": 1.2566122678671918,
+                "step": 280
+            },
+            {
+                "loss": 0.4862,
+                "grad_norm": 0.5707330703735352,
+                "learning_rate": 6.65762382433589e-05,
+                "epoch": 1.301631963984243,
+                "step": 290
+            },
+            {
+                "loss": 0.4352,
+                "grad_norm": 0.3476680815219879,
+                "learning_rate": 5.930248015776325e-05,
+                "epoch": 1.3466516601012943,
+                "step": 300
+            },
+            {
+                "eval_loss": 0.4677433371543884,
+                "eval_runtime": 24.7074,
+                "eval_samples_per_second": 7.569,
+                "eval_steps_per_second": 3.805,
+                "epoch": 1.3466516601012943,
+                "step": 300
+            },
+            {
+                "loss": 0.3118,
+                "grad_norm": 0.6370311379432678,
+                "learning_rate": 5.227838657493396e-05,
+                "epoch": 1.3916713562183456,
+                "step": 310
+            },
+            {
+                "loss": 0.3847,
+                "grad_norm": 0.5159108638763428,
+                "learning_rate": 4.5547047757828985e-05,
+                "epoch": 1.4366910523353966,
+                "step": 320
+            },
+            {
+                "loss": 0.3931,
+                "grad_norm": 0.6911277174949646,
+                "learning_rate": 3.914975802524806e-05,
+                "epoch": 1.4817107484524479,
+                "step": 330
+            },
+            {
+                "loss": 0.5302,
+                "grad_norm": 0.5555063486099243,
+                "learning_rate": 3.312576242618511e-05,
+                "epoch": 1.5267304445694991,
+                "step": 340
+            },
+            {
+                "loss": 0.3183,
+                "grad_norm": 0.8983607292175293,
+                "learning_rate": 2.7512015985706418e-05,
+                "epoch": 1.5717501406865504,
+                "step": 350
+            },
+            {
+                "eval_loss": 0.3523830473423004,
+                "eval_runtime": 24.7895,
+                "eval_samples_per_second": 7.544,
+                "eval_steps_per_second": 3.792,
+                "epoch": 1.5717501406865504,
+                "step": 350
+            },
+            {
+                "loss": 0.3694,
+                "grad_norm": 0.5024566054344177,
+                "learning_rate": 2.234295699929413e-05,
+                "epoch": 1.6167698368036016,
+                "step": 360
+            },
+            {
+                "loss": 0.3502,
+                "grad_norm": 0.5496794581413269,
+                "learning_rate": 1.7650295766411605e-05,
+                "epoch": 1.6617895329206527,
+                "step": 370
+            },
+            {
+                "loss": 0.3006,
+                "grad_norm": 0.4716707766056061,
+                "learning_rate": 1.3462820059333403e-05,
+                "epoch": 1.7068092290377042,
+                "step": 380
+            },
+            {
+                "loss": 0.3471,
+                "grad_norm": 0.46408089995384216,
+                "learning_rate": 9.80621852061826e-06,
+                "epoch": 1.7518289251547552,
+                "step": 390
+            },
+            {
+                "loss": 0.2301,
+                "grad_norm": 0.41809141635894775,
+                "learning_rate": 6.702923072617129e-06,
+                "epoch": 1.7968486212718064,
+                "step": 400
+            },
+            {
+                "eval_loss": 0.3102871775627136,
+                "eval_runtime": 24.3436,
+                "eval_samples_per_second": 7.682,
+                "eval_steps_per_second": 3.861,
+                "epoch": 1.7968486212718064,
+                "step": 400
+            },
+            {
+                "loss": 0.2704,
+                "grad_norm": 0.4462619423866272,
+                "learning_rate": 4.171971305776945e-06,
+                "epoch": 1.8418683173888577,
+                "step": 410
+            },
+            {
+                "loss": 0.2168,
+                "grad_norm": 0.4414360523223877,
+                "learning_rate": 2.2288896899377186e-06,
+                "epoch": 1.8868880135059087,
+                "step": 420
+            },
+            {
+                "loss": 0.2626,
+                "grad_norm": 0.3277634084224701,
+                "learning_rate": 8.855983250793288e-07,
+                "epoch": 1.93190770962296,
+                "step": 430
+            },
+            {
+                "loss": 0.342,
+                "grad_norm": 0.4310093820095062,
+                "learning_rate": 1.5033781583758678e-07,
+                "epoch": 1.9769274057400112,
+                "step": 440
+            },
+            {
+                "train_runtime": 3776.627,
+                "train_samples_per_second": 1.882,
+                "train_steps_per_second": 0.118,
+                "total_flos": 7.57271106173184e+16,
+                "train_loss": 0.5718902958882763,
+                "epoch": 2.0,
+                "step": 446,
+                "total_runtime_sec": 3777.7196531295776
+            }
+        ]
+    }
+}