Training in progress, step 8

Files changed (7) hide show

adapter_config.json CHANGED Viewed

@@ -15,17 +15,17 @@
   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
-  "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "q_proj",
     "o_proj",
     "k_proj",
     "v_proj",
-    "up_proj",
-    "gate_proj",
-    "down_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

   "megatron_core": "megatron.core",
   "modules_to_save": null,
   "peft_type": "LORA",
+  "r": 32,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "down_proj",
+    "gate_proj",
     "o_proj",
+    "up_proj",
     "k_proj",
     "v_proj",
+    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8999f058226d361ada283f3e986c2872e9f9674cfea65279ee031054703ce940
-size 42002584

 version https://git-lfs.github.com/spec/v1
+oid sha256:553c30c183cde40f9dc125ac65099f9949ee8c99143b6267860860b9080235cb
+size 167832688

all_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
-    "epoch": 0.38,
-    "train_loss": 0.5409165602177382,
-    "train_runtime": 341.6545,
-    "train_samples_per_second": 2.997,
-    "train_steps_per_second": 0.375
 }

 {
+    "epoch": 24.04,
+    "train_loss": 0.24291648308280855,
+    "train_runtime": 18372.1559,
+    "train_samples_per_second": 3.567,
+    "train_steps_per_second": 0.223
 }

best_metrics.json CHANGED Viewed

	@@ -1 +1 @@
1	- {"eval_loss": 0.~~39877966046333313~~}


1	+ {"eval_loss": 0.3460787236690521}

train_results.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
-    "epoch": 0.38,
-    "train_loss": 0.5409165602177382,
-    "train_runtime": 341.6545,
-    "train_samples_per_second": 2.997,
-    "train_steps_per_second": 0.375
 }

 {
+    "epoch": 24.04,
+    "train_loss": 0.24291648308280855,
+    "train_runtime": 18372.1559,
+    "train_samples_per_second": 3.567,
+    "train_steps_per_second": 0.223
 }

trainer_state.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c485d6200f718439cc6b80827291400c877c6d24b89a32f39136f8b555aac86c
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:86ca0d6be3f70c59aac907f159da38482d01d742f7ac083384b35f094a87276e
 size 4920