Training in progress, step 110

Files changed (9) hide show

adapter_config.json CHANGED Viewed

@@ -29,13 +29,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "v_proj",
     "k_proj",
     "gate_proj",
-    "q_proj",
     "o_proj",
-    "up_proj",
-    "down_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "k_proj",
+    "v_proj",
     "gate_proj",
     "o_proj",
+    "q_proj",
+    "down_proj",
+    "up_proj"
   ],
   "target_parameters": null,
   "task_type": "CAUSAL_LM",

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:60d95b10b6e140a9626a7058d5038528f2ff80148dc4569b881db56052046509
-size 40

 version https://git-lfs.github.com/spec/v1
+oid sha256:1dc2767d43ff64fdc473d3da757398d1dbefb6920eb8b0523fec8c503ee7e7c8
+size 323014560

config.json CHANGED Viewed

@@ -3,7 +3,7 @@
     "Qwen2ForCausalLM"
   ],
   "attention_dropout": 0.0,
-  "bos_token_id": 151643,
   "dtype": "bfloat16",
   "eos_token_id": 151643,
   "hidden_act": "silu",
@@ -46,6 +46,7 @@
   "num_attention_heads": 28,
   "num_hidden_layers": 28,
   "num_key_value_heads": 4,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000,

     "Qwen2ForCausalLM"
   ],
   "attention_dropout": 0.0,
+  "bos_token_id": 151646,
   "dtype": "bfloat16",
   "eos_token_id": 151643,
   "hidden_act": "silu",
   "num_attention_heads": 28,
   "num_hidden_layers": 28,
   "num_key_value_heads": 4,
+  "pad_token_id": 151643,
   "rms_norm_eps": 1e-06,
   "rope_scaling": null,
   "rope_theta": 10000,

generation_config.json CHANGED Viewed

@@ -2,7 +2,10 @@
   "_from_model_config": true,
   "bos_token_id": 151646,
   "do_sample": true,
-  "eos_token_id": 151643,
   "temperature": 0.6,
   "top_p": 0.95,
   "transformers_version": "4.57.1"

   "_from_model_config": true,
   "bos_token_id": 151646,
   "do_sample": true,
+  "eos_token_id": [
+    151643
+  ],
+  "pad_token_id": 151643,
   "temperature": 0.6,
   "top_p": 0.95,
   "transformers_version": "4.57.1"

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:64d2c6edd65794c79413c57f7b9ecb464a193a01e21e6db35b0b8149223abc58
 size 4877660776

 version https://git-lfs.github.com/spec/v1
+oid sha256:f33d404b24cd4296db6593cef4a200fbf897d26091bb29a925f44f5048212822
 size 4877660776

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:547cb05578bea1cd4dcea2fbbe29d92a5af252c312b74833ff2bcafbec22c19d
 size 4932751008

 version https://git-lfs.github.com/spec/v1
+oid sha256:5839f0133080f959019114927e11dfc999fc8c2eb4d58fc4ca73bc257921c67e
 size 4932751008

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b8b4c6b367ca75c3616aa92be096b0cca836aafc7c53c81e5615466bd0a16ae4
 size 4330865200

 version https://git-lfs.github.com/spec/v1
+oid sha256:be74946458476a35cf284f213926802097c0b9a7f7731d9b8785e19712c95cfb
 size 4330865200

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e20ddafc659ba90242154b55275402edeca0715e5dbb30f56815a4ce081f4893
-size 11422778

 version https://git-lfs.github.com/spec/v1
+oid sha256:a4256422650d141f228fe954acee98679da412984c29a569877eefd3af69315a
+size 11422959

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c61c93517da2b72eeb50829ab91aebcb7b8a3bc71c7559e58a3ed702f9d2d42c
 size 8760

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce150e95afc759cfdbebc809595f0ddd7785d8982327752b175192eea4eda04e
 size 8760