Upload task output test1334test1234test1234test34

Files changed (10) hide show

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ tags:
 - generated_from_trainer
 base_model: samoline/b7447218-27e6-491c-b3ab-ea03a5b93541
 model-index:
-- name: workspace/axolotl/outputs/test1334test1234test1234test12334/texttest
   results: []
 ---
@@ -23,7 +23,7 @@ chat_template: llama3
 dataset_prepared_path: null
 datasets:
 - data_files:
-  - test1334test1234test1234test12334_train_data.json
   ds_type: json
   format: custom
   path: /workspace/axolotl/data
@@ -60,11 +60,11 @@ lora_target_linear: true
 lr_scheduler: cosine
 max_steps: 1
 micro_batch_size: 2
-mlflow_experiment_name: /workspace/axolotl/data/test1334test1234test1234test12334_train_data.json
 model_type: AutoModelForCausalLM
 num_epochs: 1
 optimizer: adamw_bnb_8bit
-output_dir: /workspace/axolotl/outputs/test1334test1234test1234test12334/texttest
 pad_to_sequence_len: true
 resume_from_checkpoint: null
 s2_attention: null
@@ -79,10 +79,10 @@ trust_remote_code: true
 val_set_size: 0.05
 wandb_entity: null
 wandb_mode: offline
-wandb_name: test1334test1234test1234test12334_texttest
 wandb_project: Gradients-On-Demand
 wandb_run: your_name
-wandb_runid: test1334test1234test1234test12334_texttest
 warmup_steps: 1
 weight_decay: 0.0
 xformers_attention: null
@@ -91,7 +91,7 @@ xformers_attention: null
 </details><br>
-# workspace/axolotl/outputs/test1334test1234test1234test12334/texttest
 This model was trained from scratch on the None dataset.

 - generated_from_trainer
 base_model: samoline/b7447218-27e6-491c-b3ab-ea03a5b93541
 model-index:
+- name: workspace/axolotl/outputs/test1334test1234test1234test34/texttest
   results: []
 ---
 dataset_prepared_path: null
 datasets:
 - data_files:
+  - test1334test1234test1234test34_train_data.json
   ds_type: json
   format: custom
   path: /workspace/axolotl/data
 lr_scheduler: cosine
 max_steps: 1
 micro_batch_size: 2
+mlflow_experiment_name: /workspace/axolotl/data/test1334test1234test1234test34_train_data.json
 model_type: AutoModelForCausalLM
 num_epochs: 1
 optimizer: adamw_bnb_8bit
+output_dir: /workspace/axolotl/outputs/test1334test1234test1234test34/texttest
 pad_to_sequence_len: true
 resume_from_checkpoint: null
 s2_attention: null
 val_set_size: 0.05
 wandb_entity: null
 wandb_mode: offline
+wandb_name: test1334test1234test1234test34_texttest
 wandb_project: Gradients-On-Demand
 wandb_run: your_name
+wandb_runid: test1334test1234test1234test34_texttest
 warmup_steps: 1
 weight_decay: 0.0
 xformers_attention: null
 </details><br>
+# workspace/axolotl/outputs/test1334test1234test1234test34/texttest
 This model was trained from scratch on the None dataset.

adapter_config.json CHANGED Viewed

@@ -25,10 +25,10 @@
   "revision": null,
   "target_modules": [
     "gate_proj",
-    "k_proj",
-    "down_proj",
     "q_proj",
     "up_proj",
     "v_proj",
     "o_proj"
   ],

   "revision": null,
   "target_modules": [
     "gate_proj",
     "q_proj",
+    "k_proj",
     "up_proj",
+    "down_proj",
     "v_proj",
     "o_proj"
   ],

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a25b065eef1c3d7fc2341c739d39f9e5314db39eee10c9342acee52c4d7aee7
 size 22573704

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ea6929ca6dde2a3ac9c8a46014547707c434edda5748ced18cd7d5a5201fef2
 size 22573704

checkpoint-1/README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-base_model: /cache/test1334test1234test1234test12334/models/samoline--b7447218-27e6-491c-b3ab-ea03a5b93541
 library_name: peft
 ---

 ---
+base_model: /cache/test1334test1234test1234test34/models/samoline--b7447218-27e6-491c-b3ab-ea03a5b93541
 library_name: peft
 ---

checkpoint-1/adapter_config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "alpha_pattern": {},
   "auto_mapping": null,
-  "base_model_name_or_path": "/cache/test1334test1234test1234test12334/models/samoline--b7447218-27e6-491c-b3ab-ea03a5b93541",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
@@ -25,10 +25,10 @@
   "revision": null,
   "target_modules": [
     "gate_proj",
-    "k_proj",
-    "down_proj",
     "q_proj",
     "up_proj",
     "v_proj",
     "o_proj"
   ],

 {
   "alpha_pattern": {},
   "auto_mapping": null,
+  "base_model_name_or_path": "/cache/test1334test1234test1234test34/models/samoline--b7447218-27e6-491c-b3ab-ea03a5b93541",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "revision": null,
   "target_modules": [
     "gate_proj",
     "q_proj",
+    "k_proj",
     "up_proj",
+    "down_proj",
     "v_proj",
     "o_proj"
   ],

checkpoint-1/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a25b065eef1c3d7fc2341c739d39f9e5314db39eee10c9342acee52c4d7aee7
 size 22573704

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ea6929ca6dde2a3ac9c8a46014547707c434edda5748ced18cd7d5a5201fef2
 size 22573704

checkpoint-1/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:10159d605898dbcbf79e301a5f5144c27286a025a489ac232e94d88acb2a6bee
 size 11710970

 version https://git-lfs.github.com/spec/v1
+oid sha256:984dce112fc24ae4eaba62d2904d0043a7f32ec1a9ca5e5894925adf96d89a5b
 size 11710970

checkpoint-1/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8898f6f7795fb6bc31316b2e35945a51a1fa3d28252626c221222713df549b8d
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:f97bb552d304801def1800311e9b4f0db4888641a7d6326f60a0099954973d2b
 size 14244

checkpoint-1/trainer_state.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.009216589861751152,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
@@ -10,10 +10,10 @@
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.009216589861751152,
-      "grad_norm": 0.6244447827339172,
       "learning_rate": 0.0,
-      "loss": 1.0026,
       "step": 1
     }
   ],

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.009900990099009901,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.009900990099009901,
+      "grad_norm": 0.472037672996521,
       "learning_rate": 0.0,
+      "loss": 0.9592,
       "step": 1
     }
   ],

checkpoint-1/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9a1ebb3a101775193404ad81edb57b0ce9d21fb9922f5caea612cd94c8bac42a
 size 7224

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d896a8d25c643391583d2ed5bb4dced3ad66e83c5f45be84dfcb518f2faa37f
 size 7224