Upload task output test1334test1234test1234test12334

Files changed (8) hide show

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ tags:
 - generated_from_trainer
 base_model: samoline/b7447218-27e6-491c-b3ab-ea03a5b93541
 model-index:
-- name: app/checkpoints/test13/texttest
   results: []
 ---
@@ -23,7 +23,7 @@ chat_template: llama3
 dataset_prepared_path: null
 datasets:
 - data_files:
-  - test13_train_data.json
   ds_type: json
   format: custom
   path: /workspace/axolotl/data
@@ -60,11 +60,11 @@ lora_target_linear: true
 lr_scheduler: cosine
 max_steps: 1
 micro_batch_size: 2
-mlflow_experiment_name: /workspace/axolotl/data/test13_train_data.json
 model_type: AutoModelForCausalLM
 num_epochs: 1
 optimizer: adamw_bnb_8bit
-output_dir: /app/checkpoints/test13/texttest
 pad_to_sequence_len: true
 resume_from_checkpoint: null
 s2_attention: null
@@ -79,10 +79,10 @@ trust_remote_code: true
 val_set_size: 0.05
 wandb_entity: null
 wandb_mode: offline
-wandb_name: test13_texttest
 wandb_project: Gradients-On-Demand
 wandb_run: your_name
-wandb_runid: test13_texttest
 warmup_steps: 1
 weight_decay: 0.0
 xformers_attention: null
@@ -91,7 +91,7 @@ xformers_attention: null
 </details><br>
-# app/checkpoints/test13/texttest
 This model was trained from scratch on the None dataset.

 - generated_from_trainer
 base_model: samoline/b7447218-27e6-491c-b3ab-ea03a5b93541
 model-index:
+- name: app/checkpoints/test1334test1234test1234test12334/texttest
   results: []
 ---
 dataset_prepared_path: null
 datasets:
 - data_files:
+  - test1334test1234test1234test12334_train_data.json
   ds_type: json
   format: custom
   path: /workspace/axolotl/data
 lr_scheduler: cosine
 max_steps: 1
 micro_batch_size: 2
+mlflow_experiment_name: /workspace/axolotl/data/test1334test1234test1234test12334_train_data.json
 model_type: AutoModelForCausalLM
 num_epochs: 1
 optimizer: adamw_bnb_8bit
+output_dir: /app/checkpoints/test1334test1234test1234test12334/texttest
 pad_to_sequence_len: true
 resume_from_checkpoint: null
 s2_attention: null
 val_set_size: 0.05
 wandb_entity: null
 wandb_mode: offline
+wandb_name: test1334test1234test1234test12334_texttest
 wandb_project: Gradients-On-Demand
 wandb_run: your_name
+wandb_runid: test1334test1234test1234test12334_texttest
 warmup_steps: 1
 weight_decay: 0.0
 xformers_attention: null
 </details><br>
+# app/checkpoints/test1334test1234test1234test12334/texttest
 This model was trained from scratch on the None dataset.

adapter_config.json CHANGED Viewed

@@ -24,13 +24,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
-    "up_proj",
     "down_proj",
     "v_proj",
-    "k_proj",
     "gate_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
+    "up_proj",
     "v_proj",
     "gate_proj",
+    "q_proj",
+    "k_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0ce0bd8eaf01e7f731337e25a4c58b6b8c5f1a29af57f9f2c3d7d9df4b7d8b16
 size 22573704

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e5c010c04b0ed997c5bcbbdb8362a9c53e6bc5e50f2212fe5ff9c99d75273a4
 size 22573704

checkpoint-1/adapter_config.json CHANGED Viewed

@@ -24,13 +24,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "o_proj",
-    "up_proj",
     "down_proj",
     "v_proj",
-    "k_proj",
     "gate_proj",
-    "q_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "down_proj",
+    "up_proj",
     "v_proj",
     "gate_proj",
+    "q_proj",
+    "k_proj",
+    "o_proj"
   ],
   "task_type": "CAUSAL_LM",
   "trainable_token_indices": null,

checkpoint-1/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0ce0bd8eaf01e7f731337e25a4c58b6b8c5f1a29af57f9f2c3d7d9df4b7d8b16
 size 22573704

 version https://git-lfs.github.com/spec/v1
+oid sha256:7e5c010c04b0ed997c5bcbbdb8362a9c53e6bc5e50f2212fe5ff9c99d75273a4
 size 22573704

checkpoint-1/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4266f9a9cd3f58fb428f4ce578414368cae6358aca11e9e2347c3c1c08527ff7
 size 11710970

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab750e2213b220358059c8bb1238af05f822ff8058636d3ec44e2cd653d9a7e1
 size 11710970

checkpoint-1/trainer_state.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.010416666666666666,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
@@ -10,10 +10,10 @@
   "is_world_process_zero": true,
   "log_history": [
     {
-      "epoch": 0.010416666666666666,
-      "grad_norm": 0.8706836700439453,
       "learning_rate": 0.0,
-      "loss": 1.5137,
       "step": 1
     }
   ],

   "best_global_step": null,
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.008733624454148471,
   "eval_steps": 500,
   "global_step": 1,
   "is_hyper_param_search": false,
   "is_world_process_zero": true,
   "log_history": [
     {
+      "epoch": 0.008733624454148471,
+      "grad_norm": 0.692659318447113,
       "learning_rate": 0.0,
+      "loss": 1.6015,
       "step": 1
     }
   ],

checkpoint-1/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:064783a6f886a579701dc6537acb5b82984f533c5f775f5c3965481945d4547c
-size 7096

 version https://git-lfs.github.com/spec/v1
+oid sha256:f31b6c3abbe50418c0ea9a5853aed1f1ea7a05142bddae8aa159103fea461861
+size 7160