📦 Add model, tokenizer, and model card

Files changed (4) hide show

README.md CHANGED Viewed

@@ -3,10 +3,10 @@ tags:
   - finetuned
 ---
-# meta-llama/Llama-3.1-8B-finetuned with Atomic
 ## Model Description
-This model was fine-tuned from `meta-llama/Llama-3.1-8B` on `fka/awesome-chatgpt-prompts` data using NOLA AI’s Atomic system.
 ## Training Data
 - **Dataset name:** fka/awesome-chatgpt-prompts
@@ -17,5 +17,6 @@ This model was fine-tuned from `meta-llama/Llama-3.1-8B` on `fka/awesome-chatgpt
 - **Used ATOMIC Speed:** True
 ## Final Metrics
-- **Training loss:** N/A
 ---

   - finetuned
 ---
+# meta-llama/Llama-3.2-1B-finetuned with Atomic
 ## Model Description
+This model was fine-tuned from `meta-llama/Llama-3.2-1B` on `fka/awesome-chatgpt-prompts` data using NOLA AI’s Atomic system.
 ## Training Data
 - **Dataset name:** fka/awesome-chatgpt-prompts
 - **Used ATOMIC Speed:** True
 ## Final Metrics
+- **Training loss:** 1.5815104802449544
+- **Training Runtime:** 0:00:46
 ---

adapter_config.json CHANGED Viewed

@@ -4,7 +4,7 @@
     "base_model_class": "LlamaForCausalLM",
     "parent_library": "transformers.models.llama.modeling_llama"
   },
-  "base_model_name_or_path": "meta-llama/Llama-3.1-8B",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
@@ -27,12 +27,12 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "v_proj",
     "gate_proj",
     "k_proj",
     "q_proj",
-    "o_proj",
-    "down_proj",
     "up_proj"
   ],
   "task_type": null,

     "base_model_class": "LlamaForCausalLM",
     "parent_library": "transformers.models.llama.modeling_llama"
   },
+  "base_model_name_or_path": "meta-llama/Llama-3.2-1B",
   "bias": "none",
   "corda_config": null,
   "eva_config": null,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
+    "o_proj",
     "v_proj",
     "gate_proj",
+    "down_proj",
     "k_proj",
     "q_proj",
     "up_proj"
   ],
   "task_type": null,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:36020e044dac18e4b1f3bc2bdd39e6a8f3a064be8bf47fdbfbee608db5afb45f
-size 167832240

 version https://git-lfs.github.com/spec/v1
+oid sha256:aa9cd83605777c79ba8bcea5eecf6b31323bb85d686823f9d1199355175168d7
+size 45118424

lorax_manifest.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "schema": "atomizer/lorax-manifest@v1",
-  "created_at": "2025-09-10T14:49:06.688825+00:00",
   "artifacts": {
     "base_model_id": "",
     "adapters_repo_id": "volfan6415/DemoDayModel_LoRA",
@@ -14,7 +14,7 @@
     "adapter_source": "hub",
     "private": true
   },
-  "runid": "a3c40e0c-ab71-43c1-9e2b-3c12e7647c93",
   "output_dir": "DemoDayModel",
   "training_args": {
     "bf16": true,
@@ -24,7 +24,7 @@
     "logging_steps": 10,
     "lr_scheduler_type": "linear",
     "max_grad_norm": 1,
-    "num_train_epochs": 3,
     "optim": "adamw_torch_fused",
     "output_dir": "DemoDayModel",
     "per_device_eval_batch_size": 16,

 {
   "schema": "atomizer/lorax-manifest@v1",
+  "created_at": "2025-09-18T17:43:05.756765+00:00",
   "artifacts": {
     "base_model_id": "",
     "adapters_repo_id": "volfan6415/DemoDayModel_LoRA",
     "adapter_source": "hub",
     "private": true
   },
+  "runid": "eff98df7-f8ad-4385-bb48-20b20626c6da",
   "output_dir": "DemoDayModel",
   "training_args": {
     "bf16": true,
     "logging_steps": 10,
     "lr_scheduler_type": "linear",
     "max_grad_norm": 1,
+    "num_train_epochs": 10,
     "optim": "adamw_torch_fused",
     "output_dir": "DemoDayModel",
     "per_device_eval_batch_size": 16,