Upload folder using huggingface_hub

Files changed (4) hide show

0000100_adapters.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:733d34934908187d60060aeb0a8c13a31f9a0c265c4519a3596d912cd5afe86c
+size 19947012

0000200_adapters.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5acb0abdd589aec63732c9affe03f610ef9f9212a6cbf52d7f40dbd2d80bd88
+size 19947012

adapter_config.json ADDED Viewed

+{
+    "adapter_path": "/Users/cagatay/strands-mlx/adapter_105_conservative",
+    "batch_size": 1,
+    "config": null,
+    "data": "/Users/cagatay/strands-mlx/strands_training",
+    "fine_tune_type": "lora",
+    "grad_accumulation_steps": 1,
+    "grad_checkpoint": true,
+    "iters": 200,
+    "learning_rate": 1e-05,
+    "lora_parameters": {
+        "rank": 8,
+        "scale": 16.0,
+        "dropout": 0.0
+    },
+    "lr_schedule": null,
+    "mask_prompt": false,
+    "max_seq_length": 2048,
+    "model": "mlx-community/Qwen3-1.7B-4bit",
+    "num_layers": 16,
+    "optimizer": "adam",
+    "optimizer_config": {
+        "adam": {},
+        "adamw": {},
+        "muon": {},
+        "sgd": {},
+        "adafactor": {}
+    },
+    "project_name": null,
+    "report_to": null,
+    "resume_adapter_file": null,
+    "save_every": 100,
+    "seed": 0,
+    "steps_per_eval": 50,
+    "steps_per_report": 20,
+    "steps_per_save": 100,
+    "test": false,
+    "test_batches": 500,
+    "train": true,
+    "val_batches": 25
+}

adapters.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:a5acb0abdd589aec63732c9affe03f610ef9f9212a6cbf52d7f40dbd2d80bd88
+size 19947012