Upload folder using huggingface_hub

Files changed (5) hide show

blue_cycle_1/README.md CHANGED Viewed

@@ -1,9 +1,9 @@
 ---
-base_model: unsloth/Qwen2.5-3B-Instruct-bnb-4bit
 library_name: peft
 pipeline_tag: text-generation
 tags:
-- base_model:adapter:unsloth/Qwen2.5-3B-Instruct-bnb-4bit
 - grpo
 - lora
 - transformers

 ---
+base_model: unsloth/Qwen2.5-0.5B-Instruct-bnb-4bit
 library_name: peft
 pipeline_tag: text-generation
 tags:
+- base_model:adapter:unsloth/Qwen2.5-0.5B-Instruct-bnb-4bit
 - grpo
 - lora
 - transformers

blue_cycle_1/adapter_config.json CHANGED Viewed

@@ -7,7 +7,7 @@
     "parent_library": "transformers.models.qwen2.modeling_qwen2",
     "unsloth_fixed": true
   },
-  "base_model_name_or_path": "unsloth/Qwen2.5-3B-Instruct-bnb-4bit",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
@@ -20,7 +20,7 @@
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
-  "lora_alpha": 32,
   "lora_bias": false,
   "lora_dropout": 0,
   "lora_ga_config": null,
@@ -30,16 +30,11 @@
   "peft_type": "LORA",
   "peft_version": "0.19.1",
   "qalora_group_size": 16,
-  "r": 16,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
-    "down_proj",
-    "gate_proj",
-    "o_proj",
-    "up_proj",
-    "k_proj",
     "v_proj"
   ],
   "target_parameters": null,

     "parent_library": "transformers.models.qwen2.modeling_qwen2",
     "unsloth_fixed": true
   },
+  "base_model_name_or_path": "unsloth/Qwen2.5-0.5B-Instruct-bnb-4bit",
   "bias": "none",
   "corda_config": null,
   "ensure_weight_tying": false,
   "layers_pattern": null,
   "layers_to_transform": null,
   "loftq_config": {},
+  "lora_alpha": 16,
   "lora_bias": false,
   "lora_dropout": 0,
   "lora_ga_config": null,
   "peft_type": "LORA",
   "peft_version": "0.19.1",
   "qalora_group_size": 16,
+  "r": 8,
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
     "v_proj"
   ],
   "target_parameters": null,

blue_cycle_1/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8851d689bbeba6aced1434b3a33338c1758f3907c145a95d87d9abe1929026a3
-size 119801528

 version https://git-lfs.github.com/spec/v1
+oid sha256:d81a8869746a3cce0238b90ae22f1555ede481ec8b1c4a6c5a4168189c996f2a
+size 2175168

blue_cycle_1/best_metrics.json ADDED Viewed

+{
+  "metric": "train/loss",
+  "best_loss": -0.01885230392217636,
+  "best_step": 155,
+  "agent_type": "blue"
+}

blue_cycle_1/tokenizer_config.json CHANGED Viewed

@@ -8,7 +8,7 @@
   "is_local": false,
   "model_max_length": 32768,
   "pad_token": "<|PAD_TOKEN|>",
-  "padding_side": "left",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null,

   "is_local": false,
   "model_max_length": 32768,
   "pad_token": "<|PAD_TOKEN|>",
+  "padding_side": "right",
   "split_special_tokens": false,
   "tokenizer_class": "Qwen2Tokenizer",
   "unk_token": null,