phammminhhieu
/

mamba-hypernetwork-personalization

mamba-hypernetwork-personalization

Model card Files Files and versions

phammminhhieu commited on 15 days ago

Commit

df99066

·

verified ·

1 Parent(s): 51b4149

Upload config

Files changed (1) hide show

config.json +22 -0

config.json ADDED Viewed

	@@ -0,0 +1,22 @@

+{
+  "model_type": "mamba_hypernetwork",
+  "vocab_size": 128000,
+  "hidden_dim": 1024,
+  "state_dim": 16,
+  "expand": 4,
+  "num_llm_layers": 8,
+  "lora_rank": 16,
+  "q_proj_dim": 3072,
+  "v_proj_dim": 1024,
+  "llm_name": "meta-llama/Llama-3.2-3B-Instruct",
+  "reward_model": "phammminhhieu/persona-reward-model",
+  "training_config": {
+    "batch_size": 2,
+    "K": 4,
+    "epochs": 3,
+    "lr": 0.0005,
+    "lambda_grpo": 0.05,
+    "lambda_kl": 0.1,
+    "temperature": 0.8
+  }
+}