crystalballAI commited on
Commit
bd16cf8
·
verified ·
1 Parent(s): 9f9e25b

Add adapters/adapter_config.json

Browse files
Files changed (1) hide show
  1. adapters/adapter_config.json +47 -0
adapters/adapter_config.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "adapter_path": "trail-nexus-ai/models/qwen3-0.6b-routing-specialist/adapters",
3
+ "batch_size": 2,
4
+ "config": "trail-nexus-ai/models/qwen3-0.6b-routing-specialist/lora_config.yaml",
5
+ "data": "trail-nexus-ai/training/data/routing_sft_v1",
6
+ "fine_tune_type": "lora",
7
+ "grad_accumulation_steps": 2,
8
+ "grad_checkpoint": true,
9
+ "iters": 4000,
10
+ "learning_rate": 5e-05,
11
+ "lora_parameters": {
12
+ "alpha": 32,
13
+ "dropout": 0.05,
14
+ "keys": [
15
+ "self_attn.q_proj",
16
+ "self_attn.v_proj",
17
+ "self_attn.k_proj",
18
+ "self_attn.o_proj"
19
+ ],
20
+ "rank": 16,
21
+ "scale": 1.0
22
+ },
23
+ "lr_schedule": null,
24
+ "mask_prompt": false,
25
+ "max_seq_length": 2048,
26
+ "model": "/Users/justinraj/.cache/huggingface/hub/models--Qwen--Qwen3-0.6B/snapshots/c1899de289a04d12100db370d81485cdf75e47ca",
27
+ "num_layers": 16,
28
+ "optimizer": "adam",
29
+ "optimizer_config": {
30
+ "adam": {},
31
+ "adamw": {},
32
+ "muon": {},
33
+ "sgd": {},
34
+ "adafactor": {}
35
+ },
36
+ "project_name": null,
37
+ "report_to": null,
38
+ "resume_adapter_file": null,
39
+ "save_every": 500,
40
+ "seed": 42,
41
+ "steps_per_eval": 200,
42
+ "steps_per_report": 10,
43
+ "test": false,
44
+ "test_batches": 500,
45
+ "train": true,
46
+ "val_batches": 25
47
+ }