pandelis commited on
Commit
5fe06ee
·
verified ·
1 Parent(s): 888969a

Upload Laguna XS.2 zerolang editing step 75 LoRA

Browse files
loras/laguna-xs2-zerolang-editing-step75-hdznmf/README.md ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Laguna XS.2 Zerolang Editing LoRA
2
+
3
+ Best checkpoint LoRA from Prime hosted training run `hdznmfje3xv0clwhu9sx4b0n`.
4
+
5
+ - Base model: `poolside/Laguna-XS.2`
6
+ - Environment: `pandelis/zerolang-editing@0.1.11`
7
+ - Prime checkpoint: `qyxg7ya6x53ntmfjerp11gah`
8
+ - Training step: 75
9
+ - Held-out eval Avg@1: 0.6604
10
+ - Learning rate: `2e-5`
11
+ - Batch size: 64
12
+ - Rollouts per example: 8
13
+ - Sampling: `max_tokens=4096`, `temperature=0.3`, `enable_thinking=true`
14
+
15
+ This folder contains the PEFT LoRA adapter files extracted from the checkpoint:
16
+
17
+ - `adapter_config.json`
18
+ - `adapter_model.safetensors`
loras/laguna-xs2-zerolang-editing-step75-hdznmf/adapter_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "peft_type": "LORA",
3
+ "task_type": "CAUSAL_LM",
4
+ "base_model_name_or_path": "poolside/Laguna-XS.2",
5
+ "r": 16,
6
+ "lora_alpha": 32.0,
7
+ "lora_dropout": 0.0,
8
+ "bias": "none",
9
+ "target_modules": [
10
+ "down_proj",
11
+ "experts",
12
+ "gate_proj",
13
+ "k_proj",
14
+ "o_proj",
15
+ "q_proj",
16
+ "up_proj",
17
+ "v_proj"
18
+ ],
19
+ "modules_to_save": null
20
+ }
loras/laguna-xs2-zerolang-editing-step75-hdznmf/adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1d5fd8b5fcbd7ebf37b9fde9aae86b39db1295451ffea52dd266172e27ff52b
3
+ size 4982588672
loras/laguna-xs2-zerolang-editing-step75-hdznmf/prime_metadata.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "artifact_type": "peft_lora_adapter",
3
+ "base_model": "poolside/Laguna-XS.2",
4
+ "environment": {
5
+ "id": "pandelis/zerolang-editing",
6
+ "version": "0.1.11"
7
+ },
8
+ "prime_run_id": "hdznmfje3xv0clwhu9sx4b0n",
9
+ "prime_checkpoint_id": "qyxg7ya6x53ntmfjerp11gah",
10
+ "training_step": 75,
11
+ "eval_avg_at_1": 0.6604,
12
+ "training_config": {
13
+ "learning_rate": 2e-5,
14
+ "batch_size": 64,
15
+ "rollouts_per_example": 8,
16
+ "max_steps": 80,
17
+ "sampling": {
18
+ "max_tokens": 4096,
19
+ "temperature": 0.3,
20
+ "enable_thinking": true
21
+ }
22
+ },
23
+ "source_storage_url": "r2://pi-rft-prod/runs/hdznmfje3xv0clwhu9sx4b0n/checkpoints/step_75/"
24
+ }