mohdusman001 commited on
Commit
71b5b76
·
verified ·
1 Parent(s): 65254b0

Add pipeline_summary.json

Browse files
Files changed (1) hide show
  1. metrics/pipeline_summary.json +41 -0
metrics/pipeline_summary.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "completed_at": "2025-11-16 19:50:03",
3
+ "total_hours": 4.139640825125906,
4
+ "configuration": {
5
+ "base_model": "meta-llama/Meta-Llama-3.1-8B-Instruct",
6
+ "gpus": 2,
7
+ "lora_rank": 128,
8
+ "lora_alpha": 256,
9
+ "max_steps": 500
10
+ },
11
+ "stages": {
12
+ "stage1": {
13
+ "context_length": 2048,
14
+ "hours": 4.0,
15
+ "learning_rate": 0.00015,
16
+ "merged_model": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage1/merged_model_stage1",
17
+ "final_eval": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage1/metrics/final_eval.json",
18
+ "generations": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage1/generations.jsonl",
19
+ "quick_sanity": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage1/metrics/quick_sanity.json"
20
+ },
21
+ "stage2": {
22
+ "context_length": 4096,
23
+ "hours": 5.0,
24
+ "learning_rate": 8e-05,
25
+ "merged_model": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage2/merged_model_stage2",
26
+ "final_eval": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage2/metrics/final_eval.json",
27
+ "generations": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage2/generations.jsonl",
28
+ "quick_sanity": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage2/metrics/quick_sanity.json"
29
+ },
30
+ "stage3": {
31
+ "context_length": 8192,
32
+ "hours": 5.0,
33
+ "learning_rate": 5e-05,
34
+ "merged_model": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage3/merged_model_stage3",
35
+ "final_eval": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage3/metrics/final_eval.json",
36
+ "generations": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage3/generations.jsonl",
37
+ "quick_sanity": "/scratch/musmanme/pi2_table_sft_three_stage_output/stage3/metrics/quick_sanity.json"
38
+ }
39
+ },
40
+ "note": "\u03c0\u2082 SFT complete. Use any merged_model as initial policy/reference for Stage-2 RL."
41
+ }