Thimphou commited on
Commit
2a1b97e
·
verified ·
1 Parent(s): d3d1096

Add training configuration

Browse files
Files changed (1) hide show
  1. training_config.json +19 -0
training_config.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "timestamp": "2025-06-10T17:30:51.748843",
3
+ "model_name": "Thimphou/MNLP_M3_SFT_code_5percent",
4
+ "data_path": "data/enhanced_mcqa_training_format.tsv",
5
+ "use_context": true,
6
+ "eval_with_context": false,
7
+ "epochs": 3,
8
+ "batch_size": 2,
9
+ "learning_rate": 5e-05,
10
+ "test_size": 0.1,
11
+ "max_samples": 500,
12
+ "output_dir": "./qwen-mcqa-ft",
13
+ "baseline_only": false,
14
+ "eval_only": false,
15
+ "quantize_only": false,
16
+ "quantization": "none",
17
+ "device": "cuda",
18
+ "torch_version": "2.5.1+cu124"
19
+ }