clairedhx commited on
Commit
90fa8dd
·
verified ·
1 Parent(s): 3adf308

Upload config_train.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. config_train.json +26 -0
config_train.json ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "input_csv": "data/bdx_codes/train.csv",
3
+ "text_col": "text",
4
+ "label_col": "dp_code_tronque",
5
+ "output_dir": "checkpoints/camembert_dp_ft_top40_bdx",
6
+ "pretrained": "almanach/camembert-bio-base",
7
+ "epochs": 20,
8
+ "batch_size": 8,
9
+ "lr": 2e-05,
10
+ "fp16": true,
11
+ "bf16": false,
12
+ "warmup_ratio": 0.1,
13
+ "weight_decay": 0.01,
14
+ "max_length": 512,
15
+ "val_frac": 0.1,
16
+ "seed": 42,
17
+ "eval_every": 500,
18
+ "save_total_limit": 2,
19
+ "gradient_accumulation_steps": 4,
20
+ "do_chunk": true,
21
+ "chunk_size": 480,
22
+ "chunk_stride": 64,
23
+ "mlflow_run_name": "finetuning_top40_bdx",
24
+ "n_train": 8407,
25
+ "n_val": 956
26
+ }