sugiv commited on
Commit
977128f
·
verified ·
1 Parent(s): 0872cc9

Upload training_config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yaml +30 -0
training_config.yaml ADDED
@@ -0,0 +1,30 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model:
2
+ base_model: BAAI/bge-reranker-v2-m3
3
+ freeze_encoder: true
4
+ max_length: 8192
5
+ max_sentences: 500 # NEW: Prevent OOM/hang on very long docs
6
+ pruning_head:
7
+ hidden_dim: 512
8
+ dropout: 0.2
9
+ training:
10
+ labels_file: /workspace/data/labels/examples.jsonl
11
+ train_split: 0.9
12
+ epochs: 10
13
+ batch_size: 8 # Reduced from 16 for long docs
14
+ gradient_accumulation: 8 # Maintain effective batch 64
15
+ learning_rate: 0.0001 # Slightly lower
16
+ weight_decay: 0.02
17
+ warmup_steps: 200 # More warmup
18
+ max_grad_norm: 1.0
19
+ loss:
20
+ loss_type: bce
21
+ pos_weight: 70.0 # FIXED: Was 20, now matches 94:1 imbalance
22
+ label_smoothing: 0.05
23
+ hardware:
24
+ mixed_precision: bf16
25
+ wandb:
26
+ enabled: false
27
+ global:
28
+ data_dir: /workspace/data
29
+ checkpoint_dir: /workspace/checkpoints/pruner_optimized
30
+ log_file: /workspace/logs/pruner_sentence_v2.log