File size: 1,301 Bytes
67cfa2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
{
  "config_name": "bge-base_lr5e6_ep5_bs16",
  "model": "BAAI/bge-base-en-v1.5",
  "hyperparameters": {
    "learning_rate": 5e-06,
    "epochs": 5,
    "batch_size": 16,
    "warmup_steps": 100,
    "max_grad_norm": 0.5
  },
  "training_time_seconds": 294.1,
  "synthetic_results": {
    "baseline_model": "all-MiniLM-L6-v2",
    "trained_model": "/home/ubuntu/sweep/data/model_sweep/bge-base_lr5e6_ep5_bs16",
    "sample_size": 200,
    "baseline_mean": 0.6809912909008563,
    "trained_mean": 0.7275207257270813,
    "improvement_mean": 0.04652943482622496,
    "improvement_pct": 6.832603507259692,
    "baseline_median": 0.7112560570240021,
    "trained_median": 0.7321392893791199,
    "improvement_median": 0.020883232355117798,
    "trained_std": 0.1384458249346926,
    "trained_min": 0.406196266412735,
    "trained_max": 0.9855192303657532
  },
  "real_world_results": {
    "test_pairs": 89,
    "baseline_model": "all-MiniLM-L6-v2",
    "trained_model": "/home/ubuntu/sweep/data/model_sweep/bge-base_lr5e6_ep5_bs16",
    "baseline_mean": 0.513227381021454,
    "trained_mean": 0.6044960109872765,
    "improvement": 0.09126862996582241,
    "improvement_pct": 17.783273718595147,
    "distraction_mean_margin": 0.17822580886621997,
    "distraction_positive_pct": 75.34246575342466
  }
}