consight-embeddings-v2 / sweep_result.json
magaja's picture
Add Consight v2 embeddings: bge-base fine-tuned with hard negatives
67cfa2a verified
{
"config_name": "bge-base_lr5e6_ep5_bs16",
"model": "BAAI/bge-base-en-v1.5",
"hyperparameters": {
"learning_rate": 5e-06,
"epochs": 5,
"batch_size": 16,
"warmup_steps": 100,
"max_grad_norm": 0.5
},
"training_time_seconds": 294.1,
"synthetic_results": {
"baseline_model": "all-MiniLM-L6-v2",
"trained_model": "/home/ubuntu/sweep/data/model_sweep/bge-base_lr5e6_ep5_bs16",
"sample_size": 200,
"baseline_mean": 0.6809912909008563,
"trained_mean": 0.7275207257270813,
"improvement_mean": 0.04652943482622496,
"improvement_pct": 6.832603507259692,
"baseline_median": 0.7112560570240021,
"trained_median": 0.7321392893791199,
"improvement_median": 0.020883232355117798,
"trained_std": 0.1384458249346926,
"trained_min": 0.406196266412735,
"trained_max": 0.9855192303657532
},
"real_world_results": {
"test_pairs": 89,
"baseline_model": "all-MiniLM-L6-v2",
"trained_model": "/home/ubuntu/sweep/data/model_sweep/bge-base_lr5e6_ep5_bs16",
"baseline_mean": 0.513227381021454,
"trained_mean": 0.6044960109872765,
"improvement": 0.09126862996582241,
"improvement_pct": 17.783273718595147,
"distraction_mean_margin": 0.17822580886621997,
"distraction_positive_pct": 75.34246575342466
}
}