File size: 1,260 Bytes
6a4aa16
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
{
  "version": "v3.0-hybrid",
  "config": {
    "epochs": 8,
    "batch_size": 32,
    "gradient_accumulation_steps": 2,
    "learning_rate": 2e-05,
    "warmup_ratio": 0.1,
    "save_steps": 50,
    "evaluation_steps": 50,
    "use_e5_prefixes": true,
    "shuffle_data": true,
    "weight_decay": 0.01,
    "use_cached_mnrl": true,
    "hard_negatives_per_sample": 3,
    "scale": 20.0,
    "eval_batch_size": 32,
    "primary_metric": "recall@10",
    "early_stopping_metric": "mrr@10",
    "early_stopping_patience": 1,
    "early_stopping_min_delta": 0.003,
    "save_best_model": true,
    "log_metrics_to_file": true,
    "verbose_evaluation": true
  },
  "training_time_minutes": 77.64942452907562,
  "total_examples": 9562,
  "examples_per_sample": 1.5048788164935474,
  "model_name": "intfloat/multilingual-e5-base",
  "timestamp": "202759",
  "loss_function": "CachedMultipleNegativesRankingLoss",
  "loss_scale": 20.0,
  "hard_negatives_per_sample": 3,
  "lr_scheduler": "cosine",
  "warmup_steps": 119,
  "total_steps": 1192,
  "resumed_from_checkpoint": false,
  "checkpoint_path": null,
  "early_stopping_used": true,
  "early_stopping_triggered": true,
  "best_metric_score": 0.9091547394004861,
  "stopped_epoch": 4,
  "total_evaluations": 7
}