File size: 1,186 Bytes
70c4776
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
{
  "best_score": 0.8707563891593045,
  "best_model_path": "/root/.AUQUA-S/VIPPLUS-A/iteration3_refine6_intelligibility_focus_var1.5_iter2_encoder_boost_iter3_noise_scale_1.2",
  "best_strategy": "intelligibility_focus_var1.5_iter2_encoder_boost_iter3_noise_scale_1.2",
  "best_metrics": {
    "mel_cepstral_distortion": 0.9589833174818487,
    "word_error_rate": 0.054760724732324996,
    "naturalness": 0.9245957330261779,
    "intelligibility": 0.9576635250307177,
    "speaker_similarity": 0.9452548157294308,
    "prosody": 0.9438130045261443,
    "overall_quality": 0.9845158845287313,
    "weighted_score": 0.8707563891593045
  },
  "iterations_performed": 3,
  "final_model_path": "/root/.AUQUA-S/VIPPLUS-A/top1_optimized_model",
  "optimization_timestamp": "2025-04-14T17:08:24.418693",
  "seed": 1744649962,
  "total_strategies_tested": 32,
  "strategy_effectiveness": {
    "attention_scale": 1.2800188790071496,
    "output_scale": 1.3800188790071495,
    "projection_scale": 1.6199811209928505,
    "encoder_scale": 1.6602483822531084,
    "decoder_scale": 1.2199811209928504,
    "base_enhancement": 0.0029400566370214485,
    "importance_factor": 1.5999056049642524
  }
}