| { |
| "repo_id": "faeea/custom-gopt-252-eval", |
| "description": "Bundle of the locally downloaded best validation Streaming GOPT checkpoint plus the Whisper and Charsiu models required by the evaluation pipeline.", |
| "artifacts": [ |
| { |
| "path": "streaming_gopt_best/best_audio_model.pth", |
| "type": "streaming_gopt_weights", |
| "purpose": "Pronunciation scoring model selected by validation phone MSE." |
| }, |
| { |
| "path": "streaming_gopt_best/config.json", |
| "type": "streaming_gopt_config", |
| "purpose": "Network shape and training arguments used to restore the model." |
| }, |
| { |
| "path": "streaming_gopt_best/result.csv", |
| "type": "training_metrics", |
| "purpose": "Per-epoch train/validation metrics." |
| }, |
| { |
| "path": "streaming_gopt_best/test_metrics.json", |
| "type": "test_metrics", |
| "purpose": "Held-out test metrics for the best validation checkpoint." |
| }, |
| { |
| "path": "whisper_best_model", |
| "type": "transformers_whisper_model", |
| "purpose": "ASR model used to build streaming ASR-driven GOPT chunks." |
| }, |
| { |
| "path": "charsiu_en_w2v2_tiny_fc_10ms", |
| "type": "charsiu_aligner_model", |
| "purpose": "Frame-level phone alignment model used by preprocessing." |
| }, |
| { |
| "path": "examples/eval_streaming_gopt_test.py", |
| "type": "example_script", |
| "purpose": "Minimal evaluation script for val/test split using the bundled best GOPT checkpoint." |
| }, |
| { |
| "path": "examples/infer_one_audio.py", |
| "type": "example_script", |
| "purpose": "Minimal one-audio local inference script that prints the overall utterance score." |
| }, |
| { |
| "path": "streaming_gopt_best/inference_assets.json", |
| "type": "inference_metadata", |
| "purpose": "Normalization stats and phone-id mapping required for one-audio local inference." |
| } |
| ], |
| "best_validation_summary": { |
| "selection_metric": "phone_val_mse", |
| "best_epoch": 15, |
| "phone_val_mse": 0.04897475987672806, |
| "phone_val_pcc": 0.24482591936290432, |
| "utt_val_pcc_total": 0.6696266195414817, |
| "word_val_pcc_total": 0.24699408632096473 |
| }, |
| "test_summary": { |
| "phone_test_mse": 0.04749840870499611, |
| "phone_test_pcc": 0.3332444625995981, |
| "utt_test_pcc": [ |
| 0.6184778675115561, |
| -0.005628494483717365, |
| 0.7233702728305461, |
| 0.7387418272039076, |
| 0.6823243104620896 |
| ], |
| "word_test_pcc": [ |
| 0.3099214468824142, |
| 0.022433912396827224, |
| 0.321762854413528 |
| ] |
| }, |
| "code_dependencies": { |
| "custom_gopt_repo": "https://github.com/hf49w/custom-gopt.git", |
| "charsiu_repo": "https://github.com/lingjzhu/charsiu", |
| "charsiu_repo_commit": "13a69f2a22ca0c0962b75cc693399b0ae23a12c9" |
| } |
| } |
|
|