ModalTranscriberMCP / tests /cache /transcribe /speaker_diarization /comprehensive_test_results.json
richard-su's picture
Upload folder using huggingface_hub
76f9cd2 verified
[
{
"audio_file": "tests/cache/xyz_podcast_episode.mp3",
"file_size_mb": 11.427632331848145,
"tests": {
"without_speaker_diarization": {
"config": {
"name": "without_speaker_diarization",
"enable_speaker_diarization": false,
"model_size": "turbo",
"description": "Baseline transcription without speaker identification"
},
"result": {
"processing_status": "success",
"txt_file_path": "/root/cache/transcribe/distributed_transcription_1749529774.txt",
"srt_file_path": "/root/cache/transcribe/distributed_transcription_1749529774.srt",
"audio_duration": 749.98,
"segment_count": 232,
"language_detected": "zh",
"model_used": "turbo",
"distributed_processing": true,
"chunks_processed": 13,
"chunks_failed": 0,
"speaker_diarization_enabled": false
},
"processing_time": 60.62069916725159
},
"with_speaker_diarization": {
"config": {
"name": "with_speaker_diarization",
"enable_speaker_diarization": true,
"model_size": "turbo",
"description": "Full transcription with speaker identification"
},
"result": {
"processing_status": "success",
"txt_file_path": "/root/cache/transcribe/distributed_transcription_1749529901.txt",
"srt_file_path": "/root/cache/transcribe/distributed_transcription_1749529901.srt",
"audio_duration": 749.98,
"segment_count": 241,
"language_detected": "zh",
"model_used": "turbo",
"distributed_processing": true,
"chunks_processed": 13,
"chunks_failed": 0,
"speaker_diarization_enabled": true,
"global_speaker_count": 0,
"speakers_detected": [],
"speaker_summary": {}
},
"processing_time": 127.10918402671814
}
}
},
{
"audio_file": "tests/cache/apple_podcast_episode.mp3",
"file_size_mb": 32.30221080780029,
"tests": {
"without_speaker_diarization": {
"config": {
"name": "without_speaker_diarization",
"enable_speaker_diarization": false,
"model_size": "turbo",
"description": "Baseline transcription without speaker identification"
},
"result": {
"processing_status": "success",
"txt_file_path": "/root/cache/transcribe/distributed_transcription_1749529970.txt",
"srt_file_path": "/root/cache/transcribe/distributed_transcription_1749529970.srt",
"audio_duration": 1051.44,
"segment_count": 222,
"language_detected": "en",
"model_used": "turbo",
"distributed_processing": true,
"chunks_processed": 18,
"chunks_failed": 0,
"speaker_diarization_enabled": false
},
"processing_time": 68.2933440208435
},
"with_speaker_diarization": {
"config": {
"name": "with_speaker_diarization",
"enable_speaker_diarization": true,
"model_size": "turbo",
"description": "Full transcription with speaker identification"
},
"result": {
"processing_status": "success",
"txt_file_path": "/root/cache/transcribe/distributed_transcription_1749530106.txt",
"srt_file_path": "/root/cache/transcribe/distributed_transcription_1749530106.srt",
"audio_duration": 1051.44,
"segment_count": 219,
"language_detected": "en",
"model_used": "turbo",
"distributed_processing": true,
"chunks_processed": 18,
"chunks_failed": 0,
"speaker_diarization_enabled": true,
"global_speaker_count": 0,
"speakers_detected": [],
"speaker_summary": {}
},
"processing_time": 136.49856114387512
}
}
}
]