File size: 3,014 Bytes
b5a4032
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
{
  "ground_truth_file": "/home/daniel/repos/github/Long-Form-Audio-Eval/data/ground-truth/truth_1.txt",
  "total_runs_evaluated": 8,
  "results": [
    {
      "run_id": "run-1",
      "run_type": "local-stt",
      "provider": "local",
      "model": "whisper-base",
      "engine": "Buzz",
      "metrics": {
        "wer": 17.52,
        "cer": 5.38,
        "word_accuracy": 82.48,
        "insertions": 44,
        "deletions": 62,
        "substitutions": 726,
        "hits": 3960
      }
    },
    {
      "run_id": "run-2",
      "run_type": "local-stt",
      "provider": "local",
      "model": "whisper-tiny",
      "engine": "Buzz",
      "metrics": {
        "wer": 22.49,
        "cer": 8.39,
        "word_accuracy": 77.51,
        "insertions": 82,
        "deletions": 155,
        "substitutions": 831,
        "hits": 3762
      }
    },
    {
      "run_id": "run-3",
      "run_type": "local-stt",
      "provider": "local",
      "model": "whisper-base",
      "engine": "Buzz",
      "metrics": {
        "wer": 17.52,
        "cer": 5.38,
        "word_accuracy": 82.48,
        "insertions": 44,
        "deletions": 62,
        "substitutions": 726,
        "hits": 3960
      }
    },
    {
      "run_id": "manual-1",
      "run_type": "cloud-stt",
      "provider": "gladia",
      "model": "solaria-1",
      "engine": "api",
      "metrics": {
        "wer": 20.83,
        "cer": 6.3,
        "word_accuracy": 79.17,
        "insertions": 100,
        "deletions": 92,
        "substitutions": 797,
        "hits": 3859
      }
    },
    {
      "run_id": "manual-2",
      "run_type": "cloud-stt",
      "provider": "deepgram",
      "model": "nova-3",
      "engine": "api",
      "metrics": {
        "wer": 18.72,
        "cer": 7.33,
        "word_accuracy": 81.28,
        "insertions": 60,
        "deletions": 214,
        "substitutions": 615,
        "hits": 3919
      }
    },
    {
      "run_id": "manual-3",
      "run_type": "cloud-stt",
      "provider": "assemblyai",
      "model": "best",
      "engine": "api",
      "metrics": {
        "wer": 18.79,
        "cer": 6.24,
        "word_accuracy": 81.21,
        "insertions": 64,
        "deletions": 156,
        "substitutions": 672,
        "hits": 3920
      }
    },
    {
      "run_id": "manual-4",
      "run_type": "cloud-stt",
      "provider": "speechmatics",
      "model": "slam-1-global-english",
      "engine": "api",
      "metrics": {
        "wer": 21.65,
        "cer": 7.15,
        "word_accuracy": 78.35,
        "insertions": 158,
        "deletions": 51,
        "substitutions": 819,
        "hits": 3878
      }
    },
    {
      "run_id": "manual-5",
      "run_type": "cloud-stt",
      "provider": "openai",
      "model": "whisper-1",
      "engine": "api",
      "metrics": {
        "wer": 19.27,
        "cer": 6.4,
        "word_accuracy": 80.73,
        "insertions": 114,
        "deletions": 106,
        "substitutions": 695,
        "hits": 3947
      }
    }
  ]
}