File size: 1,223 Bytes
97d0228
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
{
  "model": "pyannote-segmentation-3.0",
  "format": "tflite",
  "mode": "streaming",
  "sample_rate": 16000,
  "chunk_duration": 1.0,
  "full_window_duration": 10.0,
  "full_window_step": 5.0,
  "num_chunks_per_window": 10,
  "num_powerset_classes": 7,
  "max_local_speakers": 3,
  "frames_per_chunk": 56,
  "frames_per_window": 560,
  "lstm_state_shape": [
    2,
    8,
    1,
    128
  ],
  "inputs": {
    "audio": {
      "shape": [
        1,
        1,
        16000
      ],
      "dtype": "float32"
    },
    "lstm_state": {
      "shape": [
        2,
        8,
        1,
        128
      ],
      "dtype": "float32",
      "note": "Pass zeros on first chunk. Carry forward between chunks."
    }
  },
  "outputs": {
    "posteriors": {
      "shape": [
        1,
        56,
        7
      ],
      "dtype": "float32"
    },
    "lstm_state_out": {
      "shape": [
        2,
        8,
        1,
        128
      ],
      "dtype": "float32",
      "note": "Feed back as lstm_state for the next chunk."
    }
  },
  "usage": "Run 10 consecutive 1-second chunks with state carried between calls to reconstruct a full 10-second segmentation window. Initialize lstm_state to zeros for the first chunk."
}