File size: 1,867 Bytes
8b43d4b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
{
  "model_type": "gigaam",
  "auto_map": {
    "AutoConfig": "modeling_gigaam.GigaAMConfig",
    "AutoModel": "modeling_gigaam.GigaAMModel"
  },
  "cfg": {
    "model": {
      "cfg": {
        "model_class": "rnnt",
        "sample_rate": 16000,
        "preprocessor": {
          "_target_": "modeling_gigaam.FeatureExtractor",
          "sample_rate": 16000,
          "features": 64,
          "win_length": 320,
          "hop_length": 160,
          "mel_scale": "htk",
          "n_fft": 320,
          "mel_norm": null,
          "center": false
        },
        "encoder": {
          "_target_": "modeling_gigaam.ConformerEncoder",
          "feat_in": 64,
          "n_layers": 16,
          "d_model": 768,
          "subsampling_factor": 4,
          "ff_expansion_factor": 4,
          "self_attention_model": "rotary",
          "pos_emb_max_len": 5000,
          "n_heads": 16,
          "conv_kernel_size": 5,
          "flash_attn": false,
          "subs_kernel_size": 5,
          "subsampling": "conv1d",
          "conv_norm_type": "layer_norm"
        },
        "head": {
          "_target_": "modeling_gigaam.RNNTHead",
          "decoder": {
            "pred_hidden": 320,
            "pred_rnn_layers": 1,
            "num_classes": 1025
          },
          "joint": {
            "enc_hidden": 768,
            "pred_hidden": 320,
            "joint_hidden": 320,
            "num_classes": 1025
          }
        },
        "decoding": {
          "_target_": "modeling_gigaam.RNNTGreedyDecoding",
          "vocabulary": null,
          "model_path": "tokenizer.model"
        },
        "model_name": "v3_e2e_rnnt",
        "hashes": {
          "model": "72e2a9b5c7caad963b2bbfd2f298c252",
          "tokenizer": "3b3bf8370e882885d79731592fc99f98"
        }
      },
      "_target_": "modeling_gigaam.GigaAMASR"
    }
  }
}