JAEHYUK LEE commited on
Commit
3df0cd3
·
1 Parent(s): bcf4399

Add audio model (pth + model.py + labels + meta)

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.pth filter=lfs diff=lfs merge=lfs -text
__init__.py ADDED
File without changes
baseline_mean_female.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b83b047f116cefab3b0780856dd304dd69bfc461037f36e588c2c665394d60c
3
+ size 180
baseline_mean_male.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0d71d187a2dda7888286a3c9b68cefb7bc7c41dcc998ded431e9833b3d18ff3
3
+ size 180
baseline_std_female.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce87caf7c7a888500c0c8c612b8f49f1b401ec015512471bd8065805a428e18e
3
+ size 180
baseline_std_male.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30ee24a5ecd49255f381bdcc5de0bb5c1783871d2309596188336f652e8a041c
3
+ size 180
labels.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ [
2
+ "HAPPY",
3
+ "SAD",
4
+ "ANGRY",
5
+ "ANXIOUS",
6
+ "SURPRISE",
7
+ "FEAR"
8
+ ]
model.py ADDED
@@ -0,0 +1,26 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import torch
2
+ import torch.nn as nn
3
+ import torch.nn.functional as F
4
+
5
+
6
+ class PyTorchAudioModel(nn.Module):
7
+ def __init__(self, num_labels=6):
8
+ super().__init__()
9
+ self.conv1 = nn.Conv1d(13, 64, kernel_size=5, padding="same")
10
+ self.bn1 = nn.BatchNorm1d(64)
11
+ self.pool1 = nn.MaxPool1d(2, 2)
12
+ self.conv2 = nn.Conv1d(64, 128, kernel_size=3, padding="same")
13
+ self.bn2 = nn.BatchNorm1d(128)
14
+ self.pool2 = nn.MaxPool1d(2, 2)
15
+ self.bilstm = nn.LSTM(128, 64, bidirectional=True, batch_first=True)
16
+ self.dense1 = nn.Linear(128, 128)
17
+ self.dense2 = nn.Linear(128, num_labels)
18
+
19
+ def forward(self, x):
20
+ x = self.pool1(F.relu(self.bn1(self.conv1(x))))
21
+ x = self.pool2(F.relu(self.bn2(self.conv2(x))))
22
+ x = x.permute(0, 2, 1) # (B,C,L)->(B,L,C)
23
+ _, (h_n, _) = self.bilstm(x)
24
+ x = torch.cat([h_n[-2], h_n[-1]], dim=1)
25
+ x = F.relu(self.dense1(x))
26
+ return self.dense2(x)
model_meta.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_version": "v1.0",
3
+ "framework": "keras-3.x / tf-2.15+",
4
+ "input_shape": [
5
+ 100,
6
+ 13
7
+ ],
8
+ "output_classes": 6,
9
+ "labels_order": [
10
+ "HAPPY",
11
+ "SAD",
12
+ "ANGRY",
13
+ "ANXIOUS",
14
+ "SURPRISE",
15
+ "FEAR"
16
+ ],
17
+ "delta_required": true,
18
+ "delta_formula": "(X - mean) / (std + 1e-8)"
19
+ }
pytorch_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a560dc67d3063ae125e7be22753dcd8803f6b1b148b9e44c880a59f9a9bc942
3
+ size 593404