JAEHYUK LEE
commited on
Commit
·
3df0cd3
1
Parent(s):
bcf4399
Add audio model (pth + model.py + labels + meta)
Browse files- .gitattributes +1 -0
- __init__.py +0 -0
- baseline_mean_female.npy +3 -0
- baseline_mean_male.npy +3 -0
- baseline_std_female.npy +3 -0
- baseline_std_male.npy +3 -0
- labels.json +8 -0
- model.py +26 -0
- model_meta.json +19 -0
- pytorch_model.pth +3 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
*.pth filter=lfs diff=lfs merge=lfs -text
|
__init__.py
ADDED
|
File without changes
|
baseline_mean_female.npy
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4b83b047f116cefab3b0780856dd304dd69bfc461037f36e588c2c665394d60c
|
| 3 |
+
size 180
|
baseline_mean_male.npy
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0d71d187a2dda7888286a3c9b68cefb7bc7c41dcc998ded431e9833b3d18ff3
|
| 3 |
+
size 180
|
baseline_std_female.npy
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce87caf7c7a888500c0c8c612b8f49f1b401ec015512471bd8065805a428e18e
|
| 3 |
+
size 180
|
baseline_std_male.npy
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30ee24a5ecd49255f381bdcc5de0bb5c1783871d2309596188336f652e8a041c
|
| 3 |
+
size 180
|
labels.json
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
"HAPPY",
|
| 3 |
+
"SAD",
|
| 4 |
+
"ANGRY",
|
| 5 |
+
"ANXIOUS",
|
| 6 |
+
"SURPRISE",
|
| 7 |
+
"FEAR"
|
| 8 |
+
]
|
model.py
ADDED
|
@@ -0,0 +1,26 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import torch
|
| 2 |
+
import torch.nn as nn
|
| 3 |
+
import torch.nn.functional as F
|
| 4 |
+
|
| 5 |
+
|
| 6 |
+
class PyTorchAudioModel(nn.Module):
|
| 7 |
+
def __init__(self, num_labels=6):
|
| 8 |
+
super().__init__()
|
| 9 |
+
self.conv1 = nn.Conv1d(13, 64, kernel_size=5, padding="same")
|
| 10 |
+
self.bn1 = nn.BatchNorm1d(64)
|
| 11 |
+
self.pool1 = nn.MaxPool1d(2, 2)
|
| 12 |
+
self.conv2 = nn.Conv1d(64, 128, kernel_size=3, padding="same")
|
| 13 |
+
self.bn2 = nn.BatchNorm1d(128)
|
| 14 |
+
self.pool2 = nn.MaxPool1d(2, 2)
|
| 15 |
+
self.bilstm = nn.LSTM(128, 64, bidirectional=True, batch_first=True)
|
| 16 |
+
self.dense1 = nn.Linear(128, 128)
|
| 17 |
+
self.dense2 = nn.Linear(128, num_labels)
|
| 18 |
+
|
| 19 |
+
def forward(self, x):
|
| 20 |
+
x = self.pool1(F.relu(self.bn1(self.conv1(x))))
|
| 21 |
+
x = self.pool2(F.relu(self.bn2(self.conv2(x))))
|
| 22 |
+
x = x.permute(0, 2, 1) # (B,C,L)->(B,L,C)
|
| 23 |
+
_, (h_n, _) = self.bilstm(x)
|
| 24 |
+
x = torch.cat([h_n[-2], h_n[-1]], dim=1)
|
| 25 |
+
x = F.relu(self.dense1(x))
|
| 26 |
+
return self.dense2(x)
|
model_meta.json
ADDED
|
@@ -0,0 +1,19 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"model_version": "v1.0",
|
| 3 |
+
"framework": "keras-3.x / tf-2.15+",
|
| 4 |
+
"input_shape": [
|
| 5 |
+
100,
|
| 6 |
+
13
|
| 7 |
+
],
|
| 8 |
+
"output_classes": 6,
|
| 9 |
+
"labels_order": [
|
| 10 |
+
"HAPPY",
|
| 11 |
+
"SAD",
|
| 12 |
+
"ANGRY",
|
| 13 |
+
"ANXIOUS",
|
| 14 |
+
"SURPRISE",
|
| 15 |
+
"FEAR"
|
| 16 |
+
],
|
| 17 |
+
"delta_required": true,
|
| 18 |
+
"delta_formula": "(X - mean) / (std + 1e-8)"
|
| 19 |
+
}
|
pytorch_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a560dc67d3063ae125e7be22753dcd8803f6b1b148b9e44c880a59f9a9bc942
|
| 3 |
+
size 593404
|