kesbeast23 commited on
Commit
4776de8
·
unverified ·
1 Parent(s): 1c29f6f
.gitignore ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ gradio_env/
2
+ .DS_Store
3
+ .env
4
+ .venv/
5
+ # Exclude large audio files (use parquet instead)
6
+ *.wav
7
+ *.mp3
8
+ *.flac
9
+ common_samples/
10
+ organized_samples/
11
+
12
+ # Keep parquet files (small, no Git LFS needed)
13
+ !parquet_samples/
14
+ !*.parquet
15
+
16
+ # Python
17
+ __pycache__/
18
+ *.py[cod]
19
+ *$py.class
211_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4a2376819631b88b8ed6bdcae272acece1d0a0f6a962be531b077632d239732
3
+ size 33996737
4014_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1cf39ba7ea2c895fe485db1235bfffe58b48f150b79834c2eb919deec3e2eb7
3
+ size 35781880
F02_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:051fed6bac89a4f6031970afdedf4cb17f15c1ad9c557efb562a7152045c7806
3
+ size 15836445
F04_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02339455600a256f8a2d35379546747a5edfc7e02dd92a35ebaf057b996780e2
3
+ size 16499443
FC02_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2abedd7a17821e894236af63b47291ee31877ab7a6df61628291c7b221e663aa
3
+ size 11918414
M02_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34d2884c27120fea60df11e5507ecd14373eecfdb4bb3d77d66636eaf7765eec
3
+ size 18661702
M04_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f54f7c7d0b22bbe39bbe70b4337dbf58480adc46b59cf1a0e063f5b2def08efe
3
+ size 9262819
MC01_audio_samples.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10b513c89b82b57a06b3206741092c7e72a7851550cc841971266803a61e529a
3
+ size 14827983
parquet_audio_index.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "format": "parquet_audio",
3
+ "description": "Audio samples stored as parquet files with audio arrays",
4
+ "sample_rate": 16000,
5
+ "total_speakers": 8,
6
+ "files": [
7
+ "211_audio_samples.parquet",
8
+ "F04_audio_samples.parquet",
9
+ "FC02_audio_samples.parquet",
10
+ "F02_audio_samples.parquet",
11
+ "MC01_audio_samples.parquet",
12
+ "M04_audio_samples.parquet",
13
+ "M02_audio_samples.parquet",
14
+ "4014_audio_samples.parquet"
15
+ ],
16
+ "usage": {
17
+ "load_audio": "json.loads(df[\"audio_array\"].iloc[0])",
18
+ "get_sample_rate": "df[\"sample_rate\"].iloc[0]",
19
+ "play_in_gradio": "gr.Audio((sample_rate, np.array(audio_array)))"
20
+ }
21
+ }
requirements.txt ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Pathological Speech Synthesis Comparison App
2
+ # Python dependencies for the interactive demonstration
3
+
4
+ # Web interface
5
+ gradio>=4.0.0
6
+
7
+ # Data manipulation
8
+ pandas>=1.5.0
9
+ numpy>=1.21.0
10
+
11
+ # Parquet file support
12
+ pyarrow>=10.0.0
13
+
14
+ # Audio processing (used in conversion scripts)
15
+ librosa>=0.9.0
16
+ soundfile>=0.12.0
17
+
18
+ # Utilities
19
+ pathlib2>=2.3.7; python_version < '3.4'
20
+
21
+ # Optional: For enhanced visualizations
22
+ matplotlib>=3.5.0
23
+ seaborn>=0.11.0
24
+
25
+ # Optional: For audio analysis
26
+ scipy>=1.9.0
27
+
28
+ # JSON handling (built-in, but listing for completeness)
29
+ # json - built-in module
30
+
31
+ # File operations (built-in)
32
+ # shutil - built-in module
33
+ # os - built-in module
34
+
35
+ # Web server dependencies (usually installed with gradio)
36
+ uvicorn>=0.18.0
37
+ fastapi>=0.85.0
38
+
39
+ # Additional gradio dependencies
40
+ pillow>=9.0.0
41
+ requests>=2.25.0
42
+
43
+ # For reproducibility
44
+ wheel>=0.37.0
45
+ setuptools>=65.0.0