drixo commited on
Commit
78b083f
·
verified ·
1 Parent(s): 13efa6c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +20 -8
app.py CHANGED
@@ -5,7 +5,6 @@ import scipy.io.wavfile as wavfile
5
  import numpy as np
6
  import tempfile
7
 
8
-
9
  # -----------------------------
10
  # Load Bark Model + Processor
11
  # -----------------------------
@@ -19,6 +18,26 @@ model = AutoModelForTextToWaveform.from_pretrained(
19
  ).to(device)
20
 
21
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
22
  # -----------------------------
23
  # Audio Generation Function
24
  # -----------------------------
@@ -48,12 +67,6 @@ def generate_audio(text, voice):
48
  return fp.name
49
 
50
 
51
- # -----------------------------
52
- # Voice Presets
53
- # -----------------------------
54
- voices = sorted(processor.generation_config.voice_presets.keys())
55
-
56
-
57
  # -----------------------------
58
  # Gradio Interface
59
  # -----------------------------
@@ -76,7 +89,6 @@ demo = gr.Interface(
76
  description="Generates speech, singing, music, and sound effects using the open-source Bark model.",
77
  )
78
 
79
-
80
  # -----------------------------
81
  # Launch
82
  # -----------------------------
 
5
  import numpy as np
6
  import tempfile
7
 
 
8
  # -----------------------------
9
  # Load Bark Model + Processor
10
  # -----------------------------
 
18
  ).to(device)
19
 
20
 
21
+ # -----------------------------
22
+ # Voice Presets (Bark v2 manual list)
23
+ # -----------------------------
24
+ voices = [
25
+ "v2/en_speaker_0",
26
+ "v2/en_speaker_1",
27
+ "v2/en_speaker_2",
28
+ "v2/en_speaker_3",
29
+ "v2/en_speaker_4",
30
+ "v2/en_speaker_5",
31
+ "v2/en_speaker_6",
32
+ "v2/en_speaker_7",
33
+ "v2/en_speaker_8",
34
+ "v2/en_speaker_9",
35
+ ]
36
+
37
+ voices = sorted(voices)
38
+
39
+
40
+
41
  # -----------------------------
42
  # Audio Generation Function
43
  # -----------------------------
 
67
  return fp.name
68
 
69
 
 
 
 
 
 
 
70
  # -----------------------------
71
  # Gradio Interface
72
  # -----------------------------
 
89
  description="Generates speech, singing, music, and sound effects using the open-source Bark model.",
90
  )
91
 
 
92
  # -----------------------------
93
  # Launch
94
  # -----------------------------