roger commited on
Commit
cec4f00
·
1 Parent(s): bfd4a9b

feat: add conversion audio data flow img

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. app.py +21 -21
  3. asset/img/converted_audio.png +0 -0
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  *.wav filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  *.wav filter=lfs diff=lfs merge=lfs -text
37
+ *.png filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -8,43 +8,43 @@ print("os.path.dirname:", os.path.dirname(os.path.abspath(__file__)))
8
  # Define the audio file paths (replace with your actual paths)
9
  audio_files = {
10
  "EN": {
11
- "source1": os.path.join(curr_dir,"asset/audio/speech_clone_samples/source/-8014568635405176842.wav"),
12
- "source2": os.path.join(curr_dir,"asset/audio/speech_clone_samples/source/2188769758301752050.wav"),
13
  "prompt1": [
14
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt1/4813840990459345930.wav"),
15
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt1/-4261051484297537007.wav")
16
  ],
17
  "prompt2": [
18
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt2/-5427774732334682307.wav"),
19
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt2/-8434461861028245286.wav")
20
  ],
21
  "gen1": [
22
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen1/5518114099457736437.wav"),
23
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen1/7702800575106132714.wav")
24
  ],
25
  "gen2": [
26
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen2/-3552571881595006474.wav"),
27
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen2/1663763965594639195.wav")
28
  ]
29
  },
30
  "ZH": {
31
- "source1": os.path.join(curr_dir,"asset/audio/speech_clone_samples/source/6180100163014579264.wav"),
32
- "source2": os.path.join(curr_dir,"asset/audio/speech_clone_samples/source/3454520432972073544.wav"),
33
  "prompt3": [
34
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt3/-3133904573328901327.wav"),
35
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt3/-6807997165982172717.wav")
36
  ],
37
  "prompt4": [
38
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt4/3957690686751537502.wav"),
39
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/prompt/prompt4/-6025252638827969073.wav")
40
  ],
41
  "gen3": [
42
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen3/4648220778277450149.wav"),
43
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen3/3417274376341807017.wav")
44
  ],
45
  "gen4": [
46
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen4/8580165735770550130.wav"),
47
- os.path.join(curr_dir,"asset/audio/speech_clone_samples/generated/gen4/-2291633937079669023.wav")
48
  ]
49
  }
50
  }
@@ -52,8 +52,8 @@ audio_files = {
52
 
53
  def create_audio_demo():
54
  with gr.Blocks(title="Voice Conversion") as demo:
 
55
  gr.Markdown("# Voice Conversion")
56
-
57
  with gr.Tabs():
58
  with gr.TabItem("English (EN)"):
59
  with gr.Row():
 
8
  # Define the audio file paths (replace with your actual paths)
9
  audio_files = {
10
  "EN": {
11
+ "source1": os.path.join(curr_dir, "asset/audio/speech_clone_samples/source/-8014568635405176842.wav"),
12
+ "source2": os.path.join(curr_dir, "asset/audio/speech_clone_samples/source/2188769758301752050.wav"),
13
  "prompt1": [
14
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt1/4813840990459345930.wav"),
15
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt1/-4261051484297537007.wav")
16
  ],
17
  "prompt2": [
18
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt2/-5427774732334682307.wav"),
19
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt2/-8434461861028245286.wav")
20
  ],
21
  "gen1": [
22
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen1/5518114099457736437.wav"),
23
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen1/7702800575106132714.wav")
24
  ],
25
  "gen2": [
26
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen2/-3552571881595006474.wav"),
27
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen2/1663763965594639195.wav")
28
  ]
29
  },
30
  "ZH": {
31
+ "source1": os.path.join(curr_dir, "asset/audio/speech_clone_samples/source/6180100163014579264.wav"),
32
+ "source2": os.path.join(curr_dir, "asset/audio/speech_clone_samples/source/3454520432972073544.wav"),
33
  "prompt3": [
34
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt3/-3133904573328901327.wav"),
35
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt3/-6807997165982172717.wav")
36
  ],
37
  "prompt4": [
38
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt4/3957690686751537502.wav"),
39
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/prompt/prompt4/-6025252638827969073.wav")
40
  ],
41
  "gen3": [
42
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen3/4648220778277450149.wav"),
43
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen3/3417274376341807017.wav")
44
  ],
45
  "gen4": [
46
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen4/8580165735770550130.wav"),
47
+ os.path.join(curr_dir, "asset/audio/speech_clone_samples/generated/gen4/-2291633937079669023.wav")
48
  ]
49
  }
50
  }
 
52
 
53
  def create_audio_demo():
54
  with gr.Blocks(title="Voice Conversion") as demo:
55
+ gr.Image(os.path.join(curr_dir, "asset/img/converted_audio.png"), height=120)
56
  gr.Markdown("# Voice Conversion")
 
57
  with gr.Tabs():
58
  with gr.TabItem("English (EN)"):
59
  with gr.Row():
asset/img/converted_audio.png ADDED