Spaces:

soiz1
/

dall-e-x

Runtime error

App Files Files Community

soiz1 commited on Jan 28, 2025

Commit

61d7bec

verified ·

1 Parent(s): 47b843f

Create app.py

Browse files

Files changed (1) hide show

app.py +76 -0

app.py ADDED Viewed

	@@ -0,0 +1,76 @@

+import gradio as gr
+import tempfile
+import os
+# 保存したnpzファイルのディレクトリ
+npz_save_dir = tempfile.gettempdir()
+# 必要な関数（`make_npz_prompt` と `infer_from_prompt`）は既に提供済みのものを利用
+def save_npz_file(name, uploaded_audio, recorded_audio, transcript_content):
+    result, file_path = make_npz_prompt(name, uploaded_audio, recorded_audio, transcript_content)
+    if file_path:
+        return result, gr.File(file_path)
+    return result, None
+def generate_from_npz(npz_file, text, language, accent, preset_prompt):
+    if npz_file:
+        prompt_path = npz_file.name
+    else:
+        prompt_path = None
+    message, output = infer_from_prompt(text, language, accent, preset_prompt, prompt_path)
+    if output:
+        return message, output
+    return message, None
+def get_available_npz_files():
+    # 一時ディレクトリ内のすべての .npz ファイルをリストアップ
+    return [f for f in os.listdir(npz_save_dir) if f.endswith(".npz")]
+# Gradio アプリのインターフェース作成
+with gr.Blocks() as app:
+    with gr.Tabs():
+        with gr.Tab("NPZファイルを作成"):
+            gr.Markdown("### 音声とテキストから .npz ファイルを作成")
+            name = gr.Textbox(label="ファイル名", placeholder="保存する .npz ファイル名を入力")
+            uploaded_audio = gr.Audio(label="アップロード音声", type="numpy")
+            recorded_audio = gr.Audio(label="録音音声", source="microphone", type="numpy")
+            transcript_content = gr.Textbox(label="テキスト内容", placeholder="音声に対応する文字起こしを入力")
+            result_message = gr.Textbox(label="結果", interactive=False)
+            npz_output = gr.File(label=".npz ファイル")
+            save_button = gr.Button("変換して保存")
+            save_button.click(
+                save_npz_file,
+                inputs=[name, uploaded_audio, recorded_audio, transcript_content],
+                outputs=[result_message, npz_output],
+            )
+        with gr.Tab("NPZファイルで生成"):
+            gr.Markdown("### 保存した .npz ファイルから音声を生成")
+            npz_files_dropdown = gr.Dropdown(
+                label="利用可能な .npz ファイル", choices=get_available_npz_files(), interactive=True
+            )
+            text_input = gr.Textbox(label="生成するテキスト", placeholder="150文字以内のテキストを入力")
+            language = gr.Radio(
+                label="言語選択",
+                choices=["auto-detect", "en", "ja", "zh"],
+                value="auto-detect"
+            )
+            accent = gr.Radio(
+                label="アクセント選択",
+                choices=["no-accent", "en-accent", "ja-accent", "zh-accent"],
+                value="no-accent"
+            )
+            preset_prompt = gr.Textbox(label="プロンプト名", placeholder="既存のプロンプトを選択")
+            synthesis_message = gr.Textbox(label="結果", interactive=False)
+            audio_output = gr.Audio(label="生成音声", type="numpy")
+            generate_button = gr.Button("生成開始")
+            generate_button.click(
+                generate_from_npz,
+                inputs=[npz_files_dropdown, text_input, language, accent, preset_prompt],
+                outputs=[synthesis_message, audio_output],
+            )
+app.launch()