Spaces:

ombhojane
/

outlines

Runtime error

App Files Files Community

ombhojane commited on Dec 16, 2023

Commit

e2c6f94

1 Parent(s): 9fa1ac5

Upload 3 files

Browse files

Files changed (3) hide show

app.py +59 -0
templates/index.html +25 -0
templates/result.html +15 -0

app.py ADDED Viewed

	@@ -0,0 +1,59 @@

+# app.py
+from flask import Flask, render_template, request
+import gradio as gr
+from transformers import pipeline
+app = Flask(__name__)
+MODEL_NAME = "openai/whisper-large-v3"
+BATCH_SIZE = 8
+device = 0 if torch.cuda.is_available() else "cpu"
+pipe = pipeline(
+    task="automatic-speech-recognition",
+    model=MODEL_NAME,
+    chunk_length_s=30,
+    device=device,
+)
+def transcribe(inputs, task):
+    if inputs is None:
+        raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
+    text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task}, return_timestamps=True)["text"]
+    return text
+audio_transcribe_interface = gr.Interface(
+    fn=transcribe,
+    inputs=[
+        gr.inputs.Audio(source="upload", type="filepath", optional=True, label="Audio file"),
+        gr.inputs.Radio(["transcribe", "translate"], label="Task", default="translate"),
+    ],
+    outputs="text",
+    theme="huggingface",
+    title="Whisper Large V3: Translate Audio",
+    description=(
+        "Translate long-form audio inputs with the click of a button! Demo uses the"
+        f" checkpoint [{MODEL_NAME}](https://huggingface.co/{MODEL_NAME}) and 🤗 Transformers to transcribe audio files"
+        " of arbitrary length."
+    ),
+)
+@app.route('/')
+def index():
+    return render_template('index.html')
+@app.route('/translate_audio', methods=['POST'])
+def translate_audio():
+    if request.method == 'POST':
+        audio_file = request.files['audio_file']
+        task = request.form['task']
+        result = audio_transcribe_interface.process(audio_file, task)
+        return render_template('result.html', result=result)
+if __name__ == '__main__':
+    app.run(debug=True)

templates/index.html ADDED Viewed

	@@ -0,0 +1,25 @@

+<!-- templates/index.html -->
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta http-equiv="X-UA-Compatible" content="IE=edge">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Translate Audio</title>
+</head>
+<body>
+    <h1>Translate Audio</h1>
+    <form action="/translate_audio" method="post" enctype="multipart/form-data">
+        <label for="audio_file">Choose an audio file:</label>
+        <input type="file" id="audio_file" name="audio_file" accept="audio/*">
+        <br>
+        <label for="task">Choose a task:</label>
+        <select id="task" name="task">
+            <option value="translate" selected>Translate</option>
+        </select>
+        <br>
+        <input type="submit" value="Submit">
+    </form>
+</body>
+</html>

templates/result.html ADDED Viewed

	@@ -0,0 +1,15 @@

+<!-- templates/result.html -->
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta http-equiv="X-UA-Compatible" content="IE=edge">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Translation Result</title>
+</head>
+<body>
+    <h1>Translation Result</h1>
+    <p>{{ result }}</p>
+</body>
+</html>