Spaces:

quangchi
/

xmindlab

Sleeping

App Files Files Community

quangchi commited on Apr 7, 2025

Commit

16cac3d

verified ·

1 Parent(s): a31d210

Upload 2 files

Browse files

Files changed (2) hide show

app.py +59 -0
requirements.txt +2 -0

app.py ADDED Viewed

	@@ -0,0 +1,59 @@

+import gradio as gr
+import fal_client
+import os
+import replicate
+os.environ["REPLICATE_API_TOKEN"] = "r8_aFOI9wuwtOp7jnruY2XxJDdczL0YU5q1p6vPR"
+os.environ["FAL_KEY"] = "f202d2e1-aa0c-4b77-9949-3178755202f3:c83c90ba842d66be7cd1cef970a2e3e0"
+def on_queue_update(update):
+    if isinstance(update, fal_client.InProgress):
+        for log in update.logs:
+            print(log["message"])
+def transcribe_with_fal(audio_path):
+    try:
+        # Upload audio file to FAL API
+        url = fal_client.upload_file(audio_path)
+        # Call FAL API for speech-to-text
+        result = fal_client.subscribe(
+            "fal-ai/elevenlabs/speech-to-text",
+            arguments={"audio_url": url},
+            with_logs=True,
+            on_queue_update=on_queue_update,
+        )
+        # Get transcribed text from FAL
+        content = result['text']
+        # Prepare the input for LLM (Replicate)
+        input_data = {
+            "prompt": "Tóm tắt nội dung dưới đây theo các mục sau: - Chủ đề chính - Các vấn đề đã được thảo luận - Các quyết định đã đưa ra - Người chịu trách nhiệm cho các hành động tiếp theo - Thời hạn hoặc thời gian dự kiến cho các hành động Nội dung cuộc họp: '{}'".format(content)
+        }
+        # Call LLM for summarization
+        output = replicate.run(
+            "lucataco/qwq-32b:5a9425923f3ef1101dc663609a80cbd597dea6554a6b0c06483b949cb72603ed",
+            input=input_data,
+            max_tokens=24000
+        )
+        # Return both transcribed text and summary
+        return content, "".join(output)
+    except Exception as e:
+        return f"❌ Lỗi: {str(e)}", ""
+# Create Gradio Interface
+demo = gr.Interface(
+    fn=transcribe_with_fal,
+    inputs=gr.Audio(type="filepath", label="Upload file âm thanh"),
+    outputs=[
+        gr.Textbox(label="Text từ Speech-to-Text"),
+        gr.Textbox(label="Tóm tắt nội dung cuộc họp")
+    ],
+    title="xmind lab"
+)
+if __name__ == "__main__":
+    demo.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ fal_client
2	+ replicate