Spaces:

Nx-Neuralon
/

ASD

Sleeping

App Files Files Community

Nx-Neuralon commited on Mar 19

Commit

3988574

verified ·

1 Parent(s): 0d68d47

Update app/audio_utils.py

Browse files

Files changed (1) hide show

app/audio_utils.py +95 -114

app/audio_utils.py CHANGED Viewed

@@ -1,114 +1,95 @@
-from __future__ import annotations
-import base64
-import os
-import shutil
-import subprocess
-from dataclasses import dataclass
-from typing import List
-@dataclass
-class AudioChunk:
-    path: str
-    start_sec: float
-    end_sec: float
-def check_ffmpeg_available() -> bool:
-    return shutil.which("ffmpeg") is not None and shutil.which("ffprobe") is not None
-def ensure_dir(path: str) -> None:
-    os.makedirs(path, exist_ok=True)
-def get_media_duration(path: str) -> float:
-    cmd = [
-        "ffprobe",
-        "-v", "error",
-        "-show_entries", "format=duration",
-        "-of", "default=noprint_wrappers=1:nokey=1",
-        path,
-    ]
-    proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
-    if proc.returncode != 0:
-        raise RuntimeError(f"ffprobe 获取时长失败: {proc.stderr}")
-    return float(proc.stdout.strip())
-def extract_audio_from_video(
-    video_path: str,
-    output_audio_path: str,
-    bitrate: str = "64k",
-) -> str:
-    """
-    从视频中抽取音频，转成 16k 单声道 mp3，便于后续 ASR。
-    """
-    if not os.path.exists(video_path):
-        raise FileNotFoundError(f"视频不存在: {video_path}")
-    if not check_ffmpeg_available():
-        raise RuntimeError("未检测到 ffmpeg/ffprobe，请先安装 ffmpeg。")
-    ensure_dir(os.path.dirname(output_audio_path))
-    cmd = [
-        "ffmpeg",
-        "-y",
-        "-i", video_path,
-        "-vn",
-        "-ac", "1",
-        "-ar", "16000",
-        "-c:a", "mp3",
-        "-b:a", bitrate,
-        output_audio_path,
-    ]
-    proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
-    if proc.returncode != 0:
-        raise RuntimeError(f"抽取音频失败:\n{proc.stderr}")
-    return output_audio_path
-def split_audio_to_chunks(
-    audio_path: str,
-    output_dir: str,
-    chunk_seconds: int = 290,
-) -> List[AudioChunk]:
-    """
-    按固定时长切音频，避免超过 qwen3-asr-flash 的单次时长限制。
-    """
-    ensure_dir(output_dir)
-    duration = get_media_duration(audio_path)
-    chunks: List[AudioChunk] = []
-    start = 0.0
-    idx = 0
-    while start < duration:
-        end = min(duration, start + chunk_seconds)
-        chunk_path = os.path.join(output_dir, f"audio_chunk_{idx:03d}.mp3")
-        cmd = [
-            "ffmpeg",
-            "-y",
-            "-i", audio_path,
-            "-ss", str(start),
-            "-t", str(end - start),
-            "-acodec", "copy",
-            chunk_path,
-        ]
-        proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
-        if proc.returncode != 0:
-            raise RuntimeError(f"切分音频失败:\n{proc.stderr}")
-        chunks.append(AudioChunk(path=chunk_path, start_sec=start, end_sec=end))
-        start = end
-        idx += 1
-    return chunks
-def audio_file_to_data_uri(audio_path: str, mime_type: str = "audio/mpeg") -> str:
-    with open(audio_path, "rb") as f:
-        b64 = base64.b64encode(f.read()).decode("utf-8")
-    return f"data:{mime_type};base64,{b64}"

+from __future__ import annotations
+import base64
+import os
+import shutil
+import subprocess
+from dataclasses import dataclass
+from typing import List
+@dataclass
+class AudioChunk:
+    path: str
+    start_sec: float
+    end_sec: float
+def check_ffmpeg_available() -> bool:
+    return shutil.which("ffmpeg") is not None and shutil.which("ffprobe") is not None
+def ensure_dir(path: str) -> None:
+    os.makedirs(path, exist_ok=True)
+def get_media_duration(path: str) -> float:
+    cmd = [
+        "ffprobe",
+        "-v", "error",
+        "-show_entries", "format=duration",
+        "-of", "default=noprint_wrappers=1:nokey=1",
+        path,
+    ]
+    proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+    # if proc.returncode != 0:
+    #     print(f"获取时长失败: {proc.stderr}")
+    return float(proc.stdout.strip())
+def extract_audio_from_video(
+    video_path: str,
+    output_audio_path: str,
+    bitrate: str = "64k",
+) -> str:
+    ensure_dir(os.path.dirname(output_audio_path))
+    cmd = [
+        "ffmpeg",
+        "-y",
+        "-i", video_path,
+        "-vn",
+        "-ac", "1",
+        "-ar", "16000",
+        "-c:a", "mp3",
+        "-b:a", bitrate,
+        output_audio_path,
+    ]
+    proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+    return output_audio_path
+def split_audio_to_chunks(
+    audio_path: str,
+    output_dir: str,
+    chunk_seconds: int = 290,
+) -> List[AudioChunk]:
+    ensure_dir(output_dir)
+    duration = get_media_duration(audio_path)
+    chunks: List[AudioChunk] = []
+    start = 0.0
+    idx = 0
+    while start < duration:
+        end = min(duration, start + chunk_seconds)
+        chunk_path = os.path.join(output_dir, f"audio_chunk_{idx:03d}.mp3")
+        cmd = [
+            "ffmpeg",
+            "-y",
+            "-i", audio_path,
+            "-ss", str(start),
+            "-t", str(end - start),
+            "-acodec", "copy",
+            chunk_path,
+        ]
+        proc = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+        if proc.returncode != 0:
+            raise RuntimeError(f"切分音频失败:\n{proc.stderr}")
+        chunks.append(AudioChunk(path=chunk_path, start_sec=start, end_sec=end))
+        start = end
+        idx += 1
+    return chunks
+def audio_file_to_data_uri(audio_path: str, mime_type: str = "audio/mpeg") -> str:
+    with open(audio_path, "rb") as f:
+        b64 = base64.b64encode(f.read()).decode("utf-8")
+    return f"data:{mime_type};base64,{b64}"