Add Web WASM supoort and Update README

by luckyxin - opened Jun 9, 2025

base: refs/heads/main

←

from: refs/pr/5

Discussion Files changed

+106

-10248

This view is limited to 50 files because it contains too many changes. See the raw diff here.

Files changed (50) hide show

.gitattributes +0 -6
LICENSE +0 -46
NOTICES +0 -68
README.md +35 -181
config.json +1 -1
examples/.gitattributes +1 -0
examples/CMakeLists.txt +0 -6
examples/build-and-deploy-android.sh +0 -6
examples/build-and-deploy-ios.sh +0 -6
examples/build-and-deploy-linux.sh +0 -6
examples/build-and-deploy-mac.sh +0 -6
examples/build-and-deploy-windows.bat +0 -7
examples/images/.gitattributes +2 -0
examples/main.c +6 -14
examples/plot_pr_curves.py +5 -6
examples/sample_array.h +0 -6
examples/test.py +3 -4
examples/test_node.js +0 -529
examples_onnx/CMakeLists.txt +0 -24
examples_onnx/build-and-deploy-linux.sh +0 -37
include/ten_vad.h +3 -4
include/ten_vad.py +17 -55
lib/Web/ten_vad.d.ts +0 -111
lib/Web/ten_vad.js +0 -30
lib/Windows/x64/ten_vad.lib +0 -0
lib/Windows/x86/ten_vad.lib +0 -0
lib/iOS/ten_vad.framework/Headers/ten_vad.h +3 -90
lib/iOS/ten_vad.framework/Info.plist +0 -0
lib/iOS/ten_vad.framework/Modules/module.modulemap +3 -5
lib/macOS/ten_vad.framework/Headers +0 -1
lib/{Web/ten_vad.wasm → macOS/ten_vad.framework/Headers/ten_vad.h} +2 -2
lib/macOS/ten_vad.framework/Resources +0 -1
src/onnx_model/ten-vad.onnx → lib/macOS/ten_vad.framework/Resources/Info.plist +2 -2
lib/macOS/ten_vad.framework/Versions/A/Headers/ten_vad.h +3 -90
lib/macOS/ten_vad.framework/Versions/A/Resources/Info.plist +3 -44
lib/macOS/ten_vad.framework/Versions/Current +0 -1
lib/macOS/ten_vad.framework/Versions/Current/Headers/ten_vad.h +3 -0
lib/macOS/ten_vad.framework/Versions/Current/Resources/Info.plist +3 -0
lib/macOS/ten_vad.framework/Versions/Current/ten_vad +3 -0
lib/macOS/ten_vad.framework/ten_vad +0 -1
lib/macOS/ten_vad.framework/ten_vad +3 -0
setup.py +3 -26
src/aed.cc +0 -993
src/aed.h +0 -226
src/aed_st.h +0 -132
src/biquad.cc +0 -354
src/biquad.h +0 -190
src/biquad_st.h +0 -37
src/coeff.h +0 -246
src/fftw.c +0 -0

.gitattributes CHANGED Viewed

@@ -33,9 +33,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
-*.so filter=lfs diff=lfs merge=lfs -text
-*.dll filter=lfs diff=lfs merge=lfs -text
-ten_vad filter=lfs diff=lfs merge=lfs -text
-*.png filter=lfs diff=lfs merge=lfs -text
-*.scv filter=lfs diff=lfs merge=lfs -text
-*.wav filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

LICENSE DELETED Viewed

@@ -1,46 +0,0 @@
-Open Source License
-The ten-vad is licensed pursuant to the Apache License v2.0(provided
-for your convenience below), with the following additional conditions.
-You may reproduce, prepare Derivative Works of, publicly display, publicly perform,
-sublicense, distribute, or otherwise make available (together, "Deploy") the ten-vad,
-for commercial or non-commercial purposes, provided that you agree to abide by the terms below:
-    1. You may not Deploy the ten-vad in a way that competes with Agora's
-       offerings and/or that allows others to compete with Agora's offerings,
-       including without limitation enabling any third party to develop or
-       deploy Applications.
-    2. You may Deploy the ten-vad solely to create and enable deployment
-       of your Application(s) solely for your benefit and the benefit of your
-       direct End Users. If you prefer, you may include the following notice in
-       the documentation of your Application(s): "Powered by ten-vad".
-    3. Derivative Works of the ten-vad remain subject to this Open Source
-       License.
-    4. "End Users" shall mean the end-users of your Application(s) who access
-       the ten-vad solely to the extent necessary to access and use the
-       Application(s) you create or deploy using ten-vad.
-    5. "Application(s)" shall mean your software programs designed or developed
-       by using the ten-vad or where deployment is enabled by the ten-vad.
-    6. Note that the project contains derived code from other open source project
-       with BSD-3-Clause and BSD-2-Clause license, refer to the "NOTICES"
-        file in the root directory for detailed information.
-  Copyright © 2025 Agora
-  Licensed under the Apache License, Version 2.0 (the "License");
-  you may not use this file except in compliance with the License.
-  You may obtain a copy of the License at
-      http://www.apache.org/licenses/LICENSE-2.0
-  Unless required by applicable law or agreed to in writing, software
-  distributed under the License is distributed on an "AS IS" BASIS,
-  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-  See the License for the specific language governing permissions and
-  limitations under the License.

NOTICES DELETED Viewed

@@ -1,68 +0,0 @@
-This project includes modified code from the following third-party component:
-1. File: lpcnet_enc.c
-   - Source: LPCNet (https:github.com/xiph/LPCNet)
-   - License: BSD-2-Clause
-   - Copyright: 2017-2019, Mozilla
-   - Original License Text:
-        Copyright (c) 2017-2019 Mozilla
-        Redistribution and use in source and binary forms, with or without modification,
-        are permitted provided that the following conditions are met:
-        - Redistributions of source code must retain the above copyright notice,
-          this list of conditions and the following disclaimer.
-        - Redistributions in binary form must reproduce the above copyright notice,
-          this list of conditions and the following disclaimer in the documentation
-          and/or other materials provided with the distribution.
-        THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
-        ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-        LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-        A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
-        CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
-        EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
-        PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
-        PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
-        LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
-        NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
-        SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
-2. Project: LPCNet
-    - Source: LPCNet (https:github.com/xiph/LPCNet)
-    - License: BSD-3-Clause
-    - Copyright: 2017-2018, Mozilla, 2007-2017, Jean-Marc Valin, 2005-2017, Xiph.Org Foundation, 2003-2004, Mark Borgerding
-    - Original License Text of LPCNet open source project:
-        Copyright (c) 2017-2018, Mozilla
-        Copyright (c) 2007-2017, Jean-Marc Valin
-        Copyright (c) 2005-2017, Xiph.Org Foundation
-        Copyright (c) 2003-2004, Mark Borgerding
-        Redistribution and use in source and binary forms, with or without
-        modification, are permitted provided that the following conditions
-        are met:
-        - Redistributions of source code must retain the above copyright
-        notice, this list of conditions and the following disclaimer.
-        - Redistributions in binary form must reproduce the above copyright
-        notice, this list of conditions and the following disclaimer in the
-        documentation and/or other materials provided with the distribution.
-        - Neither the name of the Xiph.Org Foundation nor the names of its
-        contributors may be used to endorse or promote products derived from
-        this software without specific prior written permission.
-        THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
-        ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
-        LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
-        A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION
-        OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
-        SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
-        LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
-        DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
-        THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
-        (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
-        OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

README.md CHANGED Viewed

@@ -1,6 +1,5 @@
 ---
 tags:
-- Voice Acticity Detection
 - voice activity detection
 - speech activity detection
 - real time
@@ -11,92 +10,11 @@ tags:
 - silero vad
 - conversational
 - automatic speech recognition
 ---
-![TEN VAD banner][ten-vad-banner]
-[![Discussion posts](https://img.shields.io/github/discussions/TEN-framework/ten-vad?labelColor=gray&color=%20%23f79009)](https://github.com/TEN-framework/ten-vad/discussions/)
-[![Commits](https://img.shields.io/github/commit-activity/m/TEN-framework/ten-vad?labelColor=gray&color=pink)](https://github.com/TEN-framework/ten-vad/graphs/commit-activity)
-[![Issues closed](https://img.shields.io/github/issues-search?query=repo%3ATEN-framework%2Ften-vad%20is%3Aclosed&label=issues%20closed&labelColor=gray&color=green)](https://github.com/TEN-framework/ten-vad/issues)
-![](https://img.shields.io/github/contributors/ten-framework/ten-vad?color=c4f042&labelColor=gray&style=flat-square)
-[![PRs Welcome](https://img.shields.io/badge/PRs-welcome!-brightgreen.svg?style=flat-square)](https://github.com/TEN-framework/ten-vad/pulls)
-[![Ask DeepWiki](https://deepwiki.com/badge.svg)](https://deepwiki.com/TEN-framework/TEN-vad)
-[![GitHub watchers](https://img.shields.io/github/watchers/TEN-framework/ten-vad?style=social&label=Watch)](https://GitHub.com/TEN-framework/ten-vad/watchers/?WT.mc_id=academic-105485-koreyst)
-[![GitHub forks](https://img.shields.io/github/forks/TEN-framework/ten-vad?style=social&label=Fork)](https://GitHub.com/TEN-framework/ten-vad/network/?WT.mc_id=academic-105485-koreyst)
-[![GitHub stars](https://img.shields.io/github/stars/TEN-framework/ten-vad?style=social&label=Star)](https://GitHub.com/TEN-framework/ten-vad/stargazers/?WT.mc_id=academic-105485-koreyst)
-*Latest News* 🔥
-- [2025/11] **WASM** build guide and browser test demo are now available in `lib/Web` and `examples`.
-- [2025/11] We supported **Python** inference with **ONNX model** on **Linux**, **macOS** thanks to Guy Nicholson!
-- [2025/11] We supported **Golang** on **Linux**, **macOS** and **Windows** with usage of the prebuilt-libs thanks to hylarucoder!
-- [2025/11] We supported Java on **Linux, macOS, Windows, Android** with usage of the prebuilt-libs thanks to ZhangYang!
-- [2025/07] 🎉 Exciting news! **TEN VAD** is now integrated into **k2-fsa/sherpa-onnx**, thanks to the fantastic work by Fangjun Kuang! You can now achieve more precise speech segment extraction and enjoy an enhanced ASR experience! Refer to the [documentation](https://k2-fsa.github.io/sherpa/onnx/vad/ten-vad.html) and give it a try!
-- [2025/07] We support **Python inference** on **macOS** and **Windows** with usage of the prebuilt-lib!
-- [2025/06] We **finally** released and **open-sourced** the **ONNX** model and the corresponding **preprocessing code**! Now you can deploy **TEN VAD** on **any platform** and **any hardware architecture**!
-- [2025/06] We are excited to announce the release of **WASM+JS** for Web WASM Support.
-## Table of Contents
-- [Welcome to TEN](#welcome-to-ten)
-- [TEN Hugging Face Space](#ten-hugging-face-space)
-- [Introduction](#introduction)
-- [Key Features](#key-features)
-  - [High-Performance](#1-high-performance)
-    - [Performance Comparison](#11-performance-comparison)
-  - [Agent-Friendly](#2-agent-friendly)
-  - [Lightweight](#3-lightweight)
-  - [Multiple Programming Languages and Platforms](#4-multiple-programming-languages-and-platforms)
-  - [Supported Sampling Rate and Hop Size](#5-supproted-sampling-rate-and-hop-size)
-- [Developers Testimonial](#developers-testimonial)
-- [Installation](#installation)
-- [Quick Start](#quick-start)
-  - [Python Usage](#python-usage)
-    - [Linux](#1-linux)
-  - [JS Usage](#js-usage)
-    - [Web](#1-web)
-  - [C Usage](#c-usage)
-    - [Linux](#1-linux-1)
-    - [Windows](#2-windows)
-    - [macOS](#3-macos)
-    - [Android](#4-android)
-    - [iOS](#5-ios)
-- [TEN Ecosystem](#ten-ecosystem)
-- [Ask Questions](#ask-questions)
-- [Citations](#citations)
-- [License](#license)
-## Welcome to TEN
-TEN is a collection of open-source projects for building real-time, multimodal conversational voice agents. It includes [ TEN Framework ](https://github.com/ten-framework/ten-framework), [ TEN VAD ](https://github.com/ten-framework/ten-vad), [ TEN Turn Detection ](https://github.com/ten-framework/ten-turn-detection), TEN Agent, TMAN Designer, and [ TEN Portal ](https://github.com/ten-framework/portal), all fully open-source.
-| Community Channel | Purpose |
-| ---------------- | ------- |
-| [![Follow on X](https://img.shields.io/twitter/follow/TenFramework?logo=X&color=%20%23f5f5f5)](https://twitter.com/intent/follow?screen_name=TenFramework) | Follow TEN Framework on X for updates and announcements |
-| [![Follow on LinkedIn](https://custom-icon-badges.demolab.com/badge/LinkedIn-TEN_Framework-0A66C2?logo=linkedin-white&logoColor=fff)](https://www.linkedin.com/company/ten-framework) | Follow TEN Framework on LinkedIn for updates and announcements |
-| [![Discord TEN Community](https://dcbadge.vercel.app/api/server/VnPftUzAMJ?&style=flat&theme=light&color=lightgray)](https://discord.gg/VnPftUzAMJ) | Join our Discord community to connect with developers |
-| [![Hugging Face Space](https://img.shields.io/badge/Hugging%20Face-TEN%20Framework-yellow?style=flat&logo=huggingface)](https://huggingface.co/TEN-framework) | Join our Hugging Face community to explore our spaces and models |
-| [![WeChat](https://img.shields.io/badge/TEN_Framework-WeChat_Group-%2307C160?logo=wechat&labelColor=darkgreen&color=gray)](https://github.com/TEN-framework/ten-agent/discussions/170) | Join our WeChat group for Chinese community discussions |
-> \[!IMPORTANT]
->
-> **Star TEN Repositories** ⭐️
->
-> Get instant notifications for new releases and updates. Your support helps us grow and improve TEN!
-![TEN star us gif](https://github.com/user-attachments/assets/eeebe996-8c14-4bf7-82ae-f1a1f7e30705)
-## TEN Hugging Face Space
-<https://github.com/user-attachments/assets/725a8318-d679-4b17-b9e4-e3dce999b298>
-You are more than welcome to [Visit TEN Hugging Face Space](https://huggingface.co/spaces/TEN-framework/ten-agent-demo) to try VAD and Turn Detection together.
 ## **Introduction**
@@ -115,23 +33,21 @@ The precision-recall curves comparing the performance of WebRTC VAD (pitch-based
   <img src="./examples/images/PR_Curves_testset.png" width="800">
 </div>
-Note that the default threshold of 0.5 is used to generate binary speech indicators (0 for non-speech signal, 1 for speech signal). This threshold needs to be tuned according to your domain-specific task.
-#### **1.1 Performance Comparison**
-Developers can reproduce the performance comparison PR curves for **TEN VAD** and **Silero VAD** on the open-source testset (as shown in the figure above) by executing the following script on Linux x64 with a simply one line of code. The output figure will be saved in the same directory as the script.
 ```
 cd ./examples
 python plot_pr_curves.py
 ```
 ### **2. Agent-Friendly:**
 As illustrated in the figure below, TEN VAD rapidly detects speech-to-non-speech transitions, whereas Silero VAD suffers from a delay of several hundred milliseconds, resulting in increased end-to-end latency in human-agent interaction systems. In addition, as demonstrated in the 6.5s-7.0s audio segment, Silero VAD fails to identify short silent durations between adjacent speech segments.
 <div style="text-align:">
   <img src="./examples/images/Agent-Friendly-image.png" width="800">
 </div>
 ### **3. Lightweight:**
 We evaluated the RTF (Real-Time Factor) across five distinct platforms, each equipped with varying CPUs. TEN VAD demonstrates much lower computational complexity and smaller library size than Silero VAD.
@@ -199,6 +115,7 @@ We evaluated the RTF (Real-Time Factor) across five distinct platforms, each equ
     <td align="center"> 0.0050 </td>
   </tr>
 </table>
 <style>
   th, td {
     border: 1px solid #ddd;
@@ -207,17 +124,12 @@ We evaluated the RTF (Real-Time Factor) across five distinct platforms, each equ
 </style>
 ### **4. Multiple programming languages and platforms:**
-TEN VAD provides cross-platform C compatibility across five operating systems (Linux x64, Windows, macOS, Android, iOS), with Python bindings optimized for Linux x64, with wasm for Web.
 ### **5. Supproted sampling rate and hop size:**
 TEN VAD operates on 16kHz audio input with configurable hop sizes (optimized frame configurations: 160/256 samples=10/16ms). Other sampling rates must be resampled to 16kHz.
-## **Developers Testimonial**
-> "We selected TEN VAD because it provides faster and more accurate sentence-end detection in Japanese compared to other VADs, while still being lightweight and fast enough for live use." - LiveCap,Hakase shojo.
-> "TEN VAD's overall performance is better than Silero VAD. Its high accuracy and low resource consumption helped us improve efficiency and significantly reduce costs." - Rustpbx.
 ## **Installation**
 ```
@@ -273,8 +185,9 @@ The project supports five major platforms with dynamic library linking.
   </tr>
 </table>
 ### **Python Usage**
-#### **1. Linux / macOS / Windows**
 #### **Requirements**
 - numpy (Version 1.17.4/1.26.4 verified)
 - scipy (Version >= 1.5.0)
@@ -288,7 +201,7 @@ Note: You could use other versions of above packages, but we didn't test other v
 <br>
-The **lib** only depend on numpy, you have to install the dependency via requirements.txt:
 ```pip install -r requirements.txt```
@@ -306,7 +219,6 @@ sudo apt install libc++1
 <br>
 #### **Usage**
 Note: For usage in python, you can either use it by **git clone** or **pip**.
@@ -314,7 +226,7 @@ Note: For usage in python, you can either use it by **git clone** or **pip**.
 1. Clone the repository
 ```
-git clone https://github.com/TEN-framework/ten-vad.git
 ```
 2. Enter examples directory
@@ -327,7 +239,6 @@ cd ./examples
 python test.py s0724-s0730.wav out.txt
 ```
 ##### **By using pip:**
 1. Install via pip
@@ -342,24 +253,9 @@ pip install -U --force-reinstall -v git+https://github.com/TEN-framework/ten-vad
 from ten_vad import TenVad
 ```
-### **JS Usage**
-####  **1. Web**
-##### **Requirements**
-- Node.js (macOS v14.18.2, Linux v16.20.2 verified)
-- Terminal
-##### **Usage**
-```
-1) cd ./examples
-2) node test_node.js s0724-s0730.wav out.txt
-```
 ### **C Usage**
 #### **Build Scripts**
-Located in examples/ directory and examples_onnx (for **ONNX** usage on Linux):
 - Linux: build-and-deploy-linux.sh
 - Windows: build-and-deploy-windows.bat
@@ -379,14 +275,13 @@ Runtime library path configuration:
 - Configure toolchain and architecture settings
 #### **Overview of Usage**
-- Navigate to examples/ or examples_onx/ (for **ONNX** usage on Linux)
 - Execute platform-specific build script
 - Configure dynamic library path
 - Run demo with sample audio s0724-s0730.wav
 - Processed results saved to out.txt
 The detailed usage methods of each platform are as follows <br>
 ####  **1. Linux**
@@ -395,30 +290,18 @@ The detailed usage methods of each platform are as follows <br>
 - CMake
 - Terminal
-Note that if you did not install **libc++1** (Linux), you have to run the code below to install it:
 ```
 sudo apt update
 sudo apt install libc++1
 ```
-##### **Usage (prebuilt-lib)**
 ```
 1) cd ./examples
 2) ./build-and-deploy-linux.sh
 ```
-##### **Usage (ONNX)**
-You have to download the **onnxruntime** packages from the [microsoft official onnxruntime github website](https://github.com/microsoft/onnxruntime). Note that the version of onnxruntime must be higher than or equal to 1.17.1 (e.g. onnxruntime-linux-x64-1.17.1.tgz).
-<br>
-You can check the official **ONNX Runtime releases** from [this website](https://github.com/microsoft/onnxruntime/tags). And for example, to download version 1.17.1 (Linux x64), use [this link](https://github.com/microsoft/onnxruntime/releases/download/v1.17.1/onnxruntime-linux-x64-1.17.1.tgz). After extracting the compressed file, you'll find two important directories:`include/` - header files, `lib/` - library files
-```
-1) cd examples_onnx/
-2) ./build-and-deploy-linux.sh --ort-path /absolute/path/to/your/onnxruntime/root/dir
-```
-Note 1: If executing the onnx demo from a different directory than the one used when running build-and-deploy-linux.sh, ensure to create a symbolic link to src/onnx_model/ to prevent ONNX model file loading failures.
-<br>
-Note 2: The **ONNX model** locates in `src/onnx_model` directory.
 ####  **2. Windows**
 ##### **Requirements**
 - Visual Studio (2017, 2019, 2022 verified)
@@ -434,7 +317,6 @@ Note 2: The **ONNX model** locates in `src/onnx_model` directory.
 3) ./build-and-deploy-windows.bat
 ```
 ####  **3. macOS**
 ##### **Requirements**
 - Xcode (15.2 verified)
@@ -449,7 +331,6 @@ Note 2: The **ONNX model** locates in `src/onnx_model` directory.
 3) ./build-and-deploy-mac.sh
 ```
 ####  **4. Android**
 ##### **Requirements**
 - NDK (r25b, macOS verified)
@@ -466,7 +347,6 @@ Note 2: The **ONNX model** locates in `src/onnx_model` directory.
 4) ./build-and-deploy-android.sh
 ```
 ####  **5. iOS**
 ##### **Requirements**
 Xcode (15.2, macOS verified)
@@ -517,28 +397,6 @@ cd ./examples
     3.5. Build in Xcode and run demo on your device.
-## TEN Ecosystem
-| Project | Preview |
-| ------- | ------- |
-| [**🏚️ TEN Framework**][ten-framework-link]<br>TEN is an open-source framework for real-time, multimodal conversational AI.<br><br>![][ten-framework-shield] | ![][ten-framework-banner] |
-| [**️🔂 TEN Turn Detection**][ten-turn-detection-link]<br>TEN is for full-duplex dialogue communication.<br><br>![][ten-turn-detection-shield] | ![][ten-turn-detection-banner] |
-| [**🔉 TEN VAD**][ten-vad-link]<br>TEN VAD is a low-latency, lightweight and high-performance streaming voice activity detector (VAD).<br><br>![][ten-vad-shield] | ![][ten-vad-banner] |
-| [**🎙️ TEN Agent**][ten-agent-link]<br>TEN Agent is a showcase of TEN Framewrok.<br><br> | ![][ten-agent-banner] |
-| **🎨 TMAN Designer** <br>TMAN Designer is low/no code option to make a voice agent with easy to use workflow UI.<br><br> | ![][tman-designer-banner] |
-| [**📒 TEN Portal**][ten-portal-link]<br>The official site of TEN framework, it has documentation and blog.<br><br>![][ten-portal-shield] | ![][ten-portal-banner] |
-<br>
-##  Ask Questions
-[![Ask DeepWiki](https://deepwiki.com/badge.svg)](https://deepwiki.com/TEN-framework/TEN-vad)
-Most questions can be answered by using DeepWiki, it is fast, intutive to use and supports multiple languages.
 ## **Citations**
 ```
 @misc{TEN VAD,
@@ -552,32 +410,28 @@ Most questions can be answered by using DeepWiki, it is fast, intutive to use an
 }
 ```
-## License
-This project is licensed pursuant to the Apache 2.0 with additional conditions. Refer to the "LICENSE" file in the root directory for detailed information. Note that `pitch_est.cc` contains modified code derived from [LPCNet](https://github.com/xiph/LPCNet), which is [BSD-2-Clause](https://spdx.org/licenses/BSD-2-Clause.html) and [BSD-3-Clause](https://spdx.org/licenses/BSD-3-Clause.html) licensed, refer to the NOTICES file in the root directory for detailed information.
-[back-to-top]: https://img.shields.io/badge/-Back_to_top-gray?style=flat-square
-[ten-framework-shield]: https://img.shields.io/github/stars/ten-framework/ten_framework?color=ffcb47&labelColor=gray&style=flat-square&logo=github
-[ten-framework-banner]: https://github.com/user-attachments/assets/7c8f72d7-3993-4d01-8504-b71578a22944
-[ten-framework-link]: https://github.com/ten-framework/ten_framework
-[ten-vad-link]: https://github.com/ten-framework/ten-vad
-[ten-vad-shield]: https://img.shields.io/github/stars/ten-framework/ten-vad?color=ffcb47&labelColor=gray&style=flat-square&logo=github
-[ten-vad-banner]: https://github.com/user-attachments/assets/d45870e4-9453-4047-8163-08737f82863f
-[ten-turn-detection-link]: https://github.com/ten-framework/ten-turn-detection
-[ten-turn-detection-shield]: https://img.shields.io/github/stars/ten-framework/ten-turn-detection?color=ffcb47&labelColor=gray&style=flat-square&logo=github
-[ten-turn-detection-banner]: https://github.com/user-attachments/assets/8d0ec716-5d0e-43e4-ad9a-d97b17305658
-[ten-agent-link]: https://github.com/TEN-framework/ten-framework/tree/main/ai_agents
-[ten-agent-banner]: https://github.com/user-attachments/assets/38de2207-939b-4702-a0aa-04491f5b5275
-[tman-designer-banner]: https://github.com/user-attachments/assets/804c3543-0a47-42b7-b40b-ef32b742fb8f
-[ten-portal-link]: https://github.com/ten-framework/portal
-[ten-portal-shield]: https://img.shields.io/github/stars/ten-framework/portal?color=ffcb47&labelColor=gray&style=flat-square&logo=github
-[ten-portal-banner]: https://github.com/user-attachments/assets/e17d8aaa-5928-45dd-ac71-814928e26a89

 ---
 tags:
 - voice activity detection
 - speech activity detection
 - real time
 - silero vad
 - conversational
 - automatic speech recognition
+pipeline_tag: voice-activity-detection
 ---
+# **TEN VAD**
+***A Low-Latency, Lightweight and High-Performance Streaming VAD***
 ## **Introduction**
   <img src="./examples/images/PR_Curves_testset.png" width="800">
 </div>
+Note that the default threshold of 0.5 is used to generate binary speech indicators (0 for non-speech signal, 1 for speech signal). This threshold needs to be tuned according to your domain-specific task. The precision-recall curve can be obtained by executing the following script on Linux x64. The output figure will be saved in the same directory as the script.
 ```
 cd ./examples
 python plot_pr_curves.py
 ```
 ### **2. Agent-Friendly:**
 As illustrated in the figure below, TEN VAD rapidly detects speech-to-non-speech transitions, whereas Silero VAD suffers from a delay of several hundred milliseconds, resulting in increased end-to-end latency in human-agent interaction systems. In addition, as demonstrated in the 6.5s-7.0s audio segment, Silero VAD fails to identify short silent durations between adjacent speech segments.
 <div style="text-align:">
   <img src="./examples/images/Agent-Friendly-image.png" width="800">
 </div>
 ### **3. Lightweight:**
 We evaluated the RTF (Real-Time Factor) across five distinct platforms, each equipped with varying CPUs. TEN VAD demonstrates much lower computational complexity and smaller library size than Silero VAD.
     <td align="center"> 0.0050 </td>
   </tr>
 </table>
 <style>
   th, td {
     border: 1px solid #ddd;
 </style>
 ### **4. Multiple programming languages and platforms:**
+TEN VAD provides cross-platform C compatibility across five operating systems (Linux x64, Windows, macOS, Android, iOS), with Python bindings optimized for Linux x64.
 ### **5. Supproted sampling rate and hop size:**
 TEN VAD operates on 16kHz audio input with configurable hop sizes (optimized frame configurations: 160/256 samples=10/16ms). Other sampling rates must be resampled to 16kHz.
 ## **Installation**
 ```
   </tr>
 </table>
 ### **Python Usage**
+#### **1. Linux**
 #### **Requirements**
 - numpy (Version 1.17.4/1.26.4 verified)
 - scipy (Version >= 1.5.0)
 <br>
+The **lib** only depends on numpy, you have to install the dependency via requirements.txt:
 ```pip install -r requirements.txt```
 <br>
 #### **Usage**
 Note: For usage in python, you can either use it by **git clone** or **pip**.
 1. Clone the repository
 ```
+git clone https://huggingface.co/TEN-framework/ten-vad
 ```
 2. Enter examples directory
 python test.py s0724-s0730.wav out.txt
 ```
 ##### **By using pip:**
 1. Install via pip
 from ten_vad import TenVad
 ```
 ### **C Usage**
 #### **Build Scripts**
+Located in examples/ directory:
 - Linux: build-and-deploy-linux.sh
 - Windows: build-and-deploy-windows.bat
 - Configure toolchain and architecture settings
 #### **Overview of Usage**
+- Navigate to examples/
 - Execute platform-specific build script
 - Configure dynamic library path
 - Run demo with sample audio s0724-s0730.wav
 - Processed results saved to out.txt
 The detailed usage methods of each platform are as follows <br>
 ####  **1. Linux**
 - CMake
 - Terminal
+Note that if you did not install **libc++1**, you have to run the code below to install it:
 ```
 sudo apt update
 sudo apt install libc++1
 ```
+##### **Usage**
 ```
 1) cd ./examples
 2) ./build-and-deploy-linux.sh
 ```
 ####  **2. Windows**
 ##### **Requirements**
 - Visual Studio (2017, 2019, 2022 verified)
 3) ./build-and-deploy-windows.bat
 ```
 ####  **3. macOS**
 ##### **Requirements**
 - Xcode (15.2 verified)
 3) ./build-and-deploy-mac.sh
 ```
 ####  **4. Android**
 ##### **Requirements**
 - NDK (r25b, macOS verified)
 4) ./build-and-deploy-android.sh
 ```
 ####  **5. iOS**
 ##### **Requirements**
 Xcode (15.2, macOS verified)
     3.5. Build in Xcode and run demo on your device.
 ## **Citations**
 ```
 @misc{TEN VAD,
 }
 ```
+## Usage Guidance
+1. You may not (i) host the TEN VAD or the Derivative Works on any End
+   User devices, including but not limited to any mobile terminal devices
+   or (ii) Deploy the TEN VAD in a way that competes with Agora's
+   offerings and/or that allows others to compete with Agora's offerings,
+   including without limitation enabling any third party to develop or
+   deploy Applications.
+2. You may Deploy the TEN VAD solely to create and enable deployment
+   of your Application(s) solely for your benefit and the benefit of your
+   direct End Users. If you prefer, you may include the following notice in
+   the documentation of your Application(s): "Powered by TEN VAD".
+3. "End Users" shall mean the end-users of your Application(s) who access
+   the TEN VAD solely to the extent necessary to access and use the
+   Application(s) you create or deploy using TEN VAD.
+4. "Application(s)" shall mean your software programs designed or developed
+   by using the TEN VAD or where deployment is enabled by the TEN
+   VAD.
+## Future Open Source Plan
+TEN-VAD is currently released as a binary. Based on community feedback and interest, we plan to progressively open source the internal components of the binary.

config.json CHANGED Viewed

@@ -1,3 +1,3 @@
 {
-  "_comment": "This json file is only used to count downloads"
 }

 {
+  "_comment": "This json file is only used to count downloads",
 }

examples/.gitattributes ADDED Viewed

	@@ -0,0 +1 @@


1	+ *.wav filter=lfs diff=lfs merge=lfs -text

examples/CMakeLists.txt CHANGED Viewed

@@ -1,9 +1,3 @@
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 cmake_minimum_required(VERSION 3.10)
 get_filename_component(ROOT ${CMAKE_CURRENT_SOURCE_DIR}/../ ABSOLUTE)








1	cmake_minimum_required(VERSION 3.10)
2	get_filename_component(ROOT ${CMAKE_CURRENT_SOURCE_DIR}/../ ABSOLUTE)
3

examples/build-and-deploy-android.sh CHANGED Viewed

@@ -1,10 +1,4 @@
 #!/bin/bash
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 set -eo pipefail
 # Customize the arch and toolchain

 #!/bin/bash
 set -eo pipefail
 # Customize the arch and toolchain

examples/build-and-deploy-ios.sh CHANGED Viewed

@@ -1,10 +1,4 @@
 #!/usr/bin/env bash
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 set -euo pipefail
 work_dir=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

 #!/usr/bin/env bash
 set -euo pipefail
 work_dir=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)

examples/build-and-deploy-linux.sh CHANGED Viewed

@@ -1,10 +1,4 @@
 #!/bin/bash
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 set -euo pipefail
 arch=x64

 #!/bin/bash
 set -euo pipefail
 arch=x64

examples/build-and-deploy-mac.sh CHANGED Viewed

@@ -1,10 +1,4 @@
 #!/bin/bash
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 set -euo pipefail
 # Customize the arch

 #!/bin/bash
 set -euo pipefail
 # Customize the arch

examples/build-and-deploy-windows.bat CHANGED Viewed

@@ -1,13 +1,6 @@
 @echo off
 setlocal
-@REM
-@REM  Copyright © 2025 Agora
-@REM  This file is part of TEN Framework, an open source project.
-@REM  Licensed under the Apache License, Version 2.0, with certain conditions.
-@REM  Refer to the "LICENSE" file in the root directory for more information.
-@REM
 @REM Customize the arch
 set arch=x64
 @REM set arch=x86

 @echo off
 setlocal
 @REM Customize the arch
 set arch=x64
 @REM set arch=x86

examples/images/.gitattributes ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ *.jpg filter=lfs diff=lfs merge=lfs -text
2	+ *.png filter=lfs diff=lfs merge=lfs -text

examples/main.c CHANGED Viewed

@@ -1,8 +1,7 @@
 //
-// Copyright © 2025 Agora
 // This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
 //
 #include <stdio.h>
 #include <stdint.h>
@@ -87,16 +86,9 @@ int vad_process(int16_t *input_buf, uint32_t frame_num,
   for (int i = 0; i < frame_num; ++i)
   {
     int16_t *audio_data = input_buf + i * hop_size;
-    int res = ten_vad_process(ten_vad_handle, audio_data, hop_size,
-                              &out_probs[i], &out_flags[i]);
-    if (res == 0)
-    {
-      printf("[%d] %0.6f, %d\n", i, out_probs[i], out_flags[i]);
-    }
-    else
-    {
-      printf("ten_vad_process failed res %d\n", res);
-    }
   }
   uint64_t end = get_timestamp_ms();
   *use_time = (float)(end - start);
@@ -303,4 +295,4 @@ int read_wav_file(FILE *fp, wav_info_t *info)
   // restore original file position
   fseek(fp, orig_pos, SEEK_SET);
   return 0;
-}

 //
 // This file is part of TEN Framework, an open source project.
+// Licensed under the Apache License, Version 2.0.
+// See the LICENSE file for more information.
 //
 #include <stdio.h>
 #include <stdint.h>
   for (int i = 0; i < frame_num; ++i)
   {
     int16_t *audio_data = input_buf + i * hop_size;
+    ten_vad_process(ten_vad_handle, audio_data, hop_size,
+                    &out_probs[i], &out_flags[i]);
+    printf("[%d] %0.6f, %d\n", i, out_probs[i], out_flags[i]);
   }
   uint64_t end = get_timestamp_ms();
   *use_time = (float)(end - start);
   // restore original file position
   fseek(fp, orig_pos, SEEK_SET);
   return 0;
+}

examples/plot_pr_curves.py CHANGED Viewed

@@ -1,8 +1,7 @@
 #
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
 #
 import os, glob, sys, torchaudio
 import numpy as np
@@ -10,7 +9,7 @@ import scipy.io.wavfile as Wavfile
 import matplotlib.pyplot as plt
 from sklearn.metrics import confusion_matrix
-os.system('git clone https://github.com/snakers4/silero-vad.git && cd silero-vad && git checkout bbf22a00640614309d60aba5467189b48c7c6ecc && cd ..')  # Clone the silero-vad repo, using Silero V5
 sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), "./silero-vad/src")))
 from silero_vad.utils_vad import VADIterator, init_jit_model
@@ -115,7 +114,7 @@ if __name__ == "__main__":
     # Get the directory of the script
     script_dir = os.path.dirname(os.path.abspath(__file__))
-    # TEN-VAD-TestSet dir
     test_dir = f"{script_dir}/../testset"
     # Initialization

 #
+# This file is part of TEN Framework, an open source project.
+# Licensed under the Apache License, Version 2.0.
+# See the LICENSE file for more information.
 #
 import os, glob, sys, torchaudio
 import numpy as np
 import matplotlib.pyplot as plt
 from sklearn.metrics import confusion_matrix
+os.system('git clone https://github.com/snakers4/silero-vad.git')  # Clone the silero-vad repo, using Silero V5
 sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), "./silero-vad/src")))
 from silero_vad.utils_vad import VADIterator, init_jit_model
     # Get the directory of the script
     script_dir = os.path.dirname(os.path.abspath(__file__))
+    # testset dir
     test_dir = f"{script_dir}/../testset"
     # Initialization

examples/sample_array.h CHANGED Viewed

@@ -1,9 +1,3 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
 // Used for iOS APP demo
 unsigned char sample_array[] = {
 	0xe3, 0xff, 0xd4, 0xff, 0xdc, 0xff, 0xe0, 0xff, 0xf6, 0xff, 0xf5, 0xff, 0xf6, 0xff, 0xfc, 0xff,

 // Used for iOS APP demo
 unsigned char sample_array[] = {
 	0xe3, 0xff, 0xd4, 0xff, 0xdc, 0xff, 0xe0, 0xff, 0xf6, 0xff, 0xf5, 0xff, 0xf6, 0xff, 0xfc, 0xff,

examples/test.py CHANGED Viewed

@@ -1,8 +1,7 @@
 #
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
 #
 import sys, os

 #
+# This file is part of TEN Framework, an open source project.
+# Licensed under the Apache License, Version 2.0.
+# See the LICENSE file for more information.
 #
 import sys, os

examples/test_node.js DELETED Viewed

@@ -1,529 +0,0 @@
-#!/usr/bin/env node
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-/**
- * TEN VAD WebAssembly Node.js Test
- * Simplified and clean version based on main.c
- */
-const fs = require('fs');
-const path = require('path');
-// Configuration
-const HOP_SIZE = 256;          // 16ms per frame
-const VOICE_THRESHOLD = 0.5;   // Voice detection threshold
-// WASM module paths
-const WASM_DIR = './../lib/Web';
-const WASM_JS_FILE = path.join(WASM_DIR, 'ten_vad.js');
-const WASM_BINARY_FILE = path.join(WASM_DIR, 'ten_vad.wasm');
-// Global state
-let vadModule = null;
-let vadHandle = null;
-let vadHandlePtr = null;
-// ============================================================================
-// UTILITY FUNCTIONS
-// ============================================================================
-function getTimestamp() {
-    return Date.now();
-}
-function addHelperFunctions() {
-    if (!vadModule.getValue) {
-        vadModule.getValue = function(ptr, type) {
-            switch (type) {
-                case 'i32': return vadModule.HEAP32[ptr >> 2];
-                case 'float': return vadModule.HEAPF32[ptr >> 2];
-                default: throw new Error(`Unsupported type: ${type}`);
-            }
-        };
-    }
-    if (!vadModule.UTF8ToString) {
-        vadModule.UTF8ToString = function(ptr) {
-            if (!ptr) return '';
-            let result = '';
-            let i = ptr;
-            while (vadModule.HEAPU8[i]) {
-                result += String.fromCharCode(vadModule.HEAPU8[i++]);
-            }
-            return result;
-        };
-    }
-}
-// ============================================================================
-// AUDIO GENERATION
-// ============================================================================
-function generateTestAudio(durationMs = 5000) {
-    const sampleRate = 16000;
-    const totalSamples = Math.floor(durationMs * sampleRate / 1000);
-    const audioData = new Int16Array(totalSamples);
-    console.log(`Generating ${totalSamples} samples for ${durationMs}ms audio...`);
-    for (let i = 0; i < totalSamples; i++) {
-        const t = i / sampleRate;
-        let sample = 0;
-        if (t < 2.0) {
-            // Voice frequencies (440Hz + 880Hz)
-            sample = Math.sin(2 * Math.PI * 440 * t) * 8000 +
-                    Math.sin(2 * Math.PI * 880 * t) * 4000;
-        } else if (t < 3.0) {
-            // Noise
-            sample = (Math.random() - 0.5) * 3000;
-        } else if (t < 4.0) {
-            // Mixed voice (220Hz + 660Hz)
-            sample = Math.sin(2 * Math.PI * 220 * t) * 6000 +
-                    Math.sin(2 * Math.PI * 660 * t) * 3000;
-        } else {
-            // Silence with minimal noise
-            sample = Math.random() * 50;
-        }
-        audioData[i] = Math.max(-32768, Math.min(32767, Math.floor(sample)));
-    }
-    return audioData;
-}
-// ============================================================================
-// VAD OPERATIONS
-// ============================================================================
-function getVADVersion() {
-    if (!vadModule) return "unknown";
-    try {
-        const versionPtr = vadModule._ten_vad_get_version();
-        return vadModule.UTF8ToString(versionPtr);
-    } catch (error) {
-        return "unknown";
-    }
-}
-function createVADInstance() {
-    try {
-        vadHandlePtr = vadModule._malloc(4);
-        const result = vadModule._ten_vad_create(vadHandlePtr, HOP_SIZE, VOICE_THRESHOLD);
-        if (result === 0) {
-            vadHandle = vadModule.getValue(vadHandlePtr, 'i32');
-            return true;
-        } else {
-            console.error(`VAD creation failed with code: ${result}`);
-            vadModule._free(vadHandlePtr);
-            return false;
-        }
-    } catch (error) {
-        console.error(`Error creating VAD instance: ${error.message}`);
-        return false;
-    }
-}
-function destroyVADInstance() {
-    if (vadHandlePtr && vadModule) {
-        vadModule._ten_vad_destroy(vadHandlePtr);
-        vadModule._free(vadHandlePtr);
-        vadHandlePtr = null;
-        vadHandle = null;
-    }
-}
-async function processAudio(inputBuf, frameNum, outProbs, outFlags) {
-    console.log(`VAD version: ${getVADVersion()}`);
-    if (!createVADInstance()) {
-        return -1;
-    }
-    const startTime = getTimestamp();
-    for (let i = 0; i < frameNum; i++) {
-        const frameStart = i * HOP_SIZE;
-        const frameData = inputBuf.slice(frameStart, frameStart + HOP_SIZE);
-        const audioPtr = vadModule._malloc(HOP_SIZE * 2);
-        const probPtr = vadModule._malloc(4);
-        const flagPtr = vadModule._malloc(4);
-        try {
-            vadModule.HEAP16.set(frameData, audioPtr / 2);
-            const result = vadModule._ten_vad_process(
-                vadHandle, audioPtr, HOP_SIZE, probPtr, flagPtr
-            );
-            if (result === 0) {
-                const probability = vadModule.getValue(probPtr, 'float');
-                const flag = vadModule.getValue(flagPtr, 'i32');
-                outProbs[i] = probability;
-                outFlags[i] = flag;
-                console.log(`[${i}] ${probability.toFixed(6)}, ${flag}`);
-            } else {
-                console.error(`Frame ${i} processing failed with code: ${result}`);
-                outProbs[i] = 0.0;
-                outFlags[i] = 0;
-            }
-        } finally {
-            vadModule._free(audioPtr);
-            vadModule._free(probPtr);
-            vadModule._free(flagPtr);
-        }
-    }
-    const endTime = getTimestamp();
-    const processingTime = endTime - startTime;
-    destroyVADInstance();
-    return processingTime;
-}
-// ============================================================================
-// RESULT HANDLING
-// ============================================================================
-function printResults(processingTime, totalAudioTime, outFlags, frameNum) {
-    const rtf = processingTime / totalAudioTime;
-    const voiceFrames = outFlags.filter(flag => flag === 1).length;
-    const voicePercentage = (voiceFrames / frameNum * 100).toFixed(1);
-    console.log(`\n=== Processing Results ===`);
-    console.log(`Time: ${processingTime}ms, Audio: ${totalAudioTime.toFixed(2)}ms, RTF: ${rtf.toFixed(6)}`);
-    console.log(`Voice frames: ${voiceFrames}/${frameNum} (${voicePercentage}%)`);
-}
-function saveResults(outProbs, outFlags, frameNum, filename = 'out.txt') {
-    let output = '';
-    for (let i = 0; i < frameNum; i++) {
-        output += `[${i}] ${outProbs[i].toFixed(6)}, ${outFlags[i]}\n`;
-    }
-    try {
-        fs.writeFileSync(filename, output);
-        console.log(`Results saved to ${filename}`);
-    } catch (error) {
-        console.error(`Failed to save results: ${error.message}`);
-    }
-}
-// ============================================================================
-// TEST FUNCTIONS
-// ============================================================================
-async function testWithArray() {
-    console.log("=== Array Test ===\n");
-    const inputBuf = generateTestAudio(5000);
-    const byteNum = inputBuf.byteLength;
-    const sampleNum = byteNum / 2;
-    const totalAudioTime = sampleNum / 16.0;
-    const frameNum = Math.floor(sampleNum / HOP_SIZE);
-    console.log(`Audio info: ${byteNum} bytes, ${frameNum} frames, ${totalAudioTime.toFixed(2)}ms`);
-    const outProbs = new Float32Array(frameNum);
-    const outFlags = new Int32Array(frameNum);
-    const processingTime = await processAudio(inputBuf, frameNum, outProbs, outFlags);
-    if (processingTime > 0) {
-        printResults(processingTime, totalAudioTime, outFlags, frameNum);
-    }
-    return 0;
-}
-// WAV File parsing utilities
-function parseWAVHeader(buffer) {
-    if (buffer.length < 44) {
-        throw new Error('Invalid WAV file: too small');
-    }
-    // Check RIFF header
-    const riffHeader = buffer.toString('ascii', 0, 4);
-    if (riffHeader !== 'RIFF') {
-        throw new Error('Invalid WAV file: missing RIFF header');
-    }
-    // Check WAVE format
-    const waveHeader = buffer.toString('ascii', 8, 12);
-    if (waveHeader !== 'WAVE') {
-        throw new Error('Invalid WAV file: not WAVE format');
-    }
-    let offset = 12;
-    let dataOffset = -1;
-    let dataSize = 0;
-    let sampleRate = 0;
-    let channels = 0;
-    let bitsPerSample = 0;
-    // Parse chunks
-    while (offset < buffer.length - 8) {
-        const chunkId = buffer.toString('ascii', offset, offset + 4);
-        const chunkSize = buffer.readUInt32LE(offset + 4);
-        if (chunkId === 'fmt ') {
-            // Format chunk
-            const audioFormat = buffer.readUInt16LE(offset + 8);
-            channels = buffer.readUInt16LE(offset + 10);
-            sampleRate = buffer.readUInt32LE(offset + 12);
-            bitsPerSample = buffer.readUInt16LE(offset + 22);
-            if (audioFormat !== 1) {
-                throw new Error('Unsupported WAV format: only PCM is supported');
-            }
-            if (bitsPerSample !== 16) {
-                throw new Error('Unsupported bit depth: only 16-bit is supported');
-            }
-        } else if (chunkId === 'data') {
-            // Data chunk
-            dataOffset = offset + 8;
-            dataSize = chunkSize;
-            break;
-        }
-        offset += 8 + chunkSize;
-        // Align to even byte boundary
-        if (chunkSize % 2 === 1) {
-            offset++;
-        }
-    }
-    if (dataOffset === -1) {
-        throw new Error('Invalid WAV file: no data chunk found');
-    }
-    return {
-        sampleRate,
-        channels,
-        bitsPerSample,
-        dataOffset,
-        dataSize,
-        totalSamples: dataSize / (bitsPerSample / 8),
-        samplesPerChannel: dataSize / (bitsPerSample / 8) / channels
-    };
-}
-async function testWithWAV(inputFile, outputFile) {
-    console.log("=== WAV File Test ===\n");
-    if (!fs.existsSync(inputFile)) {
-        console.error(`Input file not found: ${inputFile}`);
-        return 1;
-    }
-    try {
-        const buffer = fs.readFileSync(inputFile);
-        // Parse WAV header properly
-        const wavInfo = parseWAVHeader(buffer);
-        console.log(`WAV Format: ${wavInfo.channels} channel(s), ${wavInfo.sampleRate}Hz, ${wavInfo.bitsPerSample}-bit`);
-        console.log(`Total samples: ${wavInfo.totalSamples}, samples per channel: ${wavInfo.samplesPerChannel}`);
-        // Validate format requirements
-        if (wavInfo.sampleRate !== 16000) {
-            console.warn(`Warning: Sample rate is ${wavInfo.sampleRate}Hz, expected 16000Hz`);
-        }
-        if (wavInfo.channels !== 1) {
-            console.warn(`Warning: ${wavInfo.channels} channels detected, only first channel will be used`);
-        }
-        // Extract audio data
-        const audioBuffer = buffer.slice(wavInfo.dataOffset, wavInfo.dataOffset + wavInfo.dataSize);
-        const inputBuf = new Int16Array(audioBuffer.buffer.slice(audioBuffer.byteOffset));
-        // Calculate correct sample number (for mono audio)
-        const sampleNum = wavInfo.channels === 1 ?
-            wavInfo.samplesPerChannel :
-            Math.floor(wavInfo.samplesPerChannel); // Use only first channel if stereo
-        const totalAudioTime = sampleNum / wavInfo.sampleRate * 1000; // in milliseconds
-        const frameNum = Math.floor(sampleNum / HOP_SIZE);
-        console.log(`Audio info: ${audioBuffer.length} bytes, ${sampleNum} samples, ${frameNum} frames, ${totalAudioTime.toFixed(2)}ms`);
-        // If stereo, extract only the first channel
-        let processedInput = inputBuf;
-        if (wavInfo.channels > 1) {
-            console.log(`Extracting mono from ${wavInfo.channels} channels...`);
-            processedInput = new Int16Array(Math.floor(inputBuf.length / wavInfo.channels));
-            for (let i = 0; i < processedInput.length; i++) {
-                processedInput[i] = inputBuf[i * wavInfo.channels]; // Take first channel
-            }
-        }
-        const outProbs = new Float32Array(frameNum);
-        const outFlags = new Int32Array(frameNum);
-        const processingTime = await processAudio(processedInput, frameNum, outProbs, outFlags);
-        if (processingTime > 0) {
-            printResults(processingTime, totalAudioTime, outFlags, frameNum);
-            saveResults(outProbs, outFlags, frameNum, outputFile);
-        }
-        return 0;
-    } catch (error) {
-        console.error(`Error processing WAV file: ${error.message}`);
-        return 1;
-    }
-}
-async function runBenchmark() {
-    console.log("=== Performance Benchmark ===\n");
-    if (!createVADInstance()) return;
-    const testData = new Int16Array(HOP_SIZE);
-    for (let i = 0; i < HOP_SIZE; i++) {
-        testData[i] = Math.sin(2 * Math.PI * 440 * i / 16000) * 8000;
-    }
-    const testCases = [100, 1000, 10000];
-    for (const numFrames of testCases) {
-        const audioPtr = vadModule._malloc(HOP_SIZE * 2);
-        const probPtr = vadModule._malloc(4);
-        const flagPtr = vadModule._malloc(4);
-        vadModule.HEAP16.set(testData, audioPtr / 2);
-        const startTime = getTimestamp();
-        for (let i = 0; i < numFrames; i++) {
-            vadModule._ten_vad_process(vadHandle, audioPtr, HOP_SIZE, probPtr, flagPtr);
-        }
-        const endTime = getTimestamp();
-        const totalTime = endTime - startTime;
-        const avgTime = totalTime / numFrames;
-        // Calculate RTF (Real-time Factor)
-        // Each frame represents 16ms of audio (HOP_SIZE=256 samples at 16kHz)
-        const frameAudioTime = (HOP_SIZE / 16000) * 1000; // 16ms
-        const totalAudioTime = numFrames * frameAudioTime;
-        const rtf = totalTime / totalAudioTime;
-        console.log(`${numFrames} frames: ${totalTime}ms total, ${avgTime.toFixed(3)}ms/frame, RTF: ${rtf.toFixed(3)}`);
-        vadModule._free(audioPtr);
-        vadModule._free(probPtr);
-        vadModule._free(flagPtr);
-    }
-    destroyVADInstance();
-}
-// ============================================================================
-// MODULE INITIALIZATION
-// ============================================================================
-async function loadModule() {
-    try {
-        console.log("Loading WebAssembly module...");
-        if (!fs.existsSync(WASM_JS_FILE)) {
-            throw new Error(`ten_vad.js not found at ${WASM_JS_FILE}`);
-        }
-        if (!fs.existsSync(WASM_BINARY_FILE)) {
-            throw new Error(`ten_vad.wasm not found at ${WASM_BINARY_FILE}`);
-        }
-        // Read and modify the module file for Node.js compatibility
-        const wasmJsContent = fs.readFileSync(WASM_JS_FILE, 'utf8');
-        const modifiedContent = wasmJsContent
-            .replace(/import\.meta\.url/g, `"${path.resolve(WASM_JS_FILE)}"`)
-            .replace(/export default createVADModule;/, 'module.exports = createVADModule;');
-        // Write temporary file
-        const tempPath = './ten_vad_temp.js';
-        fs.writeFileSync(tempPath, modifiedContent);
-        // Load WASM binary
-        const wasmBinary = fs.readFileSync(WASM_BINARY_FILE);
-        // Load module
-        const createVADModule = require(path.resolve(tempPath));
-        vadModule = await createVADModule({
-            wasmBinary: wasmBinary,
-            locateFile: (filePath) => filePath.endsWith('.wasm') ? WASM_BINARY_FILE : filePath,
-            noInitialRun: false,
-            noExitRuntime: true
-        });
-        // Cleanup
-        fs.unlinkSync(tempPath);
-        // Add missing helper functions
-        addHelperFunctions();
-        console.log(`Module loaded successfully. Version: ${getVADVersion()}\n`);
-        return true;
-    } catch (error) {
-        console.error(`Failed to load module: ${error.message}`);
-        return false;
-    }
-}
-// ============================================================================
-// MAIN FUNCTION
-// ============================================================================
-async function main() {
-    const args = process.argv.slice(2);
-    // Initialize module
-    if (!await loadModule()) {
-        process.exit(1);
-    }
-    try {
-        if (args.length >= 2) {
-            // Test with WAV file
-            const [inputFile, outputFile] = args;
-            console.log(`Input: ${inputFile}, Output: ${outputFile}\n`);
-            await testWithWAV(inputFile, outputFile);
-        } else {
-            // Test with generated array
-            await testWithArray();
-        }
-        await runBenchmark();
-        return 0;
-    } catch (error) {
-        console.error(`Test failed: ${error.message}`);
-        return 1;
-    }
-}
-// ============================================================================
-// EXECUTION
-// ============================================================================
-if (require.main === module) {
-    main().then(exitCode => {
-        process.exit(exitCode);
-    }).catch(error => {
-        console.error(`Fatal error: ${error.message}`);
-        process.exit(1);
-    });
-}
-module.exports = { main, testWithArray, testWithWAV, runBenchmark };

examples_onnx/CMakeLists.txt DELETED Viewed

@@ -1,24 +0,0 @@
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
-cmake_minimum_required(VERSION 3.10)
-get_filename_component(ROOT ${CMAKE_CURRENT_SOURCE_DIR}/../ ABSOLUTE)
-project(ten_vad)
-set(CMAKE_BUILD_TYPE Release)
-add_compile_options(-Wno-write-strings -Wno-unused-result)
-include_directories(${ROOT}/src)
-include_directories(${ROOT}/include)
-include_directories(${ORT_ROOT}/include)
-file(GLOB LIBRARY_SOURCES "${ROOT}/src/*.cc" "${ROOT}/src/*.c")
-add_library(ten_vad SHARED ${LIBRARY_SOURCES})
-link_directories(${ORT_ROOT}/lib)
-target_link_libraries(ten_vad "${ORT_ROOT}/lib/libonnxruntime.so")
-set(EXECUTABLE_SOURCES ${ROOT}/examples/main.c)
-add_executable(ten_vad_demo ${EXECUTABLE_SOURCES})
-target_link_libraries(ten_vad_demo ten_vad)

examples_onnx/build-and-deploy-linux.sh DELETED Viewed

@@ -1,37 +0,0 @@
-#!/bin/bash
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
-set -euo pipefail
-if [[ "$#" -lt 2 || "$1" != "--ort-path" ]]; then
-    echo "usage: $0 --ort-path <path_to_onnxruntime>" >&2
-    exit 1
-fi
-ORT_ROOT="$2"
-shift 2
-if [[ ! -d "$ORT_ROOT" || ! -d "$ORT_ROOT/lib" || ! -d "$ORT_ROOT/include" ]]; then
-    echo "invalid onnxruntime library path: $ORT_ROOT" >&2
-    exit 1
-fi
-arch=x64
-build_dir=build-linux/$arch
-rm -rf $build_dir
-mkdir -p $build_dir
-cd $build_dir
-# Step 1: Build the demo
-cmake ../../ -DORT_ROOT="$ORT_ROOT"
-cmake --build . --config Release
-# Step 2: Run the demo
-ln -s ../../../src/onnx_model/
-./ten_vad_demo ../../../examples/s0724-s0730.wav out.txt
-cd ../../

include/ten_vad.h CHANGED Viewed

@@ -1,8 +1,7 @@
 //
-// Copyright © 2025 Agora
 // This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
 //
 #ifndef TEN_VAD_H
 #define TEN_VAD_H
@@ -84,4 +83,4 @@ extern "C"
 }
 #endif
-#endif /* TEN_VAD_H */

 //
 // This file is part of TEN Framework, an open source project.
+// Licensed under the Apache License, Version 2.0.
+// See the LICENSE file for more information.
 //
 #ifndef TEN_VAD_H
 #define TEN_VAD_H
 }
 #endif
+#endif /* TEN_VAD_H */

include/ten_vad.py CHANGED Viewed

@@ -1,74 +1,36 @@
 #
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
 #
 from ctypes import c_int, c_int32, c_float, c_size_t, CDLL, c_void_p, POINTER
 import numpy as np
 import os
-import platform
 class TenVad:
     def __init__(self, hop_size: int = 256, threshold: float = 0.5):
         self.hop_size = hop_size
         self.threshold = threshold
-        if platform.system() == "Linux" and platform.machine() == "x86_64":
-            git_path = os.path.join(
                 os.path.dirname(os.path.relpath(__file__)),
-                "../lib/Linux/x64/libten_vad.so"
             )
-            if os.path.exists(git_path):
-                self.vad_library = CDLL(git_path)
-            else:
-                pip_path = os.path.join(
-                    os.path.dirname(os.path.relpath(__file__)),
-                    "./ten_vad_library/libten_vad.so"
                 )
-                self.vad_library = CDLL(pip_path)
-        elif platform.system() == "Darwin":
-            git_path = os.path.join(
-                os.path.dirname(os.path.relpath(__file__)),
-                "../lib/macOS/ten_vad.framework/Versions/A/ten_vad"
             )
-            if os.path.exists(git_path):
-                self.vad_library = CDLL(git_path)
-            else:
-                pip_path = os.path.join(
-                    os.path.dirname(os.path.relpath(__file__)),
-                    "./ten_vad_library/libten_vad"
-                )
-                self.vad_library = CDLL(pip_path)
-        elif platform.system().upper() == 'WINDOWS':
-            if platform.machine().upper() in ['X64', 'X86_64', 'AMD64']:
-                git_path = os.path.join(
-                    os.path.dirname(os.path.realpath(__file__)),
-                    "../lib/Windows/x64/ten_vad.dll"
-                )
-                if os.path.exists(git_path):
-                    self.vad_library = CDLL(git_path)
-                else:
-                    pip_path = os.path.join(
-                        os.path.dirname(os.path.realpath(__file__)),
-                        "./ten_vad_library/ten_vad.dll"
                     )
-                    self.vad_library = CDLL(pip_path)
-            else:
-                git_path = os.path.join(
-                    os.path.dirname(os.path.realpath(__file__)),
-                    "../lib/Windows/x86/ten_vad.dll"
                 )
-                if os.path.exists(git_path):
-                    self.vad_library = CDLL(git_path)
-                else:
-                    pip_path = os.path.join(
-                        os.path.dirname(os.path.realpath(__file__)),
-                        "./ten_vad_library/ten_vad.dll"
-                    )
-                    self.vad_library = CDLL(pip_path)
-        else:
-            raise NotImplementedError(f"Unsupported platform: {platform.system()} {platform.machine()}")
         self.vad_handler = c_void_p(0)
         self.out_probability = c_float()
         self.out_flags = c_int32()

 #
+# This file is part of TEN Framework, an open source project.
+# Licensed under the Apache License, Version 2.0.
+# See the LICENSE file for more information.
 #
 from ctypes import c_int, c_int32, c_float, c_size_t, CDLL, c_void_p, POINTER
 import numpy as np
 import os
 class TenVad:
     def __init__(self, hop_size: int = 256, threshold: float = 0.5):
         self.hop_size = hop_size
         self.threshold = threshold
+        if os.path.exists(
+            os.path.join(
                 os.path.dirname(os.path.relpath(__file__)),
+                "../lib/Linux/x64/libten_vad.so",
             )
+        ):
+            self.vad_library = CDLL(
+                os.path.join(
+                    os.path.dirname(os.path.relpath(__file__)),
+                    "../lib/Linux/x64/libten_vad.so",
                 )
             )
+        else:
+            self.vad_library = CDLL(
+                os.path.join(
+                    os.path.dirname(
+                        os.path.relpath(__file__)),
+                        "./ten_vad_library/libten_vad.so",
                     )
                 )
         self.vad_handler = c_void_p(0)
         self.out_probability = c_float()
         self.out_flags = c_int32()

lib/Web/ten_vad.d.ts DELETED Viewed

@@ -1,111 +0,0 @@
-/**
- * This file is part of TEN Framework, an open source project.
- * Licensed under the Apache License, Version 2.0.
- * See the LICENSE file for more information.
- *
- * TEN VAD (Voice Activity Detection) WebAssembly Module
- * TypeScript type definitions
- */
-export interface TenVADModule {
-  /**
-   * Create and initialize a VAD instance
-   * @param handlePtr Pointer to store the VAD handle
-   * @param hopSize Number of samples between consecutive analysis frames (e.g., 256)
-   * @param threshold VAD detection threshold [0.0, 1.0]
-   * @returns 0 on success, -1 on error
-   */
-  _ten_vad_create(handlePtr: number, hopSize: number, threshold: number): number;
-  /**
-   * Process audio frame for voice activity detection
-   * @param handle Valid VAD handle from ten_vad_create
-   * @param audioDataPtr Pointer to int16 audio samples array
-   * @param audioDataLength Length of audio data (should equal hopSize)
-   * @param outProbabilityPtr Pointer to output probability [0.0, 1.0]
-   * @param outFlagPtr Pointer to output flag (0: no voice, 1: voice detected)
-   * @returns 0 on success, -1 on error
-   */
-  _ten_vad_process(
-    handle: number,
-    audioDataPtr: number,
-    audioDataLength: number,
-    outProbabilityPtr: number,
-    outFlagPtr: number
-  ): number;
-  /**
-   * Destroy VAD instance and release resources
-   * @param handlePtr Pointer to the VAD handle
-   * @returns 0 on success, -1 on error
-   */
-  _ten_vad_destroy(handlePtr: number): number;
-  /**
-   * Get library version string
-   * @returns Version string pointer
-   */
-  _ten_vad_get_version(): number;
-  // WebAssembly Memory Management
-  _malloc(size: number): number;
-  _free(ptr: number): void;
-  // Memory access helpers
-  HEAP16: Int16Array;
-  HEAPF32: Float32Array;
-  HEAP32: Int32Array;
-  HEAPU8: Uint8Array;
-  // Value access methods
-  getValue(ptr: number, type: 'i8' | 'i16' | 'i32' | 'float' | 'double'): number;
-  setValue(ptr: number, value: number, type: 'i8' | 'i16' | 'i32' | 'float' | 'double'): void;
-  // String utilities
-  UTF8ToString(ptr: number): string;
-  lengthBytesUTF8(str: string): number;
-  stringToUTF8(str: string, outPtr: number, maxBytesToWrite: number): void;
-}
-/**
- * High-level TypeScript wrapper for TEN VAD
- */
-export class TenVAD {
-  private module: TenVADModule;
-  private handle: number | null;
-  private hopSize: number;
-  constructor(module: TenVADModule, hopSize: number, threshold: number);
-  /**
-   * Process audio samples for voice activity detection
-   * @param audioData Int16Array of audio samples (length must equal hopSize)
-   * @returns Object with probability and voice detection flag
-   */
-  process(audioData: Int16Array): {
-    probability: number;
-    isVoice: boolean;
-  } | null;
-  /**
-   * Get library version
-   */
-  getVersion(): string;
-  /**
-   * Destroy VAD instance
-   */
-  destroy(): void;
-  /**
-   * Check if VAD instance is valid
-   */
-  isValid(): boolean;
-}
-/**
- * Create TEN VAD WebAssembly module
- */
-declare function createVADModule(): Promise<TenVADModule>;
-export default createVADModule;

lib/Web/ten_vad.js DELETED Viewed

@@ -1,30 +0,0 @@
-var createVADModule = (() => {
-  var _scriptDir = import.meta.url;
-  return (
-function(createVADModule) {
-  createVADModule = createVADModule || {};
-var a;a||(a=typeof createVADModule !== 'undefined' ? createVADModule : {});var k,l;a.ready=new Promise(function(b,c){k=b;l=c});var p=Object.assign({},a),r="object"==typeof window,u="function"==typeof importScripts,v="",w;
-if(r||u)u?v=self.location.href:"undefined"!=typeof document&&document.currentScript&&(v=document.currentScript.src),_scriptDir&&(v=_scriptDir),0!==v.indexOf("blob:")?v=v.substr(0,v.replace(/[?#].*/,"").lastIndexOf("/")+1):v="",u&&(w=b=>{var c=new XMLHttpRequest;c.open("GET",b,!1);c.responseType="arraybuffer";c.send(null);return new Uint8Array(c.response)});var aa=a.print||console.log.bind(console),x=a.printErr||console.warn.bind(console);Object.assign(a,p);p=null;var y;a.wasmBinary&&(y=a.wasmBinary);
-var noExitRuntime=a.noExitRuntime||!0;"object"!=typeof WebAssembly&&z("no native wasm support detected");var A,B=!1,C="undefined"!=typeof TextDecoder?new TextDecoder("utf8"):void 0,D,E,F;function J(){var b=A.buffer;D=b;a.HEAP8=new Int8Array(b);a.HEAP16=new Int16Array(b);a.HEAP32=new Int32Array(b);a.HEAPU8=E=new Uint8Array(b);a.HEAPU16=new Uint16Array(b);a.HEAPU32=F=new Uint32Array(b);a.HEAPF32=new Float32Array(b);a.HEAPF64=new Float64Array(b)}var K=[],L=[],M=[];
-function ba(){var b=a.preRun.shift();K.unshift(b)}var N=0,O=null,P=null;function z(b){if(a.onAbort)a.onAbort(b);b="Aborted("+b+")";x(b);B=!0;b=new WebAssembly.RuntimeError(b+". Build with -sASSERTIONS for more info.");l(b);throw b;}function Q(){return R.startsWith("data:application/octet-stream;base64,")}var R;if(a.locateFile){if(R="ten_vad.wasm",!Q()){var S=R;R=a.locateFile?a.locateFile(S,v):v+S}}else R=(new URL("ten_vad.wasm",import.meta.url)).href;
-function T(){var b=R;try{if(b==R&&y)return new Uint8Array(y);if(w)return w(b);throw"both async and sync fetching of the wasm failed";}catch(c){z(c)}}function ca(){return y||!r&&!u||"function"!=typeof fetch?Promise.resolve().then(function(){return T()}):fetch(R,{credentials:"same-origin"}).then(function(b){if(!b.ok)throw"failed to load wasm binary file at '"+R+"'";return b.arrayBuffer()}).catch(function(){return T()})}function U(b){for(;0<b.length;)b.shift()(a)}
-var da=[null,[],[]],ea={a:function(){z("")},f:function(b,c,m){E.copyWithin(b,c,c+m)},c:function(b){var c=E.length;b>>>=0;if(2147483648<b)return!1;for(var m=1;4>=m;m*=2){var h=c*(1+.2/m);h=Math.min(h,b+100663296);var d=Math;h=Math.max(b,h);d=d.min.call(d,2147483648,h+(65536-h%65536)%65536);a:{try{A.grow(d-D.byteLength+65535>>>16);J();var e=1;break a}catch(W){}e=void 0}if(e)return!0}return!1},e:function(){return 52},b:function(){return 70},d:function(b,c,m,h){for(var d=0,e=0;e<m;e++){var W=F[c>>2],
-X=F[c+4>>2];c+=8;for(var G=0;G<X;G++){var f=E[W+G],H=da[b];if(0===f||10===f){f=H;for(var n=0,q=n+NaN,t=n;f[t]&&!(t>=q);)++t;if(16<t-n&&f.buffer&&C)f=C.decode(f.subarray(n,t));else{for(q="";n<t;){var g=f[n++];if(g&128){var I=f[n++]&63;if(192==(g&224))q+=String.fromCharCode((g&31)<<6|I);else{var Y=f[n++]&63;g=224==(g&240)?(g&15)<<12|I<<6|Y:(g&7)<<18|I<<12|Y<<6|f[n++]&63;65536>g?q+=String.fromCharCode(g):(g-=65536,q+=String.fromCharCode(55296|g>>10,56320|g&1023))}}else q+=String.fromCharCode(g)}f=q}(1===
-b?aa:x)(f);H.length=0}else H.push(f)}d+=X}F[h>>2]=d;return 0}};
-(function(){function b(d){a.asm=d.exports;A=a.asm.g;J();L.unshift(a.asm.h);N--;a.monitorRunDependencies&&a.monitorRunDependencies(N);0==N&&(null!==O&&(clearInterval(O),O=null),P&&(d=P,P=null,d()))}function c(d){b(d.instance)}function m(d){return ca().then(function(e){return WebAssembly.instantiate(e,h)}).then(function(e){return e}).then(d,function(e){x("failed to asynchronously prepare wasm: "+e);z(e)})}var h={a:ea};N++;a.monitorRunDependencies&&a.monitorRunDependencies(N);if(a.instantiateWasm)try{return a.instantiateWasm(h,
-b)}catch(d){x("Module.instantiateWasm callback failed with error: "+d),l(d)}(function(){return y||"function"!=typeof WebAssembly.instantiateStreaming||Q()||"function"!=typeof fetch?m(c):fetch(R,{credentials:"same-origin"}).then(function(d){return WebAssembly.instantiateStreaming(d,h).then(c,function(e){x("wasm streaming compile failed: "+e);x("falling back to ArrayBuffer instantiation");return m(c)})})})().catch(l);return{}})();
-a.___wasm_call_ctors=function(){return(a.___wasm_call_ctors=a.asm.h).apply(null,arguments)};a._malloc=function(){return(a._malloc=a.asm.i).apply(null,arguments)};a._free=function(){return(a._free=a.asm.j).apply(null,arguments)};a._ten_vad_create=function(){return(a._ten_vad_create=a.asm.k).apply(null,arguments)};a._ten_vad_process=function(){return(a._ten_vad_process=a.asm.l).apply(null,arguments)};a._ten_vad_destroy=function(){return(a._ten_vad_destroy=a.asm.m).apply(null,arguments)};
-a._ten_vad_get_version=function(){return(a._ten_vad_get_version=a.asm.n).apply(null,arguments)};var V;P=function fa(){V||Z();V||(P=fa)};
-function Z(){function b(){if(!V&&(V=!0,a.calledRun=!0,!B)){U(L);k(a);if(a.onRuntimeInitialized)a.onRuntimeInitialized();if(a.postRun)for("function"==typeof a.postRun&&(a.postRun=[a.postRun]);a.postRun.length;){var c=a.postRun.shift();M.unshift(c)}U(M)}}if(!(0<N)){if(a.preRun)for("function"==typeof a.preRun&&(a.preRun=[a.preRun]);a.preRun.length;)ba();U(K);0<N||(a.setStatus?(a.setStatus("Running..."),setTimeout(function(){setTimeout(function(){a.setStatus("")},1);b()},1)):b())}}
-if(a.preInit)for("function"==typeof a.preInit&&(a.preInit=[a.preInit]);0<a.preInit.length;)a.preInit.pop()();Z();
-  return createVADModule.ready
-}
-);
-})();
-export default createVADModule;

lib/Windows/x64/ten_vad.lib CHANGED Viewed

Binary files a/lib/Windows/x64/ten_vad.lib and b/lib/Windows/x64/ten_vad.lib differ

lib/Windows/x86/ten_vad.lib CHANGED Viewed

Binary files a/lib/Windows/x86/ten_vad.lib and b/lib/Windows/x86/ten_vad.lib differ

lib/iOS/ten_vad.framework/Headers/ten_vad.h CHANGED Viewed

@@ -1,90 +1,3 @@
-/*
- * @file ten_vad.h
- * @brief Ten Voice Activity Detection (ten_vad) C API
- * Version: 1.0.0
- *
- * Provides functions to create, process, and destroy a VAD instance.
- */
-#ifndef TEN_VAD_H
-#define TEN_VAD_H
-#if defined(__APPLE__) || defined(__ANDROID__) || defined(__linux__)
-#define TENVAD_API __attribute__((visibility("default")))
-#elif defined(_WIN32) || defined(__CYGWIN__)
-/**
- * @def TENVAD_API
- * @brief Export/import macro for ten_vad shared library symbols.
- */
-#ifdef TENVAD_EXPORTS
-#define TENVAD_API __declspec(dllexport)
-#else
-#define TENVAD_API __declspec(dllimport)
-#endif
-#else
-#define TENVAD_API
-#endif
-#include <stddef.h> /* size_t */
-#include <stdint.h> /* int16_t */
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-  /**
-   * @typedef ten_vad_handle
-   * @brief Opaque handle for ten_vad instance.
-   */
-  typedef void *ten_vad_handle_t;
-  /**
-   * @brief Create and initialize a ten_vad instance.
-   *
-   * @param[out] handle       Pointer to receive the vad handle.
-   * @param[in]  hop_size     The number of samples between the start points of
-   * two consecutive analysis frames. (e.g., 256).
-   * @param[in]  threshold    VAD detection threshold ranging from [0.0, 1.0]
-   * (default: 0.5).
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_create(ten_vad_handle_t *handle, size_t hop_size,
-                                float threshold);
-  /**
-   * @brief Process one audio frame for voice activity detection.
-   * Must call ten_vad_init() before calling this, and ten_vad_destroy() when done.
-   *
-   * @param[in]  handle           Valid VAD handle returned by ten_vad_create().
-   * @param[in]  audio_data       Pointer to an array of int16_t samples,
-   * buffer length must equal the hop size specified at ten_vad_create.
-   * @param[in]  audio_data_length  size of audio_data buffer, here should be equal to hop_size.
-   * @param[out] out_probability  Pointer to a float (size 1) that receives the
-   * voice activity probability in the range [0.0, 1.0].
-   * @param[out] out_flag         Pointer to an int (size 1) that receives the
-   * detection result: 0 = no voice, 1 = voice detected.
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_process(ten_vad_handle_t handle, const int16_t *audio_data, size_t audio_data_length,
-                                 float *out_probability, int *out_flag);
-  /**
-   * @brief Destroy a ten_vad instance and release its resources.
-   *
-   * @param[in,out] handle Pointer to the ten_vad handle; set to NULL on return.
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_destroy(ten_vad_handle_t *handle);
-  /**
-   * @brief Get the ten_vad library version string.
-   *
-   * @return The version string (e.g., "1.0.0").
-   */
-  TENVAD_API const char *ten_vad_get_version(void);
-#ifdef __cplusplus
-}
-#endif
-#endif /* TEN_VAD_H */

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bbf0ab2d2ee30d9c170556efb9a7200a53725053cfa7c66a0dff79e7c9351e8
+size 2885

lib/iOS/ten_vad.framework/Info.plist CHANGED Viewed

Binary files a/lib/iOS/ten_vad.framework/Info.plist and b/lib/iOS/ten_vad.framework/Info.plist differ

lib/iOS/ten_vad.framework/Modules/module.modulemap CHANGED Viewed

@@ -1,5 +1,3 @@
-framework module ten_vad {
-        umbrella header "ten_vad.h"
-        export *
-        module * { export * }
-    }

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac22f2ff0291876b7d5069f957825d01abc06a3da84c9f4385154a8e99964096
+size 115

lib/macOS/ten_vad.framework/Headers DELETED Viewed

	@@ -1 +0,0 @@
1	- Versions/Current/Headers

lib/{Web/ten_vad.wasm → macOS/ten_vad.framework/Headers/ten_vad.h} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ec0b9640683987e15a4e54e4ce5642b2447c6e5d82b1be889b5099c75434fc3
-size 283349

 version https://git-lfs.github.com/spec/v1
+oid sha256:9bbf0ab2d2ee30d9c170556efb9a7200a53725053cfa7c66a0dff79e7c9351e8
+size 2885

lib/macOS/ten_vad.framework/Resources DELETED Viewed

	@@ -1 +0,0 @@
1	- Versions/Current/Resources

src/onnx_model/ten-vad.onnx → lib/macOS/ten_vad.framework/Resources/Info.plist RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e10b98a0cab1c98e847fbdda14cb3d45a38336d47535a3f63a0fb6c4e0f4cdf4
-size 315449

 version https://git-lfs.github.com/spec/v1
+oid sha256:5aa8df4f544b3143b819d6ffd5c21574c02884bf41cb2b7a8df45c7f10f75c3a
+size 1216

lib/macOS/ten_vad.framework/Versions/A/Headers/ten_vad.h CHANGED Viewed

@@ -1,90 +1,3 @@
-/*
- * @file ten_vad.h
- * @brief Ten Voice Activity Detection (ten_vad) C API
- * Version: 1.0.0
- *
- * Provides functions to create, process, and destroy a VAD instance.
- */
-#ifndef TEN_VAD_H
-#define TEN_VAD_H
-#if defined(__APPLE__) || defined(__ANDROID__) || defined(__linux__)
-#define TENVAD_API __attribute__((visibility("default")))
-#elif defined(_WIN32) || defined(__CYGWIN__)
-/**
- * @def TENVAD_API
- * @brief Export/import macro for ten_vad shared library symbols.
- */
-#ifdef TENVAD_EXPORTS
-#define TENVAD_API __declspec(dllexport)
-#else
-#define TENVAD_API __declspec(dllimport)
-#endif
-#else
-#define TENVAD_API
-#endif
-#include <stddef.h> /* size_t */
-#include <stdint.h> /* int16_t */
-#ifdef __cplusplus
-extern "C"
-{
-#endif
-  /**
-   * @typedef ten_vad_handle
-   * @brief Opaque handle for ten_vad instance.
-   */
-  typedef void *ten_vad_handle_t;
-  /**
-   * @brief Create and initialize a ten_vad instance.
-   *
-   * @param[out] handle       Pointer to receive the vad handle.
-   * @param[in]  hop_size     The number of samples between the start points of
-   * two consecutive analysis frames. (e.g., 256).
-   * @param[in]  threshold    VAD detection threshold ranging from [0.0, 1.0]
-   * (default: 0.5).
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_create(ten_vad_handle_t *handle, size_t hop_size,
-                                float threshold);
-  /**
-   * @brief Process one audio frame for voice activity detection.
-   * Must call ten_vad_init() before calling this, and ten_vad_destroy() when done.
-   *
-   * @param[in]  handle           Valid VAD handle returned by ten_vad_create().
-   * @param[in]  audio_data       Pointer to an array of int16_t samples,
-   * buffer length must equal the hop size specified at ten_vad_create.
-   * @param[in]  audio_data_length  size of audio_data buffer, here should be equal to hop_size.
-   * @param[out] out_probability  Pointer to a float (size 1) that receives the
-   * voice activity probability in the range [0.0, 1.0].
-   * @param[out] out_flag         Pointer to an int (size 1) that receives the
-   * detection result: 0 = no voice, 1 = voice detected.
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_process(ten_vad_handle_t handle, const int16_t *audio_data, size_t audio_data_length,
-                                 float *out_probability, int *out_flag);
-  /**
-   * @brief Destroy a ten_vad instance and release its resources.
-   *
-   * @param[in,out] handle Pointer to the ten_vad handle; set to NULL on return.
-   * @return 0 on success, or -1 error occurs.
-   */
-  TENVAD_API int ten_vad_destroy(ten_vad_handle_t *handle);
-  /**
-   * @brief Get the ten_vad library version string.
-   *
-   * @return The version string (e.g., "1.0.0").
-   */
-  TENVAD_API const char *ten_vad_get_version(void);
-#ifdef __cplusplus
-}
-#endif
-#endif /* TEN_VAD_H */

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bbf0ab2d2ee30d9c170556efb9a7200a53725053cfa7c66a0dff79e7c9351e8
+size 2885

lib/macOS/ten_vad.framework/Versions/A/Resources/Info.plist CHANGED Viewed

@@ -1,44 +1,3 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN" "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
-<plist version="1.0">
-<dict>
-	<key>BuildMachineOSBuild</key>
-	<string>23D60</string>
-	<key>CFBundleDevelopmentRegion</key>
-	<string>English</string>
-	<key>CFBundleExecutable</key>
-	<string>ten_vad</string>
-	<key>CFBundleIdentifier</key>
-	<string>com.yourcompany.ten_vad</string>
-	<key>CFBundleInfoDictionaryVersion</key>
-	<string>6.0</string>
-	<key>CFBundlePackageType</key>
-	<string>FMWK</string>
-	<key>CFBundleSignature</key>
-	<string>????</string>
-	<key>CFBundleSupportedPlatforms</key>
-	<array>
-		<string>MacOSX</string>
-	</array>
-	<key>CSResourcesFileMapped</key>
-	<true/>
-	<key>DTCompiler</key>
-	<string>com.apple.compilers.llvm.clang.1_0</string>
-	<key>DTPlatformBuild</key>
-	<string></string>
-	<key>DTPlatformName</key>
-	<string>macosx</string>
-	<key>DTPlatformVersion</key>
-	<string>14.2</string>
-	<key>DTSDKBuild</key>
-	<string>23C53</string>
-	<key>DTSDKName</key>
-	<string>macosx14.2</string>
-	<key>DTXcode</key>
-	<string>1520</string>
-	<key>DTXcodeBuild</key>
-	<string>15C500b</string>
-	<key>LSMinimumSystemVersion</key>
-	<string>10.10</string>
-</dict>
-</plist>

+version https://git-lfs.github.com/spec/v1
+oid sha256:5aa8df4f544b3143b819d6ffd5c21574c02884bf41cb2b7a8df45c7f10f75c3a
+size 1216

lib/macOS/ten_vad.framework/Versions/Current DELETED Viewed

	@@ -1 +0,0 @@
1	- A

lib/macOS/ten_vad.framework/Versions/Current/Headers/ten_vad.h ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9bbf0ab2d2ee30d9c170556efb9a7200a53725053cfa7c66a0dff79e7c9351e8
+size 2885

lib/macOS/ten_vad.framework/Versions/Current/Resources/Info.plist ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5aa8df4f544b3143b819d6ffd5c21574c02884bf41cb2b7a8df45c7f10f75c3a
+size 1216

lib/macOS/ten_vad.framework/Versions/Current/ten_vad ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81b2de13710670bb94fef315ab50fedc903a21c04c4290c6c2ac28d8b42e715a
+size 744600

lib/macOS/ten_vad.framework/ten_vad DELETED Viewed

	@@ -1 +0,0 @@
1	- Versions/Current/ten_vad

lib/macOS/ten_vad.framework/ten_vad ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:81b2de13710670bb94fef315ab50fedc903a21c04c4290c6c2ac28d8b42e715a
+size 744600

setup.py CHANGED Viewed

@@ -1,11 +1,5 @@
-#
-#  Copyright © 2025 Agora
-#  This file is part of TEN Framework, an open source project.
-#  Licensed under the Apache License, Version 2.0, with certain conditions.
-#  Refer to the "LICENSE" file in the root directory for more information.
-#
 from setuptools import setup
-import os, shutil, platform
 from setuptools.command.install import install
 class custom_install_command(install):
@@ -13,25 +7,8 @@ class custom_install_command(install):
         install.run(self)
         target_dir = os.path.join(self.install_lib, "ten_vad_library")
         os.makedirs(target_dir, exist_ok=True)
-        if platform.system() == "Linux" and platform.machine() == "x86_64":
-            shutil.copy("lib/Linux/x64/libten_vad.so", target_dir)
-            print(f"Linux x64 library installed to: {target_dir}")
-        elif platform.system() == "Darwin":
-            shutil.copy("lib/macOS/ten_vad.framework/Versions/A/ten_vad",
-                       os.path.join(target_dir, "libten_vad"))
-            print(f"macOS library installed to: {target_dir}")
-        elif platform.system().upper() == 'WINDOWS':
-            if platform.machine().upper() in ['X64', 'X86_64', 'AMD64']:
-                shutil.copy("lib/Windows/x64/ten_vad.dll",
-                       os.path.join(target_dir, "ten_vad.dll"))
-                print(f"Windows x64 library installed to: {target_dir}")
-            else:
-                shutil.copy("lib/Windows/x86/ten_vad.dll",
-                       os.path.join(target_dir, "ten_vad.dll"))
-                print(f"Windows x86 library installed to: {target_dir}")
-        else:
-            raise NotImplementedError(f"Unsupported platform: {platform.system()} {platform.machine()}")
 root_dir = os.path.dirname(os.path.abspath(__file__))
 shutil.copy(f"{root_dir}/include/ten_vad.py", f"{root_dir}/ten_vad.py")

 from setuptools import setup
+import os, shutil
 from setuptools.command.install import install
 class custom_install_command(install):
         install.run(self)
         target_dir = os.path.join(self.install_lib, "ten_vad_library")
         os.makedirs(target_dir, exist_ok=True)
+        shutil.copy("lib/Linux/x64/libten_vad.so", target_dir)
+        print(f"Files installed to: {target_dir}")
 root_dir = os.path.dirname(os.path.abspath(__file__))
 shutil.copy(f"{root_dir}/include/ten_vad.py", f"{root_dir}/ten_vad.py")

src/aed.cc DELETED Viewed

@@ -1,993 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#include <string.h>
-#include <stdlib.h>
-#include <algorithm>
-#include <math.h>
-#include "aed.h"
-#include "aed_st.h"
-#include "coeff.h"
-#include "pitch_est.h"
-#include "stft.h"
-#include <assert.h>
-#define AUP_AED_ALIGN8(o) (((o) + 7) & (~7))
-#define AUP_AED_MAX(x, y) (((x) > (y)) ? (x) : (y))
-#define AUP_AED_MIN(x, y) (((x) > (y)) ? (y) : (x))
-#define AUP_AED_EPS (1e-20f)
-/// ///////////////////////////////////////////////////////////////////////
-/// Internal Utils
-/// ///////////////////////////////////////////////////////////////////////
-AUP_MODULE_AIVAD::AUP_MODULE_AIVAD(char* onnx_path) {
-  ort_api = OrtGetApiBase()->GetApi(ORT_API_VERSION);
-  OrtStatus* status =
-      ort_api->CreateEnv(ORT_LOGGING_LEVEL_WARNING, "TEN-VAD", &ort_env);
-  if (status) {
-    printf("Failed to create env: %s\n", ort_api->GetErrorMessage(status));
-    ort_api->ReleaseStatus(status);
-    ort_api->ReleaseEnv(ort_env);
-    ort_env = NULL;
-    return;
-  }
-  OrtSessionOptions* session_options;
-  ort_api->CreateSessionOptions(&session_options);
-  ort_api->SetIntraOpNumThreads(session_options, 1);
-  status =
-      ort_api->CreateSession(ort_env, onnx_path, session_options, &ort_session);
-  ort_api->ReleaseSessionOptions(session_options);
-  if (status) {
-    printf("Failed to create ort_session: %s\n",
-           ort_api->GetErrorMessage(status));
-    ort_api->ReleaseStatus(status);
-    ort_api->ReleaseEnv(ort_env);
-    ort_env = NULL;
-    return;
-  }
-  ort_api->GetAllocatorWithDefaultOptions(&ort_allocator);
-  size_t num_inputs;
-  ort_api->SessionGetInputCount(ort_session, &num_inputs);
-  assert(num_inputs == AUP_AED_MODEL_IO_NUM);
-  for (size_t i = 0; i < num_inputs; i++) {
-    char* input_name;
-    ort_api->SessionGetInputName(ort_session, i, ort_allocator, &input_name);
-    strncpy(input_names_buf[i], input_name, sizeof(input_names_buf[i]));
-    input_names[i] = input_names_buf[i];
-    ort_api->AllocatorFree(ort_allocator, input_name);
-  }
-  size_t num_outputs;
-  ort_api->SessionGetOutputCount(ort_session, &num_outputs);
-  assert(num_outputs == AUP_AED_MODEL_IO_NUM);
-  for (size_t i = 0; i < num_outputs; i++) {
-    char* output_name;
-    ort_api->SessionGetOutputName(ort_session, i, ort_allocator, &output_name);
-    strncpy(output_names_buf[i], output_name, sizeof(output_names_buf[i]));
-    output_names[i] = output_names_buf[i];
-    ort_api->AllocatorFree(ort_allocator, output_name);
-  }
-  OrtMemoryInfo* memory_info;
-  status = ort_api->CreateCpuMemoryInfo(OrtDeviceAllocator, OrtMemTypeDefault,
-                                        &memory_info);
-  if (status != NULL) {
-    printf("Failed to create memory info: %s\n",
-           ort_api->GetErrorMessage(status));
-    ort_api->ReleaseStatus(status);
-    ort_api->ReleaseSession(ort_session);
-    ort_api->ReleaseEnv(ort_env);
-    ort_session = NULL;
-    ort_env = NULL;
-    return;
-  }
-  int64_t input_shapes0[] = {1, AUP_AED_CONTEXT_WINDOW_LEN, AUP_AED_FEA_LEN};
-  int64_t input_shapes1234[] = {1, AUP_AED_MODEL_HIDDEN_DIM};
-  for (int i = 0; i < num_inputs; i++) {
-    status = ort_api->CreateTensorWithDataAsOrtValue(
-        memory_info, i == 0 ? input_data_buf_0 : input_data_buf_1234[i - 1],
-        i == 0 ? sizeof(input_data_buf_0) : sizeof(input_data_buf_1234[i - 1]),
-        i == 0 ? input_shapes0 : input_shapes1234,
-        i == 0 ? sizeof(input_shapes0) / sizeof(input_shapes0[0])
-               : sizeof(input_shapes1234) / sizeof(input_shapes1234[0]),
-        ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT, &ort_input_tensors[i]);
-    if (status != NULL) {
-      printf("Failed to create input tensor %d: %s\n", i,
-             ort_api->GetErrorMessage(status));
-      ort_api->ReleaseStatus(status);
-      ort_api->ReleaseSession(ort_session);
-      ort_api->ReleaseEnv(ort_env);
-      ort_session = NULL;
-      ort_env = NULL;
-      return;
-    }
-  }
-  int64_t output_shapes0[] = {1, 1, 1};
-  int64_t output_shapes1234[] = {1, AUP_AED_MODEL_HIDDEN_DIM};
-  for (int i = 0; i < num_outputs; i++) {
-    status = ort_api->CreateTensorAsOrtValue(
-        ort_allocator, i == 0 ? output_shapes0 : output_shapes1234,
-        i == 0 ? sizeof(output_shapes0) / sizeof(output_shapes0[0])
-               : sizeof(output_shapes1234) / sizeof(output_shapes1234[0]),
-        ONNX_TENSOR_ELEMENT_DATA_TYPE_FLOAT, &ort_output_tensors[i]);
-    if (status != NULL) {
-      printf("Failed to create output tensor %d: %s\n", i,
-             ort_api->GetErrorMessage(status));
-      ort_api->ReleaseStatus(status);
-      ort_api->ReleaseSession(ort_session);
-      ort_api->ReleaseEnv(ort_env);
-      ort_session = NULL;
-      ort_env = NULL;
-      return;
-    }
-  }
-  inited = 1;
-}
-AUP_MODULE_AIVAD::~AUP_MODULE_AIVAD() {
-  for (int i = 0; i < AUP_AED_MODEL_IO_NUM; i++) {
-    if (ort_output_tensors[i]) {
-      ort_api->ReleaseValue(ort_output_tensors[i]);
-    }
-  }
-  if (ort_session) {
-    ort_api->ReleaseSession(ort_session);
-  }
-  if (ort_env) {
-    ort_api->ReleaseEnv(ort_env);
-  }
-}
-int AUP_MODULE_AIVAD::Process(float* input, float* output) {
-  if (!inited) {
-    printf("not inited!\n");
-    return -1;
-  }
-  memcpy(input_data_buf_0, input, sizeof(input_data_buf_0));
-  if (clear_hidden) {
-    memset(input_data_buf_1234, 0, sizeof(input_data_buf_1234));
-    clear_hidden = 0;
-  }
-  OrtStatus* status = ort_api->Run(
-      ort_session, NULL, input_names, ort_input_tensors, AUP_AED_MODEL_IO_NUM,
-      output_names, AUP_AED_MODEL_IO_NUM, ort_output_tensors);
-  float* output_data;
-  ort_api->GetTensorMutableData(ort_output_tensors[0], (void**)&output_data);
-  *output = output_data[0];
-  for (int i = 1; i < AUP_AED_MODEL_IO_NUM; i++) {
-    ort_api->GetTensorMutableData(ort_output_tensors[i], (void**)&output_data);
-    memcpy(input_data_buf_1234[i - 1], output_data,
-           sizeof(input_data_buf_1234[i - 1]));
-  }
-  return 0;
-}
-int AUP_MODULE_AIVAD::Reset() {
-  if (!inited) {
-    return -1;
-  }
-  clear_hidden = 1;
-  return 0;
-}
-static int AUP_Aed_checkStatCfg(Aed_StaticCfg* pCfg) {
-  if (pCfg == NULL) {
-    return -1;
-  }
-#if AUP_AED_FEA_LEN < AUP_AED_MEL_FILTER_BANK_NUM
-  return -1;
-#endif
-  if (pCfg->hopSz < 32) {
-    return -1;
-  }
-  if (pCfg->frqInputAvailableFlag == 1) {
-    if (pCfg->fftSz < 128 || pCfg->fftSz < pCfg->hopSz) {
-      return -1;
-    }
-    if (pCfg->anaWindowSz > pCfg->fftSz || pCfg->anaWindowSz < pCfg->hopSz) {
-      return -1;
-    }
-  }
-  return 0;
-}
-static int AUP_Aed_publishStaticCfg(Aed_St* stHdl) {
-  const Aed_StaticCfg* pStatCfg;
-  if (stHdl == NULL) {
-    return -1;
-  }
-  pStatCfg = (const Aed_StaticCfg*)(&(stHdl->stCfg));
-  stHdl->extFftSz = 0;
-  stHdl->extNBins = 0;
-  stHdl->extWinSz = 0;
-  if (pStatCfg->frqInputAvailableFlag == 1) {
-    stHdl->extFftSz = pStatCfg->fftSz;
-    stHdl->extNBins = (stHdl->extFftSz >> 1) + 1;
-    stHdl->extWinSz = pStatCfg->anaWindowSz;
-  }
-  stHdl->extHopSz = pStatCfg->hopSz;
-  stHdl->intFftSz = AUP_AED_ASSUMED_FFTSZ;
-  stHdl->intHopSz = AUP_AED_ASSUMED_HOPSZ;
-  stHdl->intWinSz = AUP_AED_ASSUMED_WINDOWSZ;
-  stHdl->intNBins = (stHdl->intFftSz >> 1) + 1;
-  stHdl->intAnalyWindowPtr = AUP_AED_STFTWindow_Hann768;
-  if (pStatCfg->frqInputAvailableFlag == 0 ||
-      stHdl->extHopSz != stHdl->intHopSz) {
-    // external STFT analysis framework is not supported at all
-    stHdl->intAnalyFlag =
-        2;  // internally redo analysis based on input time signal
-  } else if (stHdl->extFftSz == stHdl->intFftSz) {
-    // external STFT analysis framework completely match with internal
-    // requirement
-    stHdl->intAnalyFlag = 0;  // directly use external spectrum
-  } else {  // external spectrum need to be interpolated or extrapolated before
-            // AIVAD
-    stHdl->intAnalyFlag =
-        1;  // use external spectrum with interpolation / exterpolation
-  }
-  stHdl->inputTimeFIFOLen = stHdl->extHopSz + stHdl->intHopSz;
-  // for aiaed release2.0.0, pre-emphasis for input time-signal is needed,
-  // therefore, we need redo analysis based on input time signal preprocessed by
-  // pre-emphasis.
-  stHdl->intAnalyFlag =
-      2;  // internally redo analysis based on input time signal
-  stHdl->feaSz = (size_t)AUP_AED_FEA_LEN;
-  stHdl->melFbSz = (size_t)AUP_AED_MEL_FILTER_BANK_NUM;
-  stHdl->algDelay = (size_t)AUP_AED_LOOKAHEAD_NFRM;
-  stHdl->algCtxtSz = (size_t)AUP_AED_CONTEXT_WINDOW_LEN;
-  stHdl->frmRmsBufLen = AUP_AED_MAX(1, stHdl->algDelay);
-  return 0;
-}
-static int AUP_Aed_publishDynamCfg(Aed_St* stHdl) {
-  const Aed_DynamCfg* pDynmCfg;
-  PE_DynamCfg peDynmCfg;
-  if (stHdl == NULL) {
-    return -1;
-  }
-  pDynmCfg = (const Aed_DynamCfg*)(&(stHdl->dynamCfg));
-  stHdl->aivadResetFrmNum = pDynmCfg->resetFrameNum;
-  stHdl->voiceDecideThresh = pDynmCfg->extVoiceThr;
-  if (stHdl->pitchEstStPtr != NULL) {
-    peDynmCfg.voicedThr = pDynmCfg->pitchEstVoicedThr;
-    AUP_PE_setDynamCfg(stHdl->pitchEstStPtr, &peDynmCfg);
-  }
-  return 0;
-}
-static int AUP_Aed_resetVariables(Aed_St* stHdl) {
-  if (stHdl == NULL) {
-    return -1;
-  }
-  // first clear all the dynamic memory, all the dynamic variables which are
-  // not listed bellow are cleared to 0 by this step
-  memset(stHdl->dynamMemPtr, 0, stHdl->dynamMemSize);
-  float* melFbCoef = stHdl->melFilterBankCoef;
-  size_t* melBinBuff = stHdl->melFilterBinBuff;
-  size_t i, j;
-  size_t nBins = stHdl->intNBins;
-  size_t melFbSz = stHdl->melFbSz;
-  stHdl->aedProcFrmCnt = 0;
-  stHdl->inputTimeFIFOIdx = 0;
-  stHdl->aivadResetCnt = 0;
-  stHdl->timeSignalPre = 0.0f;
-  stHdl->aivadScore =
-      -1.0f;  // as default value, labeling as aed is not working yet
-  stHdl->aivadScorePre = -1.0f;
-  stHdl->pitchFreq = 0.0f;
-  // generate mel filter-bank coefficients
-  float low_mel = 2595.0f * log10f(1.0f + 0.0f / 700.0f);
-  float high_mel = 2595.0f * log10f(1.0f + 8000.0f / 700.0f);
-  float mel_points = 0.0f;
-  float hz_points = 0.0f;
-  size_t idx = 0;
-  for (i = 0; i < melFbSz + 2; i++) {
-    mel_points = i * (high_mel - low_mel) / ((float)melFbSz + 1.0f) + low_mel;
-    hz_points = 700.0f * (powf(10.0f, mel_points / 2595.0f) - 1.0f);
-    melBinBuff[i] =
-        (size_t)((stHdl->intFftSz + 1.0f) * hz_points / (float)AUP_AED_FS);
-    if (i > 0 && melBinBuff[i] == melBinBuff[i - 1]) {
-      return -1;
-    }
-  }
-  for (j = 0; j < melFbSz; j++) {
-    for (i = melBinBuff[j]; i < melBinBuff[j + 1]; i++) {
-      idx = j * nBins + i;
-      melFbCoef[idx] = (float)(i - melBinBuff[j]) /
-                       (float)(melBinBuff[j + 1] - melBinBuff[j]);
-    }
-    for (i = melBinBuff[j + 1]; i < melBinBuff[j + 2]; i++) {
-      idx = j * nBins + i;
-      melFbCoef[idx] = (float)(melBinBuff[j + 2] - i) /
-                       (float)(melBinBuff[j + 2] - melBinBuff[j + 1]);
-    }
-  }
-  if (stHdl->pitchEstStPtr != NULL) {
-    if (AUP_PE_init(stHdl->pitchEstStPtr) < 0) {
-      return -1;
-    }
-  }
-  if (stHdl->aivadInf != NULL) {
-    stHdl->aivadInf->Reset();
-  }
-  if (stHdl->timeInAnalysis != NULL) {
-    if (AUP_Analyzer_init(stHdl->timeInAnalysis) < 0) {
-      return -1;
-    }
-  }
-  return 0;
-}
-static int AUP_Aed_addOneCnter(int cnter) {
-  cnter++;
-  if (cnter >= 1000000000) {
-    cnter = 0;  // reset every half year
-  }
-  return (cnter);
-}
-static void AUP_Aed_binPowerConvert(const float* src, float* tgt, int srcNBins,
-                                    int tgtNBins) {
-  float rate;
-  int srcIdx, tgtIdx;
-  if (srcNBins == tgtNBins) {
-    memcpy(tgt, src, sizeof(float) * tgtNBins);
-    return;
-  }
-  memset(tgt, 0, sizeof(float) * tgtNBins);
-  rate = (float)(srcNBins - 1) / (float)(tgtNBins - 1);
-  for (tgtIdx = 0; tgtIdx < tgtNBins; tgtIdx++) {
-    srcIdx = (int)(tgtIdx * rate);
-    srcIdx = AUP_AED_MIN(srcNBins - 1, AUP_AED_MAX(srcIdx, 0));
-    tgt[tgtIdx] = src[srcIdx];
-  }
-  return;
-}
-static void AUP_Aed_CalcBinPow(int nBins, const float* cmplxSpctr,
-                               float* binPow) {
-  int idx, realIdx, imagIdx;
-  // bin-0
-  binPow[0] = cmplxSpctr[0] * cmplxSpctr[0];
-  // bin-(NBins-1)
-  binPow[nBins - 1] = cmplxSpctr[1] * cmplxSpctr[1];
-  for (idx = 1; idx < (nBins - 1); idx++) {
-    realIdx = idx << 1;
-    imagIdx = realIdx + 1;
-    binPow[idx] = cmplxSpctr[realIdx] * cmplxSpctr[realIdx] +
-                  cmplxSpctr[imagIdx] * cmplxSpctr[imagIdx];
-  }
-  return;
-}
-static int AUP_Aed_pitch_proc(void* pitchModule, const float* timeSignal,
-                              size_t timeLen, const float* binPow, size_t nBins,
-                              PE_OutputData* pOut) {
-  PE_InputData peInData;
-  peInData.timeSignal = timeSignal;
-  peInData.hopSz = (int)timeLen;
-  peInData.inBinPow = binPow;
-  peInData.nBins = (int)nBins;
-  pOut->pitchFreq = 0;
-  pOut->voiced = -1;
-  return AUP_PE_proc(pitchModule, &peInData, pOut);
-}
-static int AUP_Aed_aivad_proc(Aed_St* stHdl, const float* inBinPow,
-                              float* aivadScore) {
-  if (stHdl == NULL || inBinPow == NULL || aivadScore == NULL) {
-    return -1;
-  }
-  size_t i, j;
-  size_t nBins = stHdl->intNBins;
-  size_t melFbSz = stHdl->melFbSz;
-  size_t srcOffset;
-  size_t srcLen;
-  float* aivadInputFeatStack = stHdl->aivadInputFeatStack;
-  float* melFbCoef = stHdl->melFilterBankCoef;
-  const float* aivadFeatMean = AUP_AED_FEATURE_MEANS;
-  const float* aivadFeatStd = AUP_AED_FEATURE_STDS;
-  float* curMelFbCoefPtr = NULL;
-  float* curInputFeatPtr = NULL;
-  float perBandValue = 0.0f;
-  float powerNormal = 32768.0f * 32768.0f;
-  // update aivad feature buff.
-  srcOffset = stHdl->feaSz;
-  srcLen = (stHdl->algCtxtSz - 1) * stHdl->feaSz;
-  memmove(aivadInputFeatStack, aivadInputFeatStack + srcOffset,
-          sizeof(float) * srcLen);
-  curInputFeatPtr = aivadInputFeatStack + srcLen;
-  // cal. mel-filter-bank feature
-  for (i = 0; i < melFbSz; i++) {
-    perBandValue = 0.0f;
-    curMelFbCoefPtr = melFbCoef + i * nBins;
-    for (j = 0; j < nBins; j++) {
-      perBandValue += (inBinPow[j] * curMelFbCoefPtr[j]);
-    }
-    perBandValue = perBandValue / powerNormal;
-    perBandValue = logf(perBandValue + AUP_AED_EPS);
-    curInputFeatPtr[i] =
-        (perBandValue - aivadFeatMean[i]) / (aivadFeatStd[i] + AUP_AED_EPS);
-  }
-  // extra feat.
-  for (i = melFbSz; i < stHdl->feaSz; i++) {
-    curInputFeatPtr[i] =
-        (stHdl->pitchFreq - aivadFeatMean[i]) / (aivadFeatStd[i] + AUP_AED_EPS);
-  }
-  // exe. aivad
-  // exe. aivad
-  float aivadOutput;
-  if (stHdl->aivadInf != NULL &&
-      stHdl->aivadInf->Process(stHdl->aivadInputFeatStack, &aivadOutput) != 0) {
-    return -1;
-  }
-  (*aivadScore) = aivadOutput;
-  stHdl->aivadResetCnt += 1;
-  if (stHdl->aivadResetCnt >= stHdl->aivadResetFrmNum) {
-    if (stHdl->aivadInf != NULL && stHdl->aivadInf->Reset() != 0) {
-    }
-    stHdl->aivadResetCnt = 0;
-  }
-  return 0;
-}
-static int AUP_Aed_dynamMemPrepare(Aed_St* stHdl, void* memPtrExt,
-                                   size_t memSize) {
-  if (stHdl == NULL) {
-    return -1;
-  }
-  size_t pitchInNBins = stHdl->intNBins;
-  size_t totalMemSize = 0;
-  size_t inputTimeFIFOMemSize = 0;
-  size_t inputEmphTimeFIFOMemSize = 0;
-  size_t aivadInputCmplxSptrmMemSize = 0;
-  size_t aivadInputBinPowMemSize = 0;
-  size_t frameRmsBuffMemSize = 0;
-  size_t aivadInputFeatStackMemSize = 0;
-  size_t aimdInputFeatStackMemSize = 0;
-  size_t melFilterBankCoefMemSize = 0;
-  size_t melFilterBinBuffMemSize = 0;
-  size_t inputFloatBuffMemSize = 0;
-  // size_t vadScoreOutputBuffDelaySample = 384; // buff. delay for output
-  char* memPtr = NULL;
-  // size_t nBinsBufferMemSize = AUP_AED_ALIGN8(sizeof(float) * nBins);
-  // size_t spctrmMemSize = AUP_AED_ALIGN8(sizeof(float) * (nBins - 1) * 2);
-  inputTimeFIFOMemSize =
-      AUP_AED_ALIGN8(sizeof(float) * stHdl->inputTimeFIFOLen);
-  totalMemSize += inputTimeFIFOMemSize;
-  inputEmphTimeFIFOMemSize =
-      AUP_AED_ALIGN8(sizeof(float) * stHdl->inputTimeFIFOLen);
-  totalMemSize += inputEmphTimeFIFOMemSize;
-  aivadInputCmplxSptrmMemSize = AUP_AED_ALIGN8(sizeof(float) * stHdl->intFftSz);
-  totalMemSize += aivadInputCmplxSptrmMemSize;
-  aivadInputBinPowMemSize = AUP_AED_ALIGN8(sizeof(float) * stHdl->intNBins);
-  totalMemSize += aivadInputBinPowMemSize;
-  aivadInputFeatStackMemSize =
-      AUP_AED_ALIGN8(sizeof(float) * stHdl->algCtxtSz * stHdl->feaSz);
-  totalMemSize += aivadInputFeatStackMemSize;
-  aimdInputFeatStackMemSize =
-      AUP_AED_ALIGN8(sizeof(float) * stHdl->algCtxtSz * stHdl->feaSz);
-  totalMemSize += aimdInputFeatStackMemSize;
-  melFilterBankCoefMemSize =
-      AUP_AED_ALIGN8(sizeof(float) * pitchInNBins * stHdl->feaSz);
-  totalMemSize += melFilterBankCoefMemSize;
-  melFilterBinBuffMemSize = AUP_AED_ALIGN8(sizeof(size_t) * (stHdl->feaSz + 2));
-  totalMemSize += melFilterBinBuffMemSize;
-  frameRmsBuffMemSize = AUP_AED_ALIGN8(stHdl->frmRmsBufLen * sizeof(float));
-  totalMemSize += frameRmsBuffMemSize;
-  inputFloatBuffMemSize = AUP_AED_ALIGN8(stHdl->extHopSz * sizeof(float));
-  totalMemSize += inputFloatBuffMemSize;
-  if (memPtrExt == NULL) {
-    return ((int)totalMemSize);
-  }
-  if (totalMemSize > memSize) {
-    return -1;
-  }
-  memPtr = (char*)memPtrExt;
-  stHdl->inputTimeFIFO = (float*)memPtr;
-  memPtr += inputTimeFIFOMemSize;
-  stHdl->inputEmphTimeFIFO = (float*)memPtr;
-  memPtr += inputEmphTimeFIFOMemSize;
-  stHdl->aivadInputCmplxSptrm = (float*)memPtr;
-  memPtr += aivadInputCmplxSptrmMemSize;
-  stHdl->aivadInputBinPow = (float*)memPtr;
-  memPtr += aivadInputBinPowMemSize;
-  stHdl->aivadInputFeatStack = (float*)memPtr;
-  memPtr += aivadInputFeatStackMemSize;
-  stHdl->melFilterBankCoef = (float*)memPtr;
-  memPtr += melFilterBankCoefMemSize;
-  stHdl->melFilterBinBuff = (size_t*)memPtr;
-  memPtr += melFilterBinBuffMemSize;
-  stHdl->frameRmsBuff = (float*)memPtr;
-  memPtr += frameRmsBuffMemSize;
-  stHdl->inputFloatBuff = (float*)memPtr;
-  memPtr += inputFloatBuffMemSize;
-  if (((size_t)(memPtr - (char*)memPtrExt)) > totalMemSize) {
-    return -1;
-  }
-  return ((int)totalMemSize);
-}
-static int AUP_Aed_runOneFrm(Aed_St* stHdl, const float* tSignal, int hopSz,
-                             const float* binPowPtr, int nBins) {
-  PE_OutputData peOutData = {0, 0};
-  float aivadScore = -1.0f;
-  float mediaFilterout = 0;
-  int mediaIdx = (int)(AUP_AED_OUTPUT_SMOOTH_FILTER_LEN) / 2;
-  int i;
-  if (AUP_Aed_pitch_proc(stHdl->pitchEstStPtr, tSignal, hopSz, binPowPtr, nBins,
-                         &peOutData) < 0) {
-    return -1;
-  }
-  stHdl->pitchFreq = peOutData.pitchFreq;
-  if (AUP_Aed_aivad_proc(stHdl, binPowPtr, &aivadScore) < 0) {
-    return -1;
-  }
-  stHdl->aivadScore = aivadScore;
-  return 0;
-}
-/// ///////////////////////////////////////////////////////////////////////
-/// Public API
-/// ///////////////////////////////////////////////////////////////////////
-int AUP_Aed_create(void** stPtr) {
-  if (stPtr == NULL) {
-    return -1;
-  }
-  Aed_St* tmpPtr = (Aed_St*)malloc(sizeof(Aed_St));
-  if (tmpPtr == NULL) {
-    return -1;
-  }
-  memset(tmpPtr, 0, sizeof(Aed_St));
-  if (AUP_PE_create(&(tmpPtr->pitchEstStPtr)) < 0) {
-    return -1;
-  }
-  if (AUP_Analyzer_create(&(tmpPtr->timeInAnalysis)) < 0) {
-    return -1;
-  }
-  tmpPtr->stCfg.enableFlag = 1;  // as default, module enabled
-  tmpPtr->stCfg.fftSz = 1024;
-  tmpPtr->stCfg.hopSz = 256;
-  tmpPtr->stCfg.anaWindowSz = 768;
-  tmpPtr->stCfg.frqInputAvailableFlag = 0;
-  tmpPtr->dynamCfg.extVoiceThr = 0.5f;
-  tmpPtr->dynamCfg.extMusicThr = 0.5f;
-  tmpPtr->dynamCfg.extEnergyThr = 10.0f;
-  tmpPtr->dynamCfg.resetFrameNum = 1875;  // TODO
-  tmpPtr->dynamCfg.pitchEstVoicedThr = AUP_AED_PITCH_EST_DEFAULT_VOICEDTHR;
-  (*stPtr) = (void*)tmpPtr;
-  return 0;
-}
-int AUP_Aed_destroy(void** stPtr) {
-  if (stPtr == NULL || (*stPtr) == NULL) {
-    return -1;
-  }
-  Aed_St* stHdl = (Aed_St*)(*stPtr);
-  if (stHdl->aivadInf != NULL) {
-    delete stHdl->aivadInf;
-  }
-  stHdl->aivadInf = NULL;
-  if (AUP_PE_destroy(&(stHdl->pitchEstStPtr)) < 0) {
-    return -1;
-  }
-  if (AUP_Analyzer_destroy(&(stHdl->timeInAnalysis)) < 0) {
-    return -1;
-  }
-  if (stHdl->dynamMemPtr != NULL) {
-    free(stHdl->dynamMemPtr);
-  }
-  stHdl->dynamMemPtr = NULL;
-  if (stHdl != NULL) {
-    free(stHdl);
-  }
-  (*stPtr) = NULL;
-  return 0;
-}
-int AUP_Aed_memAllocate(void* stPtr, const Aed_StaticCfg* pCfg) {
-  Aed_St* stHdl = (Aed_St*)(stPtr);
-  Aed_StaticCfg aedStatCfg;
-  PE_StaticCfg pitchStatCfg;
-  Analyzer_StaticCfg analyzerStatCfg;
-  int totalMemSize = 0;
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  // 1th: check static cfg.
-  memcpy(&aedStatCfg, pCfg, sizeof(Aed_StaticCfg));
-  if (AUP_Aed_checkStatCfg(&aedStatCfg) < 0) {
-    return -1;
-  }
-  memcpy(&(stHdl->stCfg), &aedStatCfg, sizeof(Aed_StaticCfg));
-  // 2th: publish static configuration to internal statical configuration
-  // registers
-  if (AUP_Aed_publishStaticCfg(stHdl) < 0) {
-    return -1;
-  }
-  // 3th: create aivad instance
-  if (stHdl->aivadInf == NULL) {
-    stHdl->aivadInf = new AUP_MODULE_AIVAD("onnx_model/ten-vad.onnx");
-    if (stHdl->aivadInf == NULL) {
-      return -1;
-    }
-  }
-  stHdl->aivadInf->Reset();
-  // 4th: memAllocate operation for Pitch-Estimator ............
-  if (AUP_PE_getStaticCfg(stHdl->pitchEstStPtr, &pitchStatCfg) < 0) {
-    return -1;
-  }
-  pitchStatCfg.fftSz = stHdl->intFftSz;
-  pitchStatCfg.anaWindowSz = stHdl->intWinSz;
-  pitchStatCfg.hopSz = stHdl->intHopSz;
-  pitchStatCfg.useLPCPreFiltering = AUP_AED_PITCH_EST_USE_LPC;
-  pitchStatCfg.procFs = AUP_AED_PITCH_EST_PROCFS;
-  if (AUP_PE_memAllocate(stHdl->pitchEstStPtr, &pitchStatCfg) < 0) {
-    return -1;
-  }
-  // creation and initialization with time-analysis module ......
-  AUP_Analyzer_getStaticCfg(stHdl->timeInAnalysis, &analyzerStatCfg);
-  analyzerStatCfg.win_len = (int)stHdl->intWinSz;
-  analyzerStatCfg.hop_size = (int)stHdl->intHopSz;
-  analyzerStatCfg.fft_size = (int)stHdl->intFftSz;
-  analyzerStatCfg.ana_win_coeff = stHdl->intAnalyWindowPtr;
-  if (AUP_Analyzer_memAllocate(stHdl->timeInAnalysis, &analyzerStatCfg) < 0) {
-    return -1;
-  }
-  // 5th: check memory requirement ..............................
-  totalMemSize = AUP_Aed_dynamMemPrepare(stHdl, NULL, 0);
-  if (totalMemSize < 0) {
-    return -1;
-  }
-  // 6th: allocate dynamic memory
-  if (totalMemSize > (int)stHdl->dynamMemSize) {
-    if (stHdl->dynamMemPtr != NULL) {
-      free(stHdl->dynamMemPtr);
-      stHdl->dynamMemPtr = NULL;
-      stHdl->dynamMemSize = 0;
-    }
-    stHdl->dynamMemPtr = malloc(totalMemSize);
-    if (stHdl->dynamMemPtr == NULL) {
-      return -1;
-    }
-    stHdl->dynamMemSize = totalMemSize;
-  }
-  memset(stHdl->dynamMemPtr, 0, stHdl->dynamMemSize);
-  // 7th: setup the pointers/variable
-  if (AUP_Aed_dynamMemPrepare(stHdl, stHdl->dynamMemPtr, stHdl->dynamMemSize) <
-      0) {
-    return -1;
-  }
-  // 8th: publish internal dynamic config registers
-  if (AUP_Aed_publishDynamCfg(stHdl) < 0) {
-    return -1;
-  }
-  return 0;
-}
-int AUP_Aed_init(void* stPtr) {
-  Aed_St* stHdl = (Aed_St*)(stPtr);
-  if (stPtr == NULL) {
-    return -1;
-  }
-  // publish internal dynamic config registers
-  if (AUP_Aed_publishDynamCfg(stHdl) < 0) {
-    return -1;
-  }
-  // clear/reset run-time variables
-  if (AUP_Aed_resetVariables(stHdl) < 0) {
-    return -1;
-  }
-  return 0;
-}
-int AUP_Aed_setDynamCfg(void* stPtr, const Aed_DynamCfg* pCfg) {
-  Aed_St* stHdl = (Aed_St*)(stPtr);
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  memcpy(&(stHdl->dynamCfg), pCfg, sizeof(Aed_DynamCfg));
-  // publish internal dynamic configuration registers
-  if (AUP_Aed_publishDynamCfg(stHdl) < 0) {
-    return -1;
-  }
-  return 0;
-}
-int AUP_Aed_getStaticCfg(const void* stPtr, Aed_StaticCfg* pCfg) {
-  const Aed_St* stHdl = (const Aed_St*)(stPtr);
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  memcpy(pCfg, &(stHdl->stCfg), sizeof(Aed_StaticCfg));
-  return 0;
-}
-int AUP_Aed_getDynamCfg(const void* stPtr, Aed_DynamCfg* pCfg) {
-  const Aed_St* stHdl = (const Aed_St*)(stPtr);
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  memcpy(pCfg, &(stHdl->dynamCfg), sizeof(Aed_DynamCfg));
-  return 0;
-}
-int AUP_Aed_getAlgDelay(const void* stPtr, int* delayInFrms) {
-  const Aed_St* stHdl = (const Aed_St*)(stPtr);
-  if (stPtr == NULL || delayInFrms == NULL) {
-    return -1;
-  }
-  (*delayInFrms) = (int)stHdl->algDelay;
-  return 0;
-}
-int AUP_Aed_proc(void* stPtr, const Aed_InputData* pIn, Aed_OutputData* pOut) {
-  Analyzer_InputData analyzerInput;
-  Analyzer_OutputData analyzerOutput;
-  Aed_St* stHdl = (Aed_St*)(stPtr);
-  const float* binPowPtr = NULL;
-  float frameRms = 0.0f;
-  float frameEnergy = 0.0f;
-  float powerNormal = 32768.0f * 32768.0f;
-  int idx;
-  if (stPtr == NULL) {
-    return -1;
-  }
-  if (stHdl->stCfg.enableFlag == 0) {  // this module is disabled
-    return 0;
-  }
-  if (pIn == NULL || pIn->timeSignal == NULL || pOut == NULL) {
-    return -1;
-  }
-  if (stHdl->intAnalyFlag != 2) {  // the external spectra is going to be used
-    if (pIn->binPower == NULL) {
-      return -1;
-    }
-    if (pIn->nBins != (int)((stHdl->stCfg.fftSz >> 1) + 1) ||
-        pIn->hopSz != (int)(stHdl->stCfg.hopSz)) {
-      return -1;
-    }
-  }
-  // cal. input frame energy ....
-  for (idx = 0; idx < pIn->hopSz; idx++) {
-    frameRms += (pIn->timeSignal[idx] * pIn->timeSignal[idx]);
-  }
-  frameEnergy = frameRms;
-  frameRms = sqrtf(frameRms / (float)pIn->hopSz);
-  memmove(stHdl->frameRmsBuff, stHdl->frameRmsBuff + 1,
-          sizeof(float) * (stHdl->frmRmsBufLen - 1));
-  stHdl->frameRmsBuff[stHdl->frmRmsBufLen - 1] = frameRms;
-  // input signal conversion .........
-  if ((stHdl->inputTimeFIFOIdx + pIn->hopSz) > (int)stHdl->inputTimeFIFOLen) {
-    return -1;
-  }
-  // update pre-emphasis time signal FIFO
-  float* timeSigEphaPtr = stHdl->inputEmphTimeFIFO + stHdl->inputTimeFIFOIdx;
-  for (idx = 0; idx < pIn->hopSz; idx++) {
-    timeSigEphaPtr[idx] = pIn->timeSignal[idx] - 0.97f * stHdl->timeSignalPre;
-    stHdl->timeSignalPre = pIn->timeSignal[idx];
-  }
-  memcpy(stHdl->inputTimeFIFO + stHdl->inputTimeFIFOIdx, pIn->timeSignal,
-         sizeof(float) * (pIn->hopSz));
-  stHdl->inputTimeFIFOIdx += pIn->hopSz;
-  if (stHdl->intAnalyFlag == 0) {  // directly use external spectra
-    if (stHdl->inputTimeFIFOIdx != (int)(stHdl->intHopSz) ||
-        (int)(stHdl->intNBins) != pIn->nBins) {
-      return -1;
-    }
-    // one-time processing ...
-    stHdl->aedProcFrmCnt = AUP_Aed_addOneCnter(stHdl->aedProcFrmCnt);
-    binPowPtr = pIn->binPower;
-    // update: stHdl->pitchFreq, stHdl->aivadScore
-    if (AUP_Aed_runOneFrm(stHdl, stHdl->inputTimeFIFO, (int)stHdl->intHopSz,
-                          binPowPtr, (int)stHdl->intNBins) < 0) {
-      return -1;
-    }
-    // update the inputTimeFIFO
-    stHdl->inputTimeFIFOIdx = 0;
-  } else if (stHdl->intAnalyFlag ==
-             1) {  // do interpolation or extrapolation with external spectra
-    if (stHdl->inputTimeFIFOIdx != (int)(stHdl->intHopSz) ||
-        (int)(stHdl->extNBins) != pIn->nBins) {
-      return -1;
-    }
-    // one-time processing ....
-    stHdl->aedProcFrmCnt = AUP_Aed_addOneCnter(stHdl->aedProcFrmCnt);
-    AUP_Aed_binPowerConvert(pIn->binPower, stHdl->aivadInputBinPow,
-                            (int)stHdl->extNBins, (int)stHdl->intNBins);
-    binPowPtr = stHdl->aivadInputBinPow;
-    // update: stHdl->pitchFreq, stHdl->aivadScore
-    if (AUP_Aed_runOneFrm(stHdl, stHdl->inputTimeFIFO, (int)stHdl->intHopSz,
-                          binPowPtr, (int)stHdl->intNBins) < 0) {
-      return -1;
-    }
-    // update the inputTimeFIFO
-    stHdl->inputTimeFIFOIdx = 0;
-  } else {  // we need to do STFT on the input time-signal
-    if (stHdl->timeInAnalysis == NULL) {
-      return -1;
-    }
-    // loop processing .....
-    while (stHdl->inputTimeFIFOIdx >= (int)stHdl->intHopSz) {
-      stHdl->aedProcFrmCnt = AUP_Aed_addOneCnter(stHdl->aedProcFrmCnt);
-      analyzerInput.input = stHdl->inputEmphTimeFIFO;
-      analyzerInput.iLength = (int)stHdl->intHopSz;
-      analyzerOutput.output = stHdl->aivadInputCmplxSptrm;
-      analyzerOutput.oLength = (int)stHdl->intFftSz;
-      if (AUP_Analyzer_proc(stHdl->timeInAnalysis, &analyzerInput,
-                            &analyzerOutput) < 0) {
-        return -1;
-      }
-      AUP_Aed_CalcBinPow((int)stHdl->intNBins, stHdl->aivadInputCmplxSptrm,
-                         stHdl->aivadInputBinPow);
-      binPowPtr = stHdl->aivadInputBinPow;
-      // update: stHdl->pitchFreq, stHdl->aivadScore
-      if (AUP_Aed_runOneFrm(stHdl, stHdl->inputTimeFIFO, (int)stHdl->intHopSz,
-                            binPowPtr, (int)stHdl->intNBins) < 0) {
-        return -1;
-      }
-      // update the inputTimeFIFO & inputEmphTimeFIFO.....
-      if (stHdl->inputTimeFIFOIdx > (int)stHdl->intHopSz) {
-        memcpy(stHdl->inputTimeFIFO, stHdl->inputTimeFIFO + stHdl->intHopSz,
-               sizeof(float) * (stHdl->inputTimeFIFOIdx - stHdl->intHopSz));
-        memcpy(stHdl->inputEmphTimeFIFO,
-               stHdl->inputEmphTimeFIFO + stHdl->intHopSz,
-               sizeof(float) * (stHdl->inputTimeFIFOIdx - stHdl->intHopSz));
-      }
-      stHdl->inputTimeFIFOIdx -= (int)stHdl->intHopSz;
-    }
-  }
-  // write to output res.
-  pOut->frameEnergy = frameEnergy / powerNormal;
-  pOut->frameRms = stHdl->frameRmsBuff[0];
-  pOut->pitchFreq = stHdl->pitchFreq;
-  pOut->voiceProb = stHdl->aivadScore;
-  if (pOut->voiceProb < 0.0f) {
-    pOut->vadRes = -1;
-  } else if (pOut->voiceProb <= stHdl->voiceDecideThresh) {
-    pOut->vadRes = 0;
-  } else {
-    pOut->vadRes = 1;
-  }
-  return 0;
-}

src/aed.h DELETED Viewed

@@ -1,226 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#ifndef __AED_H__
-#define __AED_H__
-#include <stdint.h>
-#include <stdlib.h>
-#define AUP_AED_MAX_FFT_SZ (1024)  // the max. fft-size supported by VAD module
-#define AUP_AED_MAX_NBINS ((AUP_AED_MAX_FFT_SZ >> 1) + 1)
-#define AUP_AED_FS (16000)  // assumed input freq.
-// Configuration Parameters, which impacts dynamic memory occupation, can only
-// be set during allocation
-typedef struct Aed_StaticCfg_ {
-  int enableFlag;  // flag to enable or disable this module
-  // 0: disable, o.w.: enable
-  size_t fftSz;               // fft-size, only support: 128, 256, 512, 1024
-  size_t hopSz;               // fft-Hop Size, will be used to check
-  size_t anaWindowSz;         // fft-window Size, will be used to calc rms
-  int frqInputAvailableFlag;  // whether Aed_InputData will contain external
-                              // freq. power-sepctra
-} Aed_StaticCfg;
-// Configuraiton parameters which can be modified/set every frames
-typedef struct Aed_DynamCfg_ {
-  float extVoiceThr;        // threshold for ai based voice decision [0,1]
-  float extMusicThr;        // threshold for ai based music decision [0,1]
-  float extEnergyThr;       // threshold for energy based vad decision [0, ---]
-  size_t resetFrameNum;     // frame number for aivad reset [1875, 75000]
-  float pitchEstVoicedThr;  // threshold for pitch-estimator to output estimated
-                            // pitch
-} Aed_DynamCfg;
-// Spectrum are assumed to be generated with time-domain samples in [-32768,
-// 32767] with or without pre-emphasis operation
-typedef struct Aed_InputData_ {
-  const float* binPower;  // [NBins], power spectrum of 16KHz samples
-  int nBins;
-  const float*
-      timeSignal;  // [hopSz]   // this frame's input signal, in [-32768, 32767]
-  int hopSz;       // should be equal to StaticCfg->hopSz
-} Aed_InputData;
-// return data from statistical ns module
-typedef struct Aed_OutputData_ {
-  float frameEnergy;  // frame energy for input normalized data
-  float frameRms;     // rms for input int16 data
-  int energyVadRes;  // vad res 0/1 with extEnergyThreshold based on input frame
-                     // energy
-  float voiceProb;   // vad score [0,1]
-  int vadRes;  // vad res 0/1 with extVoiceThr based on ai method, t + 16ms res
-               // correspond to the t input
-  float pitchFreq;  // estimated pitch freq.
-} Aed_OutputData;
-#ifdef __cplusplus
-extern "C" {
-#endif
-/****************************************************************************
- * AUP_Aed_Create(...)
- *
- * This function creats a state handler from nothing, which is NOT ready for
- * processing
- *
- * Input:
- *
- * Output:
- *      - stPtr         : buffer to store the returned state handler
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_create(void** stPtr);
-/****************************************************************************
- * AUP_Aed_Destroy(...)
- *
- * destroy VAD instance, and releasing all the dynamically allocated memory
- * this interface will also release ainsFactory, which was
- * created externally and passed to VAD module through memAllocate interface
- *
- * Input:
- *      - stPtr         : buffer of State Handler, after this method, this
- *                        handler won't be usable anymore
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_destroy(void** stPtr);
-/****************************************************************************
- * AUP_Aed_MemAllocate(...)
- *
- * This function sets Static Config params and does memory allocation
- * operation, will lose the dynamCfg values
- *
- * Input:
- *      - stPtr         : State Handler which was returned by _create
- *      - pCfg          : static configuration parameters
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_memAllocate(void* stPtr, const Aed_StaticCfg* pCfg);
-/****************************************************************************
- * AUP_Aed_init(...)
- *
- * This function resets (initialize) the VAD module and gets it prepared for
- * processing
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_init(void* stPtr);
-/****************************************************************************
- * AUP_Aed_setDynamCfg(...)
- *
- * This function set dynamic (per-frame variable) configuration
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *      - pCfg          : configuration content
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_setDynamCfg(void* stPtr, const Aed_DynamCfg* pCfg);
-/****************************************************************************
- * AUP_Aed_getStaticCfg(...)
- *
- * This function get static configuration status from VAD module
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *      - pCfg          : configuration content
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_getStaticCfg(const void* stPtr, Aed_StaticCfg* pCfg);
-/****************************************************************************
- * AUP_Aed_getDynamCfg(...)
- *
- * This function get dynamic (per-frame variable) configuration status from
- * VAD module
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *      - pCfg          : configuration content
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_getDynamCfg(const void* stPtr, Aed_DynamCfg* pCfg);
-/****************************************************************************
- * AUP_Aed_getAlgDelay(...)
- *
- * This function get algorithm delay from VAD module
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *      - delayInFrms   : algorithm delay in terms of frames
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_getAlgDelay(const void* stPtr, int* delayInFrms);
-/****************************************************************************
- * AUP_Aed_proc(...)
- *
- * process a single frame
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate and reset
- *      - pCtrl         : per-frame variable control parameters
- *      - pIn           : input data stream
- *
- * Output:
- *      - pOut          : output data (mask, highband time-domain gain etc.)
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Aed_proc(void* stPtr, const Aed_InputData* pIn, Aed_OutputData* pOut);
-#ifdef __cplusplus
-}
-#endif
-#endif

src/aed_st.h DELETED Viewed

@@ -1,132 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#ifndef __AED_ST_H__
-#define __AED_ST_H__
-#include <stdio.h>
-#include <onnxruntime_c_api.h>
-#include "aed.h"
-#define AUP_AED_FS (16000)
-#define AUP_AED_MAX_IN_BUFF_SIZE (256)
-#define AUP_AED_POWER_SPCTR_NORMALIZER (9.3132e-10f)  // = 1/(32768^2)
-#define AUP_AED_OUTPUT_SMOOTH_FILTER_LEN (10)         // 160ms
-#define AUP_AED_MEL_FILTER_BANK_NUM (40)
-#define AUP_AED_LOOKAHEAD_NFRM (1)
-#define AUP_AED_CONTEXT_WINDOW_LEN (3)  // context window length of AIVAD
-#define AUP_AED_FEA_LEN \
-  (AUP_AED_MEL_FILTER_BANK_NUM + 1)  // feature length of AIVAD
-#define AUP_AED_PITCH_EST_USE_LPC (1)
-#define AUP_AED_PITCH_EST_PROCFS (4000)
-#if AUP_AED_PITCH_EST_PROCFS == 2000
-#define AUP_AED_PITCH_EST_DEFAULT_VOICEDTHR (0.45f)
-#else
-#define AUP_AED_PITCH_EST_DEFAULT_VOICEDTHR (0.4f)
-#endif
-#define AUP_AED_MODEL_IO_NUM (5)
-#define AUP_AED_MODEL_NAME_LENGTH (32)
-#define AUP_AED_MODEL_HIDDEN_DIM (64)
-class AUP_MODULE_AIVAD {
- public:
-  AUP_MODULE_AIVAD(char* onnx_path);
-  ~AUP_MODULE_AIVAD();
-  int Process(float* input, float* output);
-  int Reset();
- private:
-  const OrtApi* ort_api = NULL;
-  OrtAllocator* ort_allocator = NULL;
-  OrtEnv* ort_env = NULL;
-  OrtSession* ort_session = NULL;
-  int inited = 0;
-  int clear_hidden = 0;
-  char input_names_buf[AUP_AED_MODEL_IO_NUM][AUP_AED_MODEL_NAME_LENGTH] = {0};
-  const char* input_names[AUP_AED_MODEL_IO_NUM] = {NULL};
-  float input_data_buf_0[AUP_AED_CONTEXT_WINDOW_LEN * AUP_AED_FEA_LEN] = {0};
-  float input_data_buf_1234[AUP_AED_MODEL_IO_NUM - 1]
-                           [AUP_AED_MODEL_HIDDEN_DIM] = {0};
-  OrtValue* ort_input_tensors[AUP_AED_MODEL_IO_NUM] = {NULL};
-  char output_names_buf[AUP_AED_MODEL_IO_NUM][AUP_AED_MODEL_NAME_LENGTH] = {0};
-  const char* output_names[AUP_AED_MODEL_IO_NUM] = {NULL};
-  OrtValue* ort_output_tensors[AUP_AED_MODEL_IO_NUM] = {NULL};
-};
-typedef struct Aed_St_ {
-  void* dynamMemPtr;    // memory pointer holding the dynamic memory
-  size_t dynamMemSize;  // size of the buffer *dynamMemPtr
-  Aed_StaticCfg stCfg;
-  Aed_DynamCfg dynamCfg;
-  // Internal Static Config Registers, which are generated from stCfg
-  size_t extFftSz;  // externally decided FFT-Sz
-  size_t extHopSz;  // externally decided FFT-Hop-Sz
-  size_t extNBins;  // (FFTSz/2) + 1
-  size_t extWinSz;  // externally decided FFT-Window-Sz
-  size_t intFftSz;                 // internal FFT Sz
-  size_t intHopSz;                 // internal Hop Sz
-  size_t intWinSz;                 // internal Window Sz
-  size_t intNBins;                 // internal NBins
-  const float* intAnalyWindowPtr;  // internal analysis pointer
-  int intAnalyFlag;                // whether to do internal analysis
-  // 0: directly use external spectrum
-  // 1: use external spectrum with interpolation / exterpolation
-  // 2: need to redo analysis based on input time-domain signal
-  size_t inputTimeFIFOLen;  // length of input FIFO buffer
-  // if = 0: no need for input time-domain FIFO Queue
-  // Internal static config registers for pitch-est module
-  size_t feaSz;
-  size_t melFbSz;
-  size_t algDelay;  // in terms of processing frames
-  size_t algCtxtSz;
-  size_t frmRmsBufLen;  // frameRmsBuff: buffer-length of frameRmsBuff (FIFO)
-  // Internal dynamic Config Registers, which are generated from dynamCfg
-  size_t aivadResetFrmNum;
-  float voiceDecideThresh;
-  // SubModules
-  AUP_MODULE_AIVAD* aivadInf;
-  void* pitchEstStPtr;  // pitch-estimation module handler
-  void* timeInAnalysis;
-  // state handler of STFT analysis module
-  // Variables
-  int aedProcFrmCnt;  // counter of consecutive AI-VAD processed frames
-  int inputTimeFIFOIdx;
-  float* inputTimeFIFO;  // [inputTimeFIFOLen]
-  // input fifo buffer of time-signal to adjust between extHopSz and intHopSz
-  float* inputEmphTimeFIFO;     // [inputTimeFIFOLen]
-  float* aivadInputCmplxSptrm;  // [intFftSz]
-  float* aivadInputBinPow;      // [intNBins]  // AIVAD input power spectrum
-  size_t aivadResetCnt;
-  float timeSignalPre;
-  float aivadScore;
-  float aivadScorePre;
-  float pitchFreq;      // input audio pitch in Hz
-  float* frameRmsBuff;  // [frmRmsBufLen], FIFO, to delay frmRms result so that
-                        // it aligns with AIVAD result
-  float* aivadInputFeatStack;  // [...] = [AUP_AED_CONTEXT_WINDOW_LEN *
-                               // AUP_AED_FEA_LEN]
-  float* melFilterBankCoef;    // [melFbSz][nBins]
-  size_t* melFilterBinBuff;    // [melFbSz + 2]
-  float* inputFloatBuff;       // [hopSz]
-} Aed_St;
-#endif

src/biquad.cc DELETED Viewed

@@ -1,354 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#include "biquad.h"
-#include <math.h>
-#include <stdlib.h>
-#include <string.h>
-#include <stdio.h>
-#include "biquad_st.h"
-#define AUP_BIQUAD_NUM_DUMP_FILES (20)
-#define AUP_BIQUAD_DUMP_FILENAMES (200)
-// ==========================================================================================
-// internal tools
-// ==========================================================================================
-static int AUP_Biquad_checkStatCfg(const Biquad_StaticCfg* pCfg) {
-  int secIdx;
-  if (pCfg == NULL) {
-    return -1;
-  }
-  if (pCfg->maxNSample == 0 ||
-      pCfg->maxNSample > AGORA_UAP_BIQUAD_MAX_INPUT_LEN) {
-    return -1;
-  }
-  if (pCfg->nsect > AGORA_UAP_BIQUAD_MAX_SECTION) {
-    return -1;
-  }
-  // if external filter coefficients are required, we need to check the
-  //    external filter coeff pointers' validness
-  if (pCfg->nsect > 0) {
-    for (secIdx = 0; secIdx < pCfg->nsect; secIdx++) {
-      if (pCfg->B[secIdx] == NULL || pCfg->A[secIdx] == NULL) {
-        return -1;
-      }
-    }
-    if (pCfg->G == NULL) {
-      return -1;
-    }
-  }
-  return 0;
-}
-static int AUP_Biquad_publishStaticCfg(Biquad_St* stHdl) {
-  const Biquad_StaticCfg* pStatCfg;
-  int idx;
-  if (stHdl == NULL) {
-    return -1;
-  }
-  pStatCfg = (const Biquad_StaticCfg*)(&(stHdl->stCfg));
-  stHdl->maxNSample = (int)pStatCfg->maxNSample;
-  // first, give default (all-pass-filter) values to filter coeffs
-  for (idx = 0; idx < AGORA_UAP_BIQUAD_MAX_SECTION; idx++) {
-    stHdl->BCoeff[idx][0] = 1.0f;
-    stHdl->BCoeff[idx][1] = 0;
-    stHdl->BCoeff[idx][2] = 0;
-    stHdl->ACoeff[idx][0] = 1.0f;
-    stHdl->ACoeff[idx][1] = 0;
-    stHdl->ACoeff[idx][2] = 0;
-    stHdl->GCoeff[idx] = 1.0f;
-  }
-  if (pStatCfg->nsect <= 0) {
-    stHdl->nsect = _BIQUAD_DC_REMOVAL_NSECT;
-    for (idx = 0; idx < stHdl->nsect; idx++) {
-      stHdl->BCoeff[idx][0] = _BIQUAD_DC_REMOVAL_B[idx][0];
-      stHdl->BCoeff[idx][1] = _BIQUAD_DC_REMOVAL_B[idx][1];
-      stHdl->BCoeff[idx][2] = _BIQUAD_DC_REMOVAL_B[idx][2];
-      stHdl->ACoeff[idx][0] = _BIQUAD_DC_REMOVAL_A[idx][0];
-      stHdl->ACoeff[idx][1] = _BIQUAD_DC_REMOVAL_A[idx][1];
-      stHdl->ACoeff[idx][2] = _BIQUAD_DC_REMOVAL_A[idx][2];
-      stHdl->GCoeff[idx] = _BIQUAD_DC_REMOVAL_G[idx];
-    }
-  } else {
-    stHdl->nsect = pStatCfg->nsect;
-    for (idx = 0; idx < stHdl->nsect; idx++) {
-      stHdl->BCoeff[idx][0] = pStatCfg->B[idx][0];
-      stHdl->BCoeff[idx][1] = pStatCfg->B[idx][1];
-      stHdl->BCoeff[idx][2] = pStatCfg->B[idx][2];
-      stHdl->ACoeff[idx][0] = pStatCfg->A[idx][0];
-      stHdl->ACoeff[idx][1] = pStatCfg->A[idx][1];
-      stHdl->ACoeff[idx][2] = pStatCfg->A[idx][2];
-      stHdl->GCoeff[idx] = pStatCfg->G[idx];
-    }
-  }
-  return 0;
-}
-static int AUP_Biquad_resetVariables(Biquad_St* stHdl) {
-  memset(stHdl->dynamMemPtr, 0, stHdl->dynamMemSize);
-  memset(stHdl->sectW, 0, sizeof(stHdl->sectW));
-  return 0;
-}
-// ==========================================================================================
-// public APIS
-// ==========================================================================================
-int AUP_Biquad_create(void** stPtr) {
-  Biquad_St* tmpPtr;
-  if (stPtr == NULL) {
-    return -1;
-  }
-  *stPtr = (void*)malloc(sizeof(Biquad_St));
-  if (*stPtr == NULL) {
-    return -1;
-  }
-  memset(*stPtr, 0, sizeof(Biquad_St));
-  tmpPtr = (Biquad_St*)(*stPtr);
-  tmpPtr->dynamMemPtr = NULL;
-  tmpPtr->dynamMemSize = 0;
-  tmpPtr->stCfg.maxNSample = 768;
-  tmpPtr->stCfg.nsect = 0;
-  for (int idx = 0; idx < AGORA_UAP_BIQUAD_MAX_SECTION; idx++) {
-    tmpPtr->stCfg.A[idx] = NULL;
-    tmpPtr->stCfg.B[idx] = NULL;
-  }
-  tmpPtr->stCfg.G = NULL;
-  return 0;
-}
-int AUP_Biquad_destroy(void** stPtr) {
-  Biquad_St* stHdl;
-  if (stPtr == NULL) {
-    return 0;
-  }
-  stHdl = (Biquad_St*)(*stPtr);
-  if (stHdl == NULL) {
-    return 0;
-  }
-  if (stHdl->dynamMemPtr != NULL) {
-    free(stHdl->dynamMemPtr);
-  }
-  stHdl->dynamMemPtr = NULL;
-  free(stHdl);
-  (*stPtr) = NULL;
-  return 0;
-}
-int AUP_Biquad_memAllocate(void* stPtr, const Biquad_StaticCfg* pCfg) {
-  Biquad_St* stHdl = NULL;
-  char* memPtr = NULL;
-  int maxNSample, nsect, idx;
-  int inputTempBufMemSize = 0;
-  int sectOutputBufMemSize_EACH = 0;
-  int totalMemSize = 0;
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  stHdl = (Biquad_St*)(stPtr);
-  if (AUP_Biquad_checkStatCfg(pCfg) < 0) {
-    return -1;
-  }
-  memcpy(&(stHdl->stCfg), pCfg, sizeof(Biquad_StaticCfg));
-  if (AUP_Biquad_publishStaticCfg(stHdl) < 0) {
-    return -1;
-  }
-  maxNSample = stHdl->maxNSample;
-  nsect = stHdl->nsect;
-  // check memory requirement
-  inputTempBufMemSize = AGORA_UAP_BIQUAD_ALIGN8(sizeof(float) * maxNSample);
-  totalMemSize += inputTempBufMemSize;
-  sectOutputBufMemSize_EACH =
-      AGORA_UAP_BIQUAD_ALIGN8(sizeof(float) * maxNSample);
-  totalMemSize += sectOutputBufMemSize_EACH * nsect;
-  // allocate dynamic memory
-  if ((size_t)totalMemSize > stHdl->dynamMemSize) {
-    if (stHdl->dynamMemPtr != NULL) {
-      free(stHdl->dynamMemPtr);
-      stHdl->dynamMemSize = 0;
-    }
-    stHdl->dynamMemPtr = malloc(totalMemSize);
-    if (stHdl->dynamMemPtr == NULL) {
-      return -1;
-    }
-    stHdl->dynamMemSize = totalMemSize;
-  }
-  memset(stHdl->dynamMemPtr, 0, stHdl->dynamMemSize);
-  // setup the pointers/variable
-  memPtr = (char*)(stHdl->dynamMemPtr);
-  stHdl->inputTempBuf = (float*)memPtr;
-  memPtr += inputTempBufMemSize;
-  for (idx = 0; idx < nsect; idx++) {
-    stHdl->sectOutputBuf[idx] = (float*)memPtr;
-    memPtr += sectOutputBufMemSize_EACH;
-  }
-  for (; idx < AGORA_UAP_BIQUAD_MAX_SECTION; idx++) {
-    stHdl->sectOutputBuf[idx] = NULL;
-  }
-  if (((int)(memPtr - (char*)(stHdl->dynamMemPtr))) > totalMemSize) {
-    return -1;
-  }
-  return 0;
-}
-int AUP_Biquad_init(void* stPtr) {
-  Biquad_St* stHdl;
-  if (stPtr == NULL) {
-    return -1;
-  }
-  stHdl = (Biquad_St*)(stPtr);
-  if (AUP_Biquad_resetVariables(stHdl) < 0) {
-    return -1;
-  }
-  return 0;
-}
-int AUP_Biquad_getStaticCfg(const void* stPtr, Biquad_StaticCfg* pCfg) {
-  const Biquad_St* stHdl;
-  if (stPtr == NULL || pCfg == NULL) {
-    return -1;
-  }
-  stHdl = (const Biquad_St*)(stPtr);
-  memcpy(pCfg, &(stHdl->stCfg), sizeof(Biquad_StaticCfg));
-  return 0;
-}
-int AUP_Biquad_getAlgDelay(const void* stPtr, int* delayInSamples) {
-  const Biquad_St* stHdl;
-  if (stPtr == NULL || delayInSamples == NULL) {
-    return -1;
-  }
-  stHdl = (const Biquad_St*)(stPtr);
-  *delayInSamples = stHdl->nsect;
-  return 0;
-}
-int AUP_Biquad_proc(void* stPtr, const Biquad_InputData* pIn,
-                    Biquad_OutputData* pOut) {
-  Biquad_St* stHdl = NULL;
-  int isFloatIO = 0;
-  int inputNSamples, nSect;
-  int sectIdx, smplIdx;
-  float tmp1;
-  const short* pShortTemp;
-  float* src;
-  float* tgt;
-  if (stPtr == NULL || pIn == NULL || pOut == NULL) {  //  pCtrl == NULL
-    return -1;
-  }
-  if (pIn->samplesPtr == NULL || pOut->outputBuff == NULL) {
-    return -1;
-  }
-  stHdl = (Biquad_St*)(stPtr);
-  if (((int)pIn->nsamples) > stHdl->maxNSample) {
-    return -1;
-  }
-  isFloatIO = 0;
-  if (pIn->sampleType != 0) {
-    isFloatIO = 1;
-  }
-  inputNSamples = (int)pIn->nsamples;
-  nSect = stHdl->nsect;
-  // special handle for input
-  if (isFloatIO == 0) {
-    pShortTemp = (const short*)pIn->samplesPtr;
-    for (smplIdx = 0; smplIdx < inputNSamples; smplIdx++) {
-      stHdl->inputTempBuf[smplIdx] = (float)pShortTemp[smplIdx];
-    }
-  } else {
-    memcpy(stHdl->inputTempBuf, (const float*)pIn->samplesPtr,
-           sizeof(float) * inputNSamples);
-  }
-  for (sectIdx = 0; sectIdx < nSect; sectIdx++) {
-    if (sectIdx == 0) {
-      src = stHdl->inputTempBuf;
-    } else {
-      src = stHdl->sectOutputBuf[sectIdx - 1];
-    }
-    tgt = stHdl->sectOutputBuf[sectIdx];
-    for (smplIdx = 0; smplIdx < inputNSamples; smplIdx++) {
-      tmp1 = src[smplIdx] -
-             stHdl->ACoeff[sectIdx][1] * stHdl->sectW[sectIdx][0] -
-             stHdl->ACoeff[sectIdx][2] * stHdl->sectW[sectIdx][1];
-      tgt[smplIdx] = stHdl->GCoeff[sectIdx] *
-                     (stHdl->BCoeff[sectIdx][0] * tmp1 +
-                      stHdl->BCoeff[sectIdx][1] * stHdl->sectW[sectIdx][0] +
-                      stHdl->BCoeff[sectIdx][2] * stHdl->sectW[sectIdx][1]);
-      stHdl->sectW[sectIdx][1] = stHdl->sectW[sectIdx][0];
-      stHdl->sectW[sectIdx][0] = tmp1;
-    }
-  }
-  // prepare output buffer
-  if (isFloatIO == 0) {
-    for (smplIdx = 0; smplIdx < inputNSamples; smplIdx++) {
-      ((short*)pOut->outputBuff)[smplIdx] =
-          (short)_BIQUAD_FLOAT2SHORT(stHdl->sectOutputBuf[nSect - 1][smplIdx]);
-    }
-  } else {
-    memcpy(pOut->outputBuff, stHdl->sectOutputBuf[nSect - 1],
-           sizeof(float) * inputNSamples);
-  }
-  return 0;
-}

src/biquad.h DELETED Viewed

@@ -1,190 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#ifndef __BIQUAD_H__
-#define __BIQUAD_H__
-#include <stdio.h>
-#define AGORA_UAP_BIQUAD_MAX_SECTION (20)
-// the max. number of sections supported by this Biquad module
-#define AGORA_UAP_BIQUAD_MAX_INPUT_LEN (3840)
-// max. number of samples each time can be fed in
-#define AGORA_UAP_BIQUAD_ALIGN8(o) (((o) + 7) & (~7))
-#define _BIQUAD_FLOAT2SHORT(x) \
-  ((x) < -32767.5f ? -32768 : ((x) > 32766.5f ? 32767 : (short)floor(.5 + (x))))
-#define _BIQUAD_DC_REMOVAL_NSECT (2)
-const float _BIQUAD_DC_REMOVAL_B[_BIQUAD_DC_REMOVAL_NSECT][3] = {
-    {1.0f, -2.0f, 1.0f}, {1.0f, -1.0f, 0.0f}};
-const float _BIQUAD_DC_REMOVAL_A[_BIQUAD_DC_REMOVAL_NSECT][3] = {
-    {1.0f, -1.93944294f, 0.94281253f}, {1.0f, -0.94276431f, 0.0f}};
-// const float _BIQUAD_DC_REMOVAL_G[_BIQUAD_DC_REMOVAL_NSECT] = {0.97056387f,
-// 0.97138215f};
-const float _BIQUAD_DC_REMOVAL_G[_BIQUAD_DC_REMOVAL_NSECT] = {0.97056387f,
-                                                              0.8655014957f};
-// Configuration Parameters, which impacts dynamic memory occupation, can only
-// be set during allocation
-typedef struct Biquad_StaticCfg_ {
-  size_t maxNSample;  // max. number of samples each time can be fed in
-  // (0, AGORA_UAP_BIQUAD_MAX_INPUT_LEN]
-  int nsect;  // the number of sections to be processed by this Biquad module
-  // (-inf, AGORA_UAP_BIQUAD_MAX_SECTION]
-  // if <= 0, use internal default filter coefficients
-  const float* B[AGORA_UAP_BIQUAD_MAX_SECTION];
-  const float* A[AGORA_UAP_BIQUAD_MAX_SECTION];
-  // always assume A[...][0] = 1.0f
-  const float* G;
-} Biquad_StaticCfg;
-typedef struct Biquad_InputData_ {
-  const void*
-      samplesPtr;  // externally provided buffer containing input time samples
-  // either in short or float type
-  short sampleType;  // = 0: samplesPtr = short*; o.w. samplesPtr = float*
-  size_t nsamples;   // number of samples fed in this time
-} Biquad_InputData;
-typedef struct Biquad_OutputData_ {
-  void* outputBuff;  // externally provided output buffer,
-                     // assumed to be of enough size  nsamples *
-                     // sizeof(short)/sizeof(short) output data type is the same
-                     // as input
-} Biquad_OutputData;
-#ifdef __cplusplus
-extern "C" {
-#endif
-/****************************************************************************
- * AUP_Biquad_create(...)
- *
- * This function creats a state handler from nothing, which is NOT ready for
- * processing
- *
- * Input:
- *
- * Output:
- *      - stPtr         : buffer to store the returned state handler
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_create(void** stPtr);
-/****************************************************************************
- * AUP_Biquad_destroy(...)
- *
- * destroy biquad instance, and releasing all the dynamically allocated memory
- *
- * Input:
- *      - stPtr         : buffer of State Handler, after this method, this
- *                        handler won't be usable anymore
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_destroy(void** stPtr);
-/****************************************************************************
- * AUP_Biquad_memAllocate(...)
- *
- * This function sets Static Config params and does memory allocation
- * operation
- *
- * Input:
- *      - stPtr         : State Handler which was returned by _create
- *      - pCfg          : static configuration parameters
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_memAllocate(void* stPtr, const Biquad_StaticCfg* pCfg);
-/****************************************************************************
- * AUP_Biquad_init(...)
- *
- * This function resets (initialize) the biquad module and gets it prepared for
- * processing
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_init(void* stPtr);
-/****************************************************************************
- * AUP_Biquad_getStaticCfg(...)
- *
- * This function get static configuration status from Biquad module
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *      - pCfg          : configuration content
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_getStaticCfg(const void* stPtr, Biquad_StaticCfg* pCfg);
-/****************************************************************************
- * AUP_Biquad_getAlgDelay(...)
- *
- * This function get algorithm delay from biquad module
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *
- * Output:
- *      - delayInSamples   : algorithm delay in terms of samples
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_getAlgDelay(const void* stPtr, int* delayInSamples);
-/****************************************************************************
- * AUP_Biquad_proc(...)
- *
- * process a single frame
- *
- * Input:
- *      - stPtr         : State Handler which has gone through create and
- *                        memAllocate
- *      - pCtrl         : per-frame variable control parameters
- *      - pIn           : input data stream
- *
- * Output:
- *      - pOut          : output data (mask, highband time-domain gain etc.)
- *
- * Return value         :  0 - Ok
- *                        -1 - Error
- */
-int AUP_Biquad_proc(void* stPtr, const Biquad_InputData* pIn,
-                    Biquad_OutputData* pOut);
-#ifdef __cplusplus
-}
-#endif
-#endif  // __BIQUAD_H__

src/biquad_st.h DELETED Viewed

@@ -1,37 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#ifndef __BIQUAD_ST_H__
-#define __BIQUAD_ST_H__
-#include <stdio.h>
-#include "biquad.h"
-typedef struct Biquad_St_ {
-  void* dynamMemPtr;    // memory pointer holding the dynamic memory
-  size_t dynamMemSize;  // size of the buffer *dynamMemPtr
-  // Static Configuration
-  Biquad_StaticCfg stCfg;
-  // ---------------------------------------------------------------
-  // Internal Static Config Registers, which are generated from stCfg
-  int maxNSample;
-  int nsect;
-  float BCoeff[AGORA_UAP_BIQUAD_MAX_SECTION][3];
-  float ACoeff[AGORA_UAP_BIQUAD_MAX_SECTION][3];
-  float GCoeff[AGORA_UAP_BIQUAD_MAX_SECTION];  // gain for each section
-  // Variables
-  float* inputTempBuf;  // [maxNSample]
-  float sectW[AGORA_UAP_BIQUAD_MAX_SECTION][2];
-  // each section's register
-  float* sectOutputBuf
-      [AGORA_UAP_BIQUAD_MAX_SECTION];  //[AGORA_UAP_BIQUAD_MAX_SECTION][maxNSample]
-                                       // each section's output buffer
-} Biquad_St;
-#endif  // __BIQUAD_ST_H__

src/coeff.h DELETED Viewed

@@ -1,246 +0,0 @@
-//
-// Copyright © 2025 Agora
-// This file is part of TEN Framework, an open source project.
-// Licensed under the Apache License, Version 2.0, with certain conditions.
-// Refer to the "LICENSE" file in the root directory for more information.
-//
-#ifndef __COEFF_H__
-#define __COEFF_H__
-#include "aed_st.h"
-#define AUP_AED_MEAN_STD_NBINS AUP_AED_FEA_LEN
-#define AUP_AED_ASSUMED_HOPSZ (256)
-#define AUP_AED_ASSUMED_WINDOWSZ (768)
-#define AUP_AED_ASSUMED_FFTSZ (1024)
-// means of inpu-mel-filterbank
-const float AUP_AED_FEATURE_MEANS[AUP_AED_MEAN_STD_NBINS] = {
-    -8.198236465454e+00f, -6.265716552734e+00f, -5.483818531036e+00f,
-    -4.758691310883e+00f, -4.417088985443e+00f, -4.142892837524e+00f,
-    -3.912850379944e+00f, -3.845927953720e+00f, -3.657090425491e+00f,
-    -3.723418712616e+00f, -3.876134157181e+00f, -3.843890905380e+00f,
-    -3.690405130386e+00f, -3.756065845490e+00f, -3.698696136475e+00f,
-    -3.650463104248e+00f, -3.700468778610e+00f, -3.567321300507e+00f,
-    -3.498900175095e+00f, -3.477807044983e+00f, -3.458816051483e+00f,
-    -3.444923877716e+00f, -3.401328563690e+00f, -3.306261301041e+00f,
-    -3.278556823730e+00f, -3.233250856400e+00f, -3.198616027832e+00f,
-    -3.204526424408e+00f, -3.208798646927e+00f, -3.257838010788e+00f,
-    -3.381376743317e+00f, -3.534021377563e+00f, -3.640867948532e+00f,
-    -3.726858854294e+00f, -3.773730993271e+00f, -3.804667234421e+00f,
-    -3.832901000977e+00f, -3.871120452881e+00f, -3.990592956543e+00f,
-    -4.480289459229e+00f, 9.235690307617e+01f};
-// stds of input-mel-filterbank
-const float AUP_AED_FEATURE_STDS[AUP_AED_MEAN_STD_NBINS] = {
-    5.166063785553e+00f, 4.977209568024e+00f, 4.698895931244e+00f,
-    4.630621433258e+00f, 4.634347915649e+00f, 4.641156196594e+00f,
-    4.640676498413e+00f, 4.666367053986e+00f, 4.650534629822e+00f,
-    4.640020847321e+00f, 4.637400150299e+00f, 4.620099067688e+00f,
-    4.596316337585e+00f, 4.562654972076e+00f, 4.554360389709e+00f,
-    4.566910743713e+00f, 4.562489986420e+00f, 4.562412738800e+00f,
-    4.585299491882e+00f, 4.600179672241e+00f, 4.592845916748e+00f,
-    4.585922718048e+00f, 4.583496570587e+00f, 4.626092910767e+00f,
-    4.626957893372e+00f, 4.626289367676e+00f, 4.637005805969e+00f,
-    4.683015823364e+00f, 4.726813793182e+00f, 4.734289646149e+00f,
-    4.753227233887e+00f, 4.849722862244e+00f, 4.869434833527e+00f,
-    4.884482860565e+00f, 4.921327114105e+00f, 4.959212303162e+00f,
-    4.996619224548e+00f, 5.044823646545e+00f, 5.072216987610e+00f,
-    5.096439361572e+00f, 1.152136917114e+02f};
-const float AUP_AED_STFTWindow_Hann768[768] = {
-    0.0000000e+00f, 1.6733041e-05f, 6.6931045e-05f, 1.5059065e-04f,
-    2.6770626e-04f, 4.1827004e-04f, 6.0227190e-04f, 8.1969953e-04f,
-    1.0705384e-03f, 1.3547717e-03f, 1.6723803e-03f, 2.0233432e-03f,
-    2.4076367e-03f, 2.8252351e-03f, 3.2761105e-03f, 3.7602327e-03f,
-    4.2775693e-03f, 4.8280857e-03f, 5.4117450e-03f, 6.0285082e-03f,
-    6.6783340e-03f, 7.3611788e-03f, 8.0769970e-03f, 8.8257407e-03f,
-    9.6073598e-03f, 1.0421802e-02f, 1.1269013e-02f, 1.2148935e-02f,
-    1.3061510e-02f, 1.4006678e-02f, 1.4984373e-02f, 1.5994532e-02f,
-    1.7037087e-02f, 1.8111967e-02f, 1.9219101e-02f, 2.0358415e-02f,
-    2.1529832e-02f, 2.2733274e-02f, 2.3968661e-02f, 2.5235910e-02f,
-    2.6534935e-02f, 2.7865651e-02f, 2.9227967e-02f, 3.0621794e-02f,
-    3.2047037e-02f, 3.3503601e-02f, 3.4991388e-02f, 3.6510300e-02f,
-    3.8060234e-02f, 3.9641086e-02f, 4.1252752e-02f, 4.2895122e-02f,
-    4.4568088e-02f, 4.6271536e-02f, 4.8005353e-02f, 4.9769424e-02f,
-    5.1563629e-02f, 5.3387849e-02f, 5.5241962e-02f, 5.7125844e-02f,
-    5.9039368e-02f, 6.0982406e-02f, 6.2954829e-02f, 6.4956504e-02f,
-    6.6987298e-02f, 6.9047074e-02f, 7.1135695e-02f, 7.3253021e-02f,
-    7.5398909e-02f, 7.7573217e-02f, 7.9775799e-02f, 8.2006508e-02f,
-    8.4265194e-02f, 8.6551706e-02f, 8.8865891e-02f, 9.1207593e-02f,
-    9.3576658e-02f, 9.5972925e-02f, 9.8396234e-02f, 1.0084642e-01f,
-    1.0332333e-01f, 1.0582679e-01f, 1.0835663e-01f, 1.1091268e-01f,
-    1.1349477e-01f, 1.1610274e-01f, 1.1873640e-01f, 1.2139558e-01f,
-    1.2408010e-01f, 1.2678978e-01f, 1.2952444e-01f, 1.3228389e-01f,
-    1.3506796e-01f, 1.3787646e-01f, 1.4070919e-01f, 1.4356597e-01f,
-    1.4644661e-01f, 1.4935091e-01f, 1.5227868e-01f, 1.5522973e-01f,
-    1.5820385e-01f, 1.6120085e-01f, 1.6422052e-01f, 1.6726267e-01f,
-    1.7032709e-01f, 1.7341358e-01f, 1.7652192e-01f, 1.7965192e-01f,
-    1.8280336e-01f, 1.8597603e-01f, 1.8916971e-01f, 1.9238420e-01f,
-    1.9561929e-01f, 1.9887474e-01f, 2.0215035e-01f, 2.0544589e-01f,
-    2.0876115e-01f, 2.1209590e-01f, 2.1544993e-01f, 2.1882300e-01f,
-    2.2221488e-01f, 2.2562536e-01f, 2.2905421e-01f, 2.3250119e-01f,
-    2.3596607e-01f, 2.3944863e-01f, 2.4294863e-01f, 2.4646583e-01f,
-    2.5000000e-01f, 2.5355090e-01f, 2.5711830e-01f, 2.6070196e-01f,
-    2.6430163e-01f, 2.6791708e-01f, 2.7154806e-01f, 2.7519434e-01f,
-    2.7885565e-01f, 2.8253178e-01f, 2.8622245e-01f, 2.8992744e-01f,
-    2.9364649e-01f, 2.9737934e-01f, 3.0112576e-01f, 3.0488549e-01f,
-    3.0865828e-01f, 3.1244388e-01f, 3.1624203e-01f, 3.2005248e-01f,
-    3.2387498e-01f, 3.2770926e-01f, 3.3155507e-01f, 3.3541216e-01f,
-    3.3928027e-01f, 3.4315913e-01f, 3.4704849e-01f, 3.5094809e-01f,
-    3.5485766e-01f, 3.5877695e-01f, 3.6270569e-01f, 3.6664362e-01f,
-    3.7059048e-01f, 3.7454600e-01f, 3.7850991e-01f, 3.8248196e-01f,
-    3.8646187e-01f, 3.9044938e-01f, 3.9444422e-01f, 3.9844613e-01f,
-    4.0245484e-01f, 4.0647007e-01f, 4.1049157e-01f, 4.1451906e-01f,
-    4.1855226e-01f, 4.2259092e-01f, 4.2663476e-01f, 4.3068351e-01f,
-    4.3473690e-01f, 4.3879466e-01f, 4.4285652e-01f, 4.4692220e-01f,
-    4.5099143e-01f, 4.5506394e-01f, 4.5913946e-01f, 4.6321772e-01f,
-    4.6729844e-01f, 4.7138134e-01f, 4.7546616e-01f, 4.7955263e-01f,
-    4.8364046e-01f, 4.8772939e-01f, 4.9181913e-01f, 4.9590943e-01f,
-    5.0000000e-01f, 5.0409057e-01f, 5.0818087e-01f, 5.1227061e-01f,
-    5.1635954e-01f, 5.2044737e-01f, 5.2453384e-01f, 5.2861866e-01f,
-    5.3270156e-01f, 5.3678228e-01f, 5.4086054e-01f, 5.4493606e-01f,
-    5.4900857e-01f, 5.5307780e-01f, 5.5714348e-01f, 5.6120534e-01f,
-    5.6526310e-01f, 5.6931649e-01f, 5.7336524e-01f, 5.7740908e-01f,
-    5.8144774e-01f, 5.8548094e-01f, 5.8950843e-01f, 5.9352993e-01f,
-    5.9754516e-01f, 6.0155387e-01f, 6.0555578e-01f, 6.0955062e-01f,
-    6.1353813e-01f, 6.1751804e-01f, 6.2149009e-01f, 6.2545400e-01f,
-    6.2940952e-01f, 6.3335638e-01f, 6.3729431e-01f, 6.4122305e-01f,
-    6.4514234e-01f, 6.4905191e-01f, 6.5295151e-01f, 6.5684087e-01f,
-    6.6071973e-01f, 6.6458784e-01f, 6.6844493e-01f, 6.7229074e-01f,
-    6.7612502e-01f, 6.7994752e-01f, 6.8375797e-01f, 6.8755612e-01f,
-    6.9134172e-01f, 6.9511451e-01f, 6.9887424e-01f, 7.0262066e-01f,
-    7.0635351e-01f, 7.1007256e-01f, 7.1377755e-01f, 7.1746822e-01f,
-    7.2114435e-01f, 7.2480566e-01f, 7.2845194e-01f, 7.3208292e-01f,
-    7.3569837e-01f, 7.3929804e-01f, 7.4288170e-01f, 7.4644910e-01f,
-    7.5000000e-01f, 7.5353417e-01f, 7.5705137e-01f, 7.6055137e-01f,
-    7.6403393e-01f, 7.6749881e-01f, 7.7094579e-01f, 7.7437464e-01f,
-    7.7778512e-01f, 7.8117700e-01f, 7.8455007e-01f, 7.8790410e-01f,
-    7.9123885e-01f, 7.9455411e-01f, 7.9784965e-01f, 8.0112526e-01f,
-    8.0438071e-01f, 8.0761580e-01f, 8.1083029e-01f, 8.1402397e-01f,
-    8.1719664e-01f, 8.2034808e-01f, 8.2347808e-01f, 8.2658642e-01f,
-    8.2967291e-01f, 8.3273733e-01f, 8.3577948e-01f, 8.3879915e-01f,
-    8.4179615e-01f, 8.4477027e-01f, 8.4772132e-01f, 8.5064909e-01f,
-    8.5355339e-01f, 8.5643403e-01f, 8.5929081e-01f, 8.6212354e-01f,
-    8.6493204e-01f, 8.6771611e-01f, 8.7047556e-01f, 8.7321022e-01f,
-    8.7591990e-01f, 8.7860442e-01f, 8.8126360e-01f, 8.8389726e-01f,
-    8.8650523e-01f, 8.8908732e-01f, 8.9164337e-01f, 8.9417321e-01f,
-    8.9667667e-01f, 8.9915358e-01f, 9.0160377e-01f, 9.0402708e-01f,
-    9.0642334e-01f, 9.0879241e-01f, 9.1113411e-01f, 9.1344829e-01f,
-    9.1573481e-01f, 9.1799349e-01f, 9.2022420e-01f, 9.2242678e-01f,
-    9.2460109e-01f, 9.2674698e-01f, 9.2886431e-01f, 9.3095293e-01f,
-    9.3301270e-01f, 9.3504350e-01f, 9.3704517e-01f, 9.3901759e-01f,
-    9.4096063e-01f, 9.4287416e-01f, 9.4475804e-01f, 9.4661215e-01f,
-    9.4843637e-01f, 9.5023058e-01f, 9.5199465e-01f, 9.5372846e-01f,
-    9.5543191e-01f, 9.5710488e-01f, 9.5874725e-01f, 9.6035891e-01f,
-    9.6193977e-01f, 9.6348970e-01f, 9.6500861e-01f, 9.6649640e-01f,
-    9.6795296e-01f, 9.6937821e-01f, 9.7077203e-01f, 9.7213435e-01f,
-    9.7346506e-01f, 9.7476409e-01f, 9.7603134e-01f, 9.7726673e-01f,
-    9.7847017e-01f, 9.7964159e-01f, 9.8078090e-01f, 9.8188803e-01f,
-    9.8296291e-01f, 9.8400547e-01f, 9.8501563e-01f, 9.8599332e-01f,
-    9.8693849e-01f, 9.8785107e-01f, 9.8873099e-01f, 9.8957820e-01f,
-    9.9039264e-01f, 9.9117426e-01f, 9.9192300e-01f, 9.9263882e-01f,
-    9.9332167e-01f, 9.9397149e-01f, 9.9458825e-01f, 9.9517191e-01f,
-    9.9572243e-01f, 9.9623977e-01f, 9.9672389e-01f, 9.9717476e-01f,
-    9.9759236e-01f, 9.9797666e-01f, 9.9832762e-01f, 9.9864523e-01f,
-    9.9892946e-01f, 9.9918030e-01f, 9.9939773e-01f, 9.9958173e-01f,
-    9.9973229e-01f, 9.9984941e-01f, 9.9993307e-01f, 9.9998327e-01f,
-    1.0000000e+00f, 9.9998327e-01f, 9.9993307e-01f, 9.9984941e-01f,
-    9.9973229e-01f, 9.9958173e-01f, 9.9939773e-01f, 9.9918030e-01f,
-    9.9892946e-01f, 9.9864523e-01f, 9.9832762e-01f, 9.9797666e-01f,
-    9.9759236e-01f, 9.9717476e-01f, 9.9672389e-01f, 9.9623977e-01f,
-    9.9572243e-01f, 9.9517191e-01f, 9.9458825e-01f, 9.9397149e-01f,
-    9.9332167e-01f, 9.9263882e-01f, 9.9192300e-01f, 9.9117426e-01f,
-    9.9039264e-01f, 9.8957820e-01f, 9.8873099e-01f, 9.8785107e-01f,
-    9.8693849e-01f, 9.8599332e-01f, 9.8501563e-01f, 9.8400547e-01f,
-    9.8296291e-01f, 9.8188803e-01f, 9.8078090e-01f, 9.7964159e-01f,
-    9.7847017e-01f, 9.7726673e-01f, 9.7603134e-01f, 9.7476409e-01f,
-    9.7346506e-01f, 9.7213435e-01f, 9.7077203e-01f, 9.6937821e-01f,
-    9.6795296e-01f, 9.6649640e-01f, 9.6500861e-01f, 9.6348970e-01f,
-    9.6193977e-01f, 9.6035891e-01f, 9.5874725e-01f, 9.5710488e-01f,
-    9.5543191e-01f, 9.5372846e-01f, 9.5199465e-01f, 9.5023058e-01f,
-    9.4843637e-01f, 9.4661215e-01f, 9.4475804e-01f, 9.4287416e-01f,
-    9.4096063e-01f, 9.3901759e-01f, 9.3704517e-01f, 9.3504350e-01f,
-    9.3301270e-01f, 9.3095293e-01f, 9.2886431e-01f, 9.2674698e-01f,
-    9.2460109e-01f, 9.2242678e-01f, 9.2022420e-01f, 9.1799349e-01f,
-    9.1573481e-01f, 9.1344829e-01f, 9.1113411e-01f, 9.0879241e-01f,
-    9.0642334e-01f, 9.0402708e-01f, 9.0160377e-01f, 8.9915358e-01f,
-    8.9667667e-01f, 8.9417321e-01f, 8.9164337e-01f, 8.8908732e-01f,
-    8.8650523e-01f, 8.8389726e-01f, 8.8126360e-01f, 8.7860442e-01f,
-    8.7591990e-01f, 8.7321022e-01f, 8.7047556e-01f, 8.6771611e-01f,
-    8.6493204e-01f, 8.6212354e-01f, 8.5929081e-01f, 8.5643403e-01f,
-    8.5355339e-01f, 8.5064909e-01f, 8.4772132e-01f, 8.4477027e-01f,
-    8.4179615e-01f, 8.3879915e-01f, 8.3577948e-01f, 8.3273733e-01f,
-    8.2967291e-01f, 8.2658642e-01f, 8.2347808e-01f, 8.2034808e-01f,
-    8.1719664e-01f, 8.1402397e-01f, 8.1083029e-01f, 8.0761580e-01f,
-    8.0438071e-01f, 8.0112526e-01f, 7.9784965e-01f, 7.9455411e-01f,
-    7.9123885e-01f, 7.8790410e-01f, 7.8455007e-01f, 7.8117700e-01f,
-    7.7778512e-01f, 7.7437464e-01f, 7.7094579e-01f, 7.6749881e-01f,
-    7.6403393e-01f, 7.6055137e-01f, 7.5705137e-01f, 7.5353417e-01f,
-    7.5000000e-01f, 7.4644910e-01f, 7.4288170e-01f, 7.3929804e-01f,
-    7.3569837e-01f, 7.3208292e-01f, 7.2845194e-01f, 7.2480566e-01f,
-    7.2114435e-01f, 7.1746822e-01f, 7.1377755e-01f, 7.1007256e-01f,
-    7.0635351e-01f, 7.0262066e-01f, 6.9887424e-01f, 6.9511451e-01f,
-    6.9134172e-01f, 6.8755612e-01f, 6.8375797e-01f, 6.7994752e-01f,
-    6.7612502e-01f, 6.7229074e-01f, 6.6844493e-01f, 6.6458784e-01f,
-    6.6071973e-01f, 6.5684087e-01f, 6.5295151e-01f, 6.4905191e-01f,
-    6.4514234e-01f, 6.4122305e-01f, 6.3729431e-01f, 6.3335638e-01f,
-    6.2940952e-01f, 6.2545400e-01f, 6.2149009e-01f, 6.1751804e-01f,
-    6.1353813e-01f, 6.0955062e-01f, 6.0555578e-01f, 6.0155387e-01f,
-    5.9754516e-01f, 5.9352993e-01f, 5.8950843e-01f, 5.8548094e-01f,
-    5.8144774e-01f, 5.7740908e-01f, 5.7336524e-01f, 5.6931649e-01f,
-    5.6526310e-01f, 5.6120534e-01f, 5.5714348e-01f, 5.5307780e-01f,
-    5.4900857e-01f, 5.4493606e-01f, 5.4086054e-01f, 5.3678228e-01f,
-    5.3270156e-01f, 5.2861866e-01f, 5.2453384e-01f, 5.2044737e-01f,
-    5.1635954e-01f, 5.1227061e-01f, 5.0818087e-01f, 5.0409057e-01f,
-    5.0000000e-01f, 4.9590943e-01f, 4.9181913e-01f, 4.8772939e-01f,
-    4.8364046e-01f, 4.7955263e-01f, 4.7546616e-01f, 4.7138134e-01f,
-    4.6729844e-01f, 4.6321772e-01f, 4.5913946e-01f, 4.5506394e-01f,
-    4.5099143e-01f, 4.4692220e-01f, 4.4285652e-01f, 4.3879466e-01f,
-    4.3473690e-01f, 4.3068351e-01f, 4.2663476e-01f, 4.2259092e-01f,
-    4.1855226e-01f, 4.1451906e-01f, 4.1049157e-01f, 4.0647007e-01f,
-    4.0245484e-01f, 3.9844613e-01f, 3.9444422e-01f, 3.9044938e-01f,
-    3.8646187e-01f, 3.8248196e-01f, 3.7850991e-01f, 3.7454600e-01f,
-    3.7059048e-01f, 3.6664362e-01f, 3.6270569e-01f, 3.5877695e-01f,
-    3.5485766e-01f, 3.5094809e-01f, 3.4704849e-01f, 3.4315913e-01f,
-    3.3928027e-01f, 3.3541216e-01f, 3.3155507e-01f, 3.2770926e-01f,
-    3.2387498e-01f, 3.2005248e-01f, 3.1624203e-01f, 3.1244388e-01f,
-    3.0865828e-01f, 3.0488549e-01f, 3.0112576e-01f, 2.9737934e-01f,
-    2.9364649e-01f, 2.8992744e-01f, 2.8622245e-01f, 2.8253178e-01f,
-    2.7885565e-01f, 2.7519434e-01f, 2.7154806e-01f, 2.6791708e-01f,
-    2.6430163e-01f, 2.6070196e-01f, 2.5711830e-01f, 2.5355090e-01f,
-    2.5000000e-01f, 2.4646583e-01f, 2.4294863e-01f, 2.3944863e-01f,
-    2.3596607e-01f, 2.3250119e-01f, 2.2905421e-01f, 2.2562536e-01f,
-    2.2221488e-01f, 2.1882300e-01f, 2.1544993e-01f, 2.1209590e-01f,
-    2.0876115e-01f, 2.0544589e-01f, 2.0215035e-01f, 1.9887474e-01f,
-    1.9561929e-01f, 1.9238420e-01f, 1.8916971e-01f, 1.8597603e-01f,
-    1.8280336e-01f, 1.7965192e-01f, 1.7652192e-01f, 1.7341358e-01f,
-    1.7032709e-01f, 1.6726267e-01f, 1.6422052e-01f, 1.6120085e-01f,
-    1.5820385e-01f, 1.5522973e-01f, 1.5227868e-01f, 1.4935091e-01f,
-    1.4644661e-01f, 1.4356597e-01f, 1.4070919e-01f, 1.3787646e-01f,
-    1.3506796e-01f, 1.3228389e-01f, 1.2952444e-01f, 1.2678978e-01f,
-    1.2408010e-01f, 1.2139558e-01f, 1.1873640e-01f, 1.1610274e-01f,
-    1.1349477e-01f, 1.1091268e-01f, 1.0835663e-01f, 1.0582679e-01f,
-    1.0332333e-01f, 1.0084642e-01f, 9.8396234e-02f, 9.5972925e-02f,
-    9.3576658e-02f, 9.1207593e-02f, 8.8865891e-02f, 8.6551706e-02f,
-    8.4265194e-02f, 8.2006508e-02f, 7.9775799e-02f, 7.7573217e-02f,
-    7.5398909e-02f, 7.3253021e-02f, 7.1135695e-02f, 6.9047074e-02f,
-    6.6987298e-02f, 6.4956504e-02f, 6.2954829e-02f, 6.0982406e-02f,
-    5.9039368e-02f, 5.7125844e-02f, 5.5241962e-02f, 5.3387849e-02f,
-    5.1563629e-02f, 4.9769424e-02f, 4.8005353e-02f, 4.6271536e-02f,
-    4.4568088e-02f, 4.2895122e-02f, 4.1252752e-02f, 3.9641086e-02f,
-    3.8060234e-02f, 3.6510300e-02f, 3.4991388e-02f, 3.3503601e-02f,
-    3.2047037e-02f, 3.0621794e-02f, 2.9227967e-02f, 2.7865651e-02f,
-    2.6534935e-02f, 2.5235910e-02f, 2.3968661e-02f, 2.2733274e-02f,
-    2.1529832e-02f, 2.0358415e-02f, 1.9219101e-02f, 1.8111967e-02f,
-    1.7037087e-02f, 1.5994532e-02f, 1.4984373e-02f, 1.4006678e-02f,
-    1.3061510e-02f, 1.2148935e-02f, 1.1269013e-02f, 1.0421802e-02f,
-    9.6073598e-03f, 8.8257407e-03f, 8.0769970e-03f, 7.3611788e-03f,
-    6.6783340e-03f, 6.0285082e-03f, 5.4117450e-03f, 4.8280857e-03f,
-    4.2775693e-03f, 3.7602327e-03f, 3.2761105e-03f, 2.8252351e-03f,
-    2.4076367e-03f, 2.0233432e-03f, 1.6723803e-03f, 1.3547717e-03f,
-    1.0705384e-03f, 8.1969953e-04f, 6.0227190e-04f, 4.1827004e-04f,
-    2.6770626e-04f, 1.5059065e-04f, 6.6931045e-05f, 1.6733041e-05f};
-#endif

src/fftw.c DELETED Viewed

The diff for this file is too large to render. See raw diff