// | |
// Copyright © 2025 Agora | |
// This file is part of TEN Framework, an open source project. | |
// Licensed under the Apache License, Version 2.0, with certain conditions. | |
// Refer to the "LICENSE" file in the root directory for more information. | |
// | |
extern "C" | |
{ | |
/** | |
* @typedef ten_vad_handle | |
* @brief Opaque handle for ten_vad instance. | |
*/ | |
typedef void *ten_vad_handle_t; | |
/** | |
* @brief Create and initialize a ten_vad instance. | |
* | |
* @param[out] handle Pointer to receive the vad handle. | |
* @param[in] hop_size The number of samples between the start points of | |
* two consecutive analysis frames. (e.g., 256). | |
* @param[in] threshold VAD detection threshold ranging from [0.0, 1.0] | |
* This threshold is used to determine voice activity by comparing with the output probability. | |
* When probability >= threshold, voice is detected. | |
* @return 0 on success, or -1 error occurs. | |
*/ | |
TENVAD_API int ten_vad_create(ten_vad_handle_t *handle, size_t hop_size, | |
float threshold); | |
/** | |
* @brief Process one audio frame for voice activity detection. | |
* Must call ten_vad_init() before calling this, and ten_vad_destroy() when done. | |
* | |
* @param[in] handle Valid VAD handle returned by ten_vad_create(). | |
* @param[in] audio_data Pointer to an array of int16_t samples, | |
* buffer length must equal the hop size specified at ten_vad_create. | |
* @param[in] audio_data_length size of audio_data buffer, here should be equal to hop_size. | |
* @param[out] out_probability Pointer to a float (size 1) that receives the | |
* voice activity probability in the range [0.0, 1.0], where higher values indicate higher confidence in voice presence. | |
* @param[out] out_flag Pointer to an int (size 1) that receives the | |
* binary voice activity decision: 0: no voice, 1: voice detected. | |
* This flag is set to 1 when out_probability >= threshold, and 0 otherwise. | |
* @return 0 on success, or -1 error occurs. | |
*/ | |
TENVAD_API int ten_vad_process(ten_vad_handle_t handle, const int16_t *audio_data, size_t audio_data_length, | |
float *out_probability, int *out_flag); | |
/** | |
* @brief Destroy a ten_vad instance and release its resources. | |
* | |
* @param[in,out] handle Pointer to the ten_vad handle; set to NULL on return. | |
* @return 0 on success, or -1 error occurs. | |
*/ | |
TENVAD_API int ten_vad_destroy(ten_vad_handle_t *handle); | |
/** | |
* @brief Get the ten_vad library version string. | |
* | |
* @return The version string (e.g., "1.0.0"). | |
*/ | |
TENVAD_API const char *ten_vad_get_version(void); | |
} | |