/* * Copyright (c) 2019 The WebRTC project authors. All Rights Reserved. * * Use of this source code is governed by a BSD-style license * that can be found in the LICENSE file in the root of the source * tree. An additional intellectual property rights grant can be found * in the file PATENTS. All contributing project authors may * be found in the AUTHORS file in the root of the source tree. */ #ifndef MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_ #define MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_ #include #include #include "modules/audio_processing/include/audio_processing.h" namespace webrtc { class AudioBuffer; // The voice activity detection (VAD) component analyzes the stream to // determine if voice is present. class VoiceDetection { public: // Specifies the likelihood that a frame will be declared to contain voice. // A higher value makes it more likely that speech will not be clipped, at // the expense of more noise being detected as voice. enum Likelihood { kVeryLowLikelihood, kLowLikelihood, kModerateLikelihood, kHighLikelihood }; VoiceDetection(int sample_rate_hz, Likelihood likelihood); ~VoiceDetection(); VoiceDetection(VoiceDetection&) = delete; VoiceDetection& operator=(VoiceDetection&) = delete; // Returns true if voice is detected in the current frame. bool ProcessCaptureAudio(AudioBuffer* audio); Likelihood likelihood() const { return likelihood_; } private: class Vad; int sample_rate_hz_; size_t frame_size_samples_; Likelihood likelihood_; std::unique_ptr vad_; }; } // namespace webrtc #endif // MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_