1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859 |
- /*
- * Copyright (c) 2019 The WebRTC project authors. All Rights Reserved.
- *
- * Use of this source code is governed by a BSD-style license
- * that can be found in the LICENSE file in the root of the source
- * tree. An additional intellectual property rights grant can be found
- * in the file PATENTS. All contributing project authors may
- * be found in the AUTHORS file in the root of the source tree.
- */
- #ifndef MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
- #define MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
- #include <stddef.h>
- #include <memory>
- #include "modules/audio_processing/include/audio_processing.h"
- namespace webrtc {
- class AudioBuffer;
- // The voice activity detection (VAD) component analyzes the stream to
- // determine if voice is present.
- class VoiceDetection {
- public:
- // Specifies the likelihood that a frame will be declared to contain voice.
- // A higher value makes it more likely that speech will not be clipped, at
- // the expense of more noise being detected as voice.
- enum Likelihood {
- kVeryLowLikelihood,
- kLowLikelihood,
- kModerateLikelihood,
- kHighLikelihood
- };
- VoiceDetection(int sample_rate_hz, Likelihood likelihood);
- ~VoiceDetection();
- VoiceDetection(VoiceDetection&) = delete;
- VoiceDetection& operator=(VoiceDetection&) = delete;
- // Returns true if voice is detected in the current frame.
- bool ProcessCaptureAudio(AudioBuffer* audio);
- Likelihood likelihood() const { return likelihood_; }
- private:
- class Vad;
- int sample_rate_hz_;
- size_t frame_size_samples_;
- Likelihood likelihood_;
- std::unique_ptr<Vad> vad_;
- };
- } // namespace webrtc
- #endif // MODULES_AUDIO_PROCESSING_VOICE_DETECTION_H_
|