| /* |
| * Copyright (c) 2016 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| #include <vector> |
| |
| #include "testing/gtest/include/gtest/gtest.h" |
| #include "webrtc/base/array_view.h" |
| #include "webrtc/modules/audio_processing/audio_buffer.h" |
| #include "webrtc/modules/audio_processing/voice_detection_impl.h" |
| #include "webrtc/modules/audio_processing/test/audio_buffer_tools.h" |
| #include "webrtc/modules/audio_processing/test/bitexactness_tools.h" |
| |
| namespace webrtc { |
| namespace { |
| |
| const int kNumFramesToProcess = 1000; |
| |
| // Process one frame of data and produce the output. |
| void ProcessOneFrame(int sample_rate_hz, |
| AudioBuffer* audio_buffer, |
| VoiceDetectionImpl* voice_detection) { |
| if (sample_rate_hz > AudioProcessing::kSampleRate16kHz) { |
| audio_buffer->SplitIntoFrequencyBands(); |
| } |
| |
| voice_detection->ProcessCaptureAudio(audio_buffer); |
| } |
| |
| // Processes a specified amount of frames, verifies the results and reports |
| // any errors. |
| void RunBitexactnessTest(int sample_rate_hz, |
| size_t num_channels, |
| int frame_size_ms_reference, |
| bool stream_has_voice_reference, |
| VoiceDetection::Likelihood likelihood_reference) { |
| rtc::CriticalSection crit_capture; |
| VoiceDetectionImpl voice_detection(&crit_capture); |
| voice_detection.Initialize(sample_rate_hz > 16000 ? 16000 : sample_rate_hz); |
| voice_detection.Enable(true); |
| |
| int samples_per_channel = rtc::CheckedDivExact(sample_rate_hz, 100); |
| const StreamConfig capture_config(sample_rate_hz, num_channels, false); |
| AudioBuffer capture_buffer( |
| capture_config.num_frames(), capture_config.num_channels(), |
| capture_config.num_frames(), capture_config.num_channels(), |
| capture_config.num_frames()); |
| test::InputAudioFile capture_file( |
| test::GetApmCaptureTestVectorFileName(sample_rate_hz)); |
| std::vector<float> capture_input(samples_per_channel * num_channels); |
| for (int frame_no = 0; frame_no < kNumFramesToProcess; ++frame_no) { |
| ReadFloatSamplesFromStereoFile(samples_per_channel, num_channels, |
| &capture_file, capture_input); |
| |
| test::CopyVectorToAudioBuffer(capture_config, capture_input, |
| &capture_buffer); |
| |
| ProcessOneFrame(sample_rate_hz, &capture_buffer, &voice_detection); |
| } |
| |
| int frame_size_ms = voice_detection.frame_size_ms(); |
| bool stream_has_voice = voice_detection.stream_has_voice(); |
| VoiceDetection::Likelihood likelihood = voice_detection.likelihood(); |
| |
| // Compare the outputs to the references. |
| EXPECT_EQ(frame_size_ms_reference, frame_size_ms); |
| EXPECT_EQ(stream_has_voice_reference, stream_has_voice); |
| EXPECT_EQ(likelihood_reference, likelihood); |
| } |
| |
| const int kFrameSizeMsReference = 10; |
| const bool kStreamHasVoiceReference = true; |
| const VoiceDetection::Likelihood kLikelihoodReference = |
| VoiceDetection::kLowLikelihood; |
| |
| } // namespace |
| |
| TEST(VoiceDetectionBitExactnessTest, Mono8kHz) { |
| RunBitexactnessTest(8000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Mono16kHz) { |
| RunBitexactnessTest(16000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Mono32kHz) { |
| RunBitexactnessTest(32000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Mono48kHz) { |
| RunBitexactnessTest(48000, 1, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Stereo8kHz) { |
| RunBitexactnessTest(8000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Stereo16kHz) { |
| RunBitexactnessTest(16000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Stereo32kHz) { |
| RunBitexactnessTest(32000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| TEST(VoiceDetectionBitExactnessTest, Stereo48kHz) { |
| RunBitexactnessTest(48000, 2, kFrameSizeMsReference, kStreamHasVoiceReference, |
| kLikelihoodReference); |
| } |
| |
| } // namespace webrtc |