blob: 89cc209d9dd918c14d3c11b75b8519dc6e3c8a1b [file] [log] [blame]
/*
* Copyright (c) 2022 The WebRTC project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*/
#include "modules/audio_processing/agc2/speech_probability_buffer.h"
#include <algorithm>
#include "test/gtest.h"
namespace webrtc {
namespace {
constexpr float kAbsError = 0.001f;
constexpr float kActivityThreshold = 0.9f;
constexpr float kLowProbabilityThreshold = 0.2f;
constexpr int kNumAnalysisFrames = 100;
} // namespace
TEST(SpeechProbabilityBufferTest, CheckSumAfterInitialization) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
EXPECT_EQ(buffer.GetSumProbabilities(), 0.0f);
}
TEST(SpeechProbabilityBufferTest, CheckSumAfterUpdate) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
buffer.Update(0.7f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 0.7f, kAbsError);
buffer.Update(0.6f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 1.3f, kAbsError);
for (int i = 0; i < kNumAnalysisFrames - 1; ++i) {
buffer.Update(1.0f);
}
EXPECT_NEAR(buffer.GetSumProbabilities(), 99.6f, kAbsError);
}
TEST(SpeechProbabilityBufferTest, CheckSumAfterReset) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
buffer.Update(0.7f);
buffer.Update(0.6f);
buffer.Update(0.3f);
EXPECT_GT(buffer.GetSumProbabilities(), 0.0f);
buffer.Reset();
EXPECT_EQ(buffer.GetSumProbabilities(), 0.0f);
}
TEST(SpeechProbabilityBufferTest, CheckSumAfterTransientNotRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(0.0f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 9.0f, kAbsError);
buffer.Update(0.0f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 9.0f, kAbsError);
}
TEST(SpeechProbabilityBufferTest, CheckSumAfterTransientRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
buffer.Update(0.0f);
buffer.Update(0.0f);
buffer.Update(0.0f);
buffer.Update(0.0f);
buffer.Update(0.0f);
buffer.Update(0.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
buffer.Update(1.0f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 3.0f, kAbsError);
buffer.Update(0.0f);
EXPECT_NEAR(buffer.GetSumProbabilities(), 0.0f, kAbsError);
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsNotActiveAfterNoUpdates) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsActiveChangesFromFalseToTrue) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
// Add low probabilities until the buffer is full. That's not enough
// to make `IsActiveSegment()` to return true.
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(0.0f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
// Add high probabilities until `IsActiveSegment()` returns true.
for (int i = 0; i < kActivityThreshold * kNumAnalysisFrames - 1; ++i) {
buffer.Update(1.0f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsActiveChangesFromTrueToFalse) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
// Add high probabilities until the buffer is full. That's enough to
// make `IsActiveSegment()` to return true.
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(1.0f);
}
EXPECT_TRUE(buffer.IsActiveSegment());
// Add low probabilities until `IsActiveSegment()` returns false.
for (int i = 0; i < (1.0f - kActivityThreshold) * kNumAnalysisFrames - 1;
++i) {
buffer.Update(0.0f);
}
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsActiveAfterUpdatesWithHighProbabilities) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames - 1; ++i) {
buffer.Update(1.0f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsNotActiveAfterUpdatesWithLowProbabilities) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames - 1; ++i) {
buffer.Update(0.3f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.3f);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsActiveAfterBufferIsFull) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames - 1; ++i) {
buffer.Update(1.0f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsNotActiveAfterBufferIsFull) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames - 1; ++i) {
buffer.Update(0.29f);
}
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.29f);
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.29f);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsNotActiveAfterReset) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(1.0f);
}
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Reset();
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsNotActiveAfterTransientRemovedAfterFewUpdates) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
buffer.Update(0.4f);
buffer.Update(0.4f);
buffer.Update(0.0f);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsActiveAfterTransientNotRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(1.0f);
}
buffer.Update(0.7f);
buffer.Update(0.8f);
buffer.Update(0.9f);
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(0.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(0.7f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsNotActiveAfterTransientNotRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(0.1f);
}
buffer.Update(0.7f);
buffer.Update(0.8f);
buffer.Update(0.9f);
buffer.Update(1.0f);
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.0f);
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.7f);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest,
CheckSegmentIsNotActiveAfterTransientRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(0.1f);
}
buffer.Update(0.7f);
buffer.Update(0.8f);
buffer.Update(0.9f);
buffer.Update(1.0f);
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.0f);
EXPECT_FALSE(buffer.IsActiveSegment());
buffer.Update(0.7f);
EXPECT_FALSE(buffer.IsActiveSegment());
}
TEST(SpeechProbabilityBufferTest, CheckSegmentIsActiveAfterTransientRemoved) {
SpeechProbabilityBuffer buffer(kLowProbabilityThreshold);
for (int i = 0; i < kNumAnalysisFrames; ++i) {
buffer.Update(1.0f);
}
buffer.Update(0.7f);
buffer.Update(0.8f);
buffer.Update(0.9f);
buffer.Update(1.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(0.0f);
EXPECT_TRUE(buffer.IsActiveSegment());
buffer.Update(0.7f);
EXPECT_TRUE(buffer.IsActiveSegment());
}
} // namespace webrtc