modules/audio_coding/test/TestVADDTX.cc - src - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_coding/test/TestVADDTX.h"

 #include <string>

 #include "absl/strings/match.h"
 #include "api/audio_codecs/audio_decoder_factory_template.h"
 #include "api/audio_codecs/audio_encoder_factory_template.h"
 #include "api/audio_codecs/ilbc/audio_decoder_ilbc.h"
 #include "api/audio_codecs/ilbc/audio_encoder_ilbc.h"
 #include "api/audio_codecs/isac/audio_decoder_isac_float.h"
 #include "api/audio_codecs/isac/audio_encoder_isac_float.h"
 #include "api/audio_codecs/opus/audio_decoder_opus.h"
 #include "api/audio_codecs/opus/audio_encoder_opus.h"
 #include "modules/audio_coding/codecs/cng/audio_encoder_cng.h"
 #include "modules/audio_coding/test/PCMFile.h"
 #include "rtc_base/strings/string_builder.h"
 #include "test/gtest.h"
 #include "test/testsupport/file_utils.h"

 namespace webrtc {

 MonitoringAudioPacketizationCallback::MonitoringAudioPacketizationCallback(
     AudioPacketizationCallback* next)
     : next_(next) {
   ResetStatistics();
 }

 int32_t MonitoringAudioPacketizationCallback::SendData(
     AudioFrameType frame_type,
     uint8_t payload_type,
     uint32_t timestamp,
     const uint8_t* payload_data,
     size_t payload_len_bytes,
     int64_t absolute_capture_timestamp_ms) {
   counter_[static_cast<int>(frame_type)]++;
   return next_->SendData(frame_type, payload_type, timestamp, payload_data,
                          payload_len_bytes, absolute_capture_timestamp_ms);
 }

 void MonitoringAudioPacketizationCallback::PrintStatistics() {
   printf("\n");
   printf("kEmptyFrame       %u\n",
          counter_[static_cast<int>(AudioFrameType::kEmptyFrame)]);
   printf("kAudioFrameSpeech %u\n",
          counter_[static_cast<int>(AudioFrameType::kAudioFrameSpeech)]);
   printf("kAudioFrameCN     %u\n",
          counter_[static_cast<int>(AudioFrameType::kAudioFrameCN)]);
   printf("\n\n");
 }

 void MonitoringAudioPacketizationCallback::ResetStatistics() {
   memset(counter_, 0, sizeof(counter_));
 }

 void MonitoringAudioPacketizationCallback::GetStatistics(uint32_t* counter) {
   memcpy(counter, counter_, sizeof(counter_));
 }

 TestVadDtx::TestVadDtx()
     : encoder_factory_(CreateAudioEncoderFactory<AudioEncoderIlbc,
                                                  AudioEncoderIsacFloat,
                                                  AudioEncoderOpus>()),
       decoder_factory_(CreateAudioDecoderFactory<AudioDecoderIlbc,
                                                  AudioDecoderIsacFloat,
                                                  AudioDecoderOpus>()),
       acm_send_(AudioCodingModule::Create(
           AudioCodingModule::Config(decoder_factory_))),
       acm_receive_(AudioCodingModule::Create(
           AudioCodingModule::Config(decoder_factory_))),
       channel_(std::make_unique<Channel>()),
       packetization_callback_(
           std::make_unique<MonitoringAudioPacketizationCallback>(
               channel_.get())) {
   EXPECT_EQ(
       0, acm_send_->RegisterTransportCallback(packetization_callback_.get()));
   channel_->RegisterReceiverACM(acm_receive_.get());
 }

 bool TestVadDtx::RegisterCodec(const SdpAudioFormat& codec_format,
                                absl::optional<Vad::Aggressiveness> vad_mode) {
   constexpr int payload_type = 17, cn_payload_type = 117;
   bool added_comfort_noise = false;

   auto encoder = encoder_factory_->MakeAudioEncoder(payload_type, codec_format,
                                                     absl::nullopt);
   if (vad_mode.has_value() &&
       !absl::EqualsIgnoreCase(codec_format.name, "opus")) {
     AudioEncoderCngConfig config;
     config.speech_encoder = std::move(encoder);
     config.num_channels = 1;
     config.payload_type = cn_payload_type;
     config.vad_mode = vad_mode.value();
     encoder = CreateComfortNoiseEncoder(std::move(config));
     added_comfort_noise = true;
   }
   channel_->SetIsStereo(encoder->NumChannels() > 1);
   acm_send_->SetEncoder(std::move(encoder));

   std::map<int, SdpAudioFormat> receive_codecs = {{payload_type, codec_format}};
   acm_receive_->SetReceiveCodecs(receive_codecs);

   return added_comfort_noise;
 }

 // Encoding a file and see if the numbers that various packets occur follow
 // the expectation.
 void TestVadDtx::Run(std::string in_filename,
                      int frequency,
                      int channels,
                      std::string out_filename,
                      bool append,
                      const int* expects) {
   packetization_callback_->ResetStatistics();

   PCMFile in_file;
   in_file.Open(in_filename, frequency, "rb");
   in_file.ReadStereo(channels > 1);
   // Set test length to 1000 ms (100 blocks of 10 ms each).
   in_file.SetNum10MsBlocksToRead(100);
   // Fast-forward both files 500 ms (50 blocks). The first second of the file is
   // silence, but we want to keep half of that to test silence periods.
   in_file.FastForward(50);

   PCMFile out_file;
   if (append) {
     out_file.Open(out_filename, kOutputFreqHz, "ab");
   } else {
     out_file.Open(out_filename, kOutputFreqHz, "wb");
   }

   uint16_t frame_size_samples = in_file.PayloadLength10Ms();
   AudioFrame audio_frame;
   while (!in_file.EndOfFile()) {
     in_file.Read10MsData(audio_frame);
     audio_frame.timestamp_ = time_stamp_;
     time_stamp_ += frame_size_samples;
     EXPECT_GE(acm_send_->Add10MsData(audio_frame), 0);
     bool muted;
     acm_receive_->PlayoutData10Ms(kOutputFreqHz, &audio_frame, &muted);
     ASSERT_FALSE(muted);
     out_file.Write10MsData(audio_frame);
   }

   in_file.Close();
   out_file.Close();

 #ifdef PRINT_STAT
   packetization_callback_->PrintStatistics();
 #endif

   uint32_t stats[3];
   packetization_callback_->GetStatistics(stats);
   packetization_callback_->ResetStatistics();

   for (const auto& st : stats) {
     int i = &st - stats;  // Calculate the current position in stats.
     switch (expects[i]) {
       case 0: {
         EXPECT_EQ(0u, st) << "stats[" << i << "] error.";
         break;
       }
       case 1: {
         EXPECT_GT(st, 0u) << "stats[" << i << "] error.";
         break;
       }
     }
   }
 }

 // Following is the implementation of TestWebRtcVadDtx.
 TestWebRtcVadDtx::TestWebRtcVadDtx() : output_file_num_(0) {}

 void TestWebRtcVadDtx::Perform() {
   RunTestCases({"ISAC", 16000, 1});
   RunTestCases({"ISAC", 32000, 1});
   RunTestCases({"ILBC", 8000, 1});
   RunTestCases({"opus", 48000, 2});
 }

 // Test various configurations on VAD/DTX.
 void TestWebRtcVadDtx::RunTestCases(const SdpAudioFormat& codec_format) {
   Test(/*new_outfile=*/true,
        /*expect_dtx_enabled=*/RegisterCodec(codec_format, absl::nullopt));

   Test(/*new_outfile=*/false,
        /*expect_dtx_enabled=*/RegisterCodec(codec_format, Vad::kVadAggressive));

   Test(/*new_outfile=*/false,
        /*expect_dtx_enabled=*/RegisterCodec(codec_format, Vad::kVadLowBitrate));

   Test(/*new_outfile=*/false, /*expect_dtx_enabled=*/RegisterCodec(
            codec_format, Vad::kVadVeryAggressive));

   Test(/*new_outfile=*/false,
        /*expect_dtx_enabled=*/RegisterCodec(codec_format, Vad::kVadNormal));
 }

 // Set the expectation and run the test.
 void TestWebRtcVadDtx::Test(bool new_outfile, bool expect_dtx_enabled) {
   int expects[] = {-1, 1, expect_dtx_enabled, 0, 0};
   if (new_outfile) {
     output_file_num_++;
   }
   rtc::StringBuilder out_filename;
   out_filename << webrtc::test::OutputPath() << "testWebRtcVadDtx_outFile_"
                << output_file_num_ << ".pcm";
   Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
       out_filename.str(), !new_outfile, expects);
 }

 // Following is the implementation of TestOpusDtx.
 void TestOpusDtx::Perform() {
   int expects[] = {0, 1, 0, 0, 0};

   // Register Opus as send codec
   std::string out_filename =
       webrtc::test::OutputPath() + "testOpusDtx_outFile_mono.pcm";
   RegisterCodec({"opus", 48000, 2}, absl::nullopt);
   acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
     (*encoder_ptr)->SetDtx(false);
   });

   Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
       out_filename, false, expects);

   acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
     (*encoder_ptr)->SetDtx(true);
   });
   expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 1;
   expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 1;
   Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
       out_filename, true, expects);

   // Register stereo Opus as send codec
   out_filename = webrtc::test::OutputPath() + "testOpusDtx_outFile_stereo.pcm";
   RegisterCodec({"opus", 48000, 2, {{"stereo", "1"}}}, absl::nullopt);
   acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
     (*encoder_ptr)->SetDtx(false);
   });
   expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 0;
   expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 0;
   Run(webrtc::test::ResourcePath("audio_coding/teststereo32kHz", "pcm"), 32000,
       2, out_filename, false, expects);

   acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
     (*encoder_ptr)->SetDtx(true);
     // The default bitrate will not generate frames recognized as CN on desktop
     // since the frames will be encoded as CELT. Set a low target bitrate to get
     // consistent behaviour across platforms.
     (*encoder_ptr)->OnReceivedTargetAudioBitrate(24000);
   });

   expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 1;
   expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 1;
   Run(webrtc::test::ResourcePath("audio_coding/teststereo32kHz", "pcm"), 32000,
       2, out_filename, true, expects);
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_coding/test/TestVADDTX.h"

	#include <string>

	#include "absl/strings/match.h"
	#include "api/audio_codecs/audio_decoder_factory_template.h"
	#include "api/audio_codecs/audio_encoder_factory_template.h"
	#include "api/audio_codecs/ilbc/audio_decoder_ilbc.h"
	#include "api/audio_codecs/ilbc/audio_encoder_ilbc.h"
	#include "api/audio_codecs/isac/audio_decoder_isac_float.h"
	#include "api/audio_codecs/isac/audio_encoder_isac_float.h"
	#include "api/audio_codecs/opus/audio_decoder_opus.h"
	#include "api/audio_codecs/opus/audio_encoder_opus.h"
	#include "modules/audio_coding/codecs/cng/audio_encoder_cng.h"
	#include "modules/audio_coding/test/PCMFile.h"
	#include "rtc_base/strings/string_builder.h"
	#include "test/gtest.h"
	#include "test/testsupport/file_utils.h"

	namespace webrtc {

	MonitoringAudioPacketizationCallback::MonitoringAudioPacketizationCallback(
	AudioPacketizationCallback* next)
	: next_(next) {
	ResetStatistics();
	}

	int32_t MonitoringAudioPacketizationCallback::SendData(
	AudioFrameType frame_type,
	uint8_t payload_type,
	uint32_t timestamp,
	const uint8_t* payload_data,
	size_t payload_len_bytes,
	int64_t absolute_capture_timestamp_ms) {
	counter_[static_cast<int>(frame_type)]++;
	return next_->SendData(frame_type, payload_type, timestamp, payload_data,
	payload_len_bytes, absolute_capture_timestamp_ms);
	}

	void MonitoringAudioPacketizationCallback::PrintStatistics() {
	printf("\n");
	printf("kEmptyFrame %u\n",
	counter_[static_cast<int>(AudioFrameType::kEmptyFrame)]);
	printf("kAudioFrameSpeech %u\n",
	counter_[static_cast<int>(AudioFrameType::kAudioFrameSpeech)]);
	printf("kAudioFrameCN %u\n",
	counter_[static_cast<int>(AudioFrameType::kAudioFrameCN)]);
	printf("\n\n");
	}

	void MonitoringAudioPacketizationCallback::ResetStatistics() {
	memset(counter_, 0, sizeof(counter_));
	}

	void MonitoringAudioPacketizationCallback::GetStatistics(uint32_t* counter) {
	memcpy(counter, counter_, sizeof(counter_));
	}

	TestVadDtx::TestVadDtx()
	: encoder_factory_(CreateAudioEncoderFactory<AudioEncoderIlbc,
	AudioEncoderIsacFloat,
	AudioEncoderOpus>()),
	decoder_factory_(CreateAudioDecoderFactory<AudioDecoderIlbc,
	AudioDecoderIsacFloat,
	AudioDecoderOpus>()),
	acm_send_(AudioCodingModule::Create(
	AudioCodingModule::Config(decoder_factory_))),
	acm_receive_(AudioCodingModule::Create(
	AudioCodingModule::Config(decoder_factory_))),
	channel_(std::make_unique<Channel>()),
	packetization_callback_(
	std::make_unique<MonitoringAudioPacketizationCallback>(
	channel_.get())) {
	EXPECT_EQ(
	0, acm_send_->RegisterTransportCallback(packetization_callback_.get()));
	channel_->RegisterReceiverACM(acm_receive_.get());
	}

	bool TestVadDtx::RegisterCodec(const SdpAudioFormat& codec_format,
	absl::optional<Vad::Aggressiveness> vad_mode) {
	constexpr int payload_type = 17, cn_payload_type = 117;
	bool added_comfort_noise = false;

	auto encoder = encoder_factory_->MakeAudioEncoder(payload_type, codec_format,
	absl::nullopt);
	if (vad_mode.has_value() &&
	!absl::EqualsIgnoreCase(codec_format.name, "opus")) {
	AudioEncoderCngConfig config;
	config.speech_encoder = std::move(encoder);
	config.num_channels = 1;
	config.payload_type = cn_payload_type;
	config.vad_mode = vad_mode.value();
	encoder = CreateComfortNoiseEncoder(std::move(config));
	added_comfort_noise = true;
	}
	channel_->SetIsStereo(encoder->NumChannels() > 1);
	acm_send_->SetEncoder(std::move(encoder));

	std::map<int, SdpAudioFormat> receive_codecs = {{payload_type, codec_format}};
	acm_receive_->SetReceiveCodecs(receive_codecs);

	return added_comfort_noise;
	}

	// Encoding a file and see if the numbers that various packets occur follow
	// the expectation.
	void TestVadDtx::Run(std::string in_filename,
	int frequency,
	int channels,
	std::string out_filename,
	bool append,
	const int* expects) {
	packetization_callback_->ResetStatistics();

	PCMFile in_file;
	in_file.Open(in_filename, frequency, "rb");
	in_file.ReadStereo(channels > 1);
	// Set test length to 1000 ms (100 blocks of 10 ms each).
	in_file.SetNum10MsBlocksToRead(100);
	// Fast-forward both files 500 ms (50 blocks). The first second of the file is
	// silence, but we want to keep half of that to test silence periods.
	in_file.FastForward(50);

	PCMFile out_file;
	if (append) {
	out_file.Open(out_filename, kOutputFreqHz, "ab");
	} else {
	out_file.Open(out_filename, kOutputFreqHz, "wb");
	}

	uint16_t frame_size_samples = in_file.PayloadLength10Ms();
	AudioFrame audio_frame;
	while (!in_file.EndOfFile()) {
	in_file.Read10MsData(audio_frame);
	audio_frame.timestamp_ = time_stamp_;
	time_stamp_ += frame_size_samples;
	EXPECT_GE(acm_send_->Add10MsData(audio_frame), 0);
	bool muted;
	acm_receive_->PlayoutData10Ms(kOutputFreqHz, &audio_frame, &muted);
	ASSERT_FALSE(muted);
	out_file.Write10MsData(audio_frame);
	}

	in_file.Close();
	out_file.Close();

	#ifdef PRINT_STAT
	packetization_callback_->PrintStatistics();
	#endif

	uint32_t stats[3];
	packetization_callback_->GetStatistics(stats);
	packetization_callback_->ResetStatistics();

	for (const auto& st : stats) {
	int i = &st - stats; // Calculate the current position in stats.
	switch (expects[i]) {
	case 0: {
	EXPECT_EQ(0u, st) << "stats[" << i << "] error.";
	break;
	}
	case 1: {
	EXPECT_GT(st, 0u) << "stats[" << i << "] error.";
	break;
	}
	}
	}
	}

	// Following is the implementation of TestWebRtcVadDtx.
	TestWebRtcVadDtx::TestWebRtcVadDtx() : output_file_num_(0) {}

	void TestWebRtcVadDtx::Perform() {
	RunTestCases({"ISAC", 16000, 1});
	RunTestCases({"ISAC", 32000, 1});
	RunTestCases({"ILBC", 8000, 1});
	RunTestCases({"opus", 48000, 2});
	}

	// Test various configurations on VAD/DTX.
	void TestWebRtcVadDtx::RunTestCases(const SdpAudioFormat& codec_format) {
	Test(/new_outfile=/true,
	/expect_dtx_enabled=/RegisterCodec(codec_format, absl::nullopt));

	Test(/new_outfile=/false,
	/expect_dtx_enabled=/RegisterCodec(codec_format, Vad::kVadAggressive));

	Test(/new_outfile=/false,
	/expect_dtx_enabled=/RegisterCodec(codec_format, Vad::kVadLowBitrate));

	Test(/new_outfile=/false, /expect_dtx_enabled=/RegisterCodec(
	codec_format, Vad::kVadVeryAggressive));

	Test(/new_outfile=/false,
	/expect_dtx_enabled=/RegisterCodec(codec_format, Vad::kVadNormal));
	}

	// Set the expectation and run the test.
	void TestWebRtcVadDtx::Test(bool new_outfile, bool expect_dtx_enabled) {
	int expects[] = {-1, 1, expect_dtx_enabled, 0, 0};
	if (new_outfile) {
	output_file_num_++;
	}
	rtc::StringBuilder out_filename;
	out_filename << webrtc::test::OutputPath() << "testWebRtcVadDtx_outFile_"
	<< output_file_num_ << ".pcm";
	Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
	out_filename.str(), !new_outfile, expects);
	}

	// Following is the implementation of TestOpusDtx.
	void TestOpusDtx::Perform() {
	int expects[] = {0, 1, 0, 0, 0};

	// Register Opus as send codec
	std::string out_filename =
	webrtc::test::OutputPath() + "testOpusDtx_outFile_mono.pcm";
	RegisterCodec({"opus", 48000, 2}, absl::nullopt);
	acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
	(*encoder_ptr)->SetDtx(false);
	});

	Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
	out_filename, false, expects);

	acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
	(*encoder_ptr)->SetDtx(true);
	});
	expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 1;
	expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 1;
	Run(webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"), 32000, 1,
	out_filename, true, expects);

	// Register stereo Opus as send codec
	out_filename = webrtc::test::OutputPath() + "testOpusDtx_outFile_stereo.pcm";
	RegisterCodec({"opus", 48000, 2, {{"stereo", "1"}}}, absl::nullopt);
	acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
	(*encoder_ptr)->SetDtx(false);
	});
	expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 0;
	expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 0;
	Run(webrtc::test::ResourcePath("audio_coding/teststereo32kHz", "pcm"), 32000,
	2, out_filename, false, expects);

	acm_send_->ModifyEncoder([](std::unique_ptr<AudioEncoder>* encoder_ptr) {
	(*encoder_ptr)->SetDtx(true);
	// The default bitrate will not generate frames recognized as CN on desktop
	// since the frames will be encoded as CELT. Set a low target bitrate to get
	// consistent behaviour across platforms.
	(*encoder_ptr)->OnReceivedTargetAudioBitrate(24000);
	});

	expects[static_cast<int>(AudioFrameType::kEmptyFrame)] = 1;
	expects[static_cast<int>(AudioFrameType::kAudioFrameCN)] = 1;
	Run(webrtc::test::ResourcePath("audio_coding/teststereo32kHz", "pcm"), 32000,
	2, out_filename, true, expects);
	}

	} // namespace webrtc