| /* |
| * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #include "modules/audio_coding/test/opus_test.h" |
| |
| #include <string> |
| |
| #include "api/audio_codecs/builtin_audio_decoder_factory.h" |
| #include "api/environment/environment_factory.h" |
| #include "api/neteq/default_neteq_factory.h" |
| #include "modules/audio_coding/codecs/opus/opus_interface.h" |
| #include "modules/audio_coding/include/audio_coding_module_typedefs.h" |
| #include "modules/audio_coding/test/TestStereo.h" |
| #include "test/gtest.h" |
| #include "test/testsupport/file_utils.h" |
| |
| namespace webrtc { |
| |
| OpusTest::OpusTest() |
| : neteq_(DefaultNetEqFactory().Create(CreateEnvironment(), |
| NetEq::Config(), |
| CreateBuiltinAudioDecoderFactory())), |
| channel_a2b_(NULL), |
| counter_(0), |
| payload_type_(255), |
| rtp_timestamp_(0) {} |
| |
| OpusTest::~OpusTest() { |
| if (channel_a2b_ != NULL) { |
| delete channel_a2b_; |
| channel_a2b_ = NULL; |
| } |
| if (opus_mono_encoder_ != NULL) { |
| WebRtcOpus_EncoderFree(opus_mono_encoder_); |
| opus_mono_encoder_ = NULL; |
| } |
| if (opus_stereo_encoder_ != NULL) { |
| WebRtcOpus_EncoderFree(opus_stereo_encoder_); |
| opus_stereo_encoder_ = NULL; |
| } |
| if (opus_mono_decoder_ != NULL) { |
| WebRtcOpus_DecoderFree(opus_mono_decoder_); |
| opus_mono_decoder_ = NULL; |
| } |
| if (opus_stereo_decoder_ != NULL) { |
| WebRtcOpus_DecoderFree(opus_stereo_decoder_); |
| opus_stereo_decoder_ = NULL; |
| } |
| } |
| |
| void OpusTest::Perform() { |
| #ifndef WEBRTC_CODEC_OPUS |
| // Opus isn't defined, exit. |
| return; |
| #else |
| uint16_t frequency_hz; |
| size_t audio_channels; |
| int16_t test_cntr = 0; |
| |
| // Open both mono and stereo test files in 32 kHz. |
| const std::string file_name_stereo = |
| webrtc::test::ResourcePath("audio_coding/teststereo32kHz", "pcm"); |
| const std::string file_name_mono = |
| webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"); |
| frequency_hz = 32000; |
| in_file_stereo_.Open(file_name_stereo, frequency_hz, "rb"); |
| in_file_stereo_.ReadStereo(true); |
| in_file_mono_.Open(file_name_mono, frequency_hz, "rb"); |
| in_file_mono_.ReadStereo(false); |
| |
| // Create Opus encoders for mono and stereo. |
| ASSERT_GT(WebRtcOpus_EncoderCreate(&opus_mono_encoder_, 1, 0, 48000), -1); |
| ASSERT_GT(WebRtcOpus_EncoderCreate(&opus_stereo_encoder_, 2, 1, 48000), -1); |
| |
| // Create Opus decoders for mono and stereo for stand-alone testing of Opus. |
| ASSERT_GT(WebRtcOpus_DecoderCreate(&opus_mono_decoder_, 1, 48000), -1); |
| ASSERT_GT(WebRtcOpus_DecoderCreate(&opus_stereo_decoder_, 2, 48000), -1); |
| WebRtcOpus_DecoderInit(opus_mono_decoder_); |
| WebRtcOpus_DecoderInit(opus_stereo_decoder_); |
| |
| ASSERT_TRUE(neteq_.get() != NULL); |
| neteq_->FlushBuffers(); |
| |
| // Register Opus stereo as receiving codec. |
| constexpr int kOpusPayloadType = 120; |
| const SdpAudioFormat kOpusFormatStereo("opus", 48000, 2, {{"stereo", "1"}}); |
| payload_type_ = kOpusPayloadType; |
| neteq_->SetCodecs({{kOpusPayloadType, kOpusFormatStereo}}); |
| |
| // Create and connect the channel. |
| channel_a2b_ = new TestPackStereo; |
| channel_a2b_->RegisterReceiverNetEq(neteq_.get()); |
| |
| // |
| // Test Stereo. |
| // |
| |
| channel_a2b_->set_codec_mode(kStereo); |
| audio_channels = 2; |
| test_cntr++; |
| OpenOutFile(test_cntr); |
| |
| // Run Opus with 2.5 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 120); |
| |
| // Run Opus with 5 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 240); |
| |
| // Run Opus with 10 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 480); |
| |
| // Run Opus with 20 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 960); |
| |
| // Run Opus with 40 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 1920); |
| |
| // Run Opus with 60 ms frame size. |
| Run(channel_a2b_, audio_channels, 64000, 2880); |
| |
| out_file_.Close(); |
| out_file_standalone_.Close(); |
| |
| // |
| // Test Opus stereo with packet-losses. |
| // |
| |
| test_cntr++; |
| OpenOutFile(test_cntr); |
| |
| // Run Opus with 20 ms frame size, 1% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 1); |
| |
| // Run Opus with 20 ms frame size, 5% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 5); |
| |
| // Run Opus with 20 ms frame size, 10% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 10); |
| |
| out_file_.Close(); |
| out_file_standalone_.Close(); |
| |
| // |
| // Test Mono. |
| // |
| channel_a2b_->set_codec_mode(kMono); |
| audio_channels = 1; |
| test_cntr++; |
| OpenOutFile(test_cntr); |
| |
| // Register Opus mono as receiving codec. |
| const SdpAudioFormat kOpusFormatMono("opus", 48000, 2); |
| neteq_->SetCodecs({{kOpusPayloadType, kOpusFormatMono}}); |
| |
| // Run Opus with 2.5 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 120); |
| |
| // Run Opus with 5 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 240); |
| |
| // Run Opus with 10 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 480); |
| |
| // Run Opus with 20 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 960); |
| |
| // Run Opus with 40 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 1920); |
| |
| // Run Opus with 60 ms frame size. |
| Run(channel_a2b_, audio_channels, 32000, 2880); |
| |
| out_file_.Close(); |
| out_file_standalone_.Close(); |
| |
| // |
| // Test Opus mono with packet-losses. |
| // |
| test_cntr++; |
| OpenOutFile(test_cntr); |
| |
| // Run Opus with 20 ms frame size, 1% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 1); |
| |
| // Run Opus with 20 ms frame size, 5% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 5); |
| |
| // Run Opus with 20 ms frame size, 10% packet loss. |
| Run(channel_a2b_, audio_channels, 64000, 960, 10); |
| |
| // Close the files. |
| in_file_stereo_.Close(); |
| in_file_mono_.Close(); |
| out_file_.Close(); |
| out_file_standalone_.Close(); |
| #endif |
| } |
| |
| void OpusTest::Run(TestPackStereo* channel, |
| size_t channels, |
| int bitrate, |
| size_t frame_length, |
| int percent_loss) { |
| AudioFrame audio_frame; |
| int32_t out_freq_hz_b = out_file_.SamplingFrequency(); |
| const size_t kBufferSizeSamples = 480 * 12 * 2; // 120 ms stereo audio. |
| int16_t audio[kBufferSizeSamples]; |
| int16_t out_audio[kBufferSizeSamples]; |
| int16_t audio_type; |
| size_t written_samples = 0; |
| size_t read_samples = 0; |
| size_t decoded_samples = 0; |
| bool first_packet = true; |
| uint32_t start_time_stamp = 0; |
| |
| channel->reset_payload_size(); |
| counter_ = 0; |
| |
| // Set encoder rate. |
| EXPECT_EQ(0, WebRtcOpus_SetBitRate(opus_mono_encoder_, bitrate)); |
| EXPECT_EQ(0, WebRtcOpus_SetBitRate(opus_stereo_encoder_, bitrate)); |
| |
| #if defined(WEBRTC_ANDROID) || defined(WEBRTC_IOS) || defined(WEBRTC_ARCH_ARM) |
| // If we are on Android, iOS and/or ARM, use a lower complexity setting as |
| // default. |
| const int kOpusComplexity5 = 5; |
| EXPECT_EQ(0, WebRtcOpus_SetComplexity(opus_mono_encoder_, kOpusComplexity5)); |
| EXPECT_EQ(0, |
| WebRtcOpus_SetComplexity(opus_stereo_encoder_, kOpusComplexity5)); |
| #endif |
| |
| // Fast-forward 1 second (100 blocks) since the files start with silence. |
| in_file_stereo_.FastForward(100); |
| in_file_mono_.FastForward(100); |
| |
| // Limit the runtime to 1000 blocks of 10 ms each. |
| for (size_t audio_length = 0; audio_length < 1000; audio_length += 10) { |
| bool lost_packet = false; |
| |
| // Get 10 msec of audio. |
| if (channels == 1) { |
| if (in_file_mono_.EndOfFile()) { |
| break; |
| } |
| in_file_mono_.Read10MsData(audio_frame); |
| } else { |
| if (in_file_stereo_.EndOfFile()) { |
| break; |
| } |
| in_file_stereo_.Read10MsData(audio_frame); |
| } |
| |
| // If input audio is sampled at 32 kHz, resampling to 48 kHz is required. |
| EXPECT_EQ(480, resampler_.Resample10Msec( |
| audio_frame.data(), audio_frame.sample_rate_hz_, 48000, |
| channels, kBufferSizeSamples - written_samples, |
| &audio[written_samples])); |
| written_samples += 480 * channels; |
| |
| // Sometimes we need to loop over the audio vector to produce the right |
| // number of packets. |
| size_t loop_encode = |
| (written_samples - read_samples) / (channels * frame_length); |
| |
| if (loop_encode > 0) { |
| const size_t kMaxBytes = 1000; // Maximum number of bytes for one packet. |
| size_t bitstream_len_byte; |
| uint8_t bitstream[kMaxBytes]; |
| for (size_t i = 0; i < loop_encode; i++) { |
| int bitstream_len_byte_int = WebRtcOpus_Encode( |
| (channels == 1) ? opus_mono_encoder_ : opus_stereo_encoder_, |
| &audio[read_samples], frame_length, kMaxBytes, bitstream); |
| ASSERT_GE(bitstream_len_byte_int, 0); |
| bitstream_len_byte = static_cast<size_t>(bitstream_len_byte_int); |
| |
| // Simulate packet loss by setting `packet_loss_` to "true" in |
| // `percent_loss` percent of the loops. |
| // TODO(tlegrand): Move handling of loss simulation to TestPackStereo. |
| if (percent_loss > 0) { |
| if (counter_ == floor((100 / percent_loss) + 0.5)) { |
| counter_ = 0; |
| lost_packet = true; |
| channel->set_lost_packet(true); |
| } else { |
| lost_packet = false; |
| channel->set_lost_packet(false); |
| } |
| counter_++; |
| } |
| |
| // Run stand-alone Opus decoder, or decode PLC. |
| if (channels == 1) { |
| if (!lost_packet) { |
| decoded_samples += WebRtcOpus_Decode( |
| opus_mono_decoder_, bitstream, bitstream_len_byte, |
| &out_audio[decoded_samples * channels], &audio_type); |
| } else { |
| // Call decoder PLC. |
| constexpr int kPlcDurationMs = 10; |
| constexpr int kPlcSamples = 48 * kPlcDurationMs; |
| size_t total_plc_samples = 0; |
| while (total_plc_samples < frame_length) { |
| int ret = WebRtcOpus_Decode( |
| opus_mono_decoder_, NULL, 0, |
| &out_audio[decoded_samples * channels], &audio_type); |
| EXPECT_EQ(ret, kPlcSamples); |
| decoded_samples += ret; |
| total_plc_samples += ret; |
| } |
| EXPECT_EQ(total_plc_samples, frame_length); |
| } |
| } else { |
| if (!lost_packet) { |
| decoded_samples += WebRtcOpus_Decode( |
| opus_stereo_decoder_, bitstream, bitstream_len_byte, |
| &out_audio[decoded_samples * channels], &audio_type); |
| } else { |
| // Call decoder PLC. |
| constexpr int kPlcDurationMs = 10; |
| constexpr int kPlcSamples = 48 * kPlcDurationMs; |
| size_t total_plc_samples = 0; |
| while (total_plc_samples < frame_length) { |
| int ret = WebRtcOpus_Decode( |
| opus_stereo_decoder_, NULL, 0, |
| &out_audio[decoded_samples * channels], &audio_type); |
| EXPECT_EQ(ret, kPlcSamples); |
| decoded_samples += ret; |
| total_plc_samples += ret; |
| } |
| EXPECT_EQ(total_plc_samples, frame_length); |
| } |
| } |
| |
| // Send data to the channel. "channel" will handle the loss simulation. |
| channel->SendData(AudioFrameType::kAudioFrameSpeech, payload_type_, |
| rtp_timestamp_, bitstream, bitstream_len_byte, 0); |
| if (first_packet) { |
| first_packet = false; |
| start_time_stamp = rtp_timestamp_; |
| } |
| rtp_timestamp_ += static_cast<uint32_t>(frame_length); |
| read_samples += frame_length * channels; |
| } |
| if (read_samples == written_samples) { |
| read_samples = 0; |
| written_samples = 0; |
| } |
| } |
| |
| // Run received side of ACM. |
| bool muted; |
| ASSERT_EQ(NetEq::kOK, neteq_->GetAudio(&audio_frame, &muted)); |
| ASSERT_TRUE(resampler_helper_.MaybeResample(out_freq_hz_b, &audio_frame)); |
| |
| // Write output speech to file. |
| out_file_.Write10MsData( |
| audio_frame.data(), |
| audio_frame.samples_per_channel_ * audio_frame.num_channels_); |
| |
| // Write stand-alone speech to file. |
| out_file_standalone_.Write10MsData(out_audio, decoded_samples * channels); |
| |
| if (audio_frame.timestamp_ > start_time_stamp) { |
| // Number of channels should be the same for both stand-alone and |
| // ACM-decoding. |
| EXPECT_EQ(audio_frame.num_channels_, channels); |
| } |
| |
| decoded_samples = 0; |
| } |
| |
| if (in_file_mono_.EndOfFile()) { |
| in_file_mono_.Rewind(); |
| } |
| if (in_file_stereo_.EndOfFile()) { |
| in_file_stereo_.Rewind(); |
| } |
| // Reset in case we ended with a lost packet. |
| channel->set_lost_packet(false); |
| } |
| |
| void OpusTest::OpenOutFile(int test_number) { |
| std::string file_name; |
| std::stringstream file_stream; |
| file_stream << webrtc::test::OutputPath() << "opustest_out_" << test_number |
| << ".pcm"; |
| file_name = file_stream.str(); |
| out_file_.Open(file_name, 48000, "wb"); |
| file_stream.str(""); |
| file_name = file_stream.str(); |
| file_stream << webrtc::test::OutputPath() << "opusstandalone_out_" |
| << test_number << ".pcm"; |
| file_name = file_stream.str(); |
| out_file_standalone_.Open(file_name, 48000, "wb"); |
| } |
| |
| } // namespace webrtc |