common_audio/include/audio_util.h - src - Git at Google

 /*
  *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
 #define COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_

 #include <stdint.h>

 #include <algorithm>
 #include <cmath>
 #include <cstring>
 #include <limits>

 #include "api/audio/audio_view.h"
 #include "rtc_base/checks.h"

 namespace webrtc {

 typedef std::numeric_limits<int16_t> limits_int16;

 // TODO(tommi, peah): Move these constants to their own header, e.g.
 // `audio_constants.h`. Also consider if they should be in api/.

 // Absolute highest acceptable sample rate supported for audio processing,
 // capture and codecs. Note that for some components some cases a lower limit
 // applies which typically is 48000 but in some cases is lower.
 constexpr int kMaxSampleRateHz = 384000;

 // Number of samples per channel for 10ms of audio at the highest sample rate.
 constexpr size_t kMaxSamplesPerChannel10ms = kMaxSampleRateHz / 100u;

 // The conversion functions use the following naming convention:
 // S16:      int16_t [-32768, 32767]
 // Float:    float   [-1.0, 1.0]
 // FloatS16: float   [-32768.0, 32768.0]
 // Dbfs: float [-20.0*log(10, 32768), 0] = [-90.3, 0]
 // The ratio conversion functions use this naming convention:
 // Ratio: float (0, +inf)
 // Db: float (-inf, +inf)
 static inline float S16ToFloat(int16_t v) {
   constexpr float kScaling = 1.f / 32768.f;
   return v * kScaling;
 }

 static inline int16_t FloatS16ToS16(float v) {
   v = std::min(v, 32767.f);
   v = std::max(v, -32768.f);
   return static_cast<int16_t>(v + std::copysign(0.5f, v));
 }

 static inline int16_t FloatToS16(float v) {
   v *= 32768.f;
   v = std::min(v, 32767.f);
   v = std::max(v, -32768.f);
   return static_cast<int16_t>(v + std::copysign(0.5f, v));
 }

 static inline float FloatToFloatS16(float v) {
   v = std::min(v, 1.f);
   v = std::max(v, -1.f);
   return v * 32768.f;
 }

 static inline float FloatS16ToFloat(float v) {
   v = std::min(v, 32768.f);
   v = std::max(v, -32768.f);
   constexpr float kScaling = 1.f / 32768.f;
   return v * kScaling;
 }

 void FloatToS16(const float* src, size_t size, int16_t* dest);
 void S16ToFloat(const int16_t* src, size_t size, float* dest);
 void S16ToFloatS16(const int16_t* src, size_t size, float* dest);
 void FloatS16ToS16(const float* src, size_t size, int16_t* dest);
 void FloatToFloatS16(const float* src, size_t size, float* dest);
 void FloatS16ToFloat(const float* src, size_t size, float* dest);

 inline float DbToRatio(float v) {
   return std::pow(10.0f, v / 20.0f);
 }

 inline float DbfsToFloatS16(float v) {
   static constexpr float kMaximumAbsFloatS16 = -limits_int16::min();
   return DbToRatio(v) * kMaximumAbsFloatS16;
 }

 inline float FloatS16ToDbfs(float v) {
   RTC_DCHECK_GE(v, 0);

   // kMinDbfs is equal to -20.0 * log10(-limits_int16::min())
   static constexpr float kMinDbfs = -90.30899869919436f;
   if (v <= 1.0f) {
     return kMinDbfs;
   }
   // Equal to 20 * log10(v / (-limits_int16::min()))
   return 20.0f * std::log10(v) + kMinDbfs;
 }

 // Copy audio from `src` channels to `dest` channels unless `src` and `dest`
 // point to the same address. `src` and `dest` must have the same number of
 // channels, and there must be sufficient space allocated in `dest`.
 // TODO: b/335805780 - Accept ArrayView.
 template <typename T>
 void CopyAudioIfNeeded(const T* const* src,
                        int num_frames,
                        int num_channels,
                        T* const* dest) {
   for (int i = 0; i < num_channels; ++i) {
     if (src[i] != dest[i]) {
       std::copy(src[i], src[i] + num_frames, dest[i]);
     }
   }
 }

 // Deinterleave audio from `interleaved` to the channel buffers pointed to
 // by `deinterleaved`. There must be sufficient space allocated in the
 // `deinterleaved` buffers (`num_channel` buffers with `samples_per_channel`
 // per buffer).
 template <typename T>
 void Deinterleave(const InterleavedView<const T>& interleaved,
                   const DeinterleavedView<T>& deinterleaved) {
   RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
   RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
                 SamplesPerChannel(deinterleaved));
   const auto num_channels = NumChannels(interleaved);
   const auto samples_per_channel = SamplesPerChannel(interleaved);
   for (size_t i = 0; i < num_channels; ++i) {
     MonoView<T> channel = deinterleaved[i];
     size_t interleaved_idx = i;
     for (size_t j = 0; j < samples_per_channel; ++j) {
       channel[j] = interleaved[interleaved_idx];
       interleaved_idx += num_channels;
     }
   }
 }

 // Interleave audio from the channel buffers pointed to by `deinterleaved` to
 // `interleaved`. There must be sufficient space allocated in `interleaved`
 // (`samples_per_channel` * `num_channels`).
 template <typename T>
 void Interleave(const DeinterleavedView<const T>& deinterleaved,
                 const InterleavedView<T>& interleaved) {
   RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
   RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
                 SamplesPerChannel(deinterleaved));
   for (size_t i = 0; i < deinterleaved.num_channels(); ++i) {
     const auto channel = deinterleaved[i];
     size_t interleaved_idx = i;
     for (size_t j = 0; j < deinterleaved.samples_per_channel(); ++j) {
       interleaved[interleaved_idx] = channel[j];
       interleaved_idx += deinterleaved.num_channels();
     }
   }
 }

 // Downmixes an interleaved multichannel signal to a single channel by averaging
 // all channels.
 // TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
 template <typename T, typename Intermediate>
 void DownmixInterleavedToMonoImpl(const T* interleaved,
                                   size_t num_frames,
                                   int num_channels,
                                   T* deinterleaved) {
   RTC_DCHECK_GT(num_channels, 0);
   RTC_DCHECK_GT(num_frames, 0);

   const T* const end = interleaved + num_frames * num_channels;

   while (interleaved < end) {
     const T* const frame_end = interleaved + num_channels;

     Intermediate value = *interleaved++;
     while (interleaved < frame_end) {
       value += *interleaved++;
     }

     *deinterleaved++ = value / num_channels;
   }
 }

 // TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
 template <typename T>
 void DownmixInterleavedToMono(const T* interleaved,
                               size_t num_frames,
                               int num_channels,
                               T* deinterleaved);

 // TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
 template <>
 void DownmixInterleavedToMono<int16_t>(const int16_t* interleaved,
                                        size_t num_frames,
                                        int num_channels,
                                        int16_t* deinterleaved);

 }  // namespace webrtc

 #endif  // COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
	/*
	* Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
	#define COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_

	#include <stdint.h>

	#include <algorithm>
	#include <cmath>
	#include <cstring>
	#include <limits>

	#include "api/audio/audio_view.h"
	#include "rtc_base/checks.h"

	namespace webrtc {

	typedef std::numeric_limits<int16_t> limits_int16;

	// TODO(tommi, peah): Move these constants to their own header, e.g.
	// `audio_constants.h`. Also consider if they should be in api/.

	// Absolute highest acceptable sample rate supported for audio processing,
	// capture and codecs. Note that for some components some cases a lower limit
	// applies which typically is 48000 but in some cases is lower.
	constexpr int kMaxSampleRateHz = 384000;

	// Number of samples per channel for 10ms of audio at the highest sample rate.
	constexpr size_t kMaxSamplesPerChannel10ms = kMaxSampleRateHz / 100u;

	// The conversion functions use the following naming convention:
	// S16: int16_t [-32768, 32767]
	// Float: float [-1.0, 1.0]
	// FloatS16: float [-32768.0, 32768.0]
	// Dbfs: float [-20.0*log(10, 32768), 0] = [-90.3, 0]
	// The ratio conversion functions use this naming convention:
	// Ratio: float (0, +inf)
	// Db: float (-inf, +inf)
	static inline float S16ToFloat(int16_t v) {
	constexpr float kScaling = 1.f / 32768.f;
	return v * kScaling;
	}

	static inline int16_t FloatS16ToS16(float v) {
	v = std::min(v, 32767.f);
	v = std::max(v, -32768.f);
	return static_cast<int16_t>(v + std::copysign(0.5f, v));
	}

	static inline int16_t FloatToS16(float v) {
	v *= 32768.f;
	v = std::min(v, 32767.f);
	v = std::max(v, -32768.f);
	return static_cast<int16_t>(v + std::copysign(0.5f, v));
	}

	static inline float FloatToFloatS16(float v) {
	v = std::min(v, 1.f);
	v = std::max(v, -1.f);
	return v * 32768.f;
	}

	static inline float FloatS16ToFloat(float v) {
	v = std::min(v, 32768.f);
	v = std::max(v, -32768.f);
	constexpr float kScaling = 1.f / 32768.f;
	return v * kScaling;
	}

	void FloatToS16(const float* src, size_t size, int16_t* dest);
	void S16ToFloat(const int16_t* src, size_t size, float* dest);
	void S16ToFloatS16(const int16_t* src, size_t size, float* dest);
	void FloatS16ToS16(const float* src, size_t size, int16_t* dest);
	void FloatToFloatS16(const float* src, size_t size, float* dest);
	void FloatS16ToFloat(const float* src, size_t size, float* dest);

	inline float DbToRatio(float v) {
	return std::pow(10.0f, v / 20.0f);
	}

	inline float DbfsToFloatS16(float v) {
	static constexpr float kMaximumAbsFloatS16 = -limits_int16::min();
	return DbToRatio(v) * kMaximumAbsFloatS16;
	}

	inline float FloatS16ToDbfs(float v) {
	RTC_DCHECK_GE(v, 0);

	// kMinDbfs is equal to -20.0 * log10(-limits_int16::min())
	static constexpr float kMinDbfs = -90.30899869919436f;
	if (v <= 1.0f) {
	return kMinDbfs;
	}
	// Equal to 20 * log10(v / (-limits_int16::min()))
	return 20.0f * std::log10(v) + kMinDbfs;
	}

	// Copy audio from `src` channels to `dest` channels unless `src` and `dest`
	// point to the same address. `src` and `dest` must have the same number of
	// channels, and there must be sufficient space allocated in `dest`.
	// TODO: b/335805780 - Accept ArrayView.
	template <typename T>
	void CopyAudioIfNeeded(const T* const* src,
	int num_frames,
	int num_channels,
	T* const* dest) {
	for (int i = 0; i < num_channels; ++i) {
	if (src[i] != dest[i]) {
	std::copy(src[i], src[i] + num_frames, dest[i]);
	}
	}
	}

	// Deinterleave audio from `interleaved` to the channel buffers pointed to
	// by `deinterleaved`. There must be sufficient space allocated in the
	// `deinterleaved` buffers (`num_channel` buffers with `samples_per_channel`
	// per buffer).
	template <typename T>
	void Deinterleave(const InterleavedView<const T>& interleaved,
	const DeinterleavedView<T>& deinterleaved) {
	RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
	RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
	SamplesPerChannel(deinterleaved));
	const auto num_channels = NumChannels(interleaved);
	const auto samples_per_channel = SamplesPerChannel(interleaved);
	for (size_t i = 0; i < num_channels; ++i) {
	MonoView<T> channel = deinterleaved[i];
	size_t interleaved_idx = i;
	for (size_t j = 0; j < samples_per_channel; ++j) {
	channel[j] = interleaved[interleaved_idx];
	interleaved_idx += num_channels;
	}
	}
	}

	// Interleave audio from the channel buffers pointed to by `deinterleaved` to
	// `interleaved`. There must be sufficient space allocated in `interleaved`
	// (`samples_per_channel` * `num_channels`).
	template <typename T>
	void Interleave(const DeinterleavedView<const T>& deinterleaved,
	const InterleavedView<T>& interleaved) {
	RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
	RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
	SamplesPerChannel(deinterleaved));
	for (size_t i = 0; i < deinterleaved.num_channels(); ++i) {
	const auto channel = deinterleaved[i];
	size_t interleaved_idx = i;
	for (size_t j = 0; j < deinterleaved.samples_per_channel(); ++j) {
	interleaved[interleaved_idx] = channel[j];
	interleaved_idx += deinterleaved.num_channels();
	}
	}
	}

	// Downmixes an interleaved multichannel signal to a single channel by averaging
	// all channels.
	// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
	template <typename T, typename Intermediate>
	void DownmixInterleavedToMonoImpl(const T* interleaved,
	size_t num_frames,
	int num_channels,
	T* deinterleaved) {
	RTC_DCHECK_GT(num_channels, 0);
	RTC_DCHECK_GT(num_frames, 0);

	const T* const end = interleaved + num_frames * num_channels;

	while (interleaved < end) {
	const T* const frame_end = interleaved + num_channels;

	Intermediate value = *interleaved++;
	while (interleaved < frame_end) {
	value += *interleaved++;
	}

	*deinterleaved++ = value / num_channels;
	}
	}

	// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
	template <typename T>
	void DownmixInterleavedToMono(const T* interleaved,
	size_t num_frames,
	int num_channels,
	T* deinterleaved);

	// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
	template <>
	void DownmixInterleavedToMono<int16_t>(const int16_t* interleaved,
	size_t num_frames,
	int num_channels,
	int16_t* deinterleaved);

	} // namespace webrtc

	#endif // COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_