Source code
Revision control
Copy as Markdown
Other Tools
/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
/* vim: set ts=2 et sw=2 tw=80: */
/* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
#ifndef MOZILLA_AUDIOSAMPLEFORMAT_H_
#define MOZILLA_AUDIOSAMPLEFORMAT_H_
#include "mozilla/Assertions.h"
#include "mozilla/PodOperations.h"
#include <algorithm>
#include <type_traits>
#include <limits>
namespace mozilla {
/**
* Audio formats supported in MediaTracks and media elements.
*
* Only one of these is supported by AudioStream, and that is determined
* at compile time (roughly, FLOAT32 on desktops, S16 on mobile). Media decoders
* produce that format only; queued AudioData always uses that format.
*/
enum AudioSampleFormat {
// Silence: format will be chosen later
AUDIO_FORMAT_SILENCE,
// Native-endian signed 16-bit audio samples
AUDIO_FORMAT_S16,
// Signed 32-bit float samples
AUDIO_FORMAT_FLOAT32,
// The format used for output by AudioStream.
AUDIO_OUTPUT_FORMAT = AUDIO_FORMAT_FLOAT32
};
enum { MAX_AUDIO_SAMPLE_SIZE = sizeof(float) };
template <AudioSampleFormat Format>
class AudioSampleTraits;
template <>
class AudioSampleTraits<AUDIO_FORMAT_FLOAT32> {
public:
using Type = float;
};
template <>
class AudioSampleTraits<AUDIO_FORMAT_S16> {
public:
using Type = int16_t;
};
using AudioDataValue = AudioSampleTraits<AUDIO_OUTPUT_FORMAT>::Type;
template <typename T>
class AudioSampleTypeToFormat;
template <>
class AudioSampleTypeToFormat<float> {
public:
static const AudioSampleFormat Format = AUDIO_FORMAT_FLOAT32;
};
template <>
class AudioSampleTypeToFormat<short> {
public:
static const AudioSampleFormat Format = AUDIO_FORMAT_S16;
};
template <typename T>
constexpr float MaxAsFloat() {
return static_cast<float>(std::numeric_limits<T>::max());
}
template <typename T>
constexpr float LowestAsFloat() {
return static_cast<float>(std::numeric_limits<T>::lowest());
}
// The maximum value for an audio sample. If T is signed, the absolute value of
// this number is smaller (by exactly 1) than ::Min().
template <typename T>
constexpr T Max() {
return std::numeric_limits<T>::max();
}
// The minimum value for an audio sample. If T is signed, the absolute value of
// this number is greater (by exactly 1) than ::Max()
template <typename T>
constexpr T Min() {
return std::numeric_limits<T>::lowest();
}
template <>
constexpr float Max<float>() {
return 1.0f;
}
template <>
constexpr float Min<float>() {
return -1.0f;
}
// The bias value is the middle of the range. In linear PCM audio, if the
// values are all equal to the bias value, the audio is silent.
template <typename T>
constexpr T Bias() {
return 0;
}
template <>
constexpr uint8_t Bias<uint8_t>() {
return 128;
}
// Clip a floating point audio sample to its nominal range. This is
// destructive, and is only used here for avoiding overflow in some edge cases,
// so it's not going to be generally audible.
inline float Clip(float aValue) { return std::clamp(aValue, -1.0f, 1.0f); }
template <typename T>
T FloatToAudioSample(float aValue) {
if constexpr (std::is_same_v<float, T>) {
return aValue;
}
if constexpr (std::is_same_v<uint8_t, T>) {
return static_cast<T>(std::clamp((aValue + 1.0f) * 128.f,
LowestAsFloat<T>(), MaxAsFloat<T>()));
} else if constexpr (std::is_same_v<int16_t, T>) {
// This produces correct results accross the range.
return static_cast<T>(std::clamp(aValue * -LowestAsFloat<T>(),
LowestAsFloat<T>(), MaxAsFloat<T>()));
} else if constexpr (std::is_same_v<int32_t, T>) {
// We need to handle this differently because of rounding between INT32_MAX
// and float 32-bits, to maximise precision.
if (aValue >= 0.) {
// if the input sample is greater OR EQUAL to 1.0, then clip and return
// the max value.
if (aValue >= 1.0) {
return std::numeric_limits<T>::max();
}
// otherwise cast to a double and map to the positive range.
// float 32-bits cannot represent int32_max (but can represent int32_min)
constexpr double magnitudePos = std::numeric_limits<int32_t>::max();
return static_cast<int32_t>(aValue * magnitudePos);
}
// Similarly for the negative range.
if (aValue <= -1.0) {
return std::numeric_limits<T>::lowest();
}
constexpr double magnitudeNegative =
-1.0 * std::numeric_limits<int32_t>::lowest();
return static_cast<int32_t>(aValue * magnitudeNegative);
}
}
template <typename T>
T UInt8bitToAudioSample(uint8_t aValue) {
if constexpr (std::is_same_v<uint8_t, T>) {
return aValue;
} else if constexpr (std::is_same_v<int16_t, T>) {
return (static_cast<int16_t>(aValue) << 8) - (1 << 15);
} else if constexpr (std::is_same_v<int32_t, T>) {
return (static_cast<int32_t>(aValue) << 24) - (1 << 31);
} else if constexpr (std::is_same_v<float, T>) {
float biased = static_cast<float>(aValue) - Bias<uint8_t>();
if (aValue >= Bias<uint8_t>()) {
return Clip(biased / MaxAsFloat<int8_t>());
}
return Clip(biased / -LowestAsFloat<int8_t>());
}
}
template <typename T>
T Int16ToAudioSample(int16_t aValue) {
if constexpr (std::is_same_v<uint8_t, T>) {
return static_cast<uint8_t>(aValue >> 8) + 128;
} else if constexpr (std::is_same_v<int16_t, T>) {
return aValue;
} else if constexpr (std::is_same_v<int32_t, T>) {
return aValue << 16;
} else if constexpr (std::is_same_v<float, T>) {
if (aValue >= 0) {
return Clip(static_cast<float>(aValue) / MaxAsFloat<int16_t>());
}
return Clip(static_cast<float>(aValue) / -LowestAsFloat<int16_t>());
}
}
// 24-bits audio samples are stored in 32-bits variables.
template <typename T>
T Int24ToAudioSample(int32_t aValue) {
if constexpr (std::is_same_v<uint8_t, T>) {
return static_cast<uint8_t>(aValue >> 16) + 128;
} else if constexpr (std::is_same_v<int16_t, T>) {
return static_cast<int16_t>(aValue >> 8);
} else if constexpr (std::is_same_v<int32_t, T>) {
return aValue << 8;
} else if constexpr (std::is_same_v<float, T>) {
const int32_t min = -(2 << 22);
const int32_t max = (2 << 22) - 1;
if (aValue >= 0) {
return Clip(static_cast<float>(aValue) / static_cast<float>(max));
}
return Clip(static_cast<float>(aValue) / -static_cast<float>(min));
}
}
template <typename T>
T Int32ToAudioSample(int32_t aValue) {
if constexpr (std::is_same_v<uint8_t, T>) {
return static_cast<uint8_t>(aValue >> 24) + 128;
} else if constexpr (std::is_same_v<int16_t, T>) {
return aValue >> 16;
} else if constexpr (std::is_same_v<int32_t, T>) {
return aValue;
} else if constexpr (std::is_same_v<float, T>) {
if (aValue >= 0) {
return Clip(static_cast<float>(aValue) / MaxAsFloat<int32_t>());
}
return Clip(static_cast<float>(aValue) / -LowestAsFloat<int32_t>());
}
}
// This does not handle 24-bits audio, call the function explicitly when
// needed.
template <typename D, typename S>
inline D ConvertAudioSample(const S& aSource) {
if constexpr (std::is_same_v<S, D>) {
return aSource;
} else if constexpr (std::is_same_v<S, uint8_t>) {
return UInt8bitToAudioSample<D>(aSource);
} else if constexpr (std::is_same_v<S, int16_t>) {
return Int16ToAudioSample<D>(aSource);
} else if constexpr (std::is_same_v<S, int32_t>) {
return Int32ToAudioSample<D>(aSource);
} else if constexpr (std::is_same_v<S, float>) {
return FloatToAudioSample<D>(aSource);
}
}
// Sample buffer conversion
template <typename From, typename To>
inline void ConvertAudioSamples(const From* aFrom, To* aTo, int aCount) {
if constexpr (std::is_same_v<From, To>) {
PodCopy(aTo, aFrom, aCount);
return;
}
for (int i = 0; i < aCount; ++i) {
aTo[i] = ConvertAudioSample<To>(aFrom[i]);
}
}
// Sample buffer conversion with scale
template <typename From, typename To>
inline void ConvertAudioSamplesWithScale(const From* aFrom, To* aTo, int aCount,
float aScale) {
if (aScale == 1.0f) {
ConvertAudioSamples(aFrom, aTo, aCount);
return;
}
for (int i = 0; i < aCount; ++i) {
aTo[i] =
ConvertAudioSample<To>(ConvertAudioSample<float>(aFrom[i]) * aScale);
}
}
inline void ConvertAudioSamplesWithScale(const int16_t* aFrom, int16_t* aTo,
int aCount, float aScale) {
if (aScale == 1.0f) {
ConvertAudioSamples(aFrom, aTo, aCount);
return;
}
if (0.0f <= aScale && aScale < 1.0f) {
int32_t scale = int32_t((1 << 16) * aScale);
for (int i = 0; i < aCount; ++i) {
aTo[i] = int16_t((int32_t(aFrom[i]) * scale) >> 16);
}
return;
}
for (int i = 0; i < aCount; ++i) {
aTo[i] = FloatToAudioSample<int16_t>(ConvertAudioSample<float>(aFrom[i]) *
aScale);
}
}
template <typename From, typename To>
inline void AddAudioSamplesWithScale(const From* aFrom, To* aTo, int aCount,
float aScale) {
for (int i = 0; i < aCount; ++i) {
aTo[i] =
ConvertAudioSample<To>(ConvertAudioSample<float>(aTo[i]) +
ConvertAudioSample<float>(aFrom[i]) * aScale);
}
}
// In place audio sample scaling.
inline void ScaleAudioSamples(float* aBuffer, int aCount, float aScale) {
for (int32_t i = 0; i < aCount; ++i) {
aBuffer[i] *= aScale;
}
}
inline void ScaleAudioSamples(short* aBuffer, int aCount, float aScale) {
int32_t volume = int32_t((1 << 16) * aScale);
for (int32_t i = 0; i < aCount; ++i) {
aBuffer[i] = short((int32_t(aBuffer[i]) * volume) >> 16);
}
}
inline const void* AddAudioSampleOffset(const void* aBase,
AudioSampleFormat aFormat,
int32_t aOffset) {
static_assert(AUDIO_FORMAT_S16 == 1, "Bad constant");
static_assert(AUDIO_FORMAT_FLOAT32 == 2, "Bad constant");
MOZ_ASSERT(aFormat == AUDIO_FORMAT_S16 || aFormat == AUDIO_FORMAT_FLOAT32);
return static_cast<const uint8_t*>(aBase) + aFormat * 2 * aOffset;
}
} // namespace mozilla
#endif /* MOZILLA_AUDIOSAMPLEFORMAT_H_ */