audio_encoder_copy_red.cc

mozilla-central/third_party/libwebrtc/modules/audio_coding/codecs/red/audio_encoder_copy_red.cc (file symbol)

Enable keyboard shortcuts

Source code

Revision control

Copy as Markdown

Other Tools

/*

 *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.

 *  Use of this source code is governed by a BSD-style license

 *  that can be found in the LICENSE file in the root of the source

 *  tree. An additional intellectual property rights grant can be found

 *  in the file PATENTS.  All contributing project authors may

 *  be found in the AUTHORS file in the root of the source tree.

*/

#include "modules/audio_coding/codecs/red/audio_encoder_copy_red.h"

#include <string.h>

#include <utility>

#include <vector>

#include "absl/strings/string_view.h"

#include "rtc_base/byte_order.h"

#include "rtc_base/checks.h"

#include "rtc_base/logging.h"

namespace webrtc {

static constexpr const int kRedMaxPacketSize =

    1 << 10;  // RED packets must be less than 1024 bytes to fit the 10 bit

              // block length.

static constexpr const size_t kRedMaxTimestampDelta =

    1 << 14;  // RED packets can encode a timestamp delta of 14 bits.

static constexpr const size_t kAudioMaxRtpPacketLen =

    1200;  // The typical MTU is 1200 bytes.

static constexpr size_t kRedHeaderLength = 4;  // 4 bytes RED header.

static constexpr size_t kRedLastHeaderLength =

    1;  // reduced size for last RED header.

static constexpr size_t kRedNumberOfRedundantEncodings =

    1;  // The level of redundancy we support.

AudioEncoderCopyRed::Config::Config() = default;

AudioEncoderCopyRed::Config::Config(Config&&) = default;

AudioEncoderCopyRed::Config::~Config() = default;

size_t GetMaxRedundancyFromFieldTrial(const FieldTrialsView& field_trials) {

  const std::string red_trial =

      field_trials.Lookup("WebRTC-Audio-Red-For-Opus");

  size_t redundancy = 0;

  if (sscanf(red_trial.c_str(), "Enabled-%zu", &redundancy) != 1 ||

      redundancy > 9) {

    return kRedNumberOfRedundantEncodings;

  return redundancy;

AudioEncoderCopyRed::AudioEncoderCopyRed(Config&& config,

                                         const FieldTrialsView& field_trials)

    : speech_encoder_(std::move(config.speech_encoder)),

      primary_encoded_(0, kAudioMaxRtpPacketLen),

      max_packet_length_(kAudioMaxRtpPacketLen),

      red_payload_type_(config.payload_type) {

  RTC_CHECK(speech_encoder_) << "Speech encoder not provided.";

  auto number_of_redundant_encodings =

      GetMaxRedundancyFromFieldTrial(field_trials);

  for (size_t i = 0; i < number_of_redundant_encodings; i++) {

    std::pair<EncodedInfo, rtc::Buffer> redundant;

    redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);

    redundant_encodings_.push_front(std::move(redundant));

AudioEncoderCopyRed::~AudioEncoderCopyRed() = default;

int AudioEncoderCopyRed::SampleRateHz() const {

  return speech_encoder_->SampleRateHz();

size_t AudioEncoderCopyRed::NumChannels() const {

  return speech_encoder_->NumChannels();

int AudioEncoderCopyRed::RtpTimestampRateHz() const {

  return speech_encoder_->RtpTimestampRateHz();

size_t AudioEncoderCopyRed::Num10MsFramesInNextPacket() const {

  return speech_encoder_->Num10MsFramesInNextPacket();

size_t AudioEncoderCopyRed::Max10MsFramesInAPacket() const {

  return speech_encoder_->Max10MsFramesInAPacket();

int AudioEncoderCopyRed::GetTargetBitrate() const {

  return speech_encoder_->GetTargetBitrate();

AudioEncoder::EncodedInfo AudioEncoderCopyRed::EncodeImpl(

    uint32_t rtp_timestamp,

    rtc::ArrayView<const int16_t> audio,

    rtc::Buffer* encoded) {

  primary_encoded_.Clear();

  EncodedInfo info =

      speech_encoder_->Encode(rtp_timestamp, audio, &primary_encoded_);

  RTC_CHECK(info.redundant.empty()) << "Cannot use nested redundant encoders.";

  RTC_DCHECK_EQ(primary_encoded_.size(), info.encoded_bytes);

  if (info.encoded_bytes == 0) {

    return info;

  if (info.encoded_bytes >= kRedMaxPacketSize) {

    // Fallback to the primary encoding if the encoded size is more than

    // what RED can encode as redundancy (1024 bytes). This can happen with

    // Opus stereo at the highest bitrate which consumes up to 1276 bytes.

    encoded->AppendData(primary_encoded_);

    return info;

  RTC_DCHECK_GT(max_packet_length_, info.encoded_bytes);

  size_t header_length_bytes = kRedLastHeaderLength;

  size_t bytes_available = max_packet_length_ - info.encoded_bytes;

  auto it = redundant_encodings_.begin();

  // Determine how much redundancy we can fit into our packet by

  // iterating forward. This is determined both by the length as well

  // as the timestamp difference. The latter can occur with opus DTX which

  // has timestamp gaps of 400ms which exceeds REDs timestamp delta field size.

  for (; it != redundant_encodings_.end(); it++) {

    if (bytes_available < kRedHeaderLength + it->first.encoded_bytes) {

      break;

    if (it->first.encoded_bytes == 0) {

      break;

    if (rtp_timestamp - it->first.encoded_timestamp >= kRedMaxTimestampDelta) {

      break;

    bytes_available -= kRedHeaderLength + it->first.encoded_bytes;

    header_length_bytes += kRedHeaderLength;

  // Allocate room for RFC 2198 header.

  encoded->SetSize(header_length_bytes);

  // Iterate backwards and append the data.

  size_t header_offset = 0;

  while (it-- != redundant_encodings_.begin()) {

    encoded->AppendData(it->second);

    const uint32_t timestamp_delta =

        info.encoded_timestamp - it->first.encoded_timestamp;

    encoded->data()[header_offset] = it->first.payload_type | 0x80;

    rtc::SetBE16(static_cast<uint8_t*>(encoded->data()) + header_offset + 1,

                 (timestamp_delta << 2) | (it->first.encoded_bytes >> 8));

    encoded->data()[header_offset + 3] = it->first.encoded_bytes & 0xff;

    header_offset += kRedHeaderLength;

    info.redundant.push_back(it->first);

  // `info` will be implicitly cast to an EncodedInfoLeaf struct, effectively

  // discarding the (empty) vector of redundant information. This is

  // intentional.

  if (header_length_bytes > kRedHeaderLength) {

    info.redundant.push_back(info);

    RTC_DCHECK_EQ(info.speech,

                  info.redundant[info.redundant.size() - 1].speech);

  encoded->AppendData(primary_encoded_);

  RTC_DCHECK_EQ(header_offset, header_length_bytes - 1);

  encoded->data()[header_offset] = info.payload_type;

  // Shift the redundant encodings.

  auto rit = redundant_encodings_.rbegin();

  for (auto next = std::next(rit); next != redundant_encodings_.rend();

       rit++, next = std::next(rit)) {

    rit->first = next->first;

    rit->second.SetData(next->second);

  it = redundant_encodings_.begin();

  if (it != redundant_encodings_.end()) {

    it->first = info;

    it->second.SetData(primary_encoded_);

  // Update main EncodedInfo.

  info.payload_type = red_payload_type_;

  info.encoded_bytes = encoded->size();

  return info;

void AudioEncoderCopyRed::Reset() {

  speech_encoder_->Reset();

  auto number_of_redundant_encodings = redundant_encodings_.size();

  redundant_encodings_.clear();

  for (size_t i = 0; i < number_of_redundant_encodings; i++) {

    std::pair<EncodedInfo, rtc::Buffer> redundant;

    redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);

    redundant_encodings_.push_front(std::move(redundant));

bool AudioEncoderCopyRed::SetFec(bool enable) {

  return speech_encoder_->SetFec(enable);

bool AudioEncoderCopyRed::SetDtx(bool enable) {

  return speech_encoder_->SetDtx(enable);

bool AudioEncoderCopyRed::GetDtx() const {

  return speech_encoder_->GetDtx();

bool AudioEncoderCopyRed::SetApplication(Application application) {

  return speech_encoder_->SetApplication(application);

void AudioEncoderCopyRed::SetMaxPlaybackRate(int frequency_hz) {

  speech_encoder_->SetMaxPlaybackRate(frequency_hz);

bool AudioEncoderCopyRed::EnableAudioNetworkAdaptor(

    const std::string& config_string,

    RtcEventLog* event_log) {

  return speech_encoder_->EnableAudioNetworkAdaptor(config_string, event_log);

void AudioEncoderCopyRed::DisableAudioNetworkAdaptor() {

  speech_encoder_->DisableAudioNetworkAdaptor();

void AudioEncoderCopyRed::OnReceivedUplinkPacketLossFraction(

    float uplink_packet_loss_fraction) {

  speech_encoder_->OnReceivedUplinkPacketLossFraction(

      uplink_packet_loss_fraction);

void AudioEncoderCopyRed::OnReceivedUplinkBandwidth(

    int target_audio_bitrate_bps,

    absl::optional<int64_t> bwe_period_ms) {

  speech_encoder_->OnReceivedUplinkBandwidth(target_audio_bitrate_bps,

                                             bwe_period_ms);

void AudioEncoderCopyRed::OnReceivedUplinkAllocation(

    BitrateAllocationUpdate update) {

  speech_encoder_->OnReceivedUplinkAllocation(update);

absl::optional<std::pair<TimeDelta, TimeDelta>>

AudioEncoderCopyRed::GetFrameLengthRange() const {

  return speech_encoder_->GetFrameLengthRange();

void AudioEncoderCopyRed::OnReceivedRtt(int rtt_ms) {

  speech_encoder_->OnReceivedRtt(rtt_ms);

void AudioEncoderCopyRed::OnReceivedOverhead(size_t overhead_bytes_per_packet) {

  max_packet_length_ = kAudioMaxRtpPacketLen - overhead_bytes_per_packet;

  return speech_encoder_->OnReceivedOverhead(overhead_bytes_per_packet);

void AudioEncoderCopyRed::SetReceiverFrameLengthRange(int min_frame_length_ms,

                                                      int max_frame_length_ms) {

  return speech_encoder_->SetReceiverFrameLengthRange(min_frame_length_ms,

                                                      max_frame_length_ms);

ANAStats AudioEncoderCopyRed::GetANAStats() const {

  return speech_encoder_->GetANAStats();

rtc::ArrayView<std::unique_ptr<AudioEncoder>>

AudioEncoderCopyRed::ReclaimContainedEncoders() {

  return rtc::ArrayView<std::unique_ptr<AudioEncoder>>(&speech_encoder_, 1);

}  // namespace webrtc