audio_buffer.h - mozsearch

Enable keyboard shortcuts

/*

 *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.

 *  Use of this source code is governed by a BSD-style license

 *  that can be found in the LICENSE file in the root of the source

 *  tree. An additional intellectual property rights grant can be found

 *  in the file PATENTS.  All contributing project authors may

 *  be found in the AUTHORS file in the root of the source tree.

*/

#ifndef MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_

#define MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_

#include <stddef.h>

#include <stdint.h>

#include <memory>

#include <vector>

#include "api/audio/audio_processing.h"

#include "api/audio/audio_view.h"

#include "common_audio/channel_buffer.h"

#include "common_audio/include/audio_util.h"

namespace webrtc {

class PushSincResampler;

class SplittingFilter;

enum Band { kBand0To8kHz = 0, kBand8To16kHz = 1, kBand16To24kHz = 2 };

// Stores any audio data in a way that allows the audio processing module to

// operate on it in a controlled manner.

class AudioBuffer {

 public:

  static const int kSplitBandSize = 160;

  // TODO(tommi): Remove this (`AudioBuffer::kMaxSampleRate`) constant.

  static const int kMaxSampleRate = webrtc::kMaxSampleRateHz;

  AudioBuffer(size_t input_rate,

              size_t input_num_channels,

              size_t buffer_rate,

              size_t buffer_num_channels,

              size_t output_rate,

              size_t output_num_channels);

  virtual ~AudioBuffer();

  AudioBuffer(const AudioBuffer&) = delete;

  AudioBuffer& operator=(const AudioBuffer&) = delete;

  // Specify that downmixing should be done by selecting a single channel.

  void set_downmixing_to_specific_channel(size_t channel);

  // Specify that downmixing should be done by averaging all channels,.

  void set_downmixing_by_averaging();

  // Set the number of channels in the buffer. The specified number of channels

  // cannot be larger than the specified buffer_num_channels. The number is also

  // reset at each call to CopyFrom or InterleaveFrom.

  void set_num_channels(size_t num_channels);

  // Returns a DeinterleavedView<> over the channel data.

  DeinterleavedView<float> view() {

    return DeinterleavedView<float>(

        num_channels_ && buffer_num_frames_ ? channels()[0] : nullptr,

        buffer_num_frames_, num_channels_);

  size_t num_channels() const { return num_channels_; }

  size_t num_frames() const { return buffer_num_frames_; }

  size_t num_frames_per_band() const { return num_split_frames_; }

  size_t num_bands() const { return num_bands_; }

  // Returns pointer arrays to the full-band channels.

  // Usage:

  // channels()[channel][sample].

  // Where:

  // 0 <= channel < `buffer_num_channels_`

  // 0 <= sample < `buffer_num_frames_`

  float* const* channels() { return data_->channels(); }

  const float* const* channels_const() const { return data_->channels(); }

  // Returns pointer arrays to the bands for a specific channel.

  // Usage:

  // split_bands(channel)[band][sample].

  // Where:

  // 0 <= channel < `buffer_num_channels_`

  // 0 <= band < `num_bands_`

  // 0 <= sample < `num_split_frames_`

  const float* const* split_bands_const(size_t channel) const {

    return split_data_.get() ? split_data_->bands(channel)

                             : data_->bands(channel);

  float* const* split_bands(size_t channel) {

    return split_data_.get() ? split_data_->bands(channel)

                             : data_->bands(channel);

  // Returns a pointer array to the channels for a specific band.

  // Usage:

  // split_channels(band)[channel][sample].

  // Where:

  // 0 <= band < `num_bands_`

  // 0 <= channel < `buffer_num_channels_`

  // 0 <= sample < `num_split_frames_`

  const float* const* split_channels_const(Band band) const {

    if (split_data_.get()) {

      return split_data_->channels(band);

    } else {

      return band == kBand0To8kHz ? data_->channels() : nullptr;

  // Copies data into the buffer.

  void CopyFrom(const int16_t* const interleaved_data,

                const StreamConfig& stream_config);

  void CopyFrom(const float* const* stacked_data,

                const StreamConfig& stream_config);

  // Copies data from the buffer.

  void CopyTo(const StreamConfig& stream_config,

              int16_t* const interleaved_data);

  void CopyTo(const StreamConfig& stream_config, float* const* stacked_data);

  void CopyTo(AudioBuffer* buffer) const;

  // Splits the buffer data into frequency bands.

  void SplitIntoFrequencyBands();

  // Recombines the frequency bands into a full-band signal.

  void MergeFrequencyBands();

  // Copies the split bands data into the integer two-dimensional array.

  void ExportSplitChannelData(size_t channel,

                              int16_t* const* split_band_data) const;

  // Copies the data in the integer two-dimensional array into the split_bands

  // data.

  void ImportSplitChannelData(size_t channel,

                              const int16_t* const* split_band_data);

  static const size_t kMaxSplitFrameLength = 160;

  static const size_t kMaxNumBands = 3;

  // Deprecated methods, will be removed soon.

  float* const* channels_f() { return channels(); }

  const float* const* channels_const_f() const { return channels_const(); }

  const float* const* split_bands_const_f(size_t channel) const {

    return split_bands_const(channel);

  float* const* split_bands_f(size_t channel) { return split_bands(channel); }

  const float* const* split_channels_const_f(Band band) const {

    return split_channels_const(band);

 private:

  FRIEND_TEST_ALL_PREFIXES(AudioBufferTest,

                           SetNumChannelsSetsChannelBuffersNumChannels);

  void RestoreNumChannels();

  const size_t input_num_frames_;

  const size_t input_num_channels_;

  const size_t buffer_num_frames_;

  const size_t buffer_num_channels_;

  const size_t output_num_frames_;

  const size_t output_num_channels_;

  size_t num_channels_;

  size_t num_bands_;

  size_t num_split_frames_;

  std::unique_ptr<ChannelBuffer<float>> data_;

  std::unique_ptr<ChannelBuffer<float>> split_data_;

  std::unique_ptr<SplittingFilter> splitting_filter_;

  std::vector<std::unique_ptr<PushSincResampler>> input_resamplers_;

  std::vector<std::unique_ptr<PushSincResampler>> output_resamplers_;

  bool downmix_by_averaging_ = true;

  size_t channel_for_downmixing_ = 0;

};

}  // namespace webrtc

#endif  // MODULES_AUDIO_PROCESSING_AUDIO_BUFFER_H_