arduino-audio-tools/_m4_a_common_demuxer_8h_source.html

#pragma once


#include <cstdint>

#include <functional>

#include <string>


#include "AudioTools/AudioCodecs/MP4Parser.h"

#include "AudioTools/CoreAudio/Buffers.h"

#include "MP4Parser.h"


namespace audio_tools {


using stsz_sample_size_t = uint16_t;


class M4ACommonDemuxer {

 public:

  enum class Codec { Unknown, AAC, ALAC, MP3 };


  struct Frame {

    Codec codec;

    const char* mime = nullptr;

    const uint8_t* data;

    size_t size;

  };

  struct Frame {…};


  struct M4AAudioConfig {

    Codec codec = Codec::Unknown;

    // aac

    int aacProfile = 2, sampleRateIdx = 4, channelCfg = 2;

    // cookie

    Vector<uint8_t> alacMagicCookie;

  };

  struct M4AAudioConfig {…};


  struct ESDSParser {

    uint8_t audioObjectType;

    uint8_t samplingRateIndex;

    uint8_t channelConfiguration;


    // Parses esds content to extract audioObjectType, frequencyIndex, and

    // channelConfiguration

    bool parse(const uint8_t* data, size_t size) {

      const uint8_t* ptr = data;

      const uint8_t* end = data + size;


      if (ptr + 4 > end) return false;

      ptr += 4;  // skip version + flags


      if (ptr >= end || *ptr++ != 0x03) return false;

      size_t es_len = parse_descriptor_length(ptr, end);

      if (ptr + es_len > end) return false;


      ptr += 2;  // skip ES_ID

      ptr += 1;  // skip flags


      if (ptr >= end || *ptr++ != 0x04) return false;

      size_t dec_len = parse_descriptor_length(ptr, end);

      if (ptr + dec_len > end) return false;


      ptr += 13;  // skip objectTypeIndication, streamType, bufferSizeDB,

                  // maxBitrate, avgBitrate


      if (ptr >= end || *ptr++ != 0x05) return false;

      size_t dsi_len = parse_descriptor_length(ptr, end);

      if (ptr + dsi_len > end || dsi_len < 2) return false;


      uint8_t byte1 = ptr[0];

      uint8_t byte2 = ptr[1];


      audioObjectType = (byte1 >> 3) & 0x1F;

      samplingRateIndex = ((byte1 & 0x07) << 1) | ((byte2 >> 7) & 0x01);

      channelConfiguration = (byte2 >> 3) & 0x0F;

      return true;

    }


   protected:

    // Helper to decode variable-length descriptor lengths (e.g. 0x80 80 80 05)

    inline size_t parse_descriptor_length(const uint8_t*& ptr,

                                          const uint8_t* end) {

      size_t len = 0;

      for (int i = 0; i < 4 && ptr < end; ++i) {

        uint8_t b = *ptr++;

        len = (len << 7) | (b & 0x7F);

        if ((b & 0x80) == 0) break;

      }

      return len;

    }

  };

  struct ESDSParser {…};


  class SampleExtractor {

   public:

    using Frame = M4ACommonDemuxer::Frame;

    using Codec = M4ACommonDemuxer::Codec;

    using M4AAudioConfig = M4ACommonDemuxer::M4AAudioConfig;

    using FrameCallback = std::function<void(const Frame&, void*)>;


    SampleExtractor(M4AAudioConfig& cfg) : audio_config{cfg} { begin(); }


    void begin() {

      sampleIndex = 0;

      buffer.clear();

      p_chunk_offsets->clear();

      p_sample_sizes->clear();

      buffer.resize(1024);

      current_size = 0;

      box_pos = 0;

      box_size = 0;

    }

    void begin() {…}


    void setCallback(FrameCallback cb) { callback = cb; }


    void setReference(void* r) { ref = r; }


    void setMaxSize(size_t size) {

      box_size = size;

    }

    void setMaxSize(size_t size) {…}


    size_t write(const uint8_t* data, size_t len, bool is_final) {

      // Resize buffer to the current sample size

      size_t currentSize = currentSampleSize();

      if (currentSize == 0) {

        LOGE("No sample size defined: e.g. mdat before stsz!");

        return 0;

      }

      resize(currentSize);


      for (int j = 0; j < len; j++) {

        assert(buffer.write(data[j]));

        if (buffer.available() >= currentSize) {

          LOGI("Sample# %zu: size %zu bytes", sampleIndex, currentSize);

          executeCallback(currentSize);

          buffer.clear();

          box_pos += currentSize;

          ++sampleIndex;

          currentSize = currentSampleSize();

          if (box_pos >= box_size) {

            LOGI("Reached end of box: %s write",

                 is_final ? "final" : "not final");

            return j;

          }

          if (currentSize == 0) {

            LOGE("No sample size defined, cannot write data");

            return j;

          }

        }

      }

      return len;

    }

    size_t write(const uint8_t* data, size_t len, bool is_final) {…}


    BaseBuffer<stsz_sample_size_t>& getSampleSizesBuffer() {

      return *p_sample_sizes;

    }

    BaseBuffer<stsz_sample_size_t>& getSampleSizesBuffer() {…}


    void setSampleSizesBuffer(BaseBuffer<stsz_sample_size_t>& buffer) {

      p_sample_sizes = &buffer;

    }

    void setSampleSizesBuffer(BaseBuffer<stsz_sample_size_t>& buffer) {…}


    BaseBuffer<uint32_t>& getChunkOffsetsBuffer() { return *p_chunk_offsets; }


    void setChunkOffsetsBuffer(BaseBuffer<uint32_t>& buffer) {

      p_chunk_offsets = &buffer;

    }

    void setChunkOffsetsBuffer(BaseBuffer<uint32_t>& buffer) {…}


    void setFixedSampleCount(uint32_t sampleSize, uint32_t sampleCount) {

      fixed_sample_size = sampleSize;

      fixed_sample_count = sampleCount;

    }

    void setFixedSampleCount(uint32_t sampleSize, uint32_t sampleCount) {…}


    Frame getFrame(size_t size, SingleBuffer<uint8_t>& buffer) {

      Frame frame;

      frame.codec = audio_config.codec;

      frame.data = buffer.data();

      frame.size = size;

      switch (audio_config.codec) {

        case Codec::AAC: {

          // Prepare ADTS header + AAC frame

          tmp.resize(size + 7);

          writeAdtsHeader(tmp.data(), audio_config.aacProfile,

                          audio_config.sampleRateIdx, audio_config.channelCfg,

                          size);

          memcpy(tmp.data() + 7, buffer.data(), size);

          frame.data = tmp.data();

          frame.size = size + 7;

          frame.mime = "audio/aac";

          break;

        }

        case Codec::ALAC:

          frame.mime = "audio/alac";

          break;

        case Codec::MP3:

          frame.mime = "audio/mpeg";

          break;

        default:

          frame.mime = nullptr;

          break;

      }

      return frame;

    }

    Frame getFrame(size_t size, SingleBuffer<uint8_t>& buffer) {…}


   protected:

    M4AAudioConfig& audio_config;

    SingleBuffer<stsz_sample_size_t>

        defaultSampleSizes;

    SingleBuffer<uint32_t> defaultChunkOffsets;

    BaseBuffer<stsz_sample_size_t>* p_sample_sizes = &defaultSampleSizes;

    BaseBuffer<uint32_t>* p_chunk_offsets = &defaultChunkOffsets;

    Vector<uint8_t> tmp;

    FrameCallback callback = nullptr;

    void* ref = nullptr;

    size_t sampleIndex = 0;

    SingleBuffer<uint8_t> buffer;

    uint32_t fixed_sample_size = 0;

    uint32_t fixed_sample_count = 0;

    size_t current_size = 0;

    size_t box_size = 0;

    size_t box_pos = 0;


    void executeCallback(size_t size) {

      Frame frame = getFrame(size, buffer);

      if (callback)

        callback(frame, ref);

      else

        LOGE("No callback defined for audio frame extraction");

    }

    void executeCallback(size_t size) {…}


    void resize(size_t newSize) {

      if (buffer.size() < newSize) {

        buffer.resize(newSize);

      }

    }

    void resize(size_t newSize) {…}


    size_t currentSampleSize() {

      static size_t last_index = -1;

      static size_t last_size = -1;


      // Return cached size

      if (sampleIndex == last_index) {

        return last_size;

      }


      // using fixed sizes w/o table

      if (fixed_sample_size > 0 && fixed_sample_count > 0 &&

          sampleIndex < fixed_sample_count) {

        return fixed_sample_size;

      }

      stsz_sample_size_t nextSize = 0;

      if (p_sample_sizes->read(nextSize)) {

        last_index = sampleIndex;

        last_size = nextSize;

        return nextSize;

      }

      return 0;

    }

    size_t currentSampleSize() {…}


    static void writeAdtsHeader(uint8_t* adts, int aacProfile,

                                int sampleRateIdx, int channelCfg,

                                int frameLen) {

      adts[0] = 0xFF;

      adts[1] = 0xF1;

      adts[2] = ((aacProfile - 1) << 6) | (sampleRateIdx << 2) |

                ((channelCfg >> 2) & 0x1);

      adts[3] = ((channelCfg & 0x3) << 6) | ((frameLen + 7) >> 11);

      adts[4] = ((frameLen + 7) >> 3) & 0xFF;

      adts[5] = (((frameLen + 7) & 0x7) << 5) | 0x1F;

      adts[6] = 0xFC;

    }

    static void writeAdtsHeader(uint8_t* adts, int aacProfile, {…}

  };

  class SampleExtractor {…};


  using FrameCallback = std::function<void(const Frame&, void* ref)>;


  M4ACommonDemuxer() = default;

  virtual ~M4ACommonDemuxer() = default;


  virtual void setCallback(FrameCallback cb) { frame_callback = cb; }


  void setSampleSizesBuffer(BaseBuffer<stsz_sample_size_t>& buffer) {

    sampleExtractor.setSampleSizesBuffer(buffer);

  }

  void setSampleSizesBuffer(BaseBuffer<stsz_sample_size_t>& buffer) {…}


  void setChunkOffsetsBuffer(BaseBuffer<uint32_t>& buffer) {

    sampleExtractor.setChunkOffsetsBuffer(buffer);

  }

  void setChunkOffsetsBuffer(BaseBuffer<uint32_t>& buffer) {…}


  void begin() {

    stsz_processed = false;

    stco_processed = false;

    audio_config.alacMagicCookie.clear();

    audio_config.codec = Codec::Unknown;

    parser.begin();

    sampleExtractor.begin();

    chunk_offsets_count = 0;

    sample_count = 0;

  }


  void setAACConfig(int profile, int srIdx, int chCfg) {

    audio_config.aacProfile = profile;

    audio_config.sampleRateIdx = srIdx;

    audio_config.channelCfg = chCfg;

  }

  void setAACConfig(int profile, int srIdx, int chCfg) {…}


  void setM4AAudioConfig(M4AAudioConfig cfg) { audio_config = cfg; }


  M4AAudioConfig getM4AAudioConfig() { return audio_config; }


  void resize(int size) {

    default_size = size;

    if (buffer.size() < size) {

      buffer.resize(size);

    }

  }


  uint32_t getStszFileOffset() const {

    return stsz_offset;

  }

  uint32_t getStszFileOffset() const  {…}


  uint32_t getSampleCount() const {

    return sample_count;

  }

  uint32_t getSampleCount() const  {…}


  virtual void setupParser() = 0;


 protected:

  FrameCallback frame_callback = nullptr;


  SampleExtractor sampleExtractor{

      audio_config};

  SampleExtractor sampleExtractor {…};

  MP4Parser parser;

  bool stsz_processed = false;

  bool stco_processed = false;

  bool stsd_processed = false;

  M4AAudioConfig audio_config;

  SingleBuffer<uint8_t> buffer;

  uint32_t sample_count = 0;

  uint32_t stsz_offset = 0;

  uint32_t chunk_offsets_count = 0;

  size_t default_size = 2 * 1024;


  static uint32_t readU32(const uint8_t* p) {

    return (p[0] << 24) | (p[1] << 16) | (p[2] << 8) | p[3];

  }

  static uint32_t readU32(const uint8_t* p) {…}


  static uint32_t readU32(const uint32_t num) {

    uint8_t* p = (uint8_t*)&num;

    return (p[0] << 24) | (p[1] << 16) | (p[2] << 8) | p[3];

  }


   uint32_t readU32Buffer() {

      uint32_t nextSize = 0;

      buffer.readArray((uint8_t*)&nextSize, 4);

      return readU32(nextSize);

  }


  bool checkType(uint8_t* buffer, const char* type, int offset) {

    if (buffer == nullptr || type == nullptr) return false;

    bool result = buffer[offset] == type[0] && buffer[offset + 1] == type[1] &&

                  buffer[offset + 2] == type[2] &&

                  buffer[offset + 3] == type[3];

    return result;

  }

  bool checkType(uint8_t* buffer, const char* type, int offset) {…}


  void onStsd(const MP4Parser::Box& box) {

    LOGI("Box: %s, size: %u bytes", box.type, (unsigned)box.available);

    if (box.seq == 0) {

      resize(box.size);

      buffer.clear();

    }


    buffer.writeArray(box.data, box.data_size);


    if (box.is_complete && buffer.available() >= 8) {

      // printHexDump(box);

      uint32_t entryCount = readU32(buffer.data() + 4);

      // One or more sample entry boxes (e.g. mp4a, .mp3, alac)

      parser.parseString(buffer.data() + 8, box.data_size - 8,

                         box.file_offset + 8 + 8, box.level + 1);

      buffer.clear();

    }

  }


  void onMp4a(const MP4Parser::Box& box) {

    LOGI("onMp4a: %s, size: %zu bytes", box.type, box.data_size);


    if (box.is_complete) {

      // printHexDump(box);


      // use default configuration

      int aacProfile = 2;     // Default: AAC LC

      int sampleRateIdx = 4;  // Default: 44100 Hz

      int channelCfg = 2;     // Default: Stereo

      setAACConfig(aacProfile, sampleRateIdx, channelCfg);

      audio_config.codec = Codec::AAC;


      int pos = 36 - 8;

      parser.parseString(box.data + pos, box.data_size - pos, box.level + 1);

    }

  }

  void onMp4a(const MP4Parser::Box& box) {…}


  void onEsds(const MP4Parser::Box& box) {

    LOGI("onEsds: %s, size: %zu bytes", box.type, box.data_size);

    // printHexDump(box);

    ESDSParser esdsParser;

    if (!esdsParser.parse(box.data, box.data_size)) {

      LOGE("Failed to parse esds box");

      return;

    }

    LOGI(

        "-> esds: AAC objectType: %u, samplingRateIdx: %u, "

        "channelCfg: %u",

        esdsParser.audioObjectType, esdsParser.samplingRateIndex,

        esdsParser.channelConfiguration);

    setAACConfig(esdsParser.audioObjectType, esdsParser.samplingRateIndex,

                 esdsParser.channelConfiguration);

  }

  void onEsds(const MP4Parser::Box& box) {…}


  // void fixALACMagicCookie(uint8_t* cookie, size_t len) {

  //   if (len < 28) {

  //     return;

  //   }


  //   // Helper to read/write big-endian

  //   auto read32 = [](uint8_t* p) -> uint32_t {

  //     return (p[0] << 24) | (p[1] << 16) | (p[2] << 8) | p[3];

  //   };

  //   auto write32 = [](uint8_t* p, uint32_t val) {

  //     p[0] = (val >> 24) & 0xFF;

  //     p[1] = (val >> 16) & 0xFF;

  //     p[2] = (val >> 8) & 0xFF;

  //     p[3] = val & 0xFF;

  //   };

  //   auto read16 = [](uint8_t* p) -> uint16_t { return (p[0] << 8) | p[1]; };

  //   auto write16 = [](uint8_t* p, uint16_t val) {

  //     p[0] = (val >> 8) & 0xFF;

  //     p[1] = val & 0xFF;

  //   };


  //   // Fix values if zero or invalid

  //   if (read32(cookie + 0) == 0) write32(cookie + 0, 4096);    // frameLength

  //   if (cookie[6] == 0) cookie[6] = 16;                        // bitDepth

  //   if (cookie[7] == 0 || cookie[7] > 32) cookie[7] = 10;      // pb

  //   if (cookie[8] == 0 || cookie[8] > 32) cookie[8] = 14;      // mb

  //   if (cookie[9] == 0 || cookie[9] > 32) cookie[9] = 10;      // kb

  //   if (cookie[10] == 0 || cookie[10] > 8) cookie[10] = 2;     // numChannels

  //   if (read16(cookie + 11) == 0) write16(cookie + 11, 255);   // maxRun

  //   if (read32(cookie + 13) == 0) write32(cookie + 13, 8192);  // maxFrameBytes

  //   if (read32(cookie + 17) == 0) write32(cookie + 17, 512000);  // avgBitRate

  //   if (read32(cookie + 21) == 0) write32(cookie + 21, 44100);   // sampleRate

  // }


  void onAlac(const MP4Parser::Box& box) {

    LOGI("onAlac: %s, size: %zu bytes", box.type, box.data_size);

    audio_config.codec = Codec::ALAC;


    // only alac box in alac contains magic cookie

    MP4Parser::Box alac;

    if (parser.findBox("alac", box.data, box.data_size, alac)) {

      // fixALACMagicCookie((uint8_t*)alac.data, alac.data_size);

      audio_config.alacMagicCookie.resize(alac.data_size - 4);

      std::memcpy(audio_config.alacMagicCookie.data(), alac.data + 4,

                  alac.data_size - 4);

    }

  }

  void onAlac(const MP4Parser::Box& box) {…}


  void onStsz(MP4Parser::Box& box) {

    MP4Parser::defaultCallback(box,0);

    LOGI("onStsz #%u: %s, size: %u of %u bytes", (unsigned) box.seq, box.type, (unsigned) box.available, (unsigned) box.data_size);

    if (stsz_processed) return;

    BaseBuffer<stsz_sample_size_t>& sampleSizes =

        sampleExtractor.getSampleSizesBuffer();


    buffer.resize(box.available);

    size_t written = buffer.writeArray(box.data, box.available);

    assert(written = box.available);


    // get sample count and size from the box

    if (sample_count == 0 && buffer.available() > 12) {

      readU32Buffer();  // skip version + flags

      uint32_t sampleSize = readU32Buffer();

      uint32_t sampleCount = readU32Buffer();

      sample_count = sampleCount;

      stsz_offset = box.file_offset;


      sampleSizes.resize(sample_count);

      if (sampleSize != 0) {

        sampleExtractor.setFixedSampleCount(sampleSize, sampleCount);

      }

    }


    // incrementally process sampleSize

    int count = 0;

    while (buffer.available() >= 4) {

      stsz_sample_size_t sampleSize = readU32Buffer();

      assert(sampleSizes.write(sampleSize));

      count += 4;

    }

    // Remove processed data

    buffer.trim();


    if (box.is_complete) {

      stsz_processed = true;

    }

  }

  void onStsz(MP4Parser::Box& box) {…}


  // /**

  //  * @brief Handles the stco (Chunk Offset) box.

  //  * @param box MP4 box.

  //  */

  // void onStco(MP4Parser::Box& box) {

  //   LOGI("onStco: %s, size: %zu bytes", box.type, box.data_size);

  //   if (stco_processed) return;

  //   BaseBuffer<uint32_t>& chunkOffsets =

  //       sampleExtractor.getChunkOffsetsBuffer();


  //   buffer.resize(box.available);

  //   buffer.writeArray(box.data, box.available);


  //   // get chunk_offsets_count from the box

  //   if (chunk_offsets_count == 0 && buffer.available() > 12) {

  //     chunk_offsets_count = readU32(buffer.data());

  //     buffer.clearArray(4);  // clear version + flags

  //   }


  //   // incrementally process sampleSize

  //   int j = 0;

  //   for (j = 0; j < buffer.available(); j += 4) {

  //     uint32_t sampleSize = readU32(buffer.data() + j);

  //     chunkOffsets.write(sampleSize);

  //   }

  //   buffer.clearArray(j);


  //   if (box.is_complete) {

  //     stco_processed = true;

  //   }

  // }


  void printHexDump(const MP4Parser::Box& box) {

    const uint8_t* data = box.data;

    size_t len = box.data_size;

    LOGI("===========================");

    for (size_t i = 0; i < len; i += 16) {

      char hex[49] = {0};

      char ascii[17] = {0};

      for (size_t j = 0; j < 16 && i + j < len; ++j) {

        sprintf(hex + j * 3, "%02X ", data[i + j]);

        ascii[j] = (data[i + j] >= 32 && data[i + j] < 127) ? data[i + j] : '.';

      }

      ascii[16] = 0;

      LOGI("%04zx: %-48s |%s|", i, hex, ascii);

    }

    LOGI("===========================");

  }

};

class M4ACommonDemuxer {…};


}  // namespace audio_tools

audio_tools::BaseBuffer
Shared functionality of all buffers.
Definition Buffers.h:22

audio_tools::BaseBuffer::read
virtual bool read(T &result)=0
reads a single value

audio_tools::BaseBuffer::readArray
virtual int readArray(T data[], int len)
reads multiple values
Definition Buffers.h:33

audio_tools::BaseBuffer::clear
void clear()
same as reset
Definition Buffers.h:95

audio_tools::BaseBuffer::write
virtual bool write(T data)=0
write add an entry to the buffer

audio_tools::BaseBuffer::resize
virtual bool resize(int bytes)
Resizes the buffer if supported: returns false if not supported.
Definition Buffers.h:117

audio_tools::M4ACommonDemuxer::SampleExtractor
Extracts audio data based on the sample sizes defined in the stsz box. It collects the data from the ...
Definition M4ACommonDemuxer.h:107

audio_tools::M4ACommonDemuxer::SampleExtractor::write
size_t write(const uint8_t *data, size_t len, bool is_final)
Writes data to the extractor, extracting frames as sample sizes are met. Provides the data via the ca...
Definition M4ACommonDemuxer.h:163

audio_tools::M4ACommonDemuxer::SampleExtractor::setFixedSampleCount
void setFixedSampleCount(uint32_t sampleSize, uint32_t sampleCount)
Sets a fixed sample size/count instead of using the sampleSizes table.
Definition M4ACommonDemuxer.h:232

audio_tools::M4ACommonDemuxer::SampleExtractor::ref
void * ref
Reference pointer for callback.
Definition M4ACommonDemuxer.h:283

audio_tools::M4ACommonDemuxer::SampleExtractor::callback
FrameCallback callback
Frame callback.
Definition M4ACommonDemuxer.h:282

audio_tools::M4ACommonDemuxer::SampleExtractor::executeCallback
void executeCallback(size_t size)
Executes the callback for a completed frame.
Definition M4ACommonDemuxer.h:296

audio_tools::M4ACommonDemuxer::SampleExtractor::setSampleSizesBuffer
void setSampleSizesBuffer(BaseBuffer< stsz_sample_size_t > &buffer)
Sets the buffer to use for sample sizes.
Definition M4ACommonDemuxer.h:208

audio_tools::M4ACommonDemuxer::SampleExtractor::writeAdtsHeader
static void writeAdtsHeader(uint8_t *adts, int aacProfile, int sampleRateIdx, int channelCfg, int frameLen)
Writes an ADTS header for an AAC frame.
Definition M4ACommonDemuxer.h:349

audio_tools::M4ACommonDemuxer::SampleExtractor::currentSampleSize
size_t currentSampleSize()
Returns the current sample size.
Definition M4ACommonDemuxer.h:318

audio_tools::M4ACommonDemuxer::SampleExtractor::SampleExtractor
SampleExtractor(M4AAudioConfig &cfg)
Constructor. Initializes the extractor.
Definition M4ACommonDemuxer.h:117

audio_tools::M4ACommonDemuxer::SampleExtractor::sampleIndex
size_t sampleIndex
Current sample index.
Definition M4ACommonDemuxer.h:284

audio_tools::M4ACommonDemuxer::SampleExtractor::box_pos
size_t box_pos
Current position in the box.
Definition M4ACommonDemuxer.h:290

audio_tools::M4ACommonDemuxer::SampleExtractor::resize
void resize(size_t newSize)
Resizes the internal buffer if needed.
Definition M4ACommonDemuxer.h:308

audio_tools::M4ACommonDemuxer::SampleExtractor::defaultChunkOffsets
SingleBuffer< uint32_t > defaultChunkOffsets
Table of chunk offsets.
Definition M4ACommonDemuxer.h:278

audio_tools::M4ACommonDemuxer::SampleExtractor::defaultSampleSizes
SingleBuffer< stsz_sample_size_t > defaultSampleSizes
Table of sample sizes.
Definition M4ACommonDemuxer.h:277

audio_tools::M4ACommonDemuxer::SampleExtractor::getChunkOffsetsBuffer
BaseBuffer< uint32_t > & getChunkOffsetsBuffer()
Returns the buffer of chunk offsets.
Definition M4ACommonDemuxer.h:216

audio_tools::M4ACommonDemuxer::SampleExtractor::current_size
size_t current_size
Current sample size.
Definition M4ACommonDemuxer.h:288

audio_tools::M4ACommonDemuxer::SampleExtractor::buffer
SingleBuffer< uint8_t > buffer
Buffer for accumulating sample data.
Definition M4ACommonDemuxer.h:285

audio_tools::M4ACommonDemuxer::SampleExtractor::begin
void begin()
Resets the extractor state.
Definition M4ACommonDemuxer.h:122

audio_tools::M4ACommonDemuxer::SampleExtractor::box_size
size_t box_size
Maximum size of the current sample.
Definition M4ACommonDemuxer.h:289

audio_tools::M4ACommonDemuxer::SampleExtractor::getSampleSizesBuffer
BaseBuffer< stsz_sample_size_t > & getSampleSizesBuffer()
Returns the buffer of sample sizes.
Definition M4ACommonDemuxer.h:200

audio_tools::M4ACommonDemuxer::SampleExtractor::setCallback
void setCallback(FrameCallback cb)
Sets the callback to be called for each extracted frame.
Definition M4ACommonDemuxer.h:137

audio_tools::M4ACommonDemuxer::SampleExtractor::getFrame
Frame getFrame(size_t size, SingleBuffer< uint8_t > &buffer)
Constructs a Frame object for the current codec.
Definition M4ACommonDemuxer.h:243

audio_tools::M4ACommonDemuxer::SampleExtractor::setReference
void setReference(void *r)
Sets a reference pointer passed to the callback.
Definition M4ACommonDemuxer.h:143

audio_tools::M4ACommonDemuxer::SampleExtractor::fixed_sample_size
uint32_t fixed_sample_size
Fixed sample size (if used).
Definition M4ACommonDemuxer.h:286

audio_tools::M4ACommonDemuxer::SampleExtractor::setChunkOffsetsBuffer
void setChunkOffsetsBuffer(BaseBuffer< uint32_t > &buffer)
Sets the buffer to use for chunk offsets.
Definition M4ACommonDemuxer.h:222

audio_tools::M4ACommonDemuxer::SampleExtractor::fixed_sample_count
uint32_t fixed_sample_count
Fixed sample count (if used).
Definition M4ACommonDemuxer.h:287

audio_tools::M4ACommonDemuxer::SampleExtractor::setMaxSize
void setMaxSize(size_t size)
Sets the maximum box size (e.g., for mdat). This is called before the mdat data is posted....
Definition M4ACommonDemuxer.h:151

audio_tools::M4ACommonDemuxer
Abstract base class for M4A/MP4 demuxers. Provides shared functionality for both file-based and strea...
Definition M4ACommonDemuxer.h:23

audio_tools::M4ACommonDemuxer::parser
MP4Parser parser
Underlying MP4 parser.
Definition M4ACommonDemuxer.h:437

audio_tools::M4ACommonDemuxer::setAACConfig
void setAACConfig(int profile, int srIdx, int chCfg)
Sets the AAC configuration for ADTS header generation.
Definition M4ACommonDemuxer.h:404

audio_tools::M4ACommonDemuxer::sample_count
uint32_t sample_count
Number of samples in stsz.
Definition M4ACommonDemuxer.h:443

audio_tools::M4ACommonDemuxer::onEsds
void onEsds(const MP4Parser::Box &box)
Handles the esds (Elementary Stream Descriptor) box.
Definition M4ACommonDemuxer.h:530

audio_tools::M4ACommonDemuxer::setCallback
virtual void setCallback(FrameCallback cb)
Sets the callback for extracted audio frames.
Definition M4ACommonDemuxer.h:372

audio_tools::M4ACommonDemuxer::sampleExtractor
SampleExtractor sampleExtractor
Extractor for audio samples.
Definition M4ACommonDemuxer.h:435

audio_tools::M4ACommonDemuxer::setSampleSizesBuffer
void setSampleSizesBuffer(BaseBuffer< stsz_sample_size_t > &buffer)
Sets the buffer to use for sample sizes.
Definition M4ACommonDemuxer.h:377

audio_tools::M4ACommonDemuxer::getSampleCount
uint32_t getSampleCount() const
samples in stsz
Definition M4ACommonDemuxer.h:427

audio_tools::M4ACommonDemuxer::onAlac
void onAlac(const MP4Parser::Box &box)
Handles the alac box.
Definition M4ACommonDemuxer.h:585

audio_tools::M4ACommonDemuxer::onStsz
void onStsz(MP4Parser::Box &box)
Handles the stsz (Sample Size) box.
Definition M4ACommonDemuxer.h:603

audio_tools::M4ACommonDemuxer::onMp4a
void onMp4a(const MP4Parser::Box &box)
Handles the mp4a box.
Definition M4ACommonDemuxer.h:507

audio_tools::M4ACommonDemuxer::readU32
static uint32_t readU32(const uint8_t *p)
Reads a 32-bit big-endian unsigned integer from a buffer.
Definition M4ACommonDemuxer.h:453

audio_tools::M4ACommonDemuxer::buffer
SingleBuffer< uint8_t > buffer
Buffer for incremental data.
Definition M4ACommonDemuxer.h:442

audio_tools::M4ACommonDemuxer::default_size
size_t default_size
Default buffer size.
Definition M4ACommonDemuxer.h:446

audio_tools::M4ACommonDemuxer::stsz_processed
bool stsz_processed
Marks the stsz table as processed.
Definition M4ACommonDemuxer.h:438

audio_tools::M4ACommonDemuxer::checkType
bool checkType(uint8_t *buffer, const char *type, int offset)
Checks if the buffer at the given offset matches the specified type.
Definition M4ACommonDemuxer.h:476

audio_tools::M4ACommonDemuxer::getStszFileOffset
uint32_t getStszFileOffset() const
File offset of stsz box.
Definition M4ACommonDemuxer.h:422

audio_tools::M4ACommonDemuxer::setChunkOffsetsBuffer
void setChunkOffsetsBuffer(BaseBuffer< uint32_t > &buffer)
Sets the buffer to use for sample sizes.
Definition M4ACommonDemuxer.h:384

audio_tools::M4ACommonDemuxer::stco_processed
bool stco_processed
Marks the stco table as processed.
Definition M4ACommonDemuxer.h:439

audio_tools::MP4Parser
MP4Parser is a class that parses MP4 container files and extracts boxes (atoms). It provides a callba...
Definition MP4Parser.h:28

audio_tools::MP4Parser::defaultCallback
static void defaultCallback(const Box &box, void *ref)
Default callback that prints box information to Serial.
Definition MP4Parser.h:223

audio_tools::MP4Parser::begin
bool begin()
Initializes the parser.
Definition MP4Parser.h:107

audio_tools::MP4Parser::parseString
int parseString(const uint8_t *str, int len, int fileOffset=0, int level=0)
Trigger separate parsing (and callbacks) on the indicated string.
Definition MP4Parser.h:170

audio_tools::MP4Parser::findBox
bool findBox(const char *name, const uint8_t *data, size_t len, Box &result)
find box in box
Definition MP4Parser.h:197

audio_tools::SingleBuffer
A simple Buffer implementation which just uses a (dynamically sized) array.
Definition Buffers.h:172

audio_tools::SingleBuffer::trim
void trim()
Moves the unprocessed data to the beginning of the buffer.
Definition Buffers.h:260

audio_tools::SingleBuffer::write
bool write(T sample) override
write add an entry to the buffer
Definition Buffers.h:202

audio_tools::SingleBuffer::available
int available() override
provides the number of entries that are available to read
Definition Buffers.h:229

audio_tools::SingleBuffer::resize
bool resize(int size)
Resizes the buffer if supported: returns false if not supported.
Definition Buffers.h:292

audio_tools::SingleBuffer::writeArray
int writeArray(const T data[], int len) override
Fills the buffer data.
Definition Buffers.h:197

audio_tools::SingleBuffer::data
T * data()
Provides address of actual data.
Definition Buffers.h:271

audio_tools::Vector
Vector implementation which provides the most important methods as defined by std::vector....
Definition Vector.h:21

audio_tools
Generic Implementation of sound input and output for desktop environments using portaudio.
Definition AudioCodecsBase.h:10

audio_tools::stsz_sample_size_t
uint16_t stsz_sample_size_t
Definition M4ACommonDemuxer.h:17

audio_tools::M4ACommonDemuxer::ESDSParser
A parser for the ESDS segment to extract the relevant aac information.
Definition M4ACommonDemuxer.h:47

audio_tools::M4ACommonDemuxer::Frame
Definition M4ACommonDemuxer.h:27

audio_tools::M4ACommonDemuxer::M4AAudioConfig
Definition M4ACommonDemuxer.h:34

audio_tools::M4ACommonDemuxer::M4AAudioConfig::alacMagicCookie
Vector< uint8_t > alacMagicCookie
ALAC codec config.
Definition M4ACommonDemuxer.h:39

audio_tools::M4ACommonDemuxer::M4AAudioConfig::channelCfg
int channelCfg
AAC config.
Definition M4ACommonDemuxer.h:37

audio_tools::M4ACommonDemuxer::M4AAudioConfig::codec
Codec codec
Current codec.
Definition M4ACommonDemuxer.h:35

audio_tools::MP4Parser::Box
Represents an individual box in the MP4 file.
Definition MP4Parser.h:33

audio_tools::MP4Parser::Box::data
const uint8_t * data
Pointer to box payload (not including header)
Definition MP4Parser.h:40

audio_tools::MP4Parser::Box::available
int available
Number of bytes available as data.
Definition MP4Parser.h:47

audio_tools::MP4Parser::Box::file_offset
uint64_t file_offset
File offset where box starts.
Definition MP4Parser.h:46

audio_tools::MP4Parser::Box::size
size_t size
Size of payload including subboxes (not including header)
Definition MP4Parser.h:43

audio_tools::MP4Parser::Box::is_complete
bool is_complete
True if the box data is complete.
Definition MP4Parser.h:48

audio_tools::MP4Parser::Box::seq
size_t seq
Sequence number for the box per id.
Definition MP4Parser.h:38

audio_tools::MP4Parser::Box::type
char type[5]
4-character box type (null-terminated)
Definition MP4Parser.h:39

audio_tools::MP4Parser::Box::level
int level
Nesting depth.
Definition MP4Parser.h:45

audio_tools::MP4Parser::Box::data_size
size_t data_size
Size of payload (not including header)
Definition MP4Parser.h:42