packetizer: mpeg4: move audio configs parsing to header

1 year ago · 50a4eb3d42
3 changed files with 575 additions and 573 deletions
--- a/modules/codec/faad.c
+++ b/modules/codec/faad.c
@ -157,7 +157,7 @@ static int Open( vlc_object_t *p_this )
        p_dec->fmt_out.audio.i_rate = i_rate;
        p_dec->fmt_out.audio.i_channels = i_channels;
        p_dec->fmt_out.audio.i_physical_channels
-            = mpeg4_asc_channelsbyindex[i_channels];
+            = MPEG4_asc_channelsbyindex[i_channels];
        date_Init( &p_sys->date, i_rate, 1 );
    }
    else
@ -328,7 +328,7 @@ static int DecodeBlock( decoder_t *p_dec, block_t *p_block )
        p_dec->fmt_out.audio.i_rate = i_rate;
        p_dec->fmt_out.audio.i_channels = i_channels;
        p_dec->fmt_out.audio.i_physical_channels
-            = mpeg4_asc_channelsbyindex[i_channels];
+            = MPEG4_asc_channelsbyindex[i_channels];
        date_Init( &p_sys->date, i_rate, 1 );
    }

@ -399,7 +399,7 @@ static int DecodeBlock( decoder_t *p_dec, block_t *p_block )
                    p_dec->fmt_out.audio.i_rate = i_rate;
                    p_dec->fmt_out.audio.i_channels = i_channels;
                    p_dec->fmt_out.audio.i_physical_channels
-                        = mpeg4_asc_channelsbyindex[i_channels];
+                        = MPEG4_asc_channelsbyindex[i_channels];
                    date_Init( &p_sys->date, i_rate, 1 );
                }
            }
--- a/modules/packetizer/mpeg4audio.c
+++ b/modules/packetizer/mpeg4audio.c
@ -57,62 +57,6 @@
 /*****************************************************************************
 * decoder_sys_t : decoder descriptor
 *****************************************************************************/
-typedef struct
-{
-    enum mpeg4_audioObjectType i_object_type;
-    unsigned i_samplerate;
-    uint8_t i_channel_configuration;
-    int8_t i_sbr;          // 0: no sbr, 1: sbr, -1: unknown
-    int8_t i_ps;           // 0: no ps,  1: ps,  -1: unknown
-
-    struct
-    {
-        enum mpeg4_audioObjectType i_object_type;
-        unsigned i_samplerate;
-        uint8_t i_channel_configuration;
-    } extension;
-
-    /* GASpecific */
-    unsigned i_frame_length;   // 1024 or 960
-
-} mpeg4_asc_t;
-
-#define LATM_MAX_EXTRA_SIZE 64
-typedef struct
-{
-    uint8_t i_program;
-    uint8_t i_layer;
-
-    unsigned i_frame_length;         // type 1
-    uint8_t i_frame_length_type;
-    uint8_t i_frame_length_index;   // type 3 4 5 6 7
-
-    mpeg4_asc_t cfg;
-
-    /* Raw configuration */
-    size_t i_extra;
-    uint8_t extra[LATM_MAX_EXTRA_SIZE];
-
-} latm_stream_t;
-
-#define LATM_MAX_LAYER (8)
-#define LATM_MAX_PROGRAM (16)
-typedef struct
-{
-    bool b_same_time_framing;
-    uint8_t i_sub_frames;
-    uint8_t i_programs;
-
-    uint8_t pi_layers[LATM_MAX_PROGRAM];
-
-    uint8_t pi_stream[LATM_MAX_PROGRAM][LATM_MAX_LAYER];
-
-    uint8_t i_streams;
-    latm_stream_t stream[LATM_MAX_PROGRAM*LATM_MAX_LAYER];
-
-    uint32_t i_other_data;
-    int16_t  i_crc;  /* -1 if not set */
-} latm_mux_t;

 typedef struct
 {
@ -140,7 +84,7 @@ typedef struct

    /* LOAS */
    bool b_latm_cfg;
-    latm_mux_t latm;
+    MPEG4_streammux_config_t latm;

    int i_warnings;
 } decoder_sys_t;
@ -167,13 +111,6 @@ enum {
    TYPE_LOAS
 };

-static const int pi_sample_rates[16] =
-{
-    96000, 88200, 64000, 48000, 44100, 32000, 24000, 22050,
-    16000, 12000, 11025, 8000,  7350,  0,     0,     0
-};
-
-
 static int ChannelConfigurationToVLC(uint8_t i_channel)
 {
    if (i_channel == 7)
@ -187,17 +124,17 @@ static int AOTtoAACProfile(uint8_t i_object_type)
 {
    switch(i_object_type)
    {
-        case AOT_AAC_MAIN:
-        case AOT_AAC_LC:
-        case AOT_AAC_SSR:
-        case AOT_AAC_LTP:
-        case AOT_AAC_SBR:
-        case AOT_AAC_SC:
-        case AOT_ER_AAC_LD:
-        case AOT_AAC_PS:
-        case AOT_ER_AAC_ELD:
+        case MPEG4_AOT_AAC_MAIN:
+        case MPEG4_AOT_AAC_LC:
+        case MPEG4_AOT_AAC_SSR:
+        case MPEG4_AOT_AAC_LTP:
+        case MPEG4_AOT_AAC_SBR:
+        case MPEG4_AOT_AAC_SC:
+        case MPEG4_AOT_ER_AAC_LD:
+        case MPEG4_AOT_AAC_PS:
+        case MPEG4_AOT_ER_AAC_ELD:
            {
-            static_assert(AOT_AAC_MAIN == AAC_PROFILE_MAIN + 1,
+            static_assert(MPEG4_AOT_AAC_MAIN == AAC_PROFILE_MAIN + 1,
                          "invalid profile to object mapping");
            return i_object_type - 1;
            }
@ -218,8 +155,6 @@ static void ClosePacketizer(vlc_object_t *);
 static block_t *Packetize    (decoder_t *, block_t **);
 static void     Flush( decoder_t * );

-static int Mpeg4ReadAudioSpecificConfig(bs_t *s, mpeg4_asc_t *p_cfg, bool);
-
 /*****************************************************************************
 * Module descriptor
 *****************************************************************************/
@ -299,10 +234,10 @@ static int OpenPacketizer(vlc_object_t *p_this)

    if(p_dec->fmt_in->i_extra)
    {
-        mpeg4_asc_t asc;
+        MPEG4_asc_t asc;
        bs_t s;
        bs_init(&s, p_dec->fmt_in->p_extra, p_dec->fmt_in->i_extra);
-        if(Mpeg4ReadAudioSpecificConfig(&s, &asc, true) == VLC_SUCCESS)
+        if(MPEG4_read_AudioSpecificConfig(&s, &asc, true) == VLC_SUCCESS)
        {
            p_dec->fmt_out.audio.i_rate = asc.i_samplerate;
            p_dec->fmt_out.audio.i_frame_length = asc.i_frame_length;
@ -493,443 +428,6 @@ static int LOASSyncInfo(uint8_t p_header[LOAS_HEADER_SIZE], unsigned int *pi_hea
    return ((p_header[1] & 0x1f) << 8) + p_header[2];
 }

-static int Mpeg4GAProgramConfigElement(bs_t *s)
-{
-    /* TODO compute channels count ? */
-    int i_tag = bs_read(s, 4);
-    if (i_tag != 0x05)
-        return -1;
-    bs_skip(s, 2 + 4); // object type + sampling index
-    int i_num_front = bs_read(s, 4);
-    int i_num_side = bs_read(s, 4);
-    int i_num_back = bs_read(s, 4);
-    int i_num_lfe = bs_read(s, 2);
-    int i_num_assoc_data = bs_read(s, 3);
-    int i_num_valid_cc = bs_read(s, 4);
-
-    if (bs_read1(s))
-        bs_skip(s, 4); // mono downmix
-    if (bs_read1(s))
-        bs_skip(s, 4); // stereo downmix
-    if (bs_read1(s))
-        bs_skip(s, 2+1); // matrix downmix + pseudo_surround
-
-    bs_skip(s, i_num_front * (1+4));
-    bs_skip(s, i_num_side * (1+4));
-    bs_skip(s, i_num_back * (1+4));
-    bs_skip(s, i_num_lfe * (4));
-    bs_skip(s, i_num_assoc_data * (4));
-    bs_skip(s, i_num_valid_cc * (5));
-    bs_align(s);
-    int i_comment = bs_read(s, 8);
-    bs_skip(s, i_comment * 8);
-    return 0;
-}
-
-static int Mpeg4GASpecificConfig(mpeg4_asc_t *p_cfg, bs_t *s)
-{
-    p_cfg->i_frame_length = bs_read1(s) ? 960 : 1024;
-    if(p_cfg->i_object_type == AOT_ER_AAC_LD) /* 14496-3 4.5.1.1 */
-        p_cfg->i_frame_length >>= 1;
-    else if(p_cfg->i_object_type == AOT_AAC_SSR)
-        p_cfg->i_frame_length = 256;
-
-    if (bs_read1(s))     // depend on core coder
-        bs_skip(s, 14);   // core coder delay
-
-    int i_extension_flag = bs_read1(s);
-    if (p_cfg->i_channel_configuration == 0)
-        Mpeg4GAProgramConfigElement(s);
-    if (p_cfg->i_object_type == AOT_AAC_SC ||
-        p_cfg->i_object_type == AOT_ER_AAC_SC)
-        bs_skip(s, 3);    // layer
-
-    if (i_extension_flag) {
-        if (p_cfg->i_object_type == AOT_ER_BSAC)
-            bs_skip(s, 5 + 11);   // numOfSubFrame + layer length
-        if (p_cfg->i_object_type == AOT_ER_AAC_LC ||
-            p_cfg->i_object_type == AOT_ER_AAC_LTP ||
-            p_cfg->i_object_type == AOT_ER_AAC_SC ||
-            p_cfg->i_object_type == AOT_ER_AAC_LD)
-            bs_skip(s, 1+1+1);    // ER data : section scale spectral */
-        if (bs_read1(s))     // extension 3
-            fprintf(stderr, "Mpeg4GASpecificConfig: error 1\n");
-    }
-    return 0;
-}
-
-static int Mpeg4ELDSpecificConfig(mpeg4_asc_t *p_cfg, bs_t *s)
-{
-    p_cfg->i_frame_length = bs_read1(s) ? 480 : 512;
-
-    /* ELDSpecificConfig Table 4.180 */
-
-    bs_skip(s, 3);
-    if(bs_read1(s)) /* ldSbrPresentFlag */
-    {
-        bs_skip(s, 2);
-        /* ld_sbr_header(channelConfiguration) Table 4.181 */
-        unsigned numSbrHeader;
-        switch(p_cfg->i_channel_configuration)
-        {
-            case 1: case 2:
-                numSbrHeader = 1;
-                break;
-            case 3:
-                numSbrHeader = 2;
-                break;
-            case 4: case 5: case 6:
-                numSbrHeader = 3;
-                break;
-            case 7:
-                numSbrHeader = 4;
-                break;
-            default:
-                numSbrHeader = 0;
-                break;
-        }
-        for( ; numSbrHeader; numSbrHeader-- )
-        {
-            /* sbr_header() Table 4.63 */
-            bs_read(s, 14);
-            bool header_extra_1 = bs_read1(s);
-            bool header_extra_2 = bs_read1(s);
-            if(header_extra_1)
-                bs_read(s, 5);
-            if(header_extra_2)
-                bs_read(s, 6);
-        }
-    }
-
-    for(unsigned eldExtType = bs_read(s, 4);
-        eldExtType != 0x0 /* ELDEXT_TERM */;
-        eldExtType = bs_read(s, 4))
-    {
-        unsigned eldExtLen = bs_read(s, 4);
-        unsigned eldExtLenAdd = 0;
-        if(eldExtLen == 15)
-        {
-            eldExtLenAdd = bs_read(s, 8);
-            eldExtLen += eldExtLenAdd;
-        }
-        if(eldExtLenAdd == 255)
-            eldExtLen += bs_read(s, 16);
-        /* reserved extensions */
-        for(; eldExtLen; eldExtLen--)
-            bs_skip(s, 8);
-    }
-
-    return 0;
-}
-
-static enum mpeg4_audioObjectType Mpeg4ReadAudioObjectType(bs_t *s)
-{
-    int i_type = bs_read(s, 5);
-    if (i_type == 31)
-        i_type = 32 + bs_read(s, 6);
-    return i_type;
-}
-
-static unsigned Mpeg4ReadAudioSamplerate(bs_t *s)
-{
-    int i_index = bs_read(s, 4);
-    if (i_index != 0x0f)
-        return pi_sample_rates[i_index];
-    return bs_read(s, 24);
-}
-
-static int Mpeg4ReadAudioSpecificConfig(bs_t *s, mpeg4_asc_t *p_cfg, bool b_withext)
-{
-    p_cfg->i_object_type = Mpeg4ReadAudioObjectType(s);
-    p_cfg->i_samplerate = Mpeg4ReadAudioSamplerate(s);
-    p_cfg->i_channel_configuration = bs_read(s, 4);
-
-    p_cfg->i_sbr = -1;
-    p_cfg->i_ps  = -1;
-    p_cfg->extension.i_object_type = 0;
-    p_cfg->extension.i_samplerate = 0;
-    p_cfg->extension.i_channel_configuration = 0;
-    p_cfg->i_frame_length = 0;
-
-    if (p_cfg->i_object_type == AOT_AAC_SBR ||
-        p_cfg->i_object_type == AOT_AAC_PS) {
-        p_cfg->i_sbr = 1;
-        if (p_cfg->i_object_type == AOT_AAC_PS)
-           p_cfg->i_ps = 1;
-        p_cfg->extension.i_object_type = AOT_AAC_SBR;
-        p_cfg->extension.i_samplerate = Mpeg4ReadAudioSamplerate(s);
-
-        p_cfg->i_object_type = Mpeg4ReadAudioObjectType(s);
-        if(p_cfg->i_object_type == AOT_ER_BSAC)
-            p_cfg->extension.i_channel_configuration = bs_read(s, 4);
-    }
-
-    switch(p_cfg->i_object_type)
-    {
-    case AOT_AAC_MAIN:
-    case AOT_AAC_LC:
-    case AOT_AAC_SSR:
-    case AOT_AAC_LTP:
-    case AOT_AAC_SC:
-    case AOT_TWINVQ:
-    case AOT_ER_AAC_LC:
-    case AOT_ER_AAC_LTP:
-    case AOT_ER_AAC_SC:
-    case AOT_ER_TWINVQ:
-    case AOT_ER_BSAC:
-    case AOT_ER_AAC_LD:
-        Mpeg4GASpecificConfig(p_cfg, s);
-        break;
-    case AOT_CELP:
-        // CelpSpecificConfig();
-    case AOT_HVXC:
-        // HvxcSpecificConfig();
-    case AOT_TTSI:
-        // TTSSSpecificConfig();
-    case AOT_MAIN_SYNTHETIC:
-    case AOT_WAVETABLES:
-    case AOT_GENERAL_MIDI:
-    case AOT_ALGORITHMIC:
-        // StructuredAudioSpecificConfig();
-    case AOT_ER_CELP:
-        // ERCelpSpecificConfig();
-    case AOT_ER_HXVC:
-        // ERHvxcSpecificConfig();
-    case AOT_ER_HILN:
-    case AOT_ER_Parametric:
-        // ParametricSpecificConfig();
-    case AOT_SSC:
-        // SSCSpecificConfig();
-    case AOT_LAYER1:
-    case AOT_LAYER2:
-    case AOT_LAYER3:
-        // MPEG_1_2_SpecificConfig();
-    case AOT_DST:
-        // DSTSpecificConfig();
-    case AOT_ALS:
-        // ALSSpecificConfig();
-    case AOT_SLS:
-    case AOT_SLS_NON_CORE:
-        // SLSSpecificConfig();
-    case AOT_ER_AAC_ELD:
-        Mpeg4ELDSpecificConfig(p_cfg, s);
-        break;
-    case AOT_SMR_SIMPLE:
-    case AOT_SMR_MAIN:
-        // SymbolicMusicSpecificConfig();
-    default:
-        // error
-        return VLC_EGENERIC;
-    }
-
-    switch(p_cfg->i_object_type)
-    {
-    case AOT_ER_AAC_LC:
-    case AOT_ER_AAC_LTP:
-    case AOT_ER_AAC_SC:
-    case AOT_ER_TWINVQ:
-    case AOT_ER_BSAC:
-    case AOT_ER_AAC_LD:
-    case AOT_ER_CELP:
-    case AOT_ER_HXVC:
-    case AOT_ER_HILN:
-    case AOT_ER_Parametric:
-    case AOT_ER_AAC_ELD:
-    {
-        int epConfig = bs_read(s, 2);
-        if (epConfig == 2 || epConfig == 3)
-            //ErrorProtectionSpecificConfig();
-        if (epConfig == 3)
-            if (bs_read1(s)) {
-                // TODO : directMapping
-            }
-        break;
-    }
-    default:
-        break;
-    }
-
-    if (b_withext && p_cfg->extension.i_object_type != AOT_AAC_SBR &&
-        !bs_eof(s) && bs_read(s, 11) == 0x2b7)
-    {
-        p_cfg->extension.i_object_type = Mpeg4ReadAudioObjectType(s);
-        if (p_cfg->extension.i_object_type == AOT_AAC_SBR)
-        {
-            p_cfg->i_sbr  = bs_read1(s);
-            if (p_cfg->i_sbr == 1) {
-                p_cfg->extension.i_samplerate = Mpeg4ReadAudioSamplerate(s);
-                if (bs_read(s, 11) == 0x548)
-                   p_cfg->i_ps = bs_read1(s);
-            }
-        }
-        else if (p_cfg->extension.i_object_type == AOT_ER_BSAC)
-        {
-            p_cfg->i_sbr  = bs_read1(s);
-            if(p_cfg->i_sbr)
-                p_cfg->extension.i_samplerate = Mpeg4ReadAudioSamplerate(s);
-            p_cfg->extension.i_channel_configuration = bs_read(s, 4);
-        }
-    }
-
-#if 0
-    static const char *ppsz_otype[] = {
-        "NULL",
-        "AAC Main", "AAC LC", "AAC SSR", "AAC LTP", "SBR", "AAC Scalable",
-        "TwinVQ",
-        "CELP", "HVXC",
-        "Reserved", "Reserved",
-        "TTSI",
-        "Main Synthetic", "Wavetables Synthesis", "General MIDI",
-        "Algorithmic Synthesis and Audio FX",
-        "ER AAC LC",
-        "Reserved",
-        "ER AAC LTP", "ER AAC Scalable", "ER TwinVQ", "ER BSAC", "ER AAC LD",
-        "ER CELP", "ER HVXC", "ER HILN", "ER Parametric",
-        "SSC",
-        "PS", "MPEG Surround", "Escape",
-        "Layer 1", "Layer 2", "Layer 3",
-        "DST", "ALS", "SLS", "SLS non-core", "ELD",
-        "SMR Simple", "SMR Main",
-    };
-
-    fprintf(stderr, "Mpeg4ReadAudioSpecificInfo: t=%s(%d)f=%d c=%d sbr=%d\n",
-            ppsz_otype[p_cfg->i_object_type], p_cfg->i_object_type,
-            p_cfg->i_samplerate, p_cfg->i_channel, p_cfg->i_sbr);
-#endif
-    return bs_error(s) ? VLC_EGENERIC : VLC_SUCCESS;
-}
-
-static uint32_t LatmGetValue(bs_t *s)
-{
-    uint32_t v = 0;
-    for (int i = 1 + bs_read(s, 2); i > 0; i--)
-        v = (v << 8) + bs_read(s, 8);
-    return v;
-}
-
-static size_t AudioSpecificConfigBitsToBytes(bs_t *s, uint32_t i_bits, uint8_t *p_data)
-{
-    size_t i_extra = __MIN((i_bits + 7) / 8, LATM_MAX_EXTRA_SIZE);
-    for (size_t i = 0; i < i_extra; i++) {
-        const uint32_t i_read = __MIN(8, i_bits - 8*i);
-        p_data[i] = bs_read(s, i_read) << (8-i_read);
-    }
-    return i_extra;
-}
-
-static int LatmReadStreamMuxConfiguration(latm_mux_t *m, bs_t *s)
-{
-    int i_mux_version;
-    int i_mux_versionA;
-
-    i_mux_version = bs_read(s, 1);
-    i_mux_versionA = 0;
-    if (i_mux_version)
-        i_mux_versionA = bs_read(s, 1);
-
-    if (i_mux_versionA != 0) /* support only A=0 */
-        return -1;
-
-    memset(m, 0, sizeof(*m));
-
-    if (i_mux_versionA == 0)
-        if (i_mux_version == 1)
-            LatmGetValue(s); /* taraBufferFullness */
-
-    if(bs_eof(s))
-        return -1;
-
-    m->b_same_time_framing = bs_read1(s);
-    m->i_sub_frames = 1 + bs_read(s, 6);
-    m->i_programs = 1 + bs_read(s, 4);
-
-    for (uint8_t i_program = 0; i_program < m->i_programs; i_program++) {
-        if(bs_eof(s))
-            return -1;
-        m->pi_layers[i_program] = 1+bs_read(s, 3);
-
-        for (uint8_t i_layer = 0; i_layer < m->pi_layers[i_program]; i_layer++) {
-            latm_stream_t *st = &m->stream[m->i_streams];
-            bool b_previous_cfg;
-
-            m->pi_stream[i_program][i_layer] = m->i_streams;
-            st->i_program = i_program;
-            st->i_layer = i_layer;
-
-            b_previous_cfg = false;
-            if (i_program != 0 || i_layer != 0)
-                b_previous_cfg = bs_read1(s);
-
-            if (b_previous_cfg) {
-                assert(m->i_streams > 0);
-                st->cfg = m->stream[m->i_streams-1].cfg;
-            } else {
-                uint32_t asc_size = 0;
-                if(i_mux_version > 0)
-                    asc_size = LatmGetValue(s);
-                bs_t asc_bs = *s;
-                Mpeg4ReadAudioSpecificConfig(&asc_bs, &st->cfg, i_mux_version > 0);
-                if (i_mux_version == 0)
-                    asc_size = bs_pos(&asc_bs) - bs_pos(s);
-                asc_bs = *s;
-                st->i_extra = AudioSpecificConfigBitsToBytes(&asc_bs, asc_size, st->extra);
-                bs_skip(s, asc_size);
-            }
-
-            st->i_frame_length_type = bs_read(s, 3);
-            switch(st->i_frame_length_type)
-            {
-            case 0:
-            {
-                bs_skip(s, 8); /* latmBufferFullnes */
-                if (!m->b_same_time_framing)
-                    if (st->cfg.i_object_type == AOT_AAC_SC ||
-                        st->cfg.i_object_type == AOT_CELP ||
-                        st->cfg.i_object_type == AOT_ER_AAC_SC ||
-                        st->cfg.i_object_type == AOT_ER_CELP)
-                        bs_skip(s, 6); /* eFrameOffset */
-                break;
-            }
-            case 1:
-                st->i_frame_length = bs_read(s, 9);
-                break;
-            case 3: case 4: case 5:
-                st->i_frame_length_index = bs_read(s, 6); // celp
-                break;
-            case 6: case 7:
-                st->i_frame_length_index = bs_read(s, 1); // hvxc
-            default:
-                break;
-            }
-            /* Next stream */
-            m->i_streams++;
-        }
-    }
-
-    if(bs_error(s) || bs_eof(s))
-        return -1;
-
-    /* other data */
-    if (bs_read1(s)) {
-        if (i_mux_version == 1)
-            m->i_other_data = LatmGetValue(s);
-        else {
-            int b_continue;
-            do {
-                b_continue = bs_read1(s);
-                m->i_other_data = (m->i_other_data << 8) + bs_read(s, 8);
-            } while (b_continue);
-        }
-    }
-
-    /* crc */
-    m->i_crc = -1;
-    if (bs_read1(s))
-        m->i_crc = bs_read(s, 8);
-
-    return bs_error(s) ? -1 : 0;
-}
-
 static int LOASParse(decoder_t *p_dec, uint8_t *p_buffer, int i_buffer)
 {
    decoder_sys_t *p_sys = p_dec->p_sys;
@ -939,9 +437,9 @@ static int LOASParse(decoder_t *p_dec, uint8_t *p_buffer, int i_buffer)
    bs_init(&s, p_buffer, i_buffer);

    /* Read the stream mux configuration if present */
-    if (!bs_read1(&s) && !LatmReadStreamMuxConfiguration(&p_sys->latm, &s) &&
+    if (!bs_read1(&s) && !MPEG4_parse_StreamMuxConfig(&s, &p_sys->latm) &&
            p_sys->latm.i_streams > 0) {
-        const latm_stream_t *st = &p_sys->latm.stream[0];
+        const MPEG4_audio_stream_t *st = &p_sys->latm.stream[0];

        if(st->cfg.i_samplerate == 0 || st->cfg.i_frame_length == 0 ||
           ChannelConfigurationToVLC(st->cfg.i_channel_configuration) == 0)
@ -996,12 +494,12 @@ static int LOASParse(decoder_t *p_dec, uint8_t *p_buffer, int i_buffer)
        msg_Err(p_dec, "latm sub frames not yet supported, please send a sample");

    for (uint8_t i_sub = 0; i_sub < p_sys->latm.i_sub_frames; i_sub++) {
-        unsigned pi_payload[LATM_MAX_PROGRAM][LATM_MAX_LAYER];
+        unsigned pi_payload[MPEG4_STREAMMUX_MAX_PROGRAM][MPEG4_STREAMMUX_MAX_LAYER];
        if (p_sys->latm.b_same_time_framing) {
            /* Payload length */
            for (uint8_t i_program = 0; i_program < p_sys->latm.i_programs; i_program++) {
                for (uint8_t i_layer = 0; i_layer < p_sys->latm.pi_layers[i_program]; i_layer++) {
-                    latm_stream_t *st = &p_sys->latm.stream[p_sys->latm.pi_stream[i_program][i_layer]];
+                    MPEG4_audio_stream_t *st = &p_sys->latm.stream[p_sys->latm.pi_stream[i_program][i_layer]];
                    if (st->i_frame_length_type == 0) {
                        unsigned i_payload = 0;
                        for (;;) {
@ -1055,7 +553,7 @@ static int LOASParse(decoder_t *p_dec, uint8_t *p_buffer, int i_buffer)

            for (int i_chunk = 0; i_chunk < i_chunks; i_chunk++) {
                const int streamIndex = bs_read(&s, 4);
-                latm_stream_t *st = &p_sys->latm.stream[streamIndex];
+                MPEG4_audio_stream_t *st = &p_sys->latm.stream[streamIndex];
                const int i_program = st->i_program;
                const int i_layer = st->i_layer;

--- a/modules/packetizer/mpeg4audio.h
+++ b/modules/packetizer/mpeg4audio.h
@ -1,7 +1,7 @@
 /*****************************************************************************
- * mpeg4audio.h: MPEG 4 audio definitions
+ * mpeg4audio.h: ISO/IEC 14496-3 audio definitions
 *****************************************************************************
- * Copyright (C) 2001-2017 VLC authors and VideoLAN
+ * Copyright (C) 2001-2024 VLC authors, VideoLAN and VideoLabs
 *
 * This program is free software; you can redistribute it and/or modify it
 * under the terms of the GNU Lesser General Public License as published by
@ -17,68 +17,71 @@
 * along with this program; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin Street, Fifth Floor, Boston MA 02110-1301, USA.
 *****************************************************************************/
-enum mpeg4_audioObjectType /* ISO/IEC 14496-3:2009 1.5.1 */
+#include <vlc_bits.h>
+
+enum MPEG4_audioObjectType /* ISO/IEC 14496-3:2009 1.5.1 */
 {
-    AOT_AAC_MAIN        = 1,
-    AOT_AAC_LC          = 2,
-    AOT_AAC_SSR         = 3,
-    AOT_AAC_LTP         = 4,
-    AOT_AAC_SBR         = 5,
-    AOT_AAC_SC          = 6,
-    AOT_TWINVQ          = 7,
-    AOT_CELP            = 8,
-    AOT_HVXC            = 9,
-    AOT_RESERVED10      = 10,
-    AOT_RESERVED11      = 11,
-    AOT_TTSI            = 12,
-    AOT_MAIN_SYNTHETIC  = 13,
-    AOT_WAVETABLES      = 14,
-    AOT_GENERAL_MIDI    = 15,
-    AOT_ALGORITHMIC     = 16,
-    AOT_ER_AAC_LC       = 17,
-    AOT_RESERVED18      = 18,
-    AOT_ER_AAC_LTP      = 19,
-    AOT_ER_AAC_SC       = 20,
-    AOT_ER_TWINVQ       = 21,
-    AOT_ER_BSAC         = 22,
-    AOT_ER_AAC_LD       = 23,
-    AOT_ER_CELP         = 24,
-    AOT_ER_HXVC         = 25,
-    AOT_ER_HILN         = 26,
-    AOT_ER_Parametric   = 27,
-    AOT_SSC             = 28,
-    AOT_AAC_PS          = 29,
-    AOT_MPEG_SURROUND   = 30,
-    AOT_ESCAPE          = 31,
-    AOT_LAYER1          = 32,
-    AOT_LAYER2          = 33,
-    AOT_LAYER3          = 34,
-    AOT_DST             = 35,
-    AOT_ALS             = 36,
-    AOT_SLS             = 37,
-    AOT_SLS_NON_CORE    = 38,
-    AOT_ER_AAC_ELD      = 39,
-    AOT_SMR_SIMPLE      = 40,
-    AOT_SMR_MAIN        = 41,
+    MPEG4_AOT_NULL            = 0,
+    MPEG4_AOT_AAC_MAIN        = 1,
+    MPEG4_AOT_AAC_LC          = 2,
+    MPEG4_AOT_AAC_SSR         = 3,
+    MPEG4_AOT_AAC_LTP         = 4,
+    MPEG4_AOT_AAC_SBR         = 5,
+    MPEG4_AOT_AAC_SC          = 6,
+    MPEG4_AOT_TWINVQ          = 7,
+    MPEG4_AOT_CELP            = 8,
+    MPEG4_AOT_HVXC            = 9,
+    MPEG4_AOT_RESERVED10      = 10,
+    MPEG4_AOT_RESERVED11      = 11,
+    MPEG4_AOT_TTSI            = 12,
+    MPEG4_AOT_MAIN_SYNTHETIC  = 13,
+    MPEG4_AOT_WAVETABLES      = 14,
+    MPEG4_AOT_GENERAL_MIDI    = 15,
+    MPEG4_AOT_ALGORITHMIC     = 16,
+    MPEG4_AOT_ER_AAC_LC       = 17,
+    MPEG4_AOT_RESERVED18      = 18,
+    MPEG4_AOT_ER_AAC_LTP      = 19,
+    MPEG4_AOT_ER_AAC_SC       = 20,
+    MPEG4_AOT_ER_TWINVQ       = 21,
+    MPEG4_AOT_ER_BSAC         = 22,
+    MPEG4_AOT_ER_AAC_LD       = 23,
+    MPEG4_AOT_ER_CELP         = 24,
+    MPEG4_AOT_ER_HXVC         = 25,
+    MPEG4_AOT_ER_HILN         = 26,
+    MPEG4_AOT_ER_Parametric   = 27,
+    MPEG4_AOT_SSC             = 28,
+    MPEG4_AOT_AAC_PS          = 29,
+    MPEG4_AOT_MPEG_SURROUND   = 30,
+    MPEG4_AOT_ESCAPE          = 31,
+    MPEG4_AOT_LAYER1          = 32,
+    MPEG4_AOT_LAYER2          = 33,
+    MPEG4_AOT_LAYER3          = 34,
+    MPEG4_AOT_DST             = 35,
+    MPEG4_AOT_ALS             = 36,
+    MPEG4_AOT_SLS             = 37,
+    MPEG4_AOT_SLS_NON_CORE    = 38,
+    MPEG4_AOT_ER_AAC_ELD      = 39,
+    MPEG4_AOT_SMR_SIMPLE      = 40,
+    MPEG4_AOT_SMR_MAIN        = 41,
 };

 enum
 {
-    AAC_PROFILE_MAIN = AOT_AAC_MAIN - 1,
+    AAC_PROFILE_MAIN = MPEG4_AOT_AAC_MAIN - 1,
    AAC_PROFILE_LC,
    AAC_PROFILE_SSR,
    AAC_PROFILE_LTP,
    AAC_PROFILE_HE,
-    AAC_PROFILE_LD   = AOT_ER_AAC_LD - 1,
-    AAC_PROFILE_HEv2 = AOT_AAC_PS - 1,
-    AAC_PROFILE_ELD  = AOT_ER_AAC_ELD - 1,
+    AAC_PROFILE_LD   = MPEG4_AOT_ER_AAC_LD - 1,
+    AAC_PROFILE_HEv2 = MPEG4_AOT_AAC_PS - 1,
+    AAC_PROFILE_ELD  = MPEG4_AOT_ER_AAC_ELD - 1,
    /* Similar shift signaling as avcodec, as signaling should have been
       done in ADTS header. Values defaults to MPEG4 */
    AAC_PROFILE_MPEG2_LC = AAC_PROFILE_LC + 128,
    AAC_PROFILE_MPEG2_HE = AAC_PROFILE_HE + 128,
 };

-static const uint32_t mpeg4_asc_channelsbyindex[] =
+static const uint32_t MPEG4_asc_channelsbyindex[] =
 {
    [0] = 0, /* Set later */

@ -110,4 +113,505 @@ static const uint32_t mpeg4_asc_channelsbyindex[] =
    [8] = 0,
 };

-#define MPEG4_ASC_MAX_INDEXEDPOS ARRAY_SIZE(mpeg4_asc_channelsbyindex)
+#define MPEG4_ASC_MAX_INDEXEDPOS ARRAY_SIZE(MPEG4_asc_channelsbyindex)
+
+typedef struct
+{
+    enum MPEG4_audioObjectType i_object_type;
+    unsigned i_samplerate;
+    uint8_t i_channel_configuration;
+    int8_t i_sbr;          // 0: no sbr, 1: sbr, -1: unknown
+    int8_t i_ps;           // 0: no ps,  1: ps,  -1: unknown
+
+    struct
+    {
+        enum MPEG4_audioObjectType i_object_type;
+        unsigned i_samplerate;
+        uint8_t i_channel_configuration;
+    } extension;
+
+    /* GASpecific */
+    unsigned i_frame_length;   // 1024 or 960
+
+} MPEG4_asc_t;
+
+static inline int MPEG4_read_GAProgramConfigElement(bs_t *s)
+{
+    /* TODO compute channels count ? */
+    int i_tag = bs_read(s, 4);
+    if (i_tag != 0x05)
+        return -1;
+    bs_skip(s, 2 + 4); // object type + sampling index
+    int i_num_front = bs_read(s, 4);
+    int i_num_side = bs_read(s, 4);
+    int i_num_back = bs_read(s, 4);
+    int i_num_lfe = bs_read(s, 2);
+    int i_num_assoc_data = bs_read(s, 3);
+    int i_num_valid_cc = bs_read(s, 4);
+
+    if (bs_read1(s))
+        bs_skip(s, 4); // mono downmix
+    if (bs_read1(s))
+        bs_skip(s, 4); // stereo downmix
+    if (bs_read1(s))
+        bs_skip(s, 2+1); // matrix downmix + pseudo_surround
+
+    bs_skip(s, i_num_front * (1+4));
+    bs_skip(s, i_num_side * (1+4));
+    bs_skip(s, i_num_back * (1+4));
+    bs_skip(s, i_num_lfe * (4));
+    bs_skip(s, i_num_assoc_data * (4));
+    bs_skip(s, i_num_valid_cc * (5));
+    bs_align(s);
+    int i_comment = bs_read(s, 8);
+    bs_skip(s, i_comment * 8);
+    return 0;
+}
+
+static inline int MPEG4_read_GASpecificConfig(MPEG4_asc_t *p_cfg, bs_t *s)
+{
+    p_cfg->i_frame_length = bs_read1(s) ? 960 : 1024;
+    if(p_cfg->i_object_type == MPEG4_AOT_ER_AAC_LD) /* 14496-3 4.5.1.1 */
+        p_cfg->i_frame_length >>= 1;
+    else if(p_cfg->i_object_type == MPEG4_AOT_AAC_SSR)
+        p_cfg->i_frame_length = 256;
+
+    if (bs_read1(s))     // depend on core coder
+        bs_skip(s, 14);   // core coder delay
+
+    int i_extension_flag = bs_read1(s);
+    if (p_cfg->i_channel_configuration == 0)
+        MPEG4_read_GAProgramConfigElement(s);
+    if (p_cfg->i_object_type == MPEG4_AOT_AAC_SC ||
+        p_cfg->i_object_type == MPEG4_AOT_ER_AAC_SC)
+        bs_skip(s, 3);    // layer
+
+    if (i_extension_flag) {
+        if (p_cfg->i_object_type == MPEG4_AOT_ER_BSAC)
+            bs_skip(s, 5 + 11);   // numOfSubFrame + layer length
+        if (p_cfg->i_object_type == MPEG4_AOT_ER_AAC_LC ||
+            p_cfg->i_object_type == MPEG4_AOT_ER_AAC_LTP ||
+            p_cfg->i_object_type == MPEG4_AOT_ER_AAC_SC ||
+            p_cfg->i_object_type == MPEG4_AOT_ER_AAC_LD)
+            bs_skip(s, 1+1+1);    // ER data : section scale spectral */
+        if (bs_read1(s))     // extension 3
+            fprintf(stderr, "MPEG4GASpecificConfig: error 1\n");
+    }
+    return 0;
+}
+
+static inline int MPEG4_read_ELDSpecificConfig(MPEG4_asc_t *p_cfg, bs_t *s)
+{
+    p_cfg->i_frame_length = bs_read1(s) ? 480 : 512;
+
+    /* ELDSpecificConfig Table 4.180 */
+
+    bs_skip(s, 3);
+    if(bs_read1(s)) /* ldSbrPresentFlag */
+    {
+        bs_skip(s, 2);
+        /* ld_sbr_header(channelConfiguration) Table 4.181 */
+        unsigned numSbrHeader;
+        switch(p_cfg->i_channel_configuration)
+        {
+        case 1: case 2:
+            numSbrHeader = 1;
+            break;
+        case 3:
+            numSbrHeader = 2;
+            break;
+        case 4: case 5: case 6:
+            numSbrHeader = 3;
+            break;
+        case 7:
+            numSbrHeader = 4;
+            break;
+        default:
+            numSbrHeader = 0;
+            break;
+        }
+        for( ; numSbrHeader; numSbrHeader-- )
+        {
+            /* sbr_header() Table 4.63 */
+            bs_read(s, 14);
+            bool header_extra_1 = bs_read1(s);
+            bool header_extra_2 = bs_read1(s);
+            if(header_extra_1)
+                bs_read(s, 5);
+            if(header_extra_2)
+                bs_read(s, 6);
+        }
+    }
+
+    for(unsigned eldExtType = bs_read(s, 4);
+         eldExtType != 0x0 /* ELDEXT_TERM */;
+         eldExtType = bs_read(s, 4))
+    {
+        unsigned eldExtLen = bs_read(s, 4);
+        unsigned eldExtLenAdd = 0;
+        if(eldExtLen == 15)
+        {
+            eldExtLenAdd = bs_read(s, 8);
+            eldExtLen += eldExtLenAdd;
+        }
+        if(eldExtLenAdd == 255)
+            eldExtLen += bs_read(s, 16);
+        /* reserved extensions */
+        for(; eldExtLen; eldExtLen--)
+            bs_skip(s, 8);
+    }
+
+    return 0;
+}
+
+static inline enum MPEG4_audioObjectType MPEG4_read_AudioObjectType(bs_t *s)
+{
+    int i_type = bs_read(s, 5);
+    if (i_type == 31)
+        i_type = 32 + bs_read(s, 6);
+    return (enum MPEG4_audioObjectType) i_type;
+}
+
+static const int pi_sample_rates[16] =
+    {
+        96000, 88200, 64000, 48000, 44100, 32000, 24000, 22050,
+        16000, 12000, 11025, 8000,  7350,  0,     0,     0
+};
+
+static inline unsigned MPEG4_read_AudioSamplerate(bs_t *s)
+{
+    int i_index = bs_read(s, 4);
+    if (i_index != 0x0f)
+        return pi_sample_rates[i_index];
+    return bs_read(s, 24);
+}
+
+static inline int MPEG4_read_AudioSpecificConfig(bs_t *s, MPEG4_asc_t *p_cfg, bool b_withext)
+{
+    p_cfg->i_object_type = MPEG4_read_AudioObjectType(s);
+    p_cfg->i_samplerate = MPEG4_read_AudioSamplerate(s);
+    p_cfg->i_channel_configuration = bs_read(s, 4);
+
+    p_cfg->i_sbr = -1;
+    p_cfg->i_ps  = -1;
+    p_cfg->extension.i_object_type = MPEG4_AOT_NULL;
+    p_cfg->extension.i_samplerate = 0;
+    p_cfg->extension.i_channel_configuration = 0;
+    p_cfg->i_frame_length = 0;
+
+    if (p_cfg->i_object_type == MPEG4_AOT_AAC_SBR ||
+        p_cfg->i_object_type == MPEG4_AOT_AAC_PS) {
+        p_cfg->i_sbr = 1;
+        if (p_cfg->i_object_type == MPEG4_AOT_AAC_PS)
+            p_cfg->i_ps = 1;
+        p_cfg->extension.i_object_type = MPEG4_AOT_AAC_SBR;
+        p_cfg->extension.i_samplerate = MPEG4_read_AudioSamplerate(s);
+
+        p_cfg->i_object_type = MPEG4_read_AudioObjectType(s);
+        if(p_cfg->i_object_type == MPEG4_AOT_ER_BSAC)
+            p_cfg->extension.i_channel_configuration = bs_read(s, 4);
+    }
+
+    switch(p_cfg->i_object_type)
+    {
+    case MPEG4_AOT_AAC_MAIN:
+    case MPEG4_AOT_AAC_LC:
+    case MPEG4_AOT_AAC_SSR:
+    case MPEG4_AOT_AAC_LTP:
+    case MPEG4_AOT_AAC_SC:
+    case MPEG4_AOT_TWINVQ:
+    case MPEG4_AOT_ER_AAC_LC:
+    case MPEG4_AOT_ER_AAC_LTP:
+    case MPEG4_AOT_ER_AAC_SC:
+    case MPEG4_AOT_ER_TWINVQ:
+    case MPEG4_AOT_ER_BSAC:
+    case MPEG4_AOT_ER_AAC_LD:
+        MPEG4_read_GASpecificConfig(p_cfg, s);
+        break;
+    case MPEG4_AOT_CELP:
+        // CelpSpecificConfig();
+    case MPEG4_AOT_HVXC:
+        // HvxcSpecificConfig();
+    case MPEG4_AOT_TTSI:
+        // TTSSSpecificConfig();
+    case MPEG4_AOT_MAIN_SYNTHETIC:
+    case MPEG4_AOT_WAVETABLES:
+    case MPEG4_AOT_GENERAL_MIDI:
+    case MPEG4_AOT_ALGORITHMIC:
+        // StructuredAudioSpecificConfig();
+    case MPEG4_AOT_ER_CELP:
+        // ERCelpSpecificConfig();
+    case MPEG4_AOT_ER_HXVC:
+        // ERHvxcSpecificConfig();
+    case MPEG4_AOT_ER_HILN:
+    case MPEG4_AOT_ER_Parametric:
+        // ParametricSpecificConfig();
+    case MPEG4_AOT_SSC:
+        // SSCSpecificConfig();
+    case MPEG4_AOT_LAYER1:
+    case MPEG4_AOT_LAYER2:
+    case MPEG4_AOT_LAYER3:
+        // MPEG_1_2_SpecificConfig();
+    case MPEG4_AOT_DST:
+        // DSTSpecificConfig();
+    case MPEG4_AOT_ALS:
+        // ALSSpecificConfig();
+    case MPEG4_AOT_SLS:
+    case MPEG4_AOT_SLS_NON_CORE:
+        // SLSSpecificConfig();
+    case MPEG4_AOT_ER_AAC_ELD:
+        MPEG4_read_ELDSpecificConfig(p_cfg, s);
+        break;
+    case MPEG4_AOT_SMR_SIMPLE:
+    case MPEG4_AOT_SMR_MAIN:
+        // SymbolicMusicSpecificConfig();
+    default:
+        // error
+        return VLC_EGENERIC;
+    }
+
+    switch(p_cfg->i_object_type)
+    {
+    case MPEG4_AOT_ER_AAC_LC:
+    case MPEG4_AOT_ER_AAC_LTP:
+    case MPEG4_AOT_ER_AAC_SC:
+    case MPEG4_AOT_ER_TWINVQ:
+    case MPEG4_AOT_ER_BSAC:
+    case MPEG4_AOT_ER_AAC_LD:
+    case MPEG4_AOT_ER_CELP:
+    case MPEG4_AOT_ER_HXVC:
+    case MPEG4_AOT_ER_HILN:
+    case MPEG4_AOT_ER_Parametric:
+    case MPEG4_AOT_ER_AAC_ELD:
+    {
+        int epConfig = bs_read(s, 2);
+        if (epConfig == 2 || epConfig == 3)
+            //ErrorProtectionSpecificConfig();
+            if (epConfig == 3)
+                if (bs_read1(s)) {
+                    // TODO : directMapping
+                }
+        break;
+    }
+    default:
+        break;
+    }
+
+    if (b_withext && p_cfg->extension.i_object_type != MPEG4_AOT_AAC_SBR &&
+        !bs_eof(s) && bs_read(s, 11) == 0x2b7)
+    {
+        p_cfg->extension.i_object_type = MPEG4_read_AudioObjectType(s);
+        if (p_cfg->extension.i_object_type == MPEG4_AOT_AAC_SBR)
+        {
+            p_cfg->i_sbr  = bs_read1(s);
+            if (p_cfg->i_sbr == 1) {
+                p_cfg->extension.i_samplerate = MPEG4_read_AudioSamplerate(s);
+                if (bs_read(s, 11) == 0x548)
+                    p_cfg->i_ps = bs_read1(s);
+            }
+        }
+        else if (p_cfg->extension.i_object_type == MPEG4_AOT_ER_BSAC)
+        {
+            p_cfg->i_sbr  = bs_read1(s);
+            if(p_cfg->i_sbr)
+                p_cfg->extension.i_samplerate = MPEG4_read_AudioSamplerate(s);
+            p_cfg->extension.i_channel_configuration = bs_read(s, 4);
+        }
+    }
+
+#if 0
+    static const char *ppsz_otype[] = {
+        "NULL",
+        "AAC Main", "AAC LC", "AAC SSR", "AAC LTP", "SBR", "AAC Scalable",
+        "TwinVQ",
+        "CELP", "HVXC",
+        "Reserved", "Reserved",
+        "TTSI",
+        "Main Synthetic", "Wavetables Synthesis", "General MIDI",
+        "Algorithmic Synthesis and Audio FX",
+        "ER AAC LC",
+        "Reserved",
+        "ER AAC LTP", "ER AAC Scalable", "ER TwinVQ", "ER BSAC", "ER AAC LD",
+        "ER CELP", "ER HVXC", "ER HILN", "ER Parametric",
+        "SSC",
+        "PS", "MPEG Surround", "Escape",
+        "Layer 1", "Layer 2", "Layer 3",
+        "DST", "ALS", "SLS", "SLS non-core", "ELD",
+        "SMR Simple", "SMR Main",
+    };
+
+    fprintf(stderr, "MPEG4ReadAudioSpecificInfo: t=%s(%d)f=%d c=%d sbr=%d\n",
+            ppsz_otype[p_cfg->i_object_type], p_cfg->i_object_type,
+            p_cfg->i_samplerate, p_cfg->i_channel, p_cfg->i_sbr);
+#endif
+    return bs_error(s) ? VLC_EGENERIC : VLC_SUCCESS;
+}
+
+#define MPEG4_STREAM_MAX_EXTRADATA 64
+typedef struct
+{
+    uint8_t i_program;
+    uint8_t i_layer;
+
+    unsigned i_frame_length;         // type 1
+    uint8_t i_frame_length_type;
+    uint8_t i_frame_length_index;   // type 3 4 5 6 7
+
+    MPEG4_asc_t cfg;
+
+    /* Raw configuration */
+    size_t i_extra;
+    uint8_t extra[MPEG4_STREAM_MAX_EXTRADATA];
+
+} MPEG4_audio_stream_t;
+
+#define MPEG4_STREAMMUX_MAX_LAYER   8
+#define MPEG4_STREAMMUX_MAX_PROGRAM 16
+typedef struct
+{
+    bool b_same_time_framing;
+    uint8_t i_sub_frames;
+    uint8_t i_programs;
+
+    uint8_t pi_layers[MPEG4_STREAMMUX_MAX_PROGRAM];
+
+    uint8_t pi_stream[MPEG4_STREAMMUX_MAX_PROGRAM][MPEG4_STREAMMUX_MAX_LAYER];
+
+    uint8_t i_streams;
+    MPEG4_audio_stream_t stream[MPEG4_STREAMMUX_MAX_PROGRAM*MPEG4_STREAMMUX_MAX_LAYER];
+
+    uint32_t i_other_data;
+    int16_t  i_crc;  /* -1 if not set */
+} MPEG4_streammux_config_t;
+
+static inline uint32_t MPEG4_LatmGetValue(bs_t *s)
+{
+    uint32_t v = 0;
+    for (int i = 1 + bs_read(s, 2); i > 0; i--)
+        v = (v << 8) + bs_read(s, 8);
+    return v;
+}
+
+static inline size_t AudioSpecificConfigBitsToBytes(bs_t *s, uint32_t i_bits, uint8_t *p_data)
+{
+    size_t i_extra = __MIN((i_bits + 7) / 8, MPEG4_STREAM_MAX_EXTRADATA);
+    for (size_t i = 0; i < i_extra; i++) {
+        const uint32_t i_read = __MIN(8, i_bits - 8*i);
+        p_data[i] = bs_read(s, i_read) << (8-i_read);
+    }
+    return i_extra;
+}
+
+static inline int MPEG4_parse_StreamMuxConfig(bs_t *s, MPEG4_streammux_config_t *m)
+{
+    int i_mux_version;
+    int i_mux_versionA;
+
+    i_mux_version = bs_read(s, 1);
+    i_mux_versionA = 0;
+    if (i_mux_version)
+        i_mux_versionA = bs_read(s, 1);
+
+    if (i_mux_versionA != 0) /* support only A=0 */
+        return -1;
+
+    memset(m, 0, sizeof(*m));
+
+    if (i_mux_versionA == 0)
+        if (i_mux_version == 1)
+            MPEG4_LatmGetValue(s); /* taraBufferFullness */
+
+    if(bs_eof(s))
+        return -1;
+
+    m->b_same_time_framing = bs_read1(s);
+    m->i_sub_frames = 1 + bs_read(s, 6);
+    m->i_programs = 1 + bs_read(s, 4);
+
+    for (uint8_t i_program = 0; i_program < m->i_programs; i_program++) {
+        if(bs_eof(s))
+            return -1;
+        m->pi_layers[i_program] = 1+bs_read(s, 3);
+
+        for (uint8_t i_layer = 0; i_layer < m->pi_layers[i_program]; i_layer++) {
+            MPEG4_audio_stream_t *st = &m->stream[m->i_streams];
+            bool b_previous_cfg;
+
+            m->pi_stream[i_program][i_layer] = m->i_streams;
+            st->i_program = i_program;
+            st->i_layer = i_layer;
+
+            b_previous_cfg = false;
+            if (i_program != 0 || i_layer != 0)
+                b_previous_cfg = bs_read1(s);
+
+            if (b_previous_cfg) {
+                assert(m->i_streams > 0);
+                st->cfg = m->stream[m->i_streams-1].cfg;
+            } else {
+                uint32_t asc_size = 0;
+                if(i_mux_version > 0)
+                    asc_size = MPEG4_LatmGetValue(s);
+                bs_t asc_bs = *s;
+                MPEG4_read_AudioSpecificConfig(&asc_bs, &st->cfg, i_mux_version > 0);
+                if (i_mux_version == 0)
+                    asc_size = bs_pos(&asc_bs) - bs_pos(s);
+                asc_bs = *s;
+                st->i_extra = AudioSpecificConfigBitsToBytes(&asc_bs, asc_size, st->extra);
+                bs_skip(s, asc_size);
+            }
+
+            st->i_frame_length_type = bs_read(s, 3);
+            switch(st->i_frame_length_type)
+            {
+            case 0:
+            {
+                bs_skip(s, 8); /* latmBufferFullnes */
+                if (!m->b_same_time_framing)
+                    if (st->cfg.i_object_type == MPEG4_AOT_AAC_SC ||
+                        st->cfg.i_object_type == MPEG4_AOT_CELP ||
+                        st->cfg.i_object_type == MPEG4_AOT_ER_AAC_SC ||
+                        st->cfg.i_object_type == MPEG4_AOT_ER_CELP)
+                        bs_skip(s, 6); /* eFrameOffset */
+                break;
+            }
+            case 1:
+                st->i_frame_length = bs_read(s, 9);
+                break;
+            case 3: case 4: case 5:
+                st->i_frame_length_index = bs_read(s, 6); // celp
+                break;
+            case 6: case 7:
+                st->i_frame_length_index = bs_read(s, 1); // hvxc
+            default:
+                break;
+            }
+            /* Next stream */
+            m->i_streams++;
+        }
+    }
+
+    if(bs_error(s) || bs_eof(s))
+        return -1;
+
+    /* other data */
+    if (bs_read1(s)) {
+        if (i_mux_version == 1)
+            m->i_other_data = MPEG4_LatmGetValue(s);
+        else {
+            int b_continue;
+            do {
+                b_continue = bs_read1(s);
+                m->i_other_data = (m->i_other_data << 8) + bs_read(s, 8);
+            } while (b_continue);
+        }
+    }
+
+    /* crc */
+    m->i_crc = -1;
+    if (bs_read1(s))
+        m->i_crc = bs_read(s, 8);
+
+    return bs_error(s) ? -1 : 0;
+}
+