[FFmpeg-devel] [PATCH] avformat: add Limitless Audio Format demuxer

Mon Sep 12 13:56:11 EEST 2022

Paul B Mahol:
> +static int laf_read_header(AVFormatContext *ctx)
> +{
> +    LAFContext *s = ctx->priv_data;
> +    AVIOContext *pb = ctx->pb;
> +    unsigned st_count, mode;
> +    unsigned sample_rate;
> +    int64_t duration;
> +    int codec_id;
> +    int quality;
> +    int bpp;
> +
> +    avio_skip(pb, 9);
> +    if (avio_rb32(pb) != MKBETAG('H','E','A','D'))
> +        return AVERROR_INVALIDDATA;
> +
> +    quality = avio_r8(pb);
> +    if (quality > 3)
> +        return AVERROR_INVALIDDATA;
> +    mode = avio_r8(pb);
> +    if (mode > 1)
> +        return AVERROR_INVALIDDATA;
> +    st_count = avio_rl32(pb);
> +    if (st_count == 0 || st_count > 1024)

I don't know whether the limit of 1024 is arbitrary or something from
some spec. If it is the latter, you should use a #define for it and also
for the size of the StreamParams array in the ctx. If it is the former,
you might just use FF_ARRAY_ELEMS(s->p) instead of 1024 here. Or a
define, as you prefer.

> +        return AVERROR_INVALIDDATA;
> +
> +    for (int i = 0; i < st_count; i++) {
> +        StreamParams *stp = &s->p[i];
> +
> +        stp->vertical = av_int2float(avio_rl32(pb));
> +        stp->horizontal = av_int2float(avio_rl32(pb));
> +        stp->lfe = avio_r8(pb);
> +        if (stp->lfe) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_LOW_FREQUENCY));
> +        } else if (stp->vertical == 0.f &&
> +                   stp->horizontal == 0.f) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_FRONT_CENTER));
> +        } else if (stp->vertical == 0.f &&
> +                   stp->horizontal == -30.f) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_FRONT_LEFT));
> +        } else if (stp->vertical == 0.f &&
> +                   stp->horizontal == 30.f) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_FRONT_RIGHT));
> +        } else if (stp->vertical == 0.f &&
> +                   stp->horizontal == -110.f) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_SIDE_LEFT));
> +        } else if (stp->vertical == 0.f &&
> +                   stp->horizontal == 110.f) {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MASK(1, (AV_CH_SIDE_RIGHT));
> +        } else {
> +            stp->layout = (AVChannelLayout)AV_CHANNEL_LAYOUT_MONO;
> +        }
> +    }
> +
> +    sample_rate = avio_rl32(pb);
> +    duration = avio_rl64(pb) / st_count;
> +    switch (quality) {
> +    case 0:
> +        codec_id = AV_CODEC_ID_PCM_U8;
> +        bpp = 1;
> +        break;
> +    case 1:
> +        codec_id = AV_CODEC_ID_PCM_S16LE;
> +        bpp = 2;
> +        break;
> +    case 2:
> +        codec_id = AV_CODEC_ID_PCM_F32LE;
> +        bpp = 4;
> +        break;
> +    case 3:
> +        codec_id = AV_CODEC_ID_PCM_S24LE;
> +        bpp = 3;
> +        break;
> +    }
> +
> +    s->index = 0;
> +    s->stored_index = 0;
> +    s->bpp = bpp;
> +    s->data = av_mallocz(st_count * sample_rate * bpp);

sample_rate is read via avio_rl32() and therefore the multiplication on
the right can overflow (it's performed in 32bits, so this can happen
even on 64bit systems). Maybe use av_calloc(sample_rate, st_count *
bpp). But you also need to ensure that sample_rate actually fits into an
int and that st_count * sample_rate * bpp performed in the avio_read()
below also fits into an int, so you should probably just ensure this here.

> +    if (!s->data)
> +        return AVERROR(ENOMEM);
> +
> +    for (int st = 0; st < st_count; st++) {
> +        StreamParams *stp = &s->p[st];
> +        LAFStream *lafst;
> +        AVCodecParameters *par;
> +        AVStream *st = avformat_new_stream(ctx, NULL);
> +        if (!st)
> +            return AVERROR(ENOMEM);
> +
> +        par = st->codecpar;
> +        par->codec_id = codec_id;
> +        par->codec_type = AVMEDIA_TYPE_AUDIO;
> +        par->ch_layout.nb_channels = 1;
> +        par->ch_layout = stp->layout;
> +        par->sample_rate = sample_rate;
> +        st->duration = duration;
> +        st->priv_data = lafst = av_mallocz(sizeof(LAFStream));

lafst is set-but-unused. And given that you are already imposing a
hardcoded limit on the number of streams you could just add an array of
1024 uint8_t to your context.

> +        if (!st->priv_data)
> +            return AVERROR(ENOMEM);
> +
> +        avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
> +    }
> +
> +    return 0;
> +}
> +
> +static int laf_read_packet(AVFormatContext *ctx, AVPacket *pkt)
> +{
> +    AVIOContext *pb = ctx->pb;
> +    LAFContext *s = ctx->priv_data;
> +    AVStream *st = ctx->streams[0];
> +    LAFStream *lafst = st->priv_data;
> +    const int bpp = s->bpp;
> +    int header_len = (ctx->nb_streams / 8) + !!(ctx->nb_streams & 7);

(ctx->nb_streams + 7) / 8.

> +    int64_t pos;
> +    int ret;
> +
> +again:
> +    if (avio_feof(pb))
> +        return AVERROR_EOF;
> +
> +    pos = avio_tell(pb);
> +
> +    if (s->index >= ctx->nb_streams) {
> +        int cur_st = 0, st_count = 0, st_index = 0;
> +
> +        for (int i = 0; i < header_len; i++) {
> +            uint8_t val = avio_r8(pb);

Given that you impose a limit of 1024 for the number of streams, you can
actually put an uint8_t [128] on the stack in this loop and read all the
values at once. This would allow to remove the outer loop.
(If you used an array of uint8_t instead of the st->priv_data for
stored, you could also use that array.)

> +
> +            for (int j = 0; j < 8 && cur_st < ctx->nb_streams; j++, cur_st++) {
> +                AVStream *st = ctx->streams[st_index];
> +                LAFStream *lafst = st->priv_data;
> +
> +                lafst->stored = 0;
> +                if (val & 1) {
> +                    lafst->stored = 1;
> +                    st_count++;
> +                }
> +                val >>= 1;
> +                st_index++;
> +            }
> +        }
> +
> +        s->index = s->stored_index = 0;
> +        s->nb_stored = st_count;
> +        if (!st_count)
> +            return AVERROR_INVALIDDATA;
> +        ret = avio_read(pb, s->data, st_count * st->codecpar->sample_rate * bpp);
> +        if (ret < 0)
> +            return ret;
> +    }
> +
> +    st = ctx->streams[s->index];
> +    lafst = st->priv_data;
> +    while (!lafst->stored) {
> +        s->index++;
> +        if (s->index >= ctx->nb_streams)
> +            goto again;
> +        lafst = ctx->streams[s->index]->priv_data;
> +    }
> +    st = ctx->streams[s->index];
> +
> +    ret = av_new_packet(pkt, st->codecpar->sample_rate * bpp);
> +    if (ret < 0)
> +        return ret;
> +
> +    for (int n = 0; n < st->codecpar->sample_rate; n++)
> +        memcpy(pkt->data + n * bpp, s->data + n * s->nb_stored * bpp + s->stored_index * bpp, bpp);

This looks like something that can easily trigger a timeout.

> +
> +    pkt->stream_index = s->index;
> +    pkt->pos = pos;

If you have data from multiple streams interleaved, then the first
stream will get the position from before reading header_len bytes, but
all the other streams will get the position from after reading the
common data. IMO all packets should get the position of the common data.

> +    s->index++;
> +    s->stored_index++;
> +
> +    return ret;

return 0 -- it is not really defined what happens in case read_packet
callbacks return positive values (it is currently ignored and some
demuxers return the size of the packet, but that is a remnant of an
earlier API) which could happen if av_new_packet() were changed to allow
to return positive values.

> +}
> +
> +static int laf_read_seek(AVFormatContext *ctx, int stream_index,
> +                         int64_t timestamp, int flags)
> +{
> +    LAFContext *s = ctx->priv_data;
> +
> +    s->stored_index = s->index = 0;
> +
> +    return -1;
> +}
> +
> +const AVInputFormat ff_laf_demuxer = {
> +    .name           = "laf",
> +    .long_name      = NULL_IF_CONFIG_SMALL("LAF (Limitless Audio Format)"),
> +    .priv_data_size = sizeof(LAFContext),
> +    .read_probe     = laf_probe,
> +    .read_header    = laf_read_header,
> +    .read_packet    = laf_read_packet,
> +    .read_seek      = laf_read_seek,
> +    .extensions     = "laf",
> +    .flags          = AVFMT_GENERIC_INDEX,
> +};