[FFmpeg-devel] [PATCH 2/2] avcodec/mjpegdec: add support for frame threading

Andreas Rheinhardt andreas.rheinhardt at outlook.com
Mon Dec 5 16:15:29 EET 2022


Timo Rothenpieler:
> In my tests, this lead to a notable speed increase with the amount
> of threads used. Decoding a 720p sample gave the following results:
> 
> 1 Thread: 1428 FPS
> 2 Threads: 2501 FPS
> 8 Threads: 7575 FPS
> Automatic: 11326 FPS (On a 16 Core/32 Threads system)
> ---
>  libavcodec/jpeglsdec.c |  2 +-
>  libavcodec/mjpegdec.c  | 13 +++++++------
>  libavcodec/sp5xdec.c   |  4 ++--
>  3 files changed, 10 insertions(+), 9 deletions(-)
> 
> diff --git a/libavcodec/jpeglsdec.c b/libavcodec/jpeglsdec.c
> index 2e6d018ea6..c0642e8e30 100644
> --- a/libavcodec/jpeglsdec.c
> +++ b/libavcodec/jpeglsdec.c
> @@ -559,7 +559,7 @@ const FFCodec ff_jpegls_decoder = {
>      .init           = ff_mjpeg_decode_init,
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP |
>                        FF_CODEC_CAP_SETS_PKT_DTS,
>  };
> diff --git a/libavcodec/mjpegdec.c b/libavcodec/mjpegdec.c
> index 9b7465abe7..d30d722398 100644
> --- a/libavcodec/mjpegdec.c
> +++ b/libavcodec/mjpegdec.c
> @@ -54,6 +54,7 @@
>  #include "exif.h"
>  #include "bytestream.h"
>  #include "tiff_common.h"
> +#include "thread.h"
>  
>  
>  static int init_default_huffman_tables(MJpegDecodeContext *s)
> @@ -713,7 +714,7 @@ int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
>                  s->avctx->pix_fmt,
>                  AV_PIX_FMT_NONE,
>              };
> -            s->hwaccel_pix_fmt = ff_get_format(s->avctx, pix_fmts);
> +            s->hwaccel_pix_fmt = ff_thread_get_format(s->avctx, pix_fmts);
>              if (s->hwaccel_pix_fmt < 0)
>                  return AVERROR(EINVAL);
>  
> @@ -729,7 +730,7 @@ int ff_mjpeg_decode_sof(MJpegDecodeContext *s)
>          }
>  
>          av_frame_unref(s->picture_ptr);
> -        if (ff_get_buffer(s->avctx, s->picture_ptr, AV_GET_BUFFER_FLAG_REF) < 0)
> +        if (ff_thread_get_buffer(s->avctx, s->picture_ptr, AV_GET_BUFFER_FLAG_REF) < 0)
>              return -1;
>          s->picture_ptr->pict_type = AV_PICTURE_TYPE_I;
>          s->picture_ptr->key_frame = 1;
> @@ -2388,7 +2389,7 @@ static int mjpeg_get_packet(AVCodecContext *avctx)
>      int ret;
>  
>      av_packet_unref(s->pkt);
> -    ret = ff_decode_get_packet(avctx, s->pkt);
> +    ret = ff_thread_decode_get_packet(avctx, s->pkt);
>      if (ret < 0)
>          return ret;
>  
> @@ -3020,7 +3021,7 @@ const FFCodec ff_mjpeg_decoder = {
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
>      .flush          = decode_flush,
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .p.max_lowres   = 3,
>      .p.priv_class   = &mjpegdec_class,
>      .p.profiles     = NULL_IF_CONFIG_SMALL(ff_mjpeg_profiles),
> @@ -3050,7 +3051,7 @@ const FFCodec ff_thp_decoder = {
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
>      .flush          = decode_flush,
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .p.max_lowres   = 3,
>      .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP |
>                        FF_CODEC_CAP_SETS_PKT_DTS,
> @@ -3068,7 +3069,7 @@ const FFCodec ff_smvjpeg_decoder = {
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
>      .flush          = decode_flush,
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .caps_internal  = FF_CODEC_CAP_EXPORTS_CROPPING |
>                        FF_CODEC_CAP_SETS_PKT_DTS | FF_CODEC_CAP_INIT_CLEANUP,
>  };
> diff --git a/libavcodec/sp5xdec.c b/libavcodec/sp5xdec.c
> index 394448c5a9..8b08dc672a 100644
> --- a/libavcodec/sp5xdec.c
> +++ b/libavcodec/sp5xdec.c
> @@ -101,7 +101,7 @@ const FFCodec ff_sp5x_decoder = {
>      .init           = ff_mjpeg_decode_init,
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .p.max_lowres   = 3,
>      .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP |
>                        FF_CODEC_CAP_SETS_PKT_DTS,
> @@ -118,7 +118,7 @@ const FFCodec ff_amv_decoder = {
>      .close          = ff_mjpeg_decode_end,
>      FF_CODEC_RECEIVE_FRAME_CB(ff_mjpeg_receive_frame),
>      .p.max_lowres   = 3,
> -    .p.capabilities = AV_CODEC_CAP_DR1,
> +    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
>      .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP |
>                        FF_CODEC_CAP_SETS_PKT_DTS,
>  };

Can you test the sample that Michael mentioned here:
https://patchwork.ffmpeg.org/project/ffmpeg/patch/AS8PR01MB7944E105BE990A5D01EF89208FEF9@AS8PR01MB7944.eurprd01.prod.exchangelabs.com/?
(I never got around to analyzing this, but if I am not mistaken, it
shows that this decoder is not a simple one-in, one-out decoder, so that
making it multithreaded will be more complicated than just adding the
flag and using ff_thread_get_buffer/format.)

- Andreas



More information about the ffmpeg-devel mailing list