[FFmpeg-devel] [PATCH] avcodec/libx265: add support for ROI-based encoding
Guo, Yejun
yejun.guo at intel.com
Fri Jan 18 17:53:37 EET 2019
Signed-off-by: Guo, Yejun <yejun.guo at intel.com>
---
libavcodec/libx265.c | 74 ++++++++++++++++++++++++++++++++++++++++++++++++++++
1 file changed, 74 insertions(+)
diff --git a/libavcodec/libx265.c b/libavcodec/libx265.c
index 27c90b3..6b1cc74 100644
--- a/libavcodec/libx265.c
+++ b/libavcodec/libx265.c
@@ -285,6 +285,70 @@ static av_cold int libx265_encode_init(AVCodecContext *avctx)
return 0;
}
+static av_cold int libx265_encode_set_roi(libx265Context *ctx, const AVFrame *frame, x265_picture* pic)
+{
+ // From x265.h:
+ /* An array of quantizer offsets to be applied to this image during encoding.
+ * These are added on top of the decisions made by rateControl.
+ * Adaptive quantization must be enabled to use this feature. These quantizer
+ * offsets should be given for each 16x16 block (8x8 block, when qg-size is 8).
+ * Behavior if quant offsets differ between encoding passes is undefined.
+ */
+ AVFrameSideData *sd = av_frame_get_side_data(frame, AV_FRAME_DATA_REGIONS_OF_INTEREST);
+ if (sd) {
+ if (ctx->params->rc.aqMode == X265_AQ_NONE) {
+ av_log(ctx, AV_LOG_WARNING, "Adaptive quantization must be enabled to use ROI encoding, skipping ROI.\n");
+ } else {
+ int mb_size = (ctx->params->rc.qgSize == 8) ? 8 : 16;
+ int mbx = (frame->width + mb_size - 1) / mb_size;
+ int mby = (frame->height + mb_size - 1) / mb_size;
+ int nb_rois;
+ AVRegionOfInterest* roi;
+ float* qoffsets; // will be freed after encode is called
+ qoffsets = av_mallocz_array(mbx * mby, sizeof(*qoffsets));
+ if (!qoffsets)
+ return AVERROR(ENOMEM);
+
+ nb_rois = sd->size / sizeof(AVRegionOfInterest);
+ roi = (AVRegionOfInterest*)sd->data;
+ for (int count = 0; count < nb_rois; count++) {
+ int starty = FFMIN(mby, roi->top / mb_size);
+ int endy = FFMIN(mby, (roi->bottom + mb_size - 1)/ mb_size);
+ int startx = FFMIN(mbx, roi->left / mb_size);
+ int endx = FFMIN(mbx, (roi->right + mb_size - 1)/ mb_size);
+ float qoffset;
+
+ if (roi->qoffset.den == 0) {
+ av_free(qoffsets);
+ av_log(ctx, AV_LOG_ERROR, "AVRegionOfInterest.qoffset.den should not be zero.\n");
+ return AVERROR(EINVAL);
+ }
+ qoffset = roi->qoffset.num * 1.0f / roi->qoffset.den;
+ qoffset = av_clipf(qoffset, -1.0f, 1.0f);
+
+ // 25 is a number that I think it is a possible proper scale value.
+ qoffset = qoffset * 25;
+
+ for (int y = starty; y < endy; y++) {
+ for (int x = startx; x < endx; x++) {
+ qoffsets[x + y*mbx] = qoffset;
+ }
+ }
+
+ if (roi->self_size == 0) {
+ av_free(qoffsets);
+ av_log(ctx, AV_LOG_ERROR, "AVRegionOfInterest.self_size should be set to sizeof(AVRegionOfInterest).\n");
+ return AVERROR(EINVAL);
+ }
+ roi = (AVRegionOfInterest*)((char*)roi + roi->self_size);
+ }
+
+ pic->quantOffsets = qoffsets;
+ }
+ }
+ return 0;
+}
+
static int libx265_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
const AVFrame *pic, int *got_packet)
{
@@ -314,10 +378,20 @@ static int libx265_encode_frame(AVCodecContext *avctx, AVPacket *pkt,
pic->pict_type == AV_PICTURE_TYPE_P ? X265_TYPE_P :
pic->pict_type == AV_PICTURE_TYPE_B ? X265_TYPE_B :
X265_TYPE_AUTO;
+
+ ret = libx265_encode_set_roi(ctx, pic, &x265pic);
+ if (ret < 0)
+ return ret;
}
ret = ctx->api->encoder_encode(ctx->encoder, &nal, &nnal,
pic ? &x265pic : NULL, &x265pic_out);
+
+ if (x265pic.quantOffsets) {
+ av_free(x265pic.quantOffsets);
+ x265pic.quantOffsets = NULL;
+ }
+
if (ret < 0)
return AVERROR_EXTERNAL;
--
2.7.4
More information about the ffmpeg-devel
mailing list