[FFmpeg-devel] [PATCH v2 3/3] hwcontext_vaapi: Use PRIME_2 memory type for modifiers.
Mark Thompson
sw at jkqxz.net
Thu Jan 14 01:21:34 EET 2021
On 13/11/2020 23:15, Bas Nieuwenhuizen wrote:
> This way we can pass explicit modifiers in. Sometimes the
> modifier matters for the number of memory planes that
> libva accepts, in particular when dealing with
> driver-compressed textures. Furthermore the driver might
> not actually be able to determine the implicit modifier
> if all the buffer-passing has used explicit modifier.
> All these issues should be resolved by passing in the
> modifier, and for that we switch to using the PRIME_2
> memory type.
>
> Tested with experimental radeonsi patches for modifiers
> and kmsgrab. Also tested with radeonsi without the
> patches to double-check it works without PRIME_2 support.
>
> v2:
> Cache PRIME_2 support to avoid doing two calls every time on
> libva drivers that do not support it.
> ---
> libavutil/hwcontext_vaapi.c | 158 ++++++++++++++++++++++++++----------
> 1 file changed, 115 insertions(+), 43 deletions(-)
>
> diff --git a/libavutil/hwcontext_vaapi.c b/libavutil/hwcontext_vaapi.c
> index 2227d6ed69..62b5a163ee 100644
> --- a/libavutil/hwcontext_vaapi.c
> +++ b/libavutil/hwcontext_vaapi.c
> @@ -79,6 +79,9 @@ typedef struct VAAPIFramesContext {
> unsigned int rt_format;
> // Whether vaDeriveImage works.
> int derive_works;
> + // Caches whether VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME_2 is unsupported for
> + // surface imports.
> + int prime_2_import_unsupported;
> } VAAPIFramesContext;
>
> typedef struct VAAPIMapping {
> @@ -1022,6 +1025,7 @@ static void vaapi_unmap_from_drm(AVHWFramesContext *dst_fc,
> static int vaapi_map_from_drm(AVHWFramesContext *src_fc, AVFrame *dst,
> const AVFrame *src, int flags)
> {
> + VAAPIFramesContext *src_vafc = src_fc->internal->priv;
> AVHWFramesContext *dst_fc =
> (AVHWFramesContext*)dst->hw_frames_ctx->data;
> AVVAAPIDeviceContext *dst_dev = dst_fc->device_ctx->hwctx;
> @@ -1029,25 +1033,10 @@ static int vaapi_map_from_drm(AVHWFramesContext *src_fc, AVFrame *dst,
> const VAAPIFormatDescriptor *format_desc;
> VASurfaceID surface_id;
> VAStatus vas;
> + VAStatus prime2_vas = VA_STATUS_SUCCESS;
> + int use_prime2;
> uint32_t va_fourcc;
> - int err, i, j, k;
> -
> - unsigned long buffer_handle;
> - VASurfaceAttribExternalBuffers buffer_desc;
> - VASurfaceAttrib attrs[2] = {
> - {
> - .type = VASurfaceAttribMemoryType,
> - .flags = VA_SURFACE_ATTRIB_SETTABLE,
> - .value.type = VAGenericValueTypeInteger,
> - .value.value.i = VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME,
> - },
> - {
> - .type = VASurfaceAttribExternalBufferDescriptor,
> - .flags = VA_SURFACE_ATTRIB_SETTABLE,
> - .value.type = VAGenericValueTypePointer,
> - .value.value.p = &buffer_desc,
> - }
> - };
> + int err, i, j;
>
> desc = (AVDRMFrameDescriptor*)src->data[0];
>
> @@ -1083,35 +1072,115 @@ static int vaapi_map_from_drm(AVHWFramesContext *src_fc, AVFrame *dst,
> format_desc = vaapi_format_from_fourcc(va_fourcc);
> av_assert0(format_desc);
>
> - buffer_handle = desc->objects[0].fd;
> - buffer_desc.pixel_format = va_fourcc;
> - buffer_desc.width = src_fc->width;
> - buffer_desc.height = src_fc->height;
> - buffer_desc.data_size = desc->objects[0].size;
> - buffer_desc.buffers = &buffer_handle;
> - buffer_desc.num_buffers = 1;
> - buffer_desc.flags = 0;
> -
> - k = 0;
> - for (i = 0; i < desc->nb_layers; i++) {
> - for (j = 0; j < desc->layers[i].nb_planes; j++) {
> - buffer_desc.pitches[k] = desc->layers[i].planes[j].pitch;
> - buffer_desc.offsets[k] = desc->layers[i].planes[j].offset;
> - ++k;
> + use_prime2 = !src_vafc->prime_2_import_unsupported &&
> + desc->objects[0].format_modifier != DRM_FORMAT_MOD_INVALID;
> + if (use_prime2) {
> + VADRMPRIMESurfaceDescriptor prime_desc;
> + VASurfaceAttrib prime_attrs[2] = {
> + {
> + .type = VASurfaceAttribMemoryType,
> + .flags = VA_SURFACE_ATTRIB_SETTABLE,
> + .value.type = VAGenericValueTypeInteger,
> + .value.value.i = VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME_2,
> + },
> + {
> + .type = VASurfaceAttribExternalBufferDescriptor,
> + .flags = VA_SURFACE_ATTRIB_SETTABLE,
> + .value.type = VAGenericValueTypePointer,
> + .value.value.p = &prime_desc,
> + }
> + };
> + prime_desc.fourcc = va_fourcc;
> + prime_desc.width = src_fc->width;
> + prime_desc.height = src_fc->height;
> + prime_desc.num_objects = desc->nb_objects;
> + for (i = 0; i < desc->nb_objects; ++i) {
> + prime_desc.objects[i].fd = desc->objects[i].fd;
> + prime_desc.objects[i].size = desc->objects[i].size;
> + prime_desc.objects[i].drm_format_modifier =
> + desc->objects[i].format_modifier;
> + }
> +
> + prime_desc.num_layers = desc->nb_layers;
> + for (i = 0; i < desc->nb_layers; ++i) {
> + prime_desc.layers[i].drm_format = desc->layers[i].format;
> + prime_desc.layers[i].num_planes = desc->layers[i].nb_planes;
> + for (j = 0; j < desc->layers[i].nb_planes; ++j) {
> + prime_desc.layers[i].object_index[j] =
> + desc->layers[i].planes[j].object_index;
> + prime_desc.layers[i].offset[j] = desc->layers[i].planes[j].offset;
> + prime_desc.layers[i].pitch[j] = desc->layers[i].planes[j].pitch;
> + }
> +
> + if (format_desc->chroma_planes_swapped &&
> + desc->layers[i].nb_planes == 3) {
> + FFSWAP(uint32_t, prime_desc.layers[i].pitch[1],
> + prime_desc.layers[i].pitch[2]);
> + FFSWAP(uint32_t, prime_desc.layers[i].offset[1],
> + prime_desc.layers[i].offset[2]);
> + }
> }
> - }
> - buffer_desc.num_planes = k;
>
> - if (format_desc->chroma_planes_swapped &&
> - buffer_desc.num_planes == 3) {
> - FFSWAP(uint32_t, buffer_desc.pitches[1], buffer_desc.pitches[2]);
> - FFSWAP(uint32_t, buffer_desc.offsets[1], buffer_desc.offsets[2]);
> + /*
> + * We can query for PRIME_2 support with vaQuerySurfaceAttributes, but that
> + * that needs the config_id which we don't have here . Both Intel and
> + * Gallium seem to do the correct error checks, so lets just try the
> + * PRIME_2 import first.
> + */
> + prime2_vas = vaCreateSurfaces(dst_dev->display, format_desc->rt_format,
> + src->width, src->height, &surface_id, 1,
> + prime_attrs, FF_ARRAY_ELEMS(prime_attrs));
> }
>
> - vas = vaCreateSurfaces(dst_dev->display, format_desc->rt_format,
> - src->width, src->height,
> - &surface_id, 1,
> - attrs, FF_ARRAY_ELEMS(attrs));
> + if (prime2_vas != VA_STATUS_SUCCESS || !use_prime2) {
> + int k;
> + unsigned long buffer_handle;
> + VASurfaceAttribExternalBuffers buffer_desc;
> + VASurfaceAttrib buffer_attrs[2] = {
> + {
> + .type = VASurfaceAttribMemoryType,
> + .flags = VA_SURFACE_ATTRIB_SETTABLE,
> + .value.type = VAGenericValueTypeInteger,
> + .value.value.i = VA_SURFACE_ATTRIB_MEM_TYPE_DRM_PRIME,
> + },
> + {
> + .type = VASurfaceAttribExternalBufferDescriptor,
> + .flags = VA_SURFACE_ATTRIB_SETTABLE,
> + .value.type = VAGenericValueTypePointer,
> + .value.value.p = &buffer_desc,
> + }
> + };
> +
> + buffer_handle = desc->objects[0].fd;
> + buffer_desc.pixel_format = va_fourcc;
> + buffer_desc.width = src_fc->width;
> + buffer_desc.height = src_fc->height;
> + buffer_desc.data_size = desc->objects[0].size;
> + buffer_desc.buffers = &buffer_handle;
> + buffer_desc.num_buffers = 1;
> + buffer_desc.flags = 0;
> +
> + k = 0;
> + for (i = 0; i < desc->nb_layers; i++) {
> + for (j = 0; j < desc->layers[i].nb_planes; j++) {
> + buffer_desc.pitches[k] = desc->layers[i].planes[j].pitch;
> + buffer_desc.offsets[k] = desc->layers[i].planes[j].offset;
> + ++k;
> + }
> + }
> + buffer_desc.num_planes = k;
> +
> + if (format_desc->chroma_planes_swapped &&
> + buffer_desc.num_planes == 3) {
> + FFSWAP(uint32_t, buffer_desc.pitches[1], buffer_desc.pitches[2]);
> + FFSWAP(uint32_t, buffer_desc.offsets[1], buffer_desc.offsets[2]);
> + }
> +
> + vas = vaCreateSurfaces(dst_dev->display, format_desc->rt_format,
> + src->width, src->height,
> + &surface_id, 1,
> + buffer_attrs, FF_ARRAY_ELEMS(buffer_attrs));
> + }
> if (vas != VA_STATUS_SUCCESS) {
The status variables are confused here - vas is uninitialised if PRIME_2 import succeeded, giving random error results.
Maybe it would be cleaner to use vas everywhere ...
> av_log(dst_fc, AV_LOG_ERROR, "Failed to create surface from DRM "
> "object: %d (%s).\n", vas, vaErrorStr(vas));
> @@ -1119,6 +1188,9 @@ static int vaapi_map_from_drm(AVHWFramesContext *src_fc, AVFrame *dst,
> }
> av_log(dst_fc, AV_LOG_DEBUG, "Create surface %#x.\n", surface_id);
>
> + if (prime2_vas != VA_STATUS_SUCCESS)
> + src_vafc->prime_2_import_unsupported = 1;
... while moving this test to immediately after the PRIME_2 vaCreateSurfaces() call.
> +
> err = ff_hwframe_map_create(dst->hw_frames_ctx, dst, src,
> &vaapi_unmap_from_drm,
> (void*)(uintptr_t)surface_id);
>
Thanks,
- Mark
More information about the ffmpeg-devel
mailing list