[FFmpeg-devel] [PATCHv2 3/4] mkv: Export bounds and padding from spherical metadata
James Almer
jamrial at gmail.com
Thu Feb 16 02:20:55 EET 2017
On 2/15/2017 1:29 PM, Vittorio Giovara wrote:
> ---
> Updated according to James' review.
> Please CC.
> Vittorio
>
> libavformat/matroskadec.c | 69 ++++++++++++++++++++++++++++++++--
> tests/ref/fate/matroska-spherical-mono | 6 ++-
> 2 files changed, 71 insertions(+), 4 deletions(-)
>
> diff --git a/libavformat/matroskadec.c b/libavformat/matroskadec.c
> index 7223e94..6fa961e 100644
> --- a/libavformat/matroskadec.c
> +++ b/libavformat/matroskadec.c
> @@ -1913,16 +1913,65 @@ static int mkv_parse_video_projection(AVStream *st, const MatroskaTrack *track)
> AVSphericalMapping *spherical;
> enum AVSphericalProjection projection;
> size_t spherical_size;
> + size_t l, t, r, b;
> + size_t padding = 0;
> int ret;
> + GetByteContext gb;
> +
> + bytestream2_init(&gb, track->video.projection.private.data,
> + track->video.projection.private.size);
> +
> + if (bytestream2_get_byte(&gb) != 0) {
> + av_log(NULL, AV_LOG_WARNING, "Unknown spherical metadata\n");
> + return 0;
> + }
> +
> + bytestream2_skip(&gb, 3); // flags
>
> switch (track->video.projection.type) {
> case MATROSKA_VIDEO_PROJECTION_TYPE_EQUIRECTANGULAR:
> - projection = AV_SPHERICAL_EQUIRECTANGULAR;
> + if (track->video.projection.private.size == 0)
> + projection = AV_SPHERICAL_EQUIRECTANGULAR;
> + else if (track->video.projection.private.size == 20) {
> + t = bytestream2_get_be32(&gb);
> + b = bytestream2_get_be32(&gb);
> + l = bytestream2_get_be32(&gb);
> + r = bytestream2_get_be32(&gb);
> +
> + if (b >= UINT_MAX - t || r >= UINT_MAX - l) {
> + av_log(NULL, AV_LOG_ERROR,
> + "Invalid bounding rectangle coordinates "
> + "%zu,%zu,%zu,%zu\n", l, t, r, b);
> + return AVERROR_INVALIDDATA;
> + }
> +
> + if (l || t || r || b)
> + projection = AV_SPHERICAL_EQUIRECTANGULAR_TILE;
> + else
> + projection = AV_SPHERICAL_EQUIRECTANGULAR;
> + } else {
> + av_log(NULL, AV_LOG_ERROR, "Unknown spherical metadata\n");
> + return AVERROR_INVALIDDATA;
> + }
I think this'll look better as
case MATROSKA_VIDEO_PROJECTION_TYPE_EQUIRECTANGULAR:
projection = AV_SPHERICAL_EQUIRECTANGULAR;
if (track->video.projection.private.size == 20) {
[...]
if (l || t || r || b)
projection = AV_SPHERICAL_EQUIRECTANGULAR_TILE;
} else if (track->video.projection.private.size != 0) {
// return error
}
break;
But it's cosmetic. If you change it then don't sent a new patch just for it.
> break;
> case MATROSKA_VIDEO_PROJECTION_TYPE_CUBEMAP:
> - if (track->video.projection.private.size < 4)
> + if (track->video.projection.private.size < 4) {
> + av_log(NULL, AV_LOG_ERROR, "Missing projection private properties\n");
> + return AVERROR_INVALIDDATA;
> + } else if (track->video.projection.private.size == 12) {
> + uint32_t layout = bytestream2_get_be32(&gb);
> + if (layout == 0) {
> + projection = AV_SPHERICAL_CUBEMAP;
> + } else {
> + av_log(NULL, AV_LOG_WARNING,
> + "Unknown spherical cubemap layout %"PRIu32"\n", layout);
> + return 0;
> + }
> + padding = bytestream2_get_be32(&gb);
> + } else {
> + av_log(NULL, AV_LOG_ERROR, "Unknown spherical metadata\n");
> return AVERROR_INVALIDDATA;
> - projection = AV_SPHERICAL_CUBEMAP;
> + }
> break;
> default:
> return 0;
> @@ -1937,6 +1986,20 @@ static int mkv_parse_video_projection(AVStream *st, const MatroskaTrack *track)
> spherical->pitch = (int32_t)(track->video.projection.pitch * (1 << 16));
> spherical->roll = (int32_t)(track->video.projection.roll * (1 << 16));
>
> + spherical->padding = padding;
> +
> + if (spherical->projection == AV_SPHERICAL_EQUIRECTANGULAR_TILE) {
> + /* conversion from 0.32 coordinates to pixels */
> + size_t orig_width = (size_t) track->video.pixel_width * UINT32_MAX / (UINT32_MAX - r - l);
> + size_t orig_height = (size_t) track->video.pixel_height * UINT32_MAX / (UINT32_MAX - b - t);
> +
> + /* add a (UINT32_MAX - 1) to round up integer division */
> + spherical->bound_left = (orig_width * l + UINT32_MAX - 1) / UINT32_MAX;
> + spherical->bound_top = (orig_height * t + UINT32_MAX - 1) / UINT32_MAX;
> + spherical->bound_right = orig_width - track->video.pixel_width - spherical->bound_left;
> + spherical->bound_bottom = orig_height - track->video.pixel_height - spherical->bound_top;
> + }
> +
> ret = av_stream_add_side_data(st, AV_PKT_DATA_SPHERICAL, (uint8_t *)spherical,
> spherical_size);
> if (ret < 0) {
> diff --git a/tests/ref/fate/matroska-spherical-mono b/tests/ref/fate/matroska-spherical-mono
> index 8048aff..a70d879 100644
> --- a/tests/ref/fate/matroska-spherical-mono
> +++ b/tests/ref/fate/matroska-spherical-mono
> @@ -8,7 +8,11 @@ inverted=0
> [SIDE_DATA]
> side_data_type=Spherical Mapping
> side_data_size=56
> -projection=equirectangular
> +projection=tiled equirectangular
> +bound_left=148
> +bound_top=73
> +bound_right=147
> +bound_bottom=72
> yaw=45
> pitch=30
> roll=15
The element parsing code lgtm. No comments about all the added math.
More information about the ffmpeg-devel
mailing list