[FFmpeg-devel] [GSOC][PATCH] lavc/cfhd:IP frame decoding (inverse 3d transform) introduced
Kieran Kunhya
kieran618 at googlemail.com
Thu May 31 23:38:57 EEST 2018
Hi
On Thu, 31 May 2018 at 12:25 Gagandeep Singh <deepgagan231197 at gmail.com>
wrote:
> ---
> libavcodec/cfhd.c | 462
> ++++++++++++++++++++++++++++++++++++++++++++++--------
> libavcodec/cfhd.h | 15 +-
> 2 files changed, 411 insertions(+), 66 deletions(-)
>
> diff --git a/libavcodec/cfhd.c b/libavcodec/cfhd.c
> index 051d210355..c0cd25a95e 100644
> --- a/libavcodec/cfhd.c
> +++ b/libavcodec/cfhd.c
> @@ -41,12 +41,15 @@
> #define ALPHA_COMPAND_GAIN 9400
>
> enum CFHDParam {
> + TransformType = 10,
> ChannelCount = 12,
> SubbandCount = 14,
> + Pframe = 19,
>
PFrame
> ImageWidth = 20,
> ImageHeight = 21,
> LowpassPrecision = 35,
> SubbandNumber = 48,
> + EncodingMethod = 52,
> Quantization = 53,
> ChannelNumber = 62,
> SampleFlags = 68,
> @@ -84,6 +87,11 @@ static void init_peak_table_defaults(CFHDContext *s)
>
> static void init_frame_defaults(CFHDContext *s)
> {
> + s->sample_type = 0;
> + s->transform_type = 0;
> + s->num_frames = 0;
> + s->Pframe = 0;
> + s->first_wavelet = 0;
> s->coded_width = 0;
> s->coded_height = 0;
> s->cropped_height = 0;
> @@ -103,8 +111,10 @@ static void init_frame_defaults(CFHDContext *s)
> }
>
> /* TODO: merge with VLC tables or use LUT */
> -static inline int dequant_and_decompand(int level, int quantisation, int
> codebook)
> +static inline int dequant_and_decompand(int level, int quantisation, int
> codebook, int lossless)
> {
> + if (lossless)
> + return level;
> if (codebook == 0 || codebook == 1) {
> int64_t abslevel = abs(level);
> if (level < 264)
> @@ -193,16 +203,21 @@ static inline void filter(int16_t *output, ptrdiff_t
> out_stride,
> }
> }
>
> -static inline void interlaced_vertical_filter(int16_t *output, int16_t
> *low, int16_t *high,
> - int width, int linesize, int plane)
> +static inline void temporal_inverse_filter(int16_t *output, int16_t *low,
> int16_t *high,
> + int width, int linesize, int
> temporal_for_highpass)
> {
> int i;
> int16_t even, odd;
> for (i = 0; i < width; i++) {
> even = (low[i] - high[i])/2;
> odd = (low[i] + high[i])/2;
> - output[i] = av_clip_uintp2(even, 10);
> - output[i + linesize] = av_clip_uintp2(odd, 10);
> + if (!temporal_for_highpass) {
> + output[i] = av_clip_uintp2(even, 10);
> + output[i + linesize] = av_clip_uintp2(odd, 10);
> + } else {
> + low[i] = even;
> + high[i] = odd;
> + }
> }
> }
> static void horiz_filter(int16_t *output, int16_t *low, int16_t *high,
> @@ -261,6 +276,7 @@ static int alloc_buffers(AVCodecContext *avctx)
>
> for (i = 0; i < planes; i++) {
> int w8, h8, w4, h4, w2, h2;
> + int16_t *frame2;
> int width = i ? avctx->width >> chroma_x_shift : avctx->width;
> int height = i ? avctx->height >> chroma_y_shift : avctx->height;
> ptrdiff_t stride = FFALIGN(width / 8, 8) * 8;
> @@ -277,28 +293,85 @@ static int alloc_buffers(AVCodecContext *avctx)
> w2 = w4 * 2;
> h2 = h4 * 2;
>
> - s->plane[i].idwt_buf =
> - av_mallocz_array(height * stride,
> sizeof(*s->plane[i].idwt_buf));
> - s->plane[i].idwt_tmp =
> - av_malloc_array(height * stride,
> sizeof(*s->plane[i].idwt_tmp));
> - if (!s->plane[i].idwt_buf || !s->plane[i].idwt_tmp)
> - return AVERROR(ENOMEM);
> -
> - s->plane[i].subband[0] = s->plane[i].idwt_buf;
> - s->plane[i].subband[1] = s->plane[i].idwt_buf + 2 * w8 * h8;
> - s->plane[i].subband[2] = s->plane[i].idwt_buf + 1 * w8 * h8;
> - s->plane[i].subband[3] = s->plane[i].idwt_buf + 3 * w8 * h8;
> - s->plane[i].subband[4] = s->plane[i].idwt_buf + 2 * w4 * h4;
> - s->plane[i].subband[5] = s->plane[i].idwt_buf + 1 * w4 * h4;
> - s->plane[i].subband[6] = s->plane[i].idwt_buf + 3 * w4 * h4;
> - s->plane[i].subband[7] = s->plane[i].idwt_buf + 2 * w2 * h2;
> - s->plane[i].subband[8] = s->plane[i].idwt_buf + 1 * w2 * h2;
> - s->plane[i].subband[9] = s->plane[i].idwt_buf + 3 * w2 * h2;
> -
> - for (j = 0; j < DWT_LEVELS; j++) {
> - for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[j]); k++) {
> - s->plane[i].band[j][k].a_width = w8 << j;
> - s->plane[i].band[j][k].a_height = h8 << j;
> + if (s->transform_type == 0) {
> + s->plane[i].idwt_buf =
> + av_mallocz_array(height * stride,
> sizeof(*s->plane[i].idwt_buf));
> + s->plane[i].idwt_tmp =
> + av_malloc_array(height * stride,
> sizeof(*s->plane[i].idwt_tmp));
> + if (!s->plane[i].idwt_buf || !s->plane[i].idwt_tmp)
> + return AVERROR(ENOMEM);
> + } else if (s->transform_type == 2) {
> + s->plane[i].idwt_buf =
> + av_mallocz_array(2 * height * stride,
> sizeof(*s->plane[i].idwt_buf));
> + s->plane[i].idwt_tmp =
> + av_malloc_array(height * stride,
> sizeof(*s->plane[i].idwt_tmp));
> + if (!s->plane[i].idwt_buf || !s->plane[i].idwt_tmp)
> + return AVERROR(ENOMEM);
> + }
> +
> + if (s->transform_type == 0) {
> + s->plane[i].subband[0] = s->plane[i].idwt_buf;
> + s->plane[i].subband[1] = s->plane[i].idwt_buf + 2 * w8 * h8;
> + s->plane[i].subband[2] = s->plane[i].idwt_buf + 1 * w8 * h8;
> + s->plane[i].subband[3] = s->plane[i].idwt_buf + 3 * w8 * h8;
> + s->plane[i].subband[4] = s->plane[i].idwt_buf + 2 * w4 * h4;
> + s->plane[i].subband[5] = s->plane[i].idwt_buf + 1 * w4 * h4;
> + s->plane[i].subband[6] = s->plane[i].idwt_buf + 3 * w4 * h4;
> + s->plane[i].subband[7] = s->plane[i].idwt_buf + 2 * w2 * h2;
> + s->plane[i].subband[8] = s->plane[i].idwt_buf + 1 * w2 * h2;
> + s->plane[i].subband[9] = s->plane[i].idwt_buf + 3 * w2 * h2;
> + } else if (s->transform_type == 2) {
> + s->plane[i].subband[0] = s->plane[i].idwt_buf;
> + s->plane[i].subband[1] = s->plane[i].idwt_buf + 2 * w8 * h8;
> + s->plane[i].subband[2] = s->plane[i].idwt_buf + 1 * w8 * h8;
> + s->plane[i].subband[3] = s->plane[i].idwt_buf + 3 * w8 * h8;
> + s->plane[i].subband[4] = s->plane[i].idwt_buf + 2 * w4 * h4;
> + s->plane[i].subband[5] = s->plane[i].idwt_buf + 1 * w4 * h4;
> + s->plane[i].subband[6] = s->plane[i].idwt_buf + 3 * w4 * h4;
> + frame2 =
> + s->plane[i].subband[7] = s->plane[i].idwt_buf + 4 * w2 * h2;
> + s->plane[i].subband[8] = frame2 + 2 * w4 * h4;
> + s->plane[i].subband[9] = frame2 + 1 * w4 * h4;
> + s->plane[i].subband[10] = frame2 + 3 * w4 * h4;
> + s->plane[i].subband[11] = s->plane[i].idwt_buf + 2 * w2 * h2;
> + s->plane[i].subband[12] = s->plane[i].idwt_buf + 1 * w2 * h2;
> + s->plane[i].subband[13] = s->plane[i].idwt_buf + 3 * w2 * h2;
> + s->plane[i].subband[14] = frame2 + 2 * w2 * h2;
> + s->plane[i].subband[15] = frame2 + 1 * w2 * h2;
> + s->plane[i].subband[16] = frame2 + 3 * w2 * h2;
> + }
> +
> + if (s->transform_type == 0) {
> + for (j = 0; j < DWT_LEVELS - 3; j++) {
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[j]); k++)
> {
> + s->plane[i].band[j][k].a_width = w8 << j;
> + s->plane[i].band[j][k].a_height = h8 << j;
> + }
> + }
> + } else if(s->transform_type == 2) {
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[0]); k++) {
> + s->plane[i].band[0][k].a_width = w8;
> + s->plane[i].band[0][k].a_height = h8;
> + }
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[1]); k++) {
> + s->plane[i].band[1][k].a_width = w8 * 2;
> + s->plane[i].band[1][k].a_height = h8 * 2;
> + }
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[2]); k++) {
> + s->plane[i].band[2][k].a_width = w8 * 2;
> + s->plane[i].band[2][k].a_height = h8 * 2;
> + }
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[3]); k++) {
> + s->plane[i].band[3][k].a_width = w8 * 4;
> + s->plane[i].band[3][k].a_height = h8 * 4;
> + }
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[4]); k++) {
> + s->plane[i].band[4][k].a_width = w8 * 4;
> + s->plane[i].band[4][k].a_height = h8 * 4;
> + }
> + for (k = 0; k < FF_ARRAY_ELEMS(s->plane[i].band[5]); k++) {
> + s->plane[i].band[5][k].a_width = w8 * 4;
> + s->plane[i].band[5][k].a_height = h8 * 4;
> }
> }
>
> @@ -327,6 +400,7 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> GetByteContext gb;
> ThreadFrame frame = { .f = data };
> AVFrame *pic = data;
> + s->next_frame = av_frame_alloc();
> int ret = 0, i, j, planes, plane, got_buffer = 0;
> int16_t *coeff_data;
>
> @@ -349,6 +423,9 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> } else if (tag == SampleFlags) {
> av_log(avctx, AV_LOG_DEBUG, "Progressive?%"PRIu16"\n", data);
> s->progressive = data & 0x0001;
> + } else if (tag == Pframe) {
> + s->Pframe = 1;
> + av_log(avctx, AV_LOG_DEBUG, "Frame type %"PRIu16"\n", data);
>
Remove CamelCase in struct
> } else if (tag == ImageWidth) {
> av_log(avctx, AV_LOG_DEBUG, "Width %"PRIu16"\n", data);
> s->coded_width = data;
> @@ -373,7 +450,7 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> }
> } else if (tag == SubbandCount) {
> av_log(avctx, AV_LOG_DEBUG, "Subband Count: %"PRIu16"\n",
> data);
> - if (data != SUBBAND_COUNT) {
> + if (data != 10 && data != 17) {
> av_log(avctx, AV_LOG_ERROR, "Subband Count of %"PRIu16"
> is unsupported\n", data);
> ret = AVERROR_PATCHWELCOME;
> break;
> @@ -405,7 +482,7 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> } else if (tag == 51) {
> av_log(avctx, AV_LOG_DEBUG, "Subband number actual
> %"PRIu16"\n", data);
> s->subband_num_actual = data;
> - if (s->subband_num_actual >= 10) {
> + if (s->subband_num_actual >= 17 && s->subband_num_actual !=
> 255) {
> av_log(avctx, AV_LOG_ERROR, "Invalid subband number
> actual\n");
> ret = AVERROR(EINVAL);
> break;
> @@ -420,9 +497,15 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> s->prescale_shift[1] = (data >> 3) & 0x7;
> s->prescale_shift[2] = (data >> 6) & 0x7;
> av_log(avctx, AV_LOG_DEBUG, "Prescale shift (VC-5): %x\n",
> data);
> + } else if (tag == EncodingMethod) {
> + s->encode_method = data;
> + av_log(avctx, AV_LOG_DEBUG, "Encode Method for Subband %d :
> %x\n",s->subband_num_actual, data);
> } else if (tag == 27) {
> av_log(avctx, AV_LOG_DEBUG, "Lowpass width %"PRIu16"\n",
> data);
> - if (data < 3 || data >
> s->plane[s->channel_num].band[0][0].a_width) {
> + if (s->coded_width == 0){
> + s->coded_width = data << 3;
> + }
> + if (data < 3) {
> av_log(avctx, AV_LOG_ERROR, "Invalid lowpass width\n");
> ret = AVERROR(EINVAL);
> break;
> @@ -431,20 +514,21 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> s->plane[s->channel_num].band[0][0].stride = data;
> } else if (tag == 28) {
> av_log(avctx, AV_LOG_DEBUG, "Lowpass height %"PRIu16"\n",
> data);
> - if (data < 3 || data >
> s->plane[s->channel_num].band[0][0].a_height) {
> + if (s->coded_height == 0)
> + s->coded_height = data << 3;
> + if (data < 3) {
> av_log(avctx, AV_LOG_ERROR, "Invalid lowpass height\n");
> ret = AVERROR(EINVAL);
> break;
> }
> s->plane[s->channel_num].band[0][0].height = data;
> - } else if (tag == 1)
> + } else if (tag == 1) {
> + s->sample_type = data;
> + if (data == 2)
> + s->Pframe = 1;
> av_log(avctx, AV_LOG_DEBUG, "Sample type? %"PRIu16"\n", data);
> - else if (tag == 10) {
> - if (data != 0) {
> - avpriv_report_missing_feature(avctx, "Transform type of
> %"PRIu16, data);
> - ret = AVERROR_PATCHWELCOME;
> - break;
> - }
> + } else if (tag == 10) {
> + s->transform_type = data;
> av_log(avctx, AV_LOG_DEBUG, "Transform-type? %"PRIu16"\n",
> data);
> } else if (abstag >= 0x4000 && abstag <= 0x40ff) {
> if (abstag == 0x4001)
> @@ -502,9 +586,8 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> break;
> }
>
> s->plane[s->channel_num].band[s->level][s->subband_num].height = data;
> - } else if (tag == 71) {
> - s->codebook = data;
> - av_log(avctx, AV_LOG_DEBUG, "Codebook %i\n", s->codebook);
> + } else if (tag == -71) {
> + av_log(avctx, AV_LOG_DEBUG, "color format %d\n", data);
> } else if (tag == 72) {
>
This hunk should be a separate patch
> s->codebook = data & 0xf;
> s->difference_coding = (data >> 4) & 1;
> @@ -547,12 +630,14 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> } else if (tag == -74 && s->peak.offset) {
> s->peak.level = data;
> s->peak.base += s->peak.offset / 2 - 2;
> - } else
> + } else if (tag == 82);
> + else
> av_log(avctx, AV_LOG_DEBUG, "Unknown tag %i data %x\n", tag,
> data);
>
> /* Some kind of end of header tag */
> - if (tag == 4 && data == 0x1a4a && s->coded_width &&
> s->coded_height &&
> + if ((tag == 4 && (data == 0x1a4a || data == 0xf0f) ||
> s->sample_type == 6 || s->sample_type == 1) && s->coded_width &&
> s->coded_height &&
> s->coded_format != AV_PIX_FMT_NONE) {
> + av_log(avctx, AV_LOG_DEBUG, "this summers's gonna hurt\n");
> if (s->a_width != s->coded_width || s->a_height !=
> s->coded_height ||
> s->a_format != s->coded_format) {
> free_buffers(s);
> @@ -620,7 +705,7 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> av_log(avctx, AV_LOG_DEBUG, "Lowpass coefficients %d\n",
> lowpass_width * lowpass_height);
> }
>
> - if (tag == 55 && s->subband_num_actual != 255 && s->a_width &&
> s->a_height) {
> + if ((tag == 55 || tag == 82) && s->a_width && s->a_height) {
> int highpass_height =
> s->plane[s->channel_num].band[s->level][s->subband_num].height;
> int highpass_width =
> s->plane[s->channel_num].band[s->level][s->subband_num].width;
> int highpass_a_width =
> s->plane[s->channel_num].band[s->level][s->subband_num].a_width;
> @@ -638,9 +723,11 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> }
>
> if (highpass_height > highpass_a_height || highpass_width >
> highpass_a_width || a_expected < highpass_height *
> (uint64_t)highpass_stride) {
> - av_log(avctx, AV_LOG_ERROR, "Too many highpass
> coefficients\n");
> - ret = AVERROR(EINVAL);
> - goto end;
> + if (s->subband_num_actual != 255) {
> + av_log(avctx, AV_LOG_ERROR, "Too many highpass
> coefficients\n");
> + ret = AVERROR(EINVAL);
> + goto end;
> + }
> }
> expected = highpass_height * highpass_stride;
>
> @@ -648,8 +735,13 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
>
> init_get_bits(&s->gb, gb.buffer,
> bytestream2_get_bytes_left(&gb) * 8);
> {
> + if(s->subband_num_actual == 255){
> + expected = 0;
> + goto finish;
> + }
> +
> OPEN_READER(re, &s->gb);
> - if (!s->codebook) {
> + if (!s->codebook && !(s->transform_type == 2 &&
> s->subband_num_actual == 7)) {
> while (1) {
> UPDATE_CACHE(re, &s->gb);
> GET_RL_VLC(level, run, re, &s->gb,
> s->table_9_rl_vlc,
> @@ -664,9 +756,14 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> if (count > expected)
> break;
>
> - coeff = dequant_and_decompand(level,
> s->quantisation, 0);
> + coeff = dequant_and_decompand(level,
> s->quantisation, 0, (s->sample_type == 2 || s->sample_type == 3) &&
> s->Pframe && s->subband_num_actual == 7);
> for (i = 0; i < run; i++)
> - *coeff_data++ = coeff;
> + if (tag != 82)
> + *coeff_data++ = coeff;
> + else {
> + *coeff_data |= coeff << 8;
> + *coeff_data++ *= s->quantisation;
> + }
> }
> if (s->peak.level)
> peak_table(coeff_data - expected, &s->peak,
> expected);
> @@ -688,9 +785,14 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> if (count > expected)
> break;
>
> - coeff = dequant_and_decompand(level,
> s->quantisation, s->codebook);
> + coeff = dequant_and_decompand(level,
> s->quantisation, s->codebook, (s->sample_type == 2 || s->sample_type == 3)
> && s->Pframe && s->subband_num_actual == 7);
> for (i = 0; i < run; i++)
> - *coeff_data++ = coeff;
> + if (tag != 82)
> + *coeff_data++ = coeff;
> + else {
> + *coeff_data |= coeff << 8;
> + *coeff_data++ *= s->quantisation;
> + }
> }
> if (s->peak.level)
> peak_table(coeff_data - expected, &s->peak,
> expected);
> @@ -701,12 +803,12 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> CLOSE_READER(re, &s->gb);
> }
>
> - if (count > expected) {
> + if (count > expected && s->subband_num_actual != 255) {
> av_log(avctx, AV_LOG_ERROR, "Escape codeword not found,
> probably corrupt data\n");
> ret = AVERROR(EINVAL);
> goto end;
> }
> -
> + finish:
> bytes = FFALIGN(AV_CEIL_RSHIFT(get_bits_count(&s->gb), 3), 4);
> if (bytes > bytestream2_get_bytes_left(&gb)) {
> av_log(avctx, AV_LOG_ERROR, "Bitstream overread error\n");
> @@ -726,14 +828,14 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> }
> }
> }
> -
> - if (!s->a_width || !s->a_height || s->a_format == AV_PIX_FMT_NONE ||
> - s->coded_width || s->coded_height || s->coded_format !=
> AV_PIX_FMT_NONE) {
> +#if 0
> + if ((!s->a_width || !s->a_height || s->a_format == AV_PIX_FMT_NONE ||
> + s->coded_width || s->coded_height || s->coded_format !=
> AV_PIX_FMT_NONE) && s->sample_type != 1) {
> av_log(avctx, AV_LOG_ERROR, "Invalid dimensions\n");
> ret = AVERROR(EINVAL);
> goto end;
> }
> -
> +#endif
> if (!got_buffer) {
> av_log(avctx, AV_LOG_ERROR, "No end of header tag found\n");
> ret = AVERROR(EINVAL);
> @@ -741,8 +843,9 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> }
>
> planes = av_pix_fmt_count_planes(avctx->pix_fmt);
> + if (s->transform_type == 0 && s->sample_type != 1) {
> for (plane = 0; plane < planes && !ret; plane++) {
> - /* level 1 */
> + /* level 1 */
> int lowpass_height = s->plane[plane].band[0][0].height;
> int lowpass_width = s->plane[plane].band[0][0].width;
> int highpass_stride = s->plane[plane].band[0][1].stride;
> @@ -921,14 +1024,249 @@ static int cfhd_decode(AVCodecContext *avctx, void
> *data, int *got_frame,
> low = s->plane[plane].l_h[6];
> high = s->plane[plane].l_h[7];
> for (i = 0; i < lowpass_height; i++) {
> - interlaced_vertical_filter(dst, low, high, lowpass_width
> * 2, pic->linesize[act_plane]/2, act_plane);
> + temporal_inverse_filter(dst, low, high, lowpass_width *
> 2, pic->linesize[act_plane]/2, 0);
> low += lowpass_width * 2;
> high += lowpass_width * 2;
> dst += pic->linesize[act_plane];
> }
> }
> }
> + } else if (s->transform_type == 2 && s->sample_type != 1) {
> + for (plane = 0; plane < planes && !ret; plane++) {
> + /* level 1 */
> + int lowpass_height = s->plane[plane].band[0][0].height;
> + int lowpass_width = s->plane[plane].band[0][0].width;
> + int highpass_stride = s->plane[plane].band[0][1].stride;
> + int act_plane = plane == 1 ? 2 : plane == 2 ? 1 : plane;
> + int16_t *low, *high, *output, *dst;
> +
> + if (lowpass_height > s->plane[plane].band[0][0].a_height ||
> lowpass_width > s->plane[plane].band[0][0].a_width ||
> + !highpass_stride || s->plane[plane].band[0][1].width >
> s->plane[plane].band[0][1].a_width) {
> + av_log(avctx, AV_LOG_ERROR, "Invalid plane
> dimensions\n");
> + ret = AVERROR(EINVAL);
> + goto end;
> + }
> +
> + av_log(avctx, AV_LOG_DEBUG, "Decoding level 1 plane %i %i
> %i %i\n", plane, lowpass_height, lowpass_width, highpass_stride);
> +
> + low = s->plane[plane].subband[0];
> + high = s->plane[plane].subband[2];
> + output = s->plane[plane].l_h[0];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low, lowpass_width,
> high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].subband[1];
> + high = s->plane[plane].subband[3];
> + output = s->plane[plane].l_h[1];
> +
> + for (i = 0; i < lowpass_width; i++) {
> + // note the stride of "low" is highpass_stride
> + vert_filter(output, lowpass_width, low,
> highpass_stride, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].l_h[0];
> + high = s->plane[plane].l_h[1];
> + output = s->plane[plane].subband[0];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + horiz_filter(output, low, high, lowpass_width);
> + low += lowpass_width;
> + high += lowpass_width;
> + output += lowpass_width * 2;
> + }
> + if (s->bpc == 12) {
> + output = s->plane[plane].subband[0];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + for (j = 0; j < lowpass_width * 2; j++)
> + output[j] *= 4;
> +
> + output += lowpass_width * 2;
> + }
> + }
> +
> + /* level 2 */
> + lowpass_height = s->plane[plane].band[1][1].height;
> + lowpass_width = s->plane[plane].band[1][1].width;
> + highpass_stride = s->plane[plane].band[1][1].stride;
> +
> + if (lowpass_height > s->plane[plane].band[1][1].a_height ||
> lowpass_width > s->plane[plane].band[1][1].a_width ||
> + !highpass_stride || s->plane[plane].band[1][1].width >
> s->plane[plane].band[1][1].a_width) {
> + av_log(avctx, AV_LOG_ERROR, "Invalid plane
> dimensions\n");
> + ret = AVERROR(EINVAL);
> + goto end;
> + }
> +
> + av_log(avctx, AV_LOG_DEBUG, "Level 2 plane %i %i %i %i\n",
> plane, lowpass_height, lowpass_width, highpass_stride);
> +
> + low = s->plane[plane].subband[0];
> + high = s->plane[plane].subband[5];
> + output = s->plane[plane].l_h[3];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low, lowpass_width,
> high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].subband[4];
> + high = s->plane[plane].subband[6];
> + output = s->plane[plane].l_h[4];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> highpass_stride, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].l_h[3];
> + high = s->plane[plane].l_h[4];
> + output = s->plane[plane].subband[0];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + horiz_filter(output, low, high, lowpass_width);
> + low += lowpass_width;
> + high += lowpass_width;
> + output += lowpass_width * 2;
> + }
> +
> + output = s->plane[plane].subband[0];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + for (j = 0; j < lowpass_width * 2; j++)
> + output[j] *= 4;
> +
> + output += lowpass_width * 2;
> + }
> +
> + lowpass_height = s->plane[plane].band[2][1].height;
> + lowpass_width = s->plane[plane].band[2][1].width;
> + highpass_stride = s->plane[plane].band[2][1].stride;
> + av_log(avctx, AV_LOG_DEBUG, "Level 2 plane %i %i %i %i\n",
> plane, lowpass_height, lowpass_width, highpass_stride);
> +
> + low = s->plane[plane].subband[7];
> + high = s->plane[plane].subband[9];
> + output = s->plane[plane].l_h[3];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low, lowpass_width,
> high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].subband[8];
> + high = s->plane[plane].subband[10];
> + output = s->plane[plane].l_h[4];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> highpass_stride, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].l_h[3];
> + high = s->plane[plane].l_h[4];
> + output = s->plane[plane].subband[7];
> + for (i = 0; i < lowpass_height; i++) {
> + horiz_filter(output, low, high, lowpass_width);
> + low += lowpass_width;
> + high += lowpass_width;
> + output += lowpass_width * 2;
> + }
> +
> + lowpass_height = s->plane[plane].band[3][1].height;
> + lowpass_width = s->plane[plane].band[3][1].width;
> + highpass_stride = s->plane[plane].band[3][1].stride;
> + av_log(avctx, AV_LOG_DEBUG, "temporal level %i %i %i %i\n",
> plane, lowpass_height, lowpass_width, highpass_stride);
> +
> + if (lowpass_height > s->plane[plane].band[3][1].a_height ||
> lowpass_width > s->plane[plane].band[3][1].a_width ||
> + !highpass_stride || s->plane[plane].band[3][1].width >
> s->plane[plane].band[3][1].a_width) {
> + av_log(avctx, AV_LOG_ERROR, "Invalid plane
> dimensions\n");
> + ret = AVERROR(EINVAL);
> + goto end;
> + }
> +
> + low = s->plane[plane].subband[0];
> + high = s->plane[plane].subband[7];
> + output = s->plane[plane].subband[0];
> + for (i = 0; i < lowpass_height; i++) {
> + temporal_inverse_filter(output, low, high,
> lowpass_width, 4 * lowpass_width * lowpass_height, 1);
> + low += lowpass_width;
> + high += lowpass_width;
> + output += lowpass_width;
> + }
> +
> + av_log(avctx, AV_LOG_DEBUG, "Level 3 plane %i %i %i %i\n",
> plane, lowpass_height, lowpass_width, highpass_stride);
> + if (s->progressive) {
> + low = s->plane[plane].subband[0];
> + high = s->plane[plane].subband[12];
> + output = s->plane[plane].l_h[6];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> lowpass_width, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].subband[11];
> + high = s->plane[plane].subband[13];
> + output = s->plane[plane].l_h[7];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> highpass_stride, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + dst = (int16_t *)pic->data[act_plane];
> + low = s->plane[plane].l_h[6];
> + high = s->plane[plane].l_h[7];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + horiz_filter_clip(dst, low, high, lowpass_width,
> s->bpc);
> + low += lowpass_width;
> + high += lowpass_width;
> + dst += pic->linesize[act_plane] / 2;
> + }
> +
> + low = s->plane[plane].subband[7];
> + high = s->plane[plane].subband[15];
> + output = s->plane[plane].l_h[6];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> lowpass_width, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].subband[14];
> + high = s->plane[plane].subband[16];
> + output = s->plane[plane].l_h[7];
> + for (i = 0; i < lowpass_width; i++) {
> + vert_filter(output, lowpass_width, low,
> highpass_stride, high, highpass_stride, lowpass_height);
> + low++;
> + high++;
> + output++;
> + }
> +
> + low = s->plane[plane].l_h[6];
> + high = s->plane[plane].l_h[7];
> + output = s->plane[plane].subband[7];
> + for (i = 0; i < lowpass_height * 2; i++) {
> + horiz_filter_clip(output, low, high, lowpass_width,
> s->bpc);
> + low += lowpass_width;
> + high += lowpass_width;
> + output += lowpass_width;
> + }
> + s->next_frame->data[act_plane] = output;
>
> + }
> + }
> + } else if (s->transform_type == 2 && s->sample_type == 1) {
> + av_frame_ref(pic, s->next_frame);
> + }
>
Needs unreffing when done with.
But I don't fully understand the code, you reference the frame but never
use it?
>
> end:
> if (ret < 0)
> @@ -961,6 +1299,6 @@ AVCodec ff_cfhd_decoder = {
> .init = cfhd_init,
> .close = cfhd_close,
> .decode = cfhd_decode,
> - .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_FRAME_THREADS,
> - .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE |
> FF_CODEC_CAP_INIT_CLEANUP,
> + .capabilities = AV_CODEC_CAP_DR1,
> + .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
> };
> diff --git a/libavcodec/cfhd.h b/libavcodec/cfhd.h
> index 7cd251fca7..0126bd4052 100644
> --- a/libavcodec/cfhd.h
> +++ b/libavcodec/cfhd.h
> @@ -30,15 +30,15 @@
> #include "vlc.h"
>
> #define VLC_BITS 9
> -#define SUBBAND_COUNT 10
> -
> +#define SUBBAND_COUNT 17
> +#define BAND_END_TRAILER (1 << 15) - 1
>
Maybe something better for these #defines to explain the old mode vs new.
> typedef struct CFHD_RL_VLC_ELEM {
> int16_t level;
> int8_t len;
> uint16_t run;
> } CFHD_RL_VLC_ELEM;
>
> -#define DWT_LEVELS 3
> +#define DWT_LEVELS 6
>
> typedef struct SubBand {
> int level;
> @@ -82,9 +82,16 @@ typedef struct CFHDContext {
>
> CFHD_RL_VLC_ELEM table_18_rl_vlc[4572];
> VLC vlc_18;
> -
> + AVFrame * next_frame;
> GetBitContext gb;
>
> + int sample_type;
> + int transform_type;
> + int num_spatial;
> + int num_frames;
> + int encode_method;
> + int first_wavelet;
> + int Pframe;
> int coded_width;
> int coded_height;
> int cropped_height;
> --
> 2.14.
>
Kieran
More information about the ffmpeg-devel
mailing list