[FFmpeg-devel] [PATCH 1/2] avformat: add hash and framehash muxers
James Almer
jamrial at gmail.com
Sun Apr 10 23:22:52 CEST 2016
From: Moritz Barsnick <barsnick at gmx.net>
Signed-off-by: Moritz Barsnick <barsnick at gmx.net>
Signed-off-by: James Almer <jamrial at gmail.com>
---
Here's the previously sent patchset in an easy to read single patch.
I changed the default from sha512 to sha256 since the former is slow
on 32bits arches.
Changelog | 1 +
doc/muxers.texi | 125 ++++++++++++++++++++++++++------
libavformat/Makefile | 6 +-
libavformat/allformats.c | 2 +
libavformat/{md5enc.c => hashenc.c} | 140 +++++++++++++++++++++++++-----------
libavformat/version.h | 2 +-
6 files changed, 211 insertions(+), 65 deletions(-)
rename libavformat/{md5enc.c => hashenc.c} (52%)
diff --git a/Changelog b/Changelog
index b4a4dd7..b976dbb 100644
--- a/Changelog
+++ b/Changelog
@@ -22,6 +22,7 @@ version <next>:
- musx demuxer
- aix demuxer
- remap filter
+- hash and framehash muxers
version 3.0:
- Common Encryption (CENC) MP4 encoding and decoding support
diff --git a/doc/muxers.texi b/doc/muxers.texi
index 2aafbad..042efce 100644
--- a/doc/muxers.texi
+++ b/doc/muxers.texi
@@ -174,30 +174,70 @@ ffmpeg -i INPUT -c:a pcm_u8 -c:v mpeg2video -f framecrc -
See also the @ref{crc} muxer.
- at anchor{framemd5}
- at section framemd5
+ at anchor{framehash}
+ at section framehash
-Per-packet MD5 testing format.
+Per-packet hash testing format.
-This muxer computes and prints the MD5 hash for each audio
-and video packet. By default audio frames are converted to signed
-16-bit raw audio and video frames to raw video before computing the
-hash.
+This muxer computes and prints a cryptographic hash for each audio
+and video packet. This can be used for packet-by-packet equality
+checks without having to individually do a binary comparison on each.
+
+By default audio frames are converted to signed 16-bit raw audio and
+video frames to raw video before computing the hash, but the output
+of explicit conversions to other codecs can also be used. It uses the
+SHA-256 cryptographic hash function by default, but supports several
+other algorithms.
The output of the muxer consists of a line for each audio and video
packet of the form:
@example
- at var{stream_index}, @var{packet_dts}, @var{packet_pts}, @var{packet_duration}, @var{packet_size}, @var{MD5}
+ at var{stream_index}, @var{packet_dts}, @var{packet_pts}, @var{packet_duration}, @var{packet_size}, @var{hash}
@end example
- at var{MD5} is a hexadecimal number representing the computed MD5 hash
+ at var{hash} is a hexadecimal number representing the computed hash
for the packet.
+ at table @option
+ at item hash @var{algorithm}
+Use the cryptographic hash function specified by the string @var{algorithm}.
+Supported values include @code{MD5}, @code{murmur3}, @code{RIPEMD128},
+ at code{RIPEMD160}, @code{RIPEMD256}, @code{RIPEMD320}, @code{SHA160},
+ at code{SHA224}, @code{SHA256} (default), @code{SHA512/224}, @code{SHA512/256},
+ at code{SHA384}, @code{SHA512}, @code{CRC32} and @code{adler32}.
+
+ at end table
+
@subsection Examples
-For example to compute the MD5 of the audio and video frames in
- at file{INPUT}, converted to raw audio and video packets, and store it
-in the file @file{out.md5}:
+To compute the SHA-256 hash of the audio and video frames in @file{INPUT},
+converted to raw audio and video packets, and store it in the file
+ at file{out.sha256}:
+ at example
+ffmpeg -i INPUT -f framehash out.sha256
+ at end example
+
+To print the information to stdout, using the MD5 hash function, use
+the command:
+ at example
+ffmpeg -i INPUT -f framehash -hash md5 -
+ at end example
+
+See also the @ref{hash} muxer.
+
+ at anchor{framemd5}
+ at section framemd5
+
+Per-packet MD5 testing format.
+
+This is a variant of the @ref{framehash} muxer. Unlike that muxer,
+it defaults to using the MD5 hash function.
+
+ at subsection Examples
+
+To compute the MD5 hash of the audio and video frames in @file{INPUT},
+converted to raw audio and video packets, and store it in the file
+ at file{out.md5}:
@example
ffmpeg -i INPUT -f framemd5 out.md5
@end example
@@ -207,7 +247,7 @@ To print the information to stdout, use the command:
ffmpeg -i INPUT -f framemd5 -
@end example
-See also the @ref{md5} muxer.
+See also the @ref{framehash} and @ref{md5} muxers.
@anchor{gif}
@section gif
@@ -243,6 +283,51 @@ ffmpeg -i INPUT -c:v gif -f image2 "out%d.gif"
Note 2: the GIF format has a very small time base: the delay between two frames
can not be smaller than one centi second.
+ at anchor{hash}
+ at section hash
+
+Hash testing format.
+
+This muxer computes and prints a cryptographic hash of all the input
+audio and video frames. This can be used for equality checks without
+having to do a complete binary comparison.
+
+By default audio frames are converted to signed 16-bit raw audio and
+video frames to raw video before computing the hash, but the output
+of explicit conversions to other codecs can also be used. Timestamps
+are ignored. It uses the SHA-256 cryptographic hash function by default,
+but supports several other algorithms.
+
+The output of the muxer consists of a single line of the form:
+ at var{algo}=@var{hash}, where @var{algo} is a short string representing
+the hash function used, and @var{hash} is a hexadecimal number
+representing the computed hash.
+
+ at table @option
+ at item hash @var{algorithm}
+Use the cryptographic hash function specified by the string @var{algorithm}.
+Supported values include @code{MD5}, @code{murmur3}, @code{RIPEMD128},
+ at code{RIPEMD160}, @code{RIPEMD256}, @code{RIPEMD320}, @code{SHA160},
+ at code{SHA224}, @code{SHA256} (default), @code{SHA512/224}, @code{SHA512/256},
+ at code{SHA384}, @code{SHA512}, @code{CRC32} and @code{adler32}.
+
+ at end table
+
+ at subsection Examples
+
+To compute the SHA-256 hash of the input converted to raw audio and
+video, and store it in the file @file{out.sha256}:
+ at example
+ffmpeg -i INPUT -f hash out.sha256
+ at end example
+
+To print an MD5 hash to stdout use the command:
+ at example
+ffmpeg -i INPUT -f hash -hash md5 -
+ at end example
+
+See also the @ref{framehash} muxer.
+
@anchor{hls}
@section hls
@@ -629,16 +714,12 @@ have no effect if it is not.
MD5 testing format.
-This muxer computes and prints the MD5 hash of all the input audio
-and video frames. By default audio frames are converted to signed
-16-bit raw audio and video frames to raw video before computing the
-hash. Timestamps are ignored.
+This is a variant of the @ref{hash} muxer. Unlike that muxer, it
+defaults to using the MD5 hash function.
-The output of the muxer consists of a single line of the form:
-MD5=@var{MD5}, where @var{MD5} is a hexadecimal number representing
-the computed MD5 hash.
+ at subsection Examples
-For example to compute the MD5 hash of the input converted to raw
+To compute the MD5 hash of the input converted to raw
audio and video, and store it in the file @file{out.md5}:
@example
ffmpeg -i INPUT -f md5 out.md5
@@ -649,7 +730,7 @@ You can print the MD5 to stdout with the command:
ffmpeg -i INPUT -f md5 -
@end example
-See also the @ref{framemd5} muxer.
+See also the @ref{hash} and @ref{framemd5} muxers.
@section mov, mp4, ismv
diff --git a/libavformat/Makefile b/libavformat/Makefile
index 5921368..4bae3b7 100644
--- a/libavformat/Makefile
+++ b/libavformat/Makefile
@@ -175,7 +175,8 @@ OBJS-$(CONFIG_LIVE_FLV_DEMUXER) += flvdec.o
OBJS-$(CONFIG_FLV_MUXER) += flvenc.o avc.o
OBJS-$(CONFIG_FOURXM_DEMUXER) += 4xm.o
OBJS-$(CONFIG_FRAMECRC_MUXER) += framecrcenc.o framehash.o
-OBJS-$(CONFIG_FRAMEMD5_MUXER) += md5enc.o framehash.o
+OBJS-$(CONFIG_FRAMEHASH_MUXER) += hashenc.o framehash.o
+OBJS-$(CONFIG_FRAMEMD5_MUXER) += hashenc.o framehash.o
OBJS-$(CONFIG_FRM_DEMUXER) += frmdec.o
OBJS-$(CONFIG_FSB_DEMUXER) += fsb.o
OBJS-$(CONFIG_GIF_MUXER) += gif.o
@@ -196,6 +197,7 @@ OBJS-$(CONFIG_H263_DEMUXER) += h263dec.o rawdec.o
OBJS-$(CONFIG_H263_MUXER) += rawenc.o
OBJS-$(CONFIG_H264_DEMUXER) += h264dec.o rawdec.o
OBJS-$(CONFIG_H264_MUXER) += rawenc.o
+OBJS-$(CONFIG_HASH_MUXER) += hashenc.o
OBJS-$(CONFIG_HDS_MUXER) += hdsenc.o
OBJS-$(CONFIG_HEVC_DEMUXER) += hevcdec.o rawdec.o
OBJS-$(CONFIG_HEVC_MUXER) += rawenc.o
@@ -259,7 +261,7 @@ OBJS-$(CONFIG_MATROSKA_MUXER) += matroskaenc.o matroska.o \
avc.o hevc.o \
flacenc_header.o avlanguage.o vorbiscomment.o wv.o \
webmdashenc.o webm_chunk.o
-OBJS-$(CONFIG_MD5_MUXER) += md5enc.o
+OBJS-$(CONFIG_MD5_MUXER) += hashenc.o
OBJS-$(CONFIG_MGSTS_DEMUXER) += mgsts.o
OBJS-$(CONFIG_MICRODVD_DEMUXER) += microdvddec.o subtitles.o
OBJS-$(CONFIG_MICRODVD_MUXER) += microdvdenc.o
diff --git a/libavformat/allformats.c b/libavformat/allformats.c
index d7023ea..dbf2737 100644
--- a/libavformat/allformats.c
+++ b/libavformat/allformats.c
@@ -131,6 +131,7 @@ void av_register_all(void)
REGISTER_DEMUXER (LIVE_FLV, live_flv);
REGISTER_DEMUXER (FOURXM, fourxm);
REGISTER_MUXER (FRAMECRC, framecrc);
+ REGISTER_MUXER (FRAMEHASH, framehash);
REGISTER_MUXER (FRAMEMD5, framemd5);
REGISTER_DEMUXER (FRM, frm);
REGISTER_DEMUXER (FSB, fsb);
@@ -144,6 +145,7 @@ void av_register_all(void)
REGISTER_MUXDEMUX(H261, h261);
REGISTER_MUXDEMUX(H263, h263);
REGISTER_MUXDEMUX(H264, h264);
+ REGISTER_MUXER (HASH, hash);
REGISTER_MUXER (HDS, hds);
REGISTER_MUXDEMUX(HEVC, hevc);
REGISTER_MUXDEMUX(HLS, hls);
diff --git a/libavformat/md5enc.c b/libavformat/hashenc.c
similarity index 52%
rename from libavformat/md5enc.c
rename to libavformat/hashenc.c
index 8433be4..ef886a0 100644
--- a/libavformat/md5enc.c
+++ b/libavformat/hashenc.c
@@ -1,5 +1,5 @@
/*
- * MD5 encoder (for codec/format testing)
+ * Hash/MD5 encoder (for codec/format testing)
* Copyright (c) 2009 Reimar Döffinger, based on crcenc (c) 2002 Fabrice Bellard
*
* This file is part of FFmpeg.
@@ -26,23 +26,23 @@
#include "avformat.h"
#include "internal.h"
-struct MD5Context {
+struct HashContext {
const AVClass *avclass;
struct AVHashContext *hash;
char *hash_name;
int format_version;
};
-static void md5_finish(struct AVFormatContext *s, char *buf)
+static void hash_finish(struct AVFormatContext *s, char *buf)
{
- struct MD5Context *c = s->priv_data;
- uint8_t md5[AV_HASH_MAX_SIZE];
+ struct HashContext *c = s->priv_data;
+ uint8_t hash[AV_HASH_MAX_SIZE];
int i, offset = strlen(buf);
int len = av_hash_get_size(c->hash);
- av_assert0(len > 0 && len <= sizeof(md5));
- av_hash_final(c->hash, md5);
+ av_assert0(len > 0 && len <= sizeof(hash));
+ av_hash_final(c->hash, hash);
for (i = 0; i < len; i++) {
- snprintf(buf + offset, 3, "%02"PRIx8, md5[i]);
+ snprintf(buf + offset, 3, "%02"PRIx8, hash[i]);
offset += 2;
}
buf[offset] = '\n';
@@ -52,25 +52,28 @@ static void md5_finish(struct AVFormatContext *s, char *buf)
avio_flush(s->pb);
}
-#define OFFSET(x) offsetof(struct MD5Context, x)
+#define OFFSET(x) offsetof(struct HashContext, x)
#define ENC AV_OPT_FLAG_ENCODING_PARAM
+#if CONFIG_HASH_MUXER || CONFIG_FRAMEHASH_MUXER
static const AVOption hash_options[] = {
- { "hash", "set hash to use", OFFSET(hash_name), AV_OPT_TYPE_STRING, {.str = "md5"}, 0, 0, ENC },
+ { "hash", "set hash to use", OFFSET(hash_name), AV_OPT_TYPE_STRING, {.str = "sha256"}, 0, 0, ENC },
{ "format_version", "file format version", OFFSET(format_version), AV_OPT_TYPE_INT, {.i64 = 1}, 1, 1, ENC },
{ NULL },
};
+#endif
-static const AVClass md5enc_class = {
- .class_name = "hash encoder class",
- .item_name = av_default_item_name,
- .option = hash_options,
- .version = LIBAVUTIL_VERSION_INT,
+#if CONFIG_MD5_MUXER || CONFIG_FRAMEMD5_MUXER
+static const AVOption md5_options[] = {
+ { "hash", "set hash to use", OFFSET(hash_name), AV_OPT_TYPE_STRING, {.str = "md5"}, 0, 0, ENC },
+ { "format_version", "file format version", OFFSET(format_version), AV_OPT_TYPE_INT, {.i64 = 1}, 1, 1, ENC },
+ { NULL },
};
+#endif
-#if CONFIG_MD5_MUXER
-static int write_header(struct AVFormatContext *s)
+#if CONFIG_HASH_MUXER || CONFIG_MD5_MUXER
+static int hash_write_header(struct AVFormatContext *s)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
int res = av_hash_alloc(&c->hash, c->hash_name);
if (res < 0)
return res;
@@ -78,45 +81,77 @@ static int write_header(struct AVFormatContext *s)
return 0;
}
-static int write_packet(struct AVFormatContext *s, AVPacket *pkt)
+static int hash_write_packet(struct AVFormatContext *s, AVPacket *pkt)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
av_hash_update(c->hash, pkt->data, pkt->size);
return 0;
}
-static int write_trailer(struct AVFormatContext *s)
+static int hash_write_trailer(struct AVFormatContext *s)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
char buf[256];
av_strlcpy(buf, av_hash_get_name(c->hash), sizeof(buf) - 200);
av_strlcat(buf, "=", sizeof(buf) - 200);
- md5_finish(s, buf);
+ hash_finish(s, buf);
av_hash_freep(&c->hash);
return 0;
}
+#endif
+
+#if CONFIG_HASH_MUXER
+static const AVClass hashenc_class = {
+ .class_name = "hash encoder class",
+ .item_name = av_default_item_name,
+ .option = hash_options,
+ .version = LIBAVUTIL_VERSION_INT,
+};
+
+AVOutputFormat ff_hash_muxer = {
+ .name = "hash",
+ .long_name = NULL_IF_CONFIG_SMALL("Hash testing"),
+ .priv_data_size = sizeof(struct HashContext),
+ .audio_codec = AV_CODEC_ID_PCM_S16LE,
+ .video_codec = AV_CODEC_ID_RAWVIDEO,
+ .write_header = hash_write_header,
+ .write_packet = hash_write_packet,
+ .write_trailer = hash_write_trailer,
+ .flags = AVFMT_VARIABLE_FPS | AVFMT_TS_NONSTRICT |
+ AVFMT_TS_NEGATIVE,
+ .priv_class = &hashenc_class,
+};
+#endif
+
+#if CONFIG_MD5_MUXER
+static const AVClass md5enc_class = {
+ .class_name = "MD5 encoder class",
+ .item_name = av_default_item_name,
+ .option = md5_options,
+ .version = LIBAVUTIL_VERSION_INT,
+};
AVOutputFormat ff_md5_muxer = {
.name = "md5",
.long_name = NULL_IF_CONFIG_SMALL("MD5 testing"),
- .priv_data_size = sizeof(struct MD5Context),
+ .priv_data_size = sizeof(struct HashContext),
.audio_codec = AV_CODEC_ID_PCM_S16LE,
.video_codec = AV_CODEC_ID_RAWVIDEO,
- .write_header = write_header,
- .write_packet = write_packet,
- .write_trailer = write_trailer,
+ .write_header = hash_write_header,
+ .write_packet = hash_write_packet,
+ .write_trailer = hash_write_trailer,
.flags = AVFMT_VARIABLE_FPS | AVFMT_TS_NONSTRICT |
AVFMT_TS_NEGATIVE,
.priv_class = &md5enc_class,
};
#endif
-#if CONFIG_FRAMEMD5_MUXER
-static int framemd5_write_header(struct AVFormatContext *s)
+#if CONFIG_FRAMEHASH_MUXER || CONFIG_FRAMEMD5_MUXER
+static int framehash_write_header(struct AVFormatContext *s)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
int res = av_hash_alloc(&c->hash, c->hash_name);
if (res < 0)
return res;
@@ -128,42 +163,67 @@ static int framemd5_write_header(struct AVFormatContext *s)
return 0;
}
-static int framemd5_write_packet(struct AVFormatContext *s, AVPacket *pkt)
+static int framehash_write_packet(struct AVFormatContext *s, AVPacket *pkt)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
char buf[256];
av_hash_init(c->hash);
av_hash_update(c->hash, pkt->data, pkt->size);
snprintf(buf, sizeof(buf) - 64, "%d, %10"PRId64", %10"PRId64", %8"PRId64", %8d, ",
pkt->stream_index, pkt->dts, pkt->pts, pkt->duration, pkt->size);
- md5_finish(s, buf);
+ hash_finish(s, buf);
return 0;
}
-static int framemd5_write_trailer(struct AVFormatContext *s)
+static int framehash_write_trailer(struct AVFormatContext *s)
{
- struct MD5Context *c = s->priv_data;
+ struct HashContext *c = s->priv_data;
av_hash_freep(&c->hash);
return 0;
}
+#endif
-static const AVClass framemd5_class = {
+#if CONFIG_FRAMEHASH_MUXER
+static const AVClass framehash_class = {
.class_name = "frame hash encoder class",
.item_name = av_default_item_name,
.option = hash_options,
.version = LIBAVUTIL_VERSION_INT,
};
+AVOutputFormat ff_framehash_muxer = {
+ .name = "framehash",
+ .long_name = NULL_IF_CONFIG_SMALL("Per-frame hash testing"),
+ .priv_data_size = sizeof(struct HashContext),
+ .audio_codec = AV_CODEC_ID_PCM_S16LE,
+ .video_codec = AV_CODEC_ID_RAWVIDEO,
+ .write_header = framehash_write_header,
+ .write_packet = framehash_write_packet,
+ .write_trailer = framehash_write_trailer,
+ .flags = AVFMT_VARIABLE_FPS | AVFMT_TS_NONSTRICT |
+ AVFMT_TS_NEGATIVE,
+ .priv_class = &framehash_class,
+};
+#endif
+
+#if CONFIG_FRAMEMD5_MUXER
+static const AVClass framemd5_class = {
+ .class_name = "frame hash encoder class",
+ .item_name = av_default_item_name,
+ .option = md5_options,
+ .version = LIBAVUTIL_VERSION_INT,
+};
+
AVOutputFormat ff_framemd5_muxer = {
.name = "framemd5",
.long_name = NULL_IF_CONFIG_SMALL("Per-frame MD5 testing"),
- .priv_data_size = sizeof(struct MD5Context),
+ .priv_data_size = sizeof(struct HashContext),
.audio_codec = AV_CODEC_ID_PCM_S16LE,
.video_codec = AV_CODEC_ID_RAWVIDEO,
- .write_header = framemd5_write_header,
- .write_packet = framemd5_write_packet,
- .write_trailer = framemd5_write_trailer,
+ .write_header = framehash_write_header,
+ .write_packet = framehash_write_packet,
+ .write_trailer = framehash_write_trailer,
.flags = AVFMT_VARIABLE_FPS | AVFMT_TS_NONSTRICT |
AVFMT_TS_NEGATIVE,
.priv_class = &framemd5_class,
diff --git a/libavformat/version.h b/libavformat/version.h
index d3408eb..3575c5a 100644
--- a/libavformat/version.h
+++ b/libavformat/version.h
@@ -30,7 +30,7 @@
#include "libavutil/version.h"
#define LIBAVFORMAT_VERSION_MAJOR 57
-#define LIBAVFORMAT_VERSION_MINOR 32
+#define LIBAVFORMAT_VERSION_MINOR 33
#define LIBAVFORMAT_VERSION_MICRO 100
#define LIBAVFORMAT_VERSION_INT AV_VERSION_INT(LIBAVFORMAT_VERSION_MAJOR, \
--
2.8.1
More information about the ffmpeg-devel
mailing list