From a9b34ca3f27ed0b3c10effd3fb884936d9b02485 Mon Sep 17 00:00:00 2001
From: Přemysl Eric Janouch
Date: Mon, 5 Jun 2023 17:52:58 +0200
Subject: Unite most info tools into just one binary
Turn this into more of an fq alternative, when used with jq.
Also don't say that TIFF files are Exif.
---
meson.build | 3 +-
tools/bmffinfo.c | 142 ---------------------------------
tools/info.c | 237 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
tools/info.h | 25 ++++++
tools/jpeginfo.c | 80 -------------------
tools/rawinfo.c | 2 +-
tools/tiffinfo.c | 79 -------------------
tools/webpinfo.c | 133 -------------------------------
8 files changed, 264 insertions(+), 437 deletions(-)
delete mode 100644 tools/bmffinfo.c
create mode 100644 tools/info.c
delete mode 100644 tools/jpeginfo.c
delete mode 100644 tools/tiffinfo.c
delete mode 100644 tools/webpinfo.c
diff --git a/meson.build b/meson.build
index 86d4f41..32ee8e6 100644
--- a/meson.build
+++ b/meson.build
@@ -189,8 +189,7 @@ if get_option('tools').enabled()
cc.find_library('jq'), dependency('libpng'), dependency('libraw')]
tools_c_args = cc.get_supported_arguments(
'-Wno-unused-function', '-Wno-unused-parameter')
- foreach tool : [
- 'pnginfo', 'rawinfo', 'jpeginfo', 'tiffinfo', 'webpinfo', 'bmffinfo']
+ foreach tool : ['info', 'pnginfo', 'rawinfo']
executable(tool, 'tools/' + tool + '.c', tiff_tables,
dependencies : tools_dependencies,
c_args: tools_c_args)
diff --git a/tools/bmffinfo.c b/tools/bmffinfo.c
deleted file mode 100644
index f0c6ff1..0000000
--- a/tools/bmffinfo.c
+++ /dev/null
@@ -1,142 +0,0 @@
-//
-// bmffinfo.c: acquire information about BMFF files in JSON format
-//
-// Copyright (c) 2021, Přemysl Eric Janouch
-//
-// Permission to use, copy, modify, and/or distribute this software for any
-// purpose with or without fee is hereby granted.
-//
-// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
-// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
-// SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
-// OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
-// CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
-//
-
-#include "info.h"
-
-#include
-
-#include
-#include
-#include
-#include
-
-// --- ISO/IEC base media file format ------------------------------------------
-// ISO/IEC 14496-12:2015(E), used to be publicly available, now there's only:
-// https://mpeg.chiariglione.org/standards/mpeg-4/iso-base-media-file-format/text-isoiec-14496-12-5th-edition
-// but people have managed to archive the final version as well:
-// https://b.goeswhere.com/ISO_IEC_14496-12_2015.pdf
-//
-// ISO/IEC 23008-12:2017 Information technology -
-// High efficiency coding and media delivery in heterogeneous environments -
-// Part 12: Image File Format + Cor 1:2020 Technical Corrigendum 1
-// https://standards.iso.org/ittf/PubliclyAvailableStandards/
-
-static jv
-parse_bmff_box(jv o, const char *type, const uint8_t *data, size_t len)
-{
- // TODO(p): Parse out "uuid"'s uint8_t[16] initial field, present as hex.
- // TODO(p): Parse out "ftyp" contents: 14496-12:2015 4.3
- // TODO(p): Parse out other important boxes: 14496-12:2015 8+
- return add_to_subarray(o, "boxes", jv_string(type));
-}
-
-static jv
-parse_bmff(jv o, const uint8_t *p, size_t len)
-{
- // 4.2 Object Structure--this box need not be present, nor at the beginning
- // TODO(p): What does `aligned(8)` mean? It's probably in bits.
- if (len < 8 || memcmp(p + 4, "ftyp", 4))
- return add_error(o, "not BMFF at all or unsupported");
-
- const uint8_t *end = p + len;
- while (p < end) {
- if (end - p < 8) {
- o = add_warning(o, "box framing mismatch");
- break;
- }
-
- char type[5] = "";
- memcpy(type, p + 4, 4);
-
- uint64_t box_size = u32be(p);
- const uint8_t *data = p + 8;
- if (box_size == 1) {
- if (end - p < 16) {
- o = add_warning(o, "unexpected EOF");
- break;
- }
- box_size = u64be(data);
- data += 8;
- } else if (!box_size)
- box_size = end - p;
-
- if (box_size > (uint64_t) (end - p)) {
- o = add_warning(o, "unexpected EOF");
- break;
- }
-
- size_t data_len = box_size - (data - p);
- o = parse_bmff_box(o, type, data, data_len);
- p += box_size;
- }
- return o;
-}
-
-// --- I/O ---------------------------------------------------------------------
-
-static jv
-do_file(const char *filename, jv o)
-{
- const char *err = NULL;
- FILE *fp = fopen(filename, "rb");
- if (!fp) {
- err = strerror(errno);
- goto error;
- }
-
- uint8_t *data = NULL, buf[256 << 10];
- size_t n, len = 0;
- while ((n = fread(buf, sizeof *buf, sizeof buf / sizeof *buf, fp))) {
- data = realloc(data, len + n);
- memcpy(data + len, buf, n);
- len += n;
- }
- if (ferror(fp)) {
- err = strerror(errno);
- goto error_read;
- }
-
- o = parse_bmff(o, data, len);
-error_read:
- fclose(fp);
- free(data);
-error:
- if (err)
- o = add_error(o, err);
- return o;
-}
-
-int
-main(int argc, char *argv[])
-{
- (void) parse_icc;
- (void) parse_exif;
- (void) parse_psir;
-
- // XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
- // Usage: find . -iname *.png -print0 | xargs -0 ./pnginfo
- for (int i = 1; i < argc; i++) {
- const char *filename = argv[i];
-
- jv o = jv_object();
- o = jv_object_set(o, jv_string("filename"), jv_string(filename));
- o = do_file(filename, o);
- jv_dumpf(o, stdout, 0 /* Might consider JV_PRINT_SORTED. */);
- fputc('\n', stdout);
- }
- return 0;
-}
diff --git a/tools/info.c b/tools/info.c
new file mode 100644
index 0000000..03da252
--- /dev/null
+++ b/tools/info.c
@@ -0,0 +1,237 @@
+//
+// info.c: acquire information about JPEG/TIFF/BMFF/WebP files in JSON format
+//
+// Copyright (c) 2021 - 2023, Přemysl Eric Janouch
+//
+// Permission to use, copy, modify, and/or distribute this software for any
+// purpose with or without fee is hereby granted.
+//
+// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
+// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
+// SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
+// OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
+// CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+//
+
+#include "info.h"
+
+#include
+
+#include
+#include
+#include
+#include
+
+// --- ISO/IEC base media file format ------------------------------------------
+// ISO/IEC 14496-12:2015(E), used to be publicly available, now there's only:
+// https://mpeg.chiariglione.org/standards/mpeg-4/iso-base-media-file-format/text-isoiec-14496-12-5th-edition
+// but people have managed to archive the final version as well:
+// https://b.goeswhere.com/ISO_IEC_14496-12_2015.pdf
+//
+// ISO/IEC 23008-12:2017 Information technology -
+// High efficiency coding and media delivery in heterogeneous environments -
+// Part 12: Image File Format + Cor 1:2020 Technical Corrigendum 1
+// https://standards.iso.org/ittf/PubliclyAvailableStandards/
+
+static jv
+parse_bmff_box(jv o, const char *type, const uint8_t *data, size_t len)
+{
+ // TODO(p): Parse out "uuid"'s uint8_t[16] initial field, present as hex.
+ // TODO(p): Parse out "ftyp" contents: 14496-12:2015 4.3
+ // TODO(p): Parse out other important boxes: 14496-12:2015 8+
+ return add_to_subarray(o, "boxes", jv_string(type));
+}
+
+static bool
+detect_bmff(const uint8_t *p, size_t len)
+{
+ // 4.2 Object Structure--this box need not be present, nor at the beginning
+ // TODO(p): What does `aligned(8)` mean? It's probably in bits.
+ return len >= 8 && !memcmp(p + 4, "ftyp", 4);
+}
+
+static jv
+parse_bmff(jv o, const uint8_t *p, size_t len)
+{
+ if (!detect_bmff(p, len))
+ return add_error(o, "not BMFF at all or unsupported");
+
+ const uint8_t *end = p + len;
+ while (p < end) {
+ if (end - p < 8) {
+ o = add_warning(o, "box framing mismatch");
+ break;
+ }
+
+ char type[5] = "";
+ memcpy(type, p + 4, 4);
+
+ uint64_t box_size = u32be(p);
+ const uint8_t *data = p + 8;
+ if (box_size == 1) {
+ if (end - p < 16) {
+ o = add_warning(o, "unexpected EOF");
+ break;
+ }
+ box_size = u64be(data);
+ data += 8;
+ } else if (!box_size)
+ box_size = end - p;
+
+ if (box_size > (uint64_t) (end - p)) {
+ o = add_warning(o, "unexpected EOF");
+ break;
+ }
+
+ size_t data_len = box_size - (data - p);
+ o = parse_bmff_box(o, type, data, data_len);
+ p += box_size;
+ }
+ return o;
+}
+
+// --- WebP --------------------------------------------------------------------
+// libwebp won't let us simply iterate over all chunks, so handroll it.
+//
+// https://github.com/webmproject/libwebp/blob/master/doc/webp-container-spec.txt
+// https://github.com/webmproject/libwebp/blob/master/doc/webp-lossless-bitstream-spec.txt
+// https://datatracker.ietf.org/doc/html/rfc6386
+//
+// Pretty versions, hopefully not outdated:
+// https://developers.google.com/speed/webp/docs/riff_container
+// https://developers.google.com/speed/webp/docs/webp_lossless_bitstream_specification
+
+static bool
+detect_webp(const uint8_t *p, size_t len)
+{
+ return len >= 12 && !memcmp(p, "RIFF", 4) && !memcmp(p + 8, "WEBP", 4);
+}
+
+static jv
+parse_webp(jv o, const uint8_t *p, size_t len)
+{
+ if (!detect_webp(p, len))
+ return add_error(o, "not a WEBP file");
+
+ // TODO(p): This can still be parseable.
+ // TODO(p): Warn on trailing data.
+ uint32_t size = u32le(p + 4);
+ if (8 + size < len)
+ return add_error(o, "truncated file");
+
+ const uint8_t *end = p + 8 + size;
+ p += 12;
+
+ jv chunks = jv_array();
+ while (p < end) {
+ if (end - p < 8) {
+ o = add_warning(o, "framing mismatch");
+ printf("%ld", end - p);
+ break;
+ }
+
+ uint32_t chunk_size = u32le(p + 4);
+ uint32_t chunk_advance = (chunk_size + 1) & ~1;
+ if (p + 8 + chunk_advance > end) {
+ o = add_warning(o, "runaway chunk payload");
+ break;
+ }
+
+ char fourcc[5] = "";
+ memcpy(fourcc, p, 4);
+ chunks = jv_array_append(chunks, jv_string(fourcc));
+ p += 8;
+
+ // TODO(p): Decode VP8 and VP8L chunk metadata.
+ if (!strcmp(fourcc, "EXIF"))
+ o = parse_exif(o, p, chunk_size);
+ if (!strcmp(fourcc, "ICCP"))
+ o = parse_icc(o, p, chunk_size);
+ p += chunk_advance;
+ }
+ return jv_set(o, jv_string("chunks"), chunks);
+}
+
+// --- I/O ---------------------------------------------------------------------
+
+static struct {
+ const char *name;
+ bool (*detect) (const uint8_t *, size_t);
+ jv (*parse) (jv, const uint8_t *, size_t);
+} formats[] = {
+ {"JPEG", detect_jpeg, parse_jpeg},
+ {"TIFF", detect_tiff, parse_tiff},
+ {"BMFF", detect_bmff, parse_bmff},
+ {"WebP", detect_webp, parse_webp},
+};
+
+static jv
+parse_any(jv o, const uint8_t *p, size_t len)
+{
+ // TODO(p): Also see if the file extension is appropriate.
+ for (size_t i = 0; i < sizeof formats / sizeof *formats; i++) {
+ if (!formats[i].detect(p, len))
+ continue;
+ if (getenv("INFO_IDENTIFY"))
+ o = jv_set(o, jv_string("format"), jv_string(formats[i].name));
+ return formats[i].parse(o, p, len);
+ }
+ return add_error(o, "unsupported file format");
+}
+
+static jv
+do_file(const char *filename, jv o)
+{
+ const char *err = NULL;
+ FILE *fp = fopen(filename, "rb");
+ if (!fp) {
+ err = strerror(errno);
+ goto error;
+ }
+
+ uint8_t *data = NULL, buf[256 << 10];
+ size_t n, len = 0;
+ while ((n = fread(buf, sizeof *buf, sizeof buf / sizeof *buf, fp))) {
+ data = realloc(data, len + n);
+ memcpy(data + len, buf, n);
+ len += n;
+ }
+ if (ferror(fp)) {
+ err = strerror(errno);
+ goto error_read;
+ }
+
+#if 0
+ // Not sure if I want to ensure their existence...
+ o = jv_object_set(o, jv_string("info"), jv_array());
+ o = jv_object_set(o, jv_string("warnings"), jv_array());
+#endif
+
+ o = parse_any(o, data, len);
+error_read:
+ fclose(fp);
+ free(data);
+error:
+ if (err)
+ o = add_error(o, err);
+ return o;
+}
+
+int
+main(int argc, char *argv[])
+{
+ // XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
+ // Usage: find . -print0 | xargs -0 ./info
+ for (int i = 1; i < argc; i++) {
+ const char *filename = argv[i];
+
+ jv o = jv_object();
+ o = jv_object_set(o, jv_string("filename"), jv_string(filename));
+ o = do_file(filename, o);
+ jv_dumpf(o, stdout, 0 /* JV_PRINT_SORTED would discard information. */);
+ fputc('\n', stdout);
+ }
+ return 0;
+}
diff --git a/tools/info.h b/tools/info.h
index 0d7a699..d640f35 100644
--- a/tools/info.h
+++ b/tools/info.h
@@ -278,6 +278,25 @@ parse_exif(jv o, const uint8_t *p, size_t len)
return o;
}
+static bool
+detect_tiff(const uint8_t *p, size_t len)
+{
+ return tiffer_init(&(struct tiffer) {}, p, len);
+}
+
+// TODO(p): Photoshop data and ICC profiles also have their tag in TIFF,
+// they're not currently processed.
+static jv
+parse_tiff(jv o, const uint8_t *p, size_t len)
+{
+ struct tiffer T = {};
+ if (!tiffer_init(&T, p, len))
+ return add_warning(o, "invalid TIFF");
+ while (tiffer_next_ifd(&T))
+ o = add_to_subarray(o, "TIFF", parse_exif_ifd(&T, tiff_entries));
+ return o;
+}
+
// --- Photoshop Image Resources -----------------------------------------------
// Adobe XMP Specification Part 3: Storage in Files, 2020/1, 1.1.3 + 3.1.3
// https://www.adobe.com/devnet-apps/photoshop/fileformatashtml/
@@ -1084,6 +1103,12 @@ parse_marker(uint8_t marker, const uint8_t *p, const uint8_t *end,
return p;
}
+static bool
+detect_jpeg(const uint8_t *p, size_t len)
+{
+ return len >= 2 && p[0] == 0xff && p[1] == SOI;
+}
+
static jv
parse_jpeg(jv o, const uint8_t *p, size_t len)
{
diff --git a/tools/jpeginfo.c b/tools/jpeginfo.c
deleted file mode 100644
index 2793764..0000000
--- a/tools/jpeginfo.c
+++ /dev/null
@@ -1,80 +0,0 @@
-//
-// jpeginfo.c: acquire information about JPEG files in JSON format
-//
-// Copyright (c) 2021, Přemysl Eric Janouch
-//
-// Permission to use, copy, modify, and/or distribute this software for any
-// purpose with or without fee is hereby granted.
-//
-// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
-// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
-// SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
-// OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
-// CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
-//
-
-#include "info.h"
-
-#include
-
-#include
-#include
-#include
-#include
-
-static jv
-do_file(const char *filename, jv o)
-{
- const char *err = NULL;
- FILE *fp = fopen(filename, "rb");
- if (!fp) {
- err = strerror(errno);
- goto error;
- }
-
- uint8_t *data = NULL, buf[256 << 10];
- size_t n, len = 0;
- while ((n = fread(buf, sizeof *buf, sizeof buf / sizeof *buf, fp))) {
- data = realloc(data, len + n);
- memcpy(data + len, buf, n);
- len += n;
- }
- if (ferror(fp)) {
- err = strerror(errno);
- goto error_read;
- }
-
-#if 0
- // Not sure if I want to ensure their existence...
- o = jv_object_set(o, jv_string("info"), jv_array());
- o = jv_object_set(o, jv_string("warnings"), jv_array());
-#endif
-
- o = parse_jpeg(o, data, len);
-error_read:
- fclose(fp);
- free(data);
-error:
- if (err)
- o = add_error(o, err);
- return o;
-}
-
-int
-main(int argc, char *argv[])
-{
- // XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
- // Usage: find . -iname *.png -print0 | xargs -0 ./pnginfo
- for (int i = 1; i < argc; i++) {
- const char *filename = argv[i];
-
- jv o = jv_object();
- o = jv_object_set(o, jv_string("filename"), jv_string(filename));
- o = do_file(filename, o);
- jv_dumpf(o, stdout, 0 /* Might consider JV_PRINT_SORTED. */);
- fputc('\n', stdout);
- }
- return 0;
-}
diff --git a/tools/rawinfo.c b/tools/rawinfo.c
index 60f8482..6409d33 100644
--- a/tools/rawinfo.c
+++ b/tools/rawinfo.c
@@ -161,7 +161,7 @@ int
main(int argc, char *argv[])
{
// XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
- // Usage: find . -iname *.png -print0 | xargs -0 ./rawinfo
+ // Usage: find . -print0 | xargs -0 ./rawinfo
for (int i = 1; i < argc; i++) {
const char *filename = argv[i];
diff --git a/tools/tiffinfo.c b/tools/tiffinfo.c
deleted file mode 100644
index 97f2309..0000000
--- a/tools/tiffinfo.c
+++ /dev/null
@@ -1,79 +0,0 @@
-//
-// tiffinfo.c: acquire information about TIFF files in JSON format
-//
-// Copyright (c) 2021, Přemysl Eric Janouch
-//
-// Permission to use, copy, modify, and/or distribute this software for any
-// purpose with or without fee is hereby granted.
-//
-// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
-// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
-// SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
-// OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
-// CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
-//
-
-#include "info.h"
-
-#include
-
-#include
-#include
-#include
-#include
-
-// This is essentially the same as jpeginfo.c, but we only have an Exif segment.
-// TODO(p): Photoshop data and ICC profiles also have their tag,
-// they're not currently processed.
-
-static jv
-do_file(const char *filename, jv o)
-{
- const char *err = NULL;
- FILE *fp = fopen(filename, "rb");
- if (!fp) {
- err = strerror(errno);
- goto error;
- }
-
- uint8_t *data = NULL, buf[256 << 10];
- size_t n, len = 0;
- while ((n = fread(buf, sizeof *buf, sizeof buf / sizeof *buf, fp))) {
- data = realloc(data, len + n);
- memcpy(data + len, buf, n);
- len += n;
- }
- if (ferror(fp)) {
- err = strerror(errno);
- goto error_read;
- }
-
- o = parse_exif(o, data, len);
-
-error_read:
- fclose(fp);
- free(data);
-error:
- if (err)
- o = add_error(o, err);
- return o;
-}
-
-int
-main(int argc, char *argv[])
-{
- // XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
- // Usage: find . -iname *.png -print0 | xargs -0 ./pnginfo
- for (int i = 1; i < argc; i++) {
- const char *filename = argv[i];
-
- jv o = jv_object();
- o = jv_object_set(o, jv_string("filename"), jv_string(filename));
- o = do_file(filename, o);
- jv_dumpf(o, stdout, 0 /* Might consider JV_PRINT_SORTED. */);
- fputc('\n', stdout);
- }
- return 0;
-}
diff --git a/tools/webpinfo.c b/tools/webpinfo.c
deleted file mode 100644
index f3417f9..0000000
--- a/tools/webpinfo.c
+++ /dev/null
@@ -1,133 +0,0 @@
-//
-// webpinfo.c: acquire information about WebP files in JSON format
-//
-// Copyright (c) 2021, Přemysl Eric Janouch
-//
-// Permission to use, copy, modify, and/or distribute this software for any
-// purpose with or without fee is hereby granted.
-//
-// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
-// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
-// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
-// SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
-// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
-// OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
-// CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
-//
-
-#include "info.h"
-
-#include
-
-#include
-#include
-#include
-#include
-
-// --- WebP --------------------------------------------------------------------
-// https://github.com/webmproject/libwebp/blob/master/doc/webp-container-spec.txt
-// https://github.com/webmproject/libwebp/blob/master/doc/webp-lossless-bitstream-spec.txt
-// https://datatracker.ietf.org/doc/html/rfc6386
-//
-// Pretty versions, hopefully not outdated:
-// https://developers.google.com/speed/webp/docs/riff_container
-// https://developers.google.com/speed/webp/docs/webp_lossless_bitstream_specification
-
-static jv
-parse_webp(jv o, const uint8_t *p, size_t len)
-{
- // libwebp won't let us simply iterate over all chunks, so handroll it.
- if (len < 12 || memcmp(p, "RIFF", 4) || memcmp(p + 8, "WEBP", 4))
- return add_error(o, "not a WEBP file");
-
- // TODO(p): This can still be parseable.
- // TODO(p): Warn on trailing data.
- uint32_t size = u32le(p + 4);
- if (8 + size < len)
- return add_error(o, "truncated file");
-
- const uint8_t *end = p + 8 + size;
- p += 12;
-
- jv chunks = jv_array();
- while (p < end) {
- if (end - p < 8) {
- o = add_warning(o, "framing mismatch");
- printf("%ld", end - p);
- break;
- }
-
- uint32_t chunk_size = u32le(p + 4);
- uint32_t chunk_advance = (chunk_size + 1) & ~1;
- if (p + 8 + chunk_advance > end) {
- o = add_warning(o, "runaway chunk payload");
- break;
- }
-
- char fourcc[5] = "";
- memcpy(fourcc, p, 4);
- chunks = jv_array_append(chunks, jv_string(fourcc));
- p += 8;
-
- // TODO(p): Decode VP8 and VP8L chunk metadata.
- if (!strcmp(fourcc, "EXIF"))
- o = parse_exif(o, p, chunk_size);
- if (!strcmp(fourcc, "ICCP"))
- o = parse_icc(o, p, chunk_size);
- p += chunk_advance;
- }
- return jv_set(o, jv_string("chunks"), chunks);
-}
-
-// --- I/O ---------------------------------------------------------------------
-
-static jv
-do_file(const char *filename, jv o)
-{
- const char *err = NULL;
- FILE *fp = fopen(filename, "rb");
- if (!fp) {
- err = strerror(errno);
- goto error;
- }
-
- uint8_t *data = NULL, buf[256 << 10];
- size_t n, len = 0;
- while ((n = fread(buf, sizeof *buf, sizeof buf / sizeof *buf, fp))) {
- data = realloc(data, len + n);
- memcpy(data + len, buf, n);
- len += n;
- }
- if (ferror(fp)) {
- err = strerror(errno);
- goto error_read;
- }
-
- o = parse_webp(o, data, len);
-error_read:
- fclose(fp);
- free(data);
-error:
- if (err)
- o = add_error(o, err);
- return o;
-}
-
-int
-main(int argc, char *argv[])
-{
- (void) parse_psir;
-
- // XXX: Can't use `xargs -P0`, there's a risk of non-atomic writes.
- // Usage: find . -iname *.png -print0 | xargs -0 ./pnginfo
- for (int i = 1; i < argc; i++) {
- const char *filename = argv[i];
-
- jv o = jv_object();
- o = jv_object_set(o, jv_string("filename"), jv_string(filename));
- o = do_file(filename, o);
- jv_dumpf(o, stdout, 0 /* Might consider JV_PRINT_SORTED. */);
- fputc('\n', stdout);
- }
- return 0;
-}
--
cgit v1.2.3-70-g09d2