Mercurial > hgrepos > Python2 > PyMuPDF

diff mupdf-source/thirdparty/zint/backend/common.c @ 2:b50eed0cc0ef upstream
ADD: MuPDF v1.26.7: the MuPDF source as downloaded by a default build of PyMuPDF 1.26.4. The directory name has changed: no version number in the expanded directory now.
author: Franz Glasner <fzglas.hg@dom66.de>
date: Mon, 15 Sep 2025 11:43:07 +0200
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/mupdf-source/thirdparty/zint/backend/common.c	Mon Sep 15 11:43:07 2025 +0200
@@ -0,0 +1,968 @@
+/* common.c - Contains functions needed for a number of barcodes */
+/*
+    libzint - the open source barcode library
+    Copyright (C) 2008-2024 Robin Stuart <rstuart114@gmail.com>
+
+    Redistribution and use in source and binary forms, with or without
+    modification, are permitted provided that the following conditions
+    are met:
+
+    1. Redistributions of source code must retain the above copyright
+       notice, this list of conditions and the following disclaimer.
+    2. Redistributions in binary form must reproduce the above copyright
+       notice, this list of conditions and the following disclaimer in the
+       documentation and/or other materials provided with the distribution.
+    3. Neither the name of the project nor the names of its contributors
+       may be used to endorse or promote products derived from this software
+       without specific prior written permission.
+
+    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+    ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+    IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
+    ARE DISCLAIMED.  IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
+    FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
+    DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
+    OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
+    HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
+    LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
+    OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
+    SUCH DAMAGE.
+ */
+/* SPDX-License-Identifier: BSD-3-Clause */
+
+#include <assert.h>
+#include <stdarg.h>
+#include <stdio.h>
+#include "common.h"
+
+/* Converts a character 0-9, A-F to its equivalent integer value */
+INTERNAL int ctoi(const char source) {
+    if (z_isdigit(source))
+        return (source - '0');
+    if ((source >= 'A') && (source <= 'F'))
+        return (source - 'A' + 10);
+    if ((source >= 'a') && (source <= 'f'))
+        return (source - 'a' + 10);
+    return -1;
+}
+
+/* Converts decimal string of length <= 9 to integer value. Returns -1 if not numeric */
+INTERNAL int to_int(const unsigned char source[], const int length) {
+    int val = 0;
+    int non_digit = 0;
+    int i;
+
+    for (i = 0; i < length; i++) {
+        val *= 10;
+        val += source[i] - '0';
+        non_digit |= !z_isdigit(source[i]);
+    }
+
+    return non_digit ? -1 : val;
+}
+
+/* Converts lower case characters to upper case in string `source` */
+INTERNAL void to_upper(unsigned char source[], const int length) {
+    int i;
+
+    for (i = 0; i < length; i++) {
+        source[i] &= z_islower(source[i]) ? 0x5F : 0xFF;
+    }
+}
+
+/* Returns the number of times a character occurs in `source` */
+INTERNAL int chr_cnt(const unsigned char source[], const int length, const unsigned char c) {
+    int count = 0;
+    int i;
+    for (i = 0; i < length; i++) {
+        count += source[i] == c;
+    }
+    return count;
+}
+
+/* Flag table for `is_chr()` and `not_sane()` */
+#define IS_CLS_F    (IS_CLI_F | IS_SIL_F)
+static const unsigned short flgs[256] = {
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /*00-1F*/
+               IS_SPC_F,            IS_C82_F,            IS_C82_F,            IS_HSH_F, /*20-23*/ /*  !"# */
+               IS_CLS_F, IS_SIL_F | IS_C82_F,            IS_C82_F,            IS_C82_F, /*24-27*/ /* $%&' */
+               IS_C82_F,            IS_C82_F,            IS_AST_F,            IS_PLS_F, /*28-2B*/ /* ()*+ */
+               IS_C82_F,            IS_MNS_F, IS_CLS_F | IS_C82_F, IS_CLS_F | IS_C82_F, /*2B-2F*/ /* ,-./ */
+               IS_NUM_F,            IS_NUM_F,            IS_NUM_F,            IS_NUM_F, /*30-33*/ /* 0123 */
+               IS_NUM_F,            IS_NUM_F,            IS_NUM_F,            IS_NUM_F, /*34-37*/ /* 4567 */
+               IS_NUM_F,            IS_NUM_F, IS_CLI_F | IS_C82_F,            IS_C82_F, /*38-3B*/ /* 89:; */
+               IS_C82_F,            IS_C82_F,            IS_C82_F,            IS_C82_F, /*3B-3F*/ /* <=>? */
+                      0, IS_UHX_F | IS_ARS_F, IS_UHX_F | IS_ARS_F, IS_UHX_F | IS_ARS_F, /*40-43*/ /* @ABC */
+    IS_UHX_F | IS_ARS_F, IS_UHX_F | IS_ARS_F, IS_UHX_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, /*44-47*/ /* DEFG */
+    IS_UPO_F | IS_ARS_F,            IS_UPO_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, /*48-4B*/ /* HIJK */
+    IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F,            IS_UPO_F, /*4B-4F*/ /* LMNO */
+    IS_UPO_F | IS_ARS_F,            IS_UPO_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, /*50-53*/ /* PQRS */
+    IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F, /*53-57*/ /* TUVW */
+    IS_UX__F | IS_ARS_F, IS_UPO_F | IS_ARS_F, IS_UPO_F | IS_ARS_F,                   0, /*58-5B*/ /* XYZ[ */
+                      0,                   0,                   0,            IS_C82_F, /*5B-5F*/ /* \]^_ */
+                      0,            IS_LHX_F,            IS_LHX_F,            IS_LHX_F, /*60-63*/ /* `abc */
+               IS_LHX_F,            IS_LHX_F,            IS_LHX_F,            IS_LWO_F, /*64-67*/ /* defg */
+               IS_LWO_F,            IS_LWO_F,            IS_LWO_F,            IS_LWO_F, /*68-6B*/ /* hijk */
+               IS_LWO_F,            IS_LWO_F,            IS_LWO_F,            IS_LWO_F, /*6B-6F*/ /* lmno */
+               IS_LWO_F,            IS_LWO_F,            IS_LWO_F,            IS_LWO_F, /*70-73*/ /* pqrs */
+               IS_LWO_F,            IS_LWO_F,            IS_LWO_F,            IS_LWO_F, /*74-77*/ /* tuvw */
+               IS_LX__F,            IS_LWO_F,            IS_LWO_F,                   0, /*78-7B*/ /* xyz{ */
+                      0,                   0,                   0,                   0, /*7B-7F*/ /* |}~D */
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /*80-9F*/
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /*A0-BF*/
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /*C0-DF*/
+    0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /*E0-FF*/
+};
+
+/* Whether a character matches `flg` */
+INTERNAL int is_chr(const unsigned int flg, const unsigned int c) {
+    return c < 0x80 && (flgs[c] & flg) != 0;
+}
+
+/* Verifies if a string only uses valid characters, returning 1-based position in `source` if not, 0 for success */
+INTERNAL int not_sane(const unsigned int flg, const unsigned char source[], const int length) {
+    int i;
+
+    for (i = 0; i < length; i++) {
+        if (!(flgs[source[i]] & flg)) {
+            return i + 1;
+        }
+    }
+    return 0;
+}
+
+/* Replaces huge switch statements for looking up in tables */
+/* Verifies if a string only uses valid characters as above, but also returns `test_string` position of each in
+   `posns` array */
+INTERNAL int not_sane_lookup(const char test_string[], const int test_length, const unsigned char source[],
+                const int length, int *posns) {
+    int i, j;
+
+    for (i = 0; i < length; i++) {
+        posns[i] = -1;
+        for (j = 0; j < test_length; j++) {
+            if (source[i] == test_string[j]) {
+                posns[i] = j;
+                break;
+            }
+        }
+        if (posns[i] == -1) {
+            return i + 1;
+        }
+    }
+
+    return 0;
+}
+
+/* Returns the position of `data` in `set_string`, or -1 if not found */
+INTERNAL int posn(const char set_string[], const char data) {
+    const char *s;
+
+    for (s = set_string; *s; s++) {
+        if (data == *s) {
+            return s - set_string;
+        }
+    }
+    return -1;
+}
+
+/* Converts `arg` to a string representing its binary equivalent of length `length` and places in `binary` at
+  `bin_posn`. Returns `bin_posn` + `length` */
+INTERNAL int bin_append_posn(const int arg, const int length, char *binary, const int bin_posn) {
+    int i;
+    const int end = length - 1;
+
+    for (i = 0; i < length; i++) {
+        binary[bin_posn + i] = '0' + ((arg >> (end - i)) & 1);
+    }
+    return bin_posn + length;
+}
+
+#ifndef Z_COMMON_INLINE
+
+/* Returns true (1) if a module is dark/black, otherwise false (0) */
+INTERNAL int module_is_set(const struct zint_symbol *symbol, const int y_coord, const int x_coord) {
+    return (symbol->encoded_data[y_coord][x_coord >> 3] >> (x_coord & 0x07)) & 1;
+}
+
+/* Sets a module to dark/black */
+INTERNAL void set_module(struct zint_symbol *symbol, const int y_coord, const int x_coord) {
+    symbol->encoded_data[y_coord][x_coord >> 3] |= 1 << (x_coord & 0x07);
+}
+
+/* Returns true (1-8) if a module is colour, otherwise false (0) */
+INTERNAL int module_colour_is_set(const struct zint_symbol *symbol, const int y_coord, const int x_coord) {
+    return symbol->encoded_data[y_coord][x_coord];
+}
+
+/* Sets a module to a colour */
+INTERNAL void set_module_colour(struct zint_symbol *symbol, const int y_coord, const int x_coord, const int colour) {
+    symbol->encoded_data[y_coord][x_coord] = colour;
+}
+
+/* Sets a dark/black module to white (i.e. unsets) */
+INTERNAL void unset_module(struct zint_symbol *symbol, const int y_coord, const int x_coord) {
+    symbol->encoded_data[y_coord][x_coord >> 3] &= ~(1 << (x_coord & 0x07));
+}
+
+#endif /* Z_COMMON_INLINE */
+
+/* Expands from a width pattern to a bit pattern */
+INTERNAL void expand(struct zint_symbol *symbol, const char data[], const int length) {
+
+    int reader;
+    int writer = 0;
+    int latch = 1;
+    const int row = symbol->rows;
+
+    symbol->rows++;
+
+    for (reader = 0; reader < length; reader++) {
+        int i;
+        const int num = data[reader] - '0';
+        assert(num >= 0);
+        for (i = 0; i < num; i++) {
+            if (latch) {
+                set_module(symbol, row, writer);
+            }
+            writer++;
+        }
+
+        latch = !latch;
+    }
+
+    if (writer > symbol->width) {
+        symbol->width = writer;
+    }
+}
+
+/* Helper for `errtxt()` & `errtxtf()` to set "err_id: " part of error message, returning length */
+static int errtxt_id_str(char *errtxt, int num) {
+    int len = 0;
+    if (num == -1) {
+        errtxt[0] = '\0';
+        return 0;
+    }
+    if (num < 0 || num > 9999) { /* Restrict to 4 digits */
+        num = 9999;
+    }
+    if (num >= 1000) {
+        errtxt[len++] = '0' + (num / 1000);
+        num %= 1000;
+    }
+    errtxt[len++] = '0' + (num / 100);
+    num %= 100;
+    errtxt[len++] = '0' + (num / 10);
+    num %= 10;
+    errtxt[len++] = '0' + num;
+    errtxt[len++] = ':';
+    errtxt[len++] = ' ';
+    return len;
+}
+
+/* Set `symbol->errtxt` to "err_id: msg", returning `error_number`. If `err_id` is -1, the "err_id: " prefix is
+   omitted */
+INTERNAL int errtxt(const int error_number, struct zint_symbol *symbol, const int err_id, const char *msg) {
+    const int max_len = (int) sizeof(symbol->errtxt) - 1;
+    const int id_len = errtxt_id_str(symbol->errtxt, err_id);
+    int msg_len = (int) strlen(msg);
+
+    if (id_len + msg_len > max_len) {
+        if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0); /* Catch truncations */
+        msg_len = max_len - id_len;
+    }
+    memcpy(symbol->errtxt + id_len, msg, msg_len);
+
+    symbol->errtxt[id_len + msg_len] = '\0';
+
+    return error_number;
+}
+
+static int errtxtf_dpad(const char *fmt); /* Forward reference */
+
+/* Helper for `errtxtf()` to parse numbered specifier "n$" (where "n" 1-9), returning `fmt` advance increment */
+static int errtxtf_num_arg(const char *fmt, int *p_arg) {
+    int ret = 0;
+    int arg = -2;
+    if (!errtxtf_dpad(fmt) && z_isdigit(fmt[0])) {
+        arg = fmt[1] == '$' ? fmt[0] - '0' - 1 : -1;
+        ret = 2;
+    }
+    if (p_arg) {
+        *p_arg = arg;
+    }
+    return ret;
+}
+
+/* Helper for `errtxtf()` to parse length precision, returning `fmt` advance increment */
+static int errtxtf_slen(const char *fmt, const int arg, int *p_arg_cnt, int *p_len) {
+    int ret = 0;
+    int len = -1;
+    if (fmt[0] == '.') {
+        if (z_isdigit(fmt[1]) && fmt[1] != '0') {
+            len = fmt[1] - '0';
+            for (ret = 2; z_isdigit(fmt[ret]); ret++) {
+                len = len * 10 + fmt[ret] - '0';
+            }
+            if (fmt[ret] != 's') {
+                len = -1;
+            }
+        } else if (fmt[1] == '*' && fmt[2] == 's' && arg < 0) {
+            len = 0;
+            ret = 2;
+        } else if (fmt[1] == '*' && z_isdigit(fmt[2]) && fmt[3] == '$' && fmt[4] == 's') {
+            if (arg == -1 || arg == fmt[2] - '0') {
+                len = 0;
+                if (p_arg_cnt) {
+                    (*p_arg_cnt)++;
+                }
+            }
+            ret = 4;
+        } else {
+            ret = 1;
+        }
+    }
+    if (p_len) {
+        *p_len = len;
+    }
+    return ret;
+}
+
+/* Helper for `errtxtf()` to parse zero-padded minimum field length for "%d", returning `fmt` advance increment */
+static int errtxtf_dpad(const char *fmt) {
+    /* Allow one leading zero plus one or two digits only */
+    if (fmt[0] == '0' && z_isdigit(fmt[1])) {
+        if (fmt[1] != '0' && fmt[2] == 'd') {
+            return 2;
+        }
+        if (z_isdigit(fmt[1]) && fmt[1] != '0' && z_isdigit(fmt[2]) && fmt[3] == 'd') {
+            return 3;
+        }
+    }
+    return 0;
+}
+
+/* Set `symbol->errtxt` to "err_id: msg" with restricted subset of `printf()` formatting, returning `error_number`.
+   If `err_id` is -1, the "err_id: " prefix is omitted. Only the following specifiers are supported: "c", "d", "f",
+   "g" and "s", with no modifiers apart from "<n>$" numbering for l10n ("<n>" 1-9), in which case all specifiers must
+   be numbered, "%s" with length precisions: "%.*s", "%<n+1>$.*<n>$s", "%.<p>s" and "%<n>$.<p>s", and "%d" with
+   zero-padded minimum field lengths: "%0<m>d" or %<n>$0<m>d" ("<m>" 1-99) */
+INTERNAL int errtxtf(const int error_number, struct zint_symbol *symbol, const int err_id, const char *fmt, ...) {
+    const int max_len = (int) sizeof(symbol->errtxt) - 1;
+    int p = errtxt_id_str(symbol->errtxt, err_id);
+    const char *f;
+    int i;
+    int arg_cnt = 0;
+    int have_num_arg = 0, have_unnum_arg = 0;
+    va_list ap;
+    int idxs[9] = {0}; /* Argument order */
+    char specs[9] = {0}; /* Format specifiers */
+    const char *ss[9] = { NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL, NULL }; /* "%s" */
+    int slens[9] = {0}; /* "%s" length precisions */
+    int have_slens[9] = {0}; /* Bools for if "%s" has length precision */
+    char dpads[9][3] = {{0}}; /* 2-digit minimum field length */
+    char dfgs[9][100] = {{0}}; /* "%d", "%f" and "%g", allowing for padding up to 99 */
+    int cs[9] = {0}; /* "%c" */
+
+    /* Get argument order and specifiers */
+    for (f = fmt, i = 0; *f; f++) {
+        if (*f == '%') {
+            int inc, arg, len;
+            if (*++f == '%') {
+                continue;
+            }
+            if ((inc = errtxtf_num_arg(f, &arg))) {
+                if (arg == -1) {
+                    if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+                    return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0,
+                                    "Internal error: invalid numbered format specifer");
+                }
+                if (i >= 9) {
+                    if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+                    return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0,
+                                    "Internal error: too many format specifiers (9 maximum)");
+                }
+                f += inc;
+                have_num_arg = 1;
+                idxs[i] = arg;
+            } else {
+                if (i >= 9) {
+                    if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+                    return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0,
+                                    "Internal error: too many format specifiers (9 maximum)");
+                }
+                have_unnum_arg = 1;
+                idxs[i] = i;
+            }
+            if ((inc = errtxtf_slen(f, arg, &arg_cnt, &len))) {
+                if (len == -1) {
+                    if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+                    return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0, "Internal error: invalid length precision");
+                }
+                slens[idxs[i]] = len == 0 ? -1 : len; /* TODO: keep `slens` separate else last mentioned trumps */
+                have_slens[idxs[i]] = 1;
+                f += inc;
+            }
+            if ((inc = errtxtf_dpad(f))) {
+                memcpy(dpads[idxs[i]], f + 1, inc - 1); /* TODO: keep `dpads` separate else last mentioned trumps */
+                dpads[idxs[i]][inc - 1] = '\0';
+                f += inc;
+            }
+            if (*f != 'c' && *f != 'd' && *f != 'f' && *f != 'g' && *f != 's') {
+                if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+                return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0,
+                                "Internal error: unknown format specifier ('%c','%d','%f','%g','%s' only)");
+            }
+            specs[idxs[i++]] = *f;
+            arg_cnt++;
+        }
+    }
+    if (have_num_arg && have_unnum_arg) {
+        if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0);
+        return errtxt(ZINT_ERROR_ENCODING_PROBLEM, symbol, 0,
+                        "Internal error: mixed numbered and unnumbered format specifiers");
+    }
+
+    /* Get arguments */
+    va_start(ap, fmt);
+    for (i = 0; i < arg_cnt; i++) {
+        if (specs[i] == 'c') {
+            cs[i] = va_arg(ap, int);
+        } else if (specs[i] == 'd') {
+            if (dpads[i][0]) {
+                char dpad_fmt[30]; /* Make 30 to suppress gcc 14 "-Wformat-overflow=" false positive */
+                sprintf(dpad_fmt, "%%0%sd", dpads[i]); /* TODO: keep `dpads` separate else last mentioned trumps */
+                sprintf(dfgs[i], dpad_fmt, va_arg(ap, int));
+            } else {
+                sprintf(dfgs[i], "%d", va_arg(ap, int));
+            }
+        } else if (specs[i] == 'f' || specs[i] == 'g') {
+            sprintf(dfgs[i], specs[i] == 'f' ? "%f" : "%g", va_arg(ap, double));
+        } else if (specs[i] == 's') {
+            if (have_slens[i] && slens[i] == -1) {
+                slens[i] = va_arg(ap, int); /* TODO: keep `slens` separate else last mentioned trumps */
+            }
+            ss[i] = va_arg(ap, char *);
+        }
+    }
+    va_end(ap);
+
+    /* Populate `errtxt` */
+    for (f = fmt, i = 0; *f && p < max_len; f++) {
+        if (*f == '%') {
+            int idx;
+            if (*++f == '%') {
+                symbol->errtxt[p++] = '%';
+                continue;
+            }
+            f += errtxtf_num_arg(f, NULL /*p_arg*/);
+            f += errtxtf_slen(f, -1 /*arg*/, NULL /*arg_cnt*/, NULL /*p_len*/);
+            f += errtxtf_dpad(f);
+            idx = idxs[i];
+            if (specs[idx] == 'c') {
+                symbol->errtxt[p++] = cs[idx];
+            } else {
+                int len;
+                if (specs[idx] == 's') {
+                    if (have_slens[idx]) {
+                        const char *si = ss[idx];
+                        for (len = 0; len < slens[idx] && si[len]; len++);
+                    } else {
+                        len = (int) strlen(ss[idx]);
+                    }
+                } else {
+                    len = (int) strlen(dfgs[idx]);
+                }
+                if (len) {
+                    if (p + len > max_len) {
+                        if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0); /* Catch truncations */
+                        len = max_len - p;
+                    }
+                    memcpy(symbol->errtxt + p, specs[idx] == 's' ? ss[idx] : dfgs[idx], len);
+                    p += len;
+                }
+            }
+            i++;
+        } else {
+            symbol->errtxt[p++] = *f;
+        }
+    }
+    if (*f) {
+        if (!(symbol->debug & ZINT_DEBUG_TEST)) assert(0); /* Catch truncations */
+    }
+
+    symbol->errtxt[p] = '\0';
+
+    return error_number;
+}
+
+/* Helper to prepend/append to existing `symbol->errtxt` by calling `errtxtf(fmt)` with 2 arguments (copy of `errtxt`
+   & `msg`) if `msg` not NULL, or 1 argument (just copy of `errtxt`) if `msg` NULL, returning `error_number` */
+INTERNAL int errtxt_adj(const int error_number, struct zint_symbol *symbol, const char *fmt, const char *msg) {
+    char err_buf[sizeof(symbol->errtxt)];
+
+    err_buf[0] = '\0';
+
+/* Suppress gcc 14 warning output may be truncated */
+#if defined(__GNUC__) && !defined(__clang__) && __GNUC__ >= 14
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wstringop-truncation"
+#endif
+
+    strncat(err_buf, symbol->errtxt, sizeof(symbol->errtxt) - 1);
+
+#if defined(__GNUC__) && !defined(__clang__) && __GNUC__ >= 14
+#pragma GCC diagnostic pop
+#endif
+
+    if (msg) {
+        errtxtf(0, symbol, -1, fmt, err_buf, msg);
+    } else {
+        errtxtf(0, symbol, -1, fmt, err_buf);
+    }
+
+    return error_number;
+}
+
+/* Whether `symbology` can have row binding */
+INTERNAL int is_stackable(const int symbology) {
+    if (symbology < BARCODE_PHARMA_TWO && symbology != BARCODE_POSTNET) {
+        return 1;
+    }
+
+    switch (symbology) {
+        case BARCODE_CODE128AB:
+        case BARCODE_ISBNX:
+        case BARCODE_EAN14:
+        case BARCODE_NVE18:
+        case BARCODE_KOREAPOST:
+        case BARCODE_PLESSEY:
+        case BARCODE_TELEPEN_NUM:
+        case BARCODE_ITF14:
+        case BARCODE_CODE32:
+        case BARCODE_CODABLOCKF:
+        case BARCODE_HIBC_BLOCKF:
+            return 1;
+            break;
+    }
+
+    return 0;
+}
+
+/* Whether `symbology` is EAN/UPC */
+INTERNAL int is_upcean(const int symbology) {
+
+    switch (symbology) {
+        case BARCODE_EANX:
+        case BARCODE_EANX_CHK:
+        case BARCODE_UPCA:
+        case BARCODE_UPCA_CHK:
+        case BARCODE_UPCE:
+        case BARCODE_UPCE_CHK:
+        case BARCODE_ISBNX:
+        case BARCODE_EANX_CC:
+        case BARCODE_UPCA_CC:
+        case BARCODE_UPCE_CC:
+            return 1;
+            break;
+    }
+
+    return 0;
+}
+
+/* Whether `symbology` can have composite 2D component data */
+INTERNAL int is_composite(const int symbology) {
+    return symbology >= BARCODE_EANX_CC && symbology <= BARCODE_DBAR_EXPSTK_CC;
+}
+
+/* Whether `symbology` is a matrix design renderable as dots */
+INTERNAL int is_dotty(const int symbology) {
+
+    switch (symbology) {
+        /* Note MAXICODE and ULTRA absent */
+        case BARCODE_QRCODE:
+        case BARCODE_DATAMATRIX:
+        case BARCODE_MICROQR:
+        case BARCODE_HIBC_DM:
+        case BARCODE_AZTEC:
+        case BARCODE_HIBC_QR:
+        case BARCODE_HIBC_AZTEC:
+        case BARCODE_AZRUNE:
+        case BARCODE_CODEONE:
+        case BARCODE_GRIDMATRIX:
+        case BARCODE_HANXIN:
+        case BARCODE_MAILMARK_2D:
+        case BARCODE_DOTCODE:
+        case BARCODE_UPNQR:
+        case BARCODE_RMQR:
+            return 1;
+            break;
+    }
+
+    return 0;
+}
+
+/* Whether `symbology` has a fixed aspect ratio (matrix design) */
+INTERNAL int is_fixed_ratio(const int symbology) {
+
+    if (is_dotty(symbology)) {
+        return 1;
+    }
+
+    switch (symbology) {
+        case BARCODE_MAXICODE:
+        case BARCODE_ULTRA:
+            return 1;
+            break;
+    }
+
+    return 0;
+}
+
+/* Whether next two characters are digits */
+INTERNAL int is_twodigits(const unsigned char source[], const int length, const int position) {
+    if ((position + 1 < length) && z_isdigit(source[position]) && z_isdigit(source[position + 1])) {
+        return 1;
+    }
+
+    return 0;
+}
+
+/* Returns how many consecutive digits lie immediately ahead up to `max`, or all if `max` is -1 */
+INTERNAL int cnt_digits(const unsigned char source[], const int length, const int position, const int max) {
+    int i;
+    const int max_length = max == -1 || position + max > length ? length : position + max;
+
+    for (i = position; i < max_length && z_isdigit(source[i]); i++);
+
+    return i - position;
+}
+
+/* State machine to decode UTF-8 to Unicode codepoints (state 0 means done, state 12 means error) */
+INTERNAL unsigned int decode_utf8(unsigned int *state, unsigned int *codep, const unsigned char byte) {
+    /*
+        Copyright (c) 2008-2009 Bjoern Hoehrmann <bjoern@hoehrmann.de>
+
+        Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated
+        documentation files (the "Software"), to deal in the Software without restriction, including without
+        limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the
+        Software, and to permit persons to whom the Software is furnished to do so, subject to the following
+        conditions:
+
+        The above copyright notice and this permission notice shall be included in all copies or substantial portions
+        of the Software.
+
+        See https://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.
+     */
+
+    static const unsigned char utf8d[] = {
+        /* The first part of the table maps bytes to character classes that
+         * reduce the size of the transition table and create bitmasks. */
+         0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,  0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
+         0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,  0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
+         0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,  0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
+         0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,  0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,
+         1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,  9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,
+         7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,  7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,
+         8,8,2,2,2,2,2,2,2,2,2,2,2,2,2,2,  2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,
+        10,3,3,3,3,3,3,3,3,3,3,3,3,4,3,3, 11,6,6,6,5,8,8,8,8,8,8,8,8,8,8,8,
+
+        /* The second part is a transition table that maps a combination
+         * of a state of the automaton and a character class to a state. */
+         0,12,24,36,60,96,84,12,12,12,48,72, 12,12,12,12,12,12,12,12,12,12,12,12,
+        12, 0,12,12,12,12,12, 0,12, 0,12,12, 12,24,12,12,12,12,12,24,12,24,12,12,
+        12,12,12,12,12,12,12,24,12,12,12,12, 12,24,12,12,12,12,12,12,12,24,12,12,
+        12,12,12,12,12,12,12,36,12,36,12,12, 12,36,12,12,12,12,12,36,12,36,12,12,
+        12,36,12,12,12,12,12,12,12,12,12,12,
+    };
+
+    const unsigned int type = utf8d[byte];
+
+    *codep = *state != 0 ? (byte & 0x3fu) | (*codep << 6) : (0xff >> type) & byte;
+
+    *state = utf8d[256 + *state + type];
+
+    return *state;
+}
+
+/* Is string valid UTF-8? */
+INTERNAL int is_valid_utf8(const unsigned char source[], const int length) {
+    int i;
+    unsigned int codepoint, state = 0;
+
+    for (i = 0; i < length; i++) {
+        if (decode_utf8(&state, &codepoint, source[i]) == 12) {
+            return 0;
+        }
+    }
+
+    return state == 0;
+}
+
+/* Converts UTF-8 to Unicode. If `disallow_4byte` unset, allows all values (UTF-32). If `disallow_4byte` set,
+ * only allows codepoints <= U+FFFF (ie four-byte sequences not allowed) (UTF-16, no surrogates) */
+INTERNAL int utf8_to_unicode(struct zint_symbol *symbol, const unsigned char source[], unsigned int vals[],
+                int *length, const int disallow_4byte) {
+    int bpos;
+    int jpos;
+    unsigned int codepoint, state = 0;
+
+    bpos = 0;
+    jpos = 0;
+
+    while (bpos < *length) {
+        do {
+            decode_utf8(&state, &codepoint, source[bpos++]);
+        } while (bpos < *length && state != 0 && state != 12);
+
+        if (state != 0) {
+            strcpy(symbol->errtxt, "240: Corrupt Unicode data");
+            return ZINT_ERROR_INVALID_DATA;
+        }
+        if (disallow_4byte && codepoint > 0xffff) {
+            strcpy(symbol->errtxt, "242: Unicode sequences of more than 3 bytes not supported");
+            return ZINT_ERROR_INVALID_DATA;
+        }
+
+        vals[jpos] = codepoint;
+        jpos++;
+    }
+
+    *length = jpos;
+
+    return 0;
+}
+
+/* Treats source as ISO/IEC 8859-1 and copies into `symbol->text`, converting to UTF-8. Control chars (incl. DEL) and
+   non-ISO/IEC 8859-1 (0x80-9F) are replaced with spaces. Returns warning if truncated, else 0 */
+INTERNAL int hrt_cpy_iso8859_1(struct zint_symbol *symbol, const unsigned char source[], const int length) {
+    int i, j;
+    int warn_number = 0;
+
+    for (i = 0, j = 0; i < length && j < (int) sizeof(symbol->text); i++) {
+        if (source[i] < 0x80) {
+            symbol->text[j++] = source[i] >= ' ' && source[i] != 0x7F ? source[i] : ' ';
+        } else if (source[i] < 0xC0) {
+            if (source[i] >= 0xA0) { /* 0x80-0x9F not valid ISO/IEC 8859-1 */
+                if (j + 2 >= (int) sizeof(symbol->text)) {
+                    warn_number = ZINT_WARN_HRT_TRUNCATED;
+                    break;
+                }
+                symbol->text[j++] = 0xC2;
+                symbol->text[j++] = source[i];
+            } else {
+                symbol->text[j++] = ' ';
+            }
+        } else {
+            if (j + 2 >= (int) sizeof(symbol->text)) {
+                warn_number = ZINT_WARN_HRT_TRUNCATED;
+                break;
+            }
+            symbol->text[j++] = 0xC3;
+            symbol->text[j++] = source[i] - 0x40;
+        }
+    }
+    if (j == sizeof(symbol->text)) {
+        warn_number = ZINT_WARN_HRT_TRUNCATED;
+        j--;
+    }
+    symbol->text[j] = '\0';
+
+    if (warn_number) {
+        errtxt(0, symbol, 249, "Human Readable Text truncated");
+    }
+    return warn_number;
+}
+
+/* Sets symbol height, returning a warning if not within minimum and/or maximum if given.
+   `default_height` does not include height of fixed-height rows (i.e. separators/composite data) */
+INTERNAL int set_height(struct zint_symbol *symbol, const float min_row_height, const float default_height,
+                const float max_height, const int no_errtxt) {
+    int error_number = 0;
+    float fixed_height = 0.0f;
+    int zero_count = 0;
+    float row_height;
+    int i;
+    const int rows = symbol->rows ? symbol->rows : 1; /* Sometimes called before expand() */
+
+    for (i = 0; i < rows; i++) {
+        if (symbol->row_height[i]) {
+            fixed_height += symbol->row_height[i];
+        } else {
+            zero_count++;
+        }
+    }
+
+    if (zero_count) {
+        if (symbol->height) {
+            if (symbol->input_mode & HEIGHTPERROW_MODE) {
+                row_height = stripf(symbol->height);
+            } else {
+                row_height = stripf((symbol->height - fixed_height) / zero_count);
+            }
+        } else if (default_height) {
+            row_height = stripf(default_height / zero_count);
+        } else {
+            row_height = stripf(min_row_height);
+        }
+        if (row_height < 0.5f) { /* Absolute minimum */
+            row_height = 0.5f;
+        }
+        if (min_row_height) {
+            if (stripf(row_height) < stripf(min_row_height)) {
+                error_number = ZINT_WARN_NONCOMPLIANT;
+                if (!no_errtxt) {
+                    errtxt(0, symbol, 247, "Height not compliant with standards");
+                }
+            }
+        }
+        symbol->height = stripf(row_height * zero_count + fixed_height);
+    } else {
+        symbol->height = stripf(fixed_height); /* Ignore any given height */
+    }
+    if (max_height) {
+        if (stripf(symbol->height) > stripf(max_height)) {
+            error_number = ZINT_WARN_NONCOMPLIANT;
+            if (!no_errtxt) {
+                errtxt(0, symbol, 248, "Height not compliant with standards");
+            }
+        }
+    }
+
+    return error_number;
+}
+
+/* Prevent inlining of `stripf()` which can optimize away its effect */
+#if defined(__GNUC__) && (__GNUC__ >= 4 || (__GNUC__ == 3 && __GNUC_MINOR__ >= 1))
+#define ZINT_NOINLINE __attribute__((__noinline__))
+#elif defined(_MSC_VER) && _MSC_VER >= 1310 /* MSVC 2003 (VC++ 7.1) */
+#define ZINT_NOINLINE __declspec(noinline)
+#else
+#define ZINT_NOINLINE
+#endif
+
+/* Removes excess precision from floats - see https://stackoverflow.com/q/503436 */
+INTERNAL ZINT_NOINLINE float stripf(const float arg) {
+    return *((volatile const float *) &arg);
+}
+
+/* Returns total length of segments */
+INTERNAL int segs_length(const struct zint_seg segs[], const int seg_count) {
+    int total_len = 0;
+    int i;
+
+    for (i = 0; i < seg_count; i++) {
+        total_len += segs[i].length == -1 ? (int) ustrlen(segs[i].source) : segs[i].length;
+    }
+
+    return total_len;
+}
+
+/* Shallow copies segments, adjusting default ECIs */
+INTERNAL void segs_cpy(const struct zint_symbol *symbol, const struct zint_seg segs[], const int seg_count,
+                struct zint_seg local_segs[]) {
+    const int default_eci = symbol->symbology == BARCODE_GRIDMATRIX ? 29 : symbol->symbology == BARCODE_UPNQR ? 4 : 3;
+    int i;
+
+    local_segs[0] = segs[0];
+    for (i = 1; i < seg_count; i++) {
+        local_segs[i] = segs[i];
+        /* Ensure default ECI set if follows non-default ECI */
+        if (local_segs[i].eci == 0 && local_segs[i - 1].eci != 0 && local_segs[i - 1].eci != default_eci) {
+            local_segs[i].eci = default_eci;
+        }
+    }
+}
+
+/* Helper for ZINT_DEBUG_PRINT to put all but graphical ASCII in hex escapes. Output to `buf` if non-NULL, else
+   stdout */
+INTERNAL char *debug_print_escape(const unsigned char *source, const int first_len, char *buf) {
+    int i;
+    if (buf) {
+        int j = 0;
+        for (i = 0; i < first_len; i++) {
+            const unsigned char ch = source[i];
+            if (ch < 32 || ch >= 127) {
+                j += sprintf(buf + j, "\\x%02X", ch & 0xFF);
+            } else {
+                buf[j++] = ch;
+            }
+        }
+        buf[j] = '\0';
+    } else {
+        for (i = 0; i < first_len; i++) {
+            const unsigned char ch = source[i];
+            if (ch < 32 || ch >= 127) {
+                printf("\\x%02X", ch & 0xFF);
+            } else {
+                fputc(ch, stdout);
+            }
+        }
+    }
+    return buf;
+}
+
+#ifdef ZINT_TEST
+/* Suppress gcc warning null destination pointer [-Wformat-overflow=] false-positive */
+#if defined(__GNUC__) && !defined(__clang__) && __GNUC__ >= 7
+#pragma GCC diagnostic push
+#pragma GCC diagnostic ignored "-Wformat-overflow="
+#endif
+/* Dumps hex-formatted codewords in symbol->errtxt (for use in testing) */
+INTERNAL void debug_test_codeword_dump(struct zint_symbol *symbol, const unsigned char *codewords, const int length) {
+    int i, max = length, cnt_len = 0;
+    assert(sizeof(symbol->errtxt) >= 100);
+    if (length > 30) { /* 30*3 < errtxt 92 (100 - "Warning ") chars */
+        sprintf(symbol->errtxt, "(%d) ", length); /* Place the number of codewords at the front */
+        cnt_len = (int) strlen(symbol->errtxt);
+        max = 30 - (cnt_len + 2) / 3;
+    }
+    for (i = 0; i < max; i++) {
+        sprintf(symbol->errtxt + cnt_len + i * 3, "%02X ", codewords[i]);
+    }
+    symbol->errtxt[strlen(symbol->errtxt) - 1] = '\0'; /* Zap last space */
+}
+
+/* Dumps decimal-formatted codewords in symbol->errtxt (for use in testing) */
+INTERNAL void debug_test_codeword_dump_short(struct zint_symbol *symbol, const short *codewords, const int length) {
+    int i, max = 0, cnt_len, errtxt_len;
+    char temp[20];
+    assert(sizeof(symbol->errtxt) >= 100);
+    errtxt_len = sprintf(symbol->errtxt, "(%d) ", length); /* Place the number of codewords at the front */
+    for (i = 0, cnt_len = errtxt_len; i < length; i++) {
+        cnt_len += sprintf(temp, "%d ", codewords[i]);
+        if (cnt_len > 92) {
+            break;
+        }
+        max++;
+    }
+    for (i = 0; i < max; i++) {
+        errtxt_len += sprintf(symbol->errtxt + errtxt_len, "%d ", codewords[i]);
+    }
+    symbol->errtxt[strlen(symbol->errtxt) - 1] = '\0'; /* Zap last space */
+}
+
+/* Dumps decimal-formatted codewords in symbol->errtxt (for use in testing) */
+INTERNAL void debug_test_codeword_dump_int(struct zint_symbol *symbol, const int *codewords, const int length) {
+    int i, max = 0, cnt_len, errtxt_len;
+    char temp[20];
+    assert(sizeof(symbol->errtxt) >= 100);
+    errtxt_len = sprintf(symbol->errtxt, "(%d) ", length); /* Place the number of codewords at the front */
+    for (i = 0, cnt_len = errtxt_len; i < length; i++) {
+        cnt_len += sprintf(temp, "%d ", codewords[i]);
+        if (cnt_len > 92) {
+            break;
+        }
+        max++;
+    }
+    for (i = 0; i < max; i++) {
+        errtxt_len += sprintf(symbol->errtxt + errtxt_len, "%d ", codewords[i]);
+    }
+    symbol->errtxt[strlen(symbol->errtxt) - 1] = '\0'; /* Zap last space */
+}
+#if defined(__GNUC__) && !defined(__clang__) && __GNUC__ >= 7
+#pragma GCC diagnostic pop
+#endif
+#endif /* ZINT_TEST */
+
+/* vim: set ts=4 sw=4 et : */
author	Franz Glasner <fzglas.hg@dom66.de>
date	Mon, 15 Sep 2025 11:43:07 +0200
parents
children