diff options
Diffstat (limited to 'source/t/texlive/patches/texlive-20190410-source-upstream_fixes-1.patch')
-rw-r--r-- | source/t/texlive/patches/texlive-20190410-source-upstream_fixes-1.patch | 4096 |
1 files changed, 4096 insertions, 0 deletions
diff --git a/source/t/texlive/patches/texlive-20190410-source-upstream_fixes-1.patch b/source/t/texlive/patches/texlive-20190410-source-upstream_fixes-1.patch new file mode 100644 index 00000000..8e29d492 --- /dev/null +++ b/source/t/texlive/patches/texlive-20190410-source-upstream_fixes-1.patch @@ -0,0 +1,4096 @@ +Submitted By: Ken Moffat <ken at linuxfromscratch dot org> +Date: 2019-05-31 +Initial Package Version: 2019 +Upstream Status: Applied +Origin: Upstream +Description: Fixes from branch2019 up to svn r51236, and fixes +from trunk for harfbuzz-2.5.0 changes (svn r51269, 51271). + +diff -Naur a/texk/dvipdfm-x/ChangeLog b/texk/dvipdfm-x/ChangeLog +--- a/texk/dvipdfm-x/ChangeLog 2019-04-07 02:42:55.000000000 +0100 ++++ b/texk/dvipdfm-x/ChangeLog 2019-05-31 22:00:04.006964029 +0100 +@@ -1,3 +1,47 @@ ++2019-05-08 Akira Kakuto <kakuto@w32tex.org> ++ ++ * dpxfile.c: Avoid buffer overflow. ++ ++2019-05-08 Shunsaku Hirata <shunsaku.hirata74@gmail.com> ++ ++ * spc_pdfm.c: Transformation also applies to annotations ++ created by pdf:ann. ++ ++2019-05-07 Shunsaku Hirata <shunsaku.hirata74@gmail.com> ++ ++ * tt_cmap.c: Fix a bug that CFF charset data were not read. ++ * unicode.c: Fix a bug that end-of-buffer calculation was ++ wrong. ++ ++2019-05-05 Shunsaku Hirata <shunsaku.hirata74@gmail.com> ++ ++ * pdfdoc.c: g option affects only annotations created by ++ "pdf:bann/eann" and html "a link" specials. ++ Report from Joseph Wright: ++ https://tug.org/pipermail/tex-live/2019-May/043612.html ++ ++2019-05-03 Shunsaku Hirata <shunsaku.hirata74@gmail.com> ++ ++ * specials.c: transformation applied to current point was not ++ done properly. ++ ++2019-05-03 Akira Kakuto <kakuto@w32tex.org> ++ ++ * dpxfile.c, mfileio.h, pdfximage.c: Support non-ascii file ++ names in default code page of OS irrespective of values of a ++ variable 'command_line_encoding' (Windows only). ++ ++2019-05-03 Shunsaku Hirata <shunsaku.hirata74@gmail.com> ++ ++ * pdfobj.c, pdfobj.h: Add support for ASCIIHex and ASCII85 ++ decode filter. Support for decoding stream data with multiple ++ filters applied. Remove unused function. ++ * tt_cmap.c, tt_gsub.[ch]: Revise ToUnicode CMap creation for ++ OpenType. Use GSUB for mapping unencoded glyphs to Unicode ++ (XeTeX support), lowering priority of CJK compatibility ++ ideographs. ++ * configure.ac: Version 20190503. ++ + 2019-04-07 Karl Berry <karl@freefriends.org> + + * TeX Live 2019. +diff -Naur a/texk/dvipdfm-x/configure b/texk/dvipdfm-x/configure +--- a/texk/dvipdfm-x/configure 2019-02-24 22:07:11.000000000 +0000 ++++ b/texk/dvipdfm-x/configure 2019-05-31 22:00:04.007964030 +0100 +@@ -1,8 +1,8 @@ + #! /bin/sh + # Guess values for system-dependent variables and create Makefiles. +-# Generated by GNU Autoconf 2.69 for dvipdfm-x (TeX Live) 20190225. ++# Generated by GNU Autoconf 2.69 for dvipdfm-x (TeX Live) 20190503. + # +-# Report bugs to <tex-k@tug.org>. ++# Report bugs to <dvipdfmx@tug.org>. + # + # + # Copyright (C) 1992-1996, 1998-2012 Free Software Foundation, Inc. +@@ -274,7 +274,7 @@ + $as_echo "$0: In particular, zsh $ZSH_VERSION has bugs and should" + $as_echo "$0: be upgraded to zsh 4.3.4 or later." + else +- $as_echo "$0: Please tell bug-autoconf@gnu.org and tex-k@tug.org ++ $as_echo "$0: Please tell bug-autoconf@gnu.org and dvipdfmx@tug.org + $0: about your system, including any error possibly output + $0: before this message. Then install a modern shell, or + $0: manually run the script under such a shell if you do +@@ -590,9 +590,9 @@ + # Identity of this package. + PACKAGE_NAME='dvipdfm-x (TeX Live)' + PACKAGE_TARNAME='dvipdfm-x--tex-live-' +-PACKAGE_VERSION='20190225' +-PACKAGE_STRING='dvipdfm-x (TeX Live) 20190225' +-PACKAGE_BUGREPORT='tex-k@tug.org' ++PACKAGE_VERSION='20190503' ++PACKAGE_STRING='dvipdfm-x (TeX Live) 20190503' ++PACKAGE_BUGREPORT='dvipdfmx@tug.org' + PACKAGE_URL='' + + ac_unique_file="agl.c" +@@ -1350,7 +1350,7 @@ + # Omit some internal or obsolete options to make the list less imposing. + # This message is too long to be a string in the A/UX 3.1 sh. + cat <<_ACEOF +-\`configure' configures dvipdfm-x (TeX Live) 20190225 to adapt to many kinds of systems. ++\`configure' configures dvipdfm-x (TeX Live) 20190503 to adapt to many kinds of systems. + + Usage: $0 [OPTION]... [VAR=VALUE]... + +@@ -1421,7 +1421,7 @@ + + if test -n "$ac_init_help"; then + case $ac_init_help in +- short | recursive ) echo "Configuration of dvipdfm-x (TeX Live) 20190225:";; ++ short | recursive ) echo "Configuration of dvipdfm-x (TeX Live) 20190503:";; + esac + cat <<\_ACEOF + +@@ -1488,7 +1488,7 @@ + Use these variables to override the choices made by `configure' or to help + it to find libraries and programs with nonstandard names/locations. + +-Report bugs to <tex-k@tug.org>. ++Report bugs to <dvipdfmx@tug.org>. + _ACEOF + ac_status=$? + fi +@@ -1551,7 +1551,7 @@ + test -n "$ac_init_help" && exit $ac_status + if $ac_init_version; then + cat <<\_ACEOF +-dvipdfm-x (TeX Live) configure 20190225 ++dvipdfm-x (TeX Live) configure 20190503 + generated by GNU Autoconf 2.69 + + Copyright (C) 2012 Free Software Foundation, Inc. +@@ -1896,9 +1896,9 @@ + $as_echo "$as_me: WARNING: $2: section \"Present But Cannot Be Compiled\"" >&2;} + { $as_echo "$as_me:${as_lineno-$LINENO}: WARNING: $2: proceeding with the compiler's result" >&5 + $as_echo "$as_me: WARNING: $2: proceeding with the compiler's result" >&2;} +-( $as_echo "## ---------------------------- ## +-## Report this to tex-k@tug.org ## +-## ---------------------------- ##" ++( $as_echo "## ------------------------------- ## ++## Report this to dvipdfmx@tug.org ## ++## ------------------------------- ##" + ) | sed "s/^/$as_me: WARNING: /" >&2 + ;; + esac +@@ -2390,7 +2390,7 @@ + This file contains any messages produced by compilers while + running configure, to aid debugging if configure makes a mistake. + +-It was created by dvipdfm-x (TeX Live) $as_me 20190225, which was ++It was created by dvipdfm-x (TeX Live) $as_me 20190503, which was + generated by GNU Autoconf 2.69. Invocation command line was + + $ $0 $@ +@@ -8077,7 +8077,7 @@ + + # Define the identity of the package. + PACKAGE='dvipdfm-x--tex-live-' +- VERSION='20190225' ++ VERSION='20190503' + + + cat >>confdefs.h <<_ACEOF +@@ -14746,7 +14746,7 @@ + Report bugs to <bug-libtool@gnu.org>." + + lt_cl_version="\ +-dvipdfm-x (TeX Live) config.lt 20190225 ++dvipdfm-x (TeX Live) config.lt 20190503 + configured by $0, generated by GNU Autoconf 2.69. + + Copyright (C) 2011 Free Software Foundation, Inc. +@@ -16636,7 +16636,7 @@ + # report actual input values of CONFIG_FILES etc. instead of their + # values after options handling. + ac_log=" +-This file was extended by dvipdfm-x (TeX Live) $as_me 20190225, which was ++This file was extended by dvipdfm-x (TeX Live) $as_me 20190503, which was + generated by GNU Autoconf 2.69. Invocation command line was + + CONFIG_FILES = $CONFIG_FILES +@@ -16700,13 +16700,13 @@ + Configuration commands: + $config_commands + +-Report bugs to <tex-k@tug.org>." ++Report bugs to <dvipdfmx@tug.org>." + + _ACEOF + cat >>$CONFIG_STATUS <<_ACEOF || ac_write_fail=1 + ac_cs_config="`$as_echo "$ac_configure_args" | sed 's/^ //; s/[\\""\`\$]/\\\\&/g'`" + ac_cs_version="\\ +-dvipdfm-x (TeX Live) config.status 20190225 ++dvipdfm-x (TeX Live) config.status 20190503 + configured by $0, generated by GNU Autoconf 2.69, + with options \\"\$ac_cs_config\\" + +diff -Naur a/texk/dvipdfm-x/configure.ac b/texk/dvipdfm-x/configure.ac +--- a/texk/dvipdfm-x/configure.ac 2019-02-24 22:07:11.000000000 +0000 ++++ b/texk/dvipdfm-x/configure.ac 2019-05-31 22:00:04.007964030 +0100 +@@ -7,7 +7,7 @@ + dnl gives unlimited permission to copy and/or distribute it, + dnl with or without modifications, as long as this notice is preserved. + dnl +-AC_INIT([dvipdfm-x (TeX Live)], [20190225], [tex-k@tug.org]) ++AC_INIT([dvipdfm-x (TeX Live)], [20190503], [dvipdfmx@tug.org]) + AC_PREREQ([2.65]) + AC_CONFIG_SRCDIR([agl.c]) + AC_CONFIG_AUX_DIR([../../build-aux]) +diff -Naur a/texk/dvipdfm-x/dpxfile.c b/texk/dvipdfm-x/dpxfile.c +--- a/texk/dvipdfm-x/dpxfile.c 2018-10-07 22:27:40.000000000 +0100 ++++ b/texk/dvipdfm-x/dpxfile.c 2019-05-31 22:00:04.007964030 +0100 +@@ -1,5 +1,5 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. +- Copyright (C) 2007-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2007-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -159,11 +159,17 @@ + static char _tmpbuf[PATH_MAX+1]; + #endif /* MIKTEX */ + ++#if defined(WIN32) ++extern int utf8name_failed; ++#endif /* WIN32 */ ++ ++#define CMDBUFSIZ 1024 + static int exec_spawn (char *cmd) + { + char **cmdv, **qv; + char *p, *pp; +- char buf[1024]; ++ char buf[CMDBUFSIZ]; ++ int charcnt; + int i, ret = -1; + #ifdef WIN32 + wchar_t **cmdvw, **qvw; +@@ -182,11 +188,12 @@ + i++; + p++; + } +- cmdv = xcalloc (i + 2, sizeof (char *)); ++ cmdv = xcalloc (i + 4, sizeof (char *)); + p = cmd; + qv = cmdv; + while (*p) { + pp = buf; ++ charcnt = 0; + if (*p == '"') { + p++; + while (*p != '"') { +@@ -194,6 +201,10 @@ + goto done; + } + *pp++ = *p++; ++ charcnt++; ++ if (charcnt > CMDBUFSIZ - 1) { ++ ERROR("Too long a command line."); ++ } + } + p++; + } else if (*p == '\'') { +@@ -203,6 +214,10 @@ + goto done; + } + *pp++ = *p++; ++ charcnt++; ++ if (charcnt > CMDBUFSIZ - 1) { ++ ERROR("Too long a command line."); ++ } + } + p++; + } else { +@@ -214,10 +229,18 @@ + goto done; + } + *pp++ = *p++; ++ charcnt++; ++ if (charcnt > CMDBUFSIZ - 1) { ++ ERROR("Too long a command line."); ++ } + } + p++; + } else { + *pp++ = *p++; ++ charcnt++; ++ if (charcnt > CMDBUFSIZ - 1) { ++ ERROR("Too long a command line."); ++ } + } + } + } +@@ -235,20 +258,39 @@ + p++; + qv++; + } ++ *qv = NULL; ++ + #ifdef WIN32 + #if defined(MIKTEX) + ret = _spawnvp(_P_WAIT, *cmdv, (const char* const*)cmdv); + #else +- cmdvw = xcalloc (i + 2, sizeof (wchar_t *)); +- qv = cmdv; +- qvw = cmdvw; +- while (*qv) { +- *qvw = get_wstring_from_fsyscp(*qv, *qvw=NULL); +- qv++; +- qvw++; ++ cmdvw = xcalloc (i + 4, sizeof (wchar_t *)); ++ if (utf8name_failed == 0) { ++ qv = cmdv; ++ qvw = cmdvw; ++ while (*qv) { ++ *qvw = get_wstring_from_fsyscp(*qv, *qvw=NULL); ++ qv++; ++ qvw++; ++ } ++ *qvw = NULL; ++ ret = _wspawnvp (_P_WAIT, *cmdvw, (const wchar_t* const*) cmdvw); ++ } else { ++ int tmpcp; ++ tmpcp = file_system_codepage; ++ file_system_codepage = win32_codepage; ++ qv = cmdv; ++ qvw = cmdvw; ++ while (*qv) { ++ *qvw = get_wstring_from_fsyscp(*qv, *qvw=NULL); ++ qv++; ++ qvw++; ++ } ++ *qvw = NULL; ++ file_system_codepage = tmpcp; ++ utf8name_failed = 0; ++ ret = _wspawnvp (_P_WAIT, *cmdvw, (const wchar_t* const*) cmdvw); + } +- *qvw = NULL; +- ret = _wspawnvp (_P_WAIT, *cmdvw, (const wchar_t* const*) cmdvw); + if (cmdvw) { + qvw = cmdvw; + while (*qvw) { +@@ -1242,3 +1284,21 @@ + + return r; + } ++ ++#if defined(WIN32) ++FILE *generic_fsyscp_fopen (const char *filename, const char *mode) ++{ ++ FILE *f; ++ ++ f = fsyscp_fopen (filename, mode); ++ ++ if (f == NULL && file_system_codepage != win32_codepage) { ++ int tmpcp = file_system_codepage; ++ file_system_codepage = win32_codepage; ++ f = fsyscp_fopen (filename, mode); ++ file_system_codepage = tmpcp; ++ } ++ ++ return f; ++} ++#endif /* WIN32 */ +diff -Naur a/texk/dvipdfm-x/dvipdfmx.c b/texk/dvipdfm-x/dvipdfmx.c +--- a/texk/dvipdfm-x/dvipdfmx.c 2019-02-11 18:22:31.000000000 +0000 ++++ b/texk/dvipdfm-x/dvipdfmx.c 2019-05-31 22:00:04.007964030 +0100 +@@ -232,7 +232,7 @@ + printf ("Papersize is specified by paper format (e.g., \"a4\")\n"); + printf ("\tor by w<unit>,h<unit> (e.g., \"20cm,30cm\").\n"); + printf ("\n"); +- printf ("Email bug reports to tex-k@tug.org.\n"); ++ printf ("Email bug reports to dvipdfmx@tug.org.\n"); + } + + static void +diff -Naur a/texk/dvipdfm-x/mfileio.h b/texk/dvipdfm-x/mfileio.h +--- a/texk/dvipdfm-x/mfileio.h 2016-01-11 03:57:04.000000000 +0000 ++++ b/texk/dvipdfm-x/mfileio.h 2019-05-31 22:00:04.008964031 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2002-2016 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2002-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -36,7 +36,8 @@ + mfclose((file),__FUNCTION__,__LINE__) + #else + #if defined(WIN32) +-#define MFOPEN(name,mode) fsyscp_fopen((name),(mode)) ++extern FILE *generic_fsyscp_fopen(const char *fname, const char *mode); ++#define MFOPEN(name,mode) generic_fsyscp_fopen((name),(mode)) + #else + #define MFOPEN(name,mode) fopen((name),(mode)) + #endif +diff -Naur a/texk/dvipdfm-x/pdfdoc.c b/texk/dvipdfm-x/pdfdoc.c +--- a/texk/dvipdfm-x/pdfdoc.c 2018-12-21 03:39:51.000000000 +0000 ++++ b/texk/dvipdfm-x/pdfdoc.c 2019-05-31 22:00:04.008964031 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2008-2018 by Jin-Hwan Cho, Matthias Franz, and Shunsaku Hirata, ++ Copyright (C) 2008-2019 by Jin-Hwan Cho, Matthias Franz, and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -1780,7 +1780,6 @@ + pdf_doc *p = &pdoc; + pdf_page *page; + pdf_obj *rect_array; +- double annot_grow = p->opt.annot_grow; + double xpos, ypos; + pdf_rect annbox; + +@@ -1812,10 +1811,10 @@ + } + + rect_array = pdf_new_array(); +- pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.llx - annot_grow, 0.001))); +- pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.lly - annot_grow, 0.001))); +- pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.urx + annot_grow, 0.001))); +- pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.ury + annot_grow, 0.001))); ++ pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.llx, 0.001))); ++ pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.lly, 0.001))); ++ pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.urx, 0.001))); ++ pdf_add_array(rect_array, pdf_new_number(ROUND(annbox.ury, 0.001))); + pdf_add_dict (annot_dict, pdf_new_name("Rect"), rect_array); + + pdf_add_array(page->annots, pdf_ref_obj(annot_dict)); +@@ -2802,13 +2801,22 @@ + void + pdf_doc_break_annot (void) + { ++ pdf_doc *p = &pdoc; ++ double g = p->opt.annot_grow; ++ + if (breaking_state.dirty) { + pdf_obj *annot_dict; ++ pdf_rect rect; + + /* Copy dict */ + annot_dict = pdf_new_dict(); + pdf_merge_dict(annot_dict, breaking_state.annot_dict); +- pdf_doc_add_annot(pdf_doc_current_page_number(), &(breaking_state.rect), ++ rect = breaking_state.rect; ++ rect.llx -= g; ++ rect.lly -= g; ++ rect.urx += g; ++ rect.ury += g; ++ pdf_doc_add_annot(pdf_doc_current_page_number(), &rect, + annot_dict, !breaking_state.broken); + pdf_release_obj(annot_dict); + +diff -Naur a/texk/dvipdfm-x/pdfobj.c b/texk/dvipdfm-x/pdfobj.c +--- a/texk/dvipdfm-x/pdfobj.c 2018-12-26 23:07:57.000000000 +0000 ++++ b/texk/dvipdfm-x/pdfobj.c 2019-05-31 22:00:04.008964031 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2007-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2007-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -2223,48 +2223,9 @@ + + #if HAVE_ZLIB + #define WBUF_SIZE 4096 +-int +-pdf_add_stream_flate (pdf_obj *dst, const void *data, int len) +-{ +- z_stream z; +- Bytef wbuf[WBUF_SIZE]; +- +- z.zalloc = Z_NULL; z.zfree = Z_NULL; z.opaque = Z_NULL; +- +- z.next_in = (z_const Bytef *) data; z.avail_in = len; +- z.next_out = (Bytef *) wbuf; z.avail_out = WBUF_SIZE; +- +- if (inflateInit(&z) != Z_OK) { +- WARN("inflateInit() failed."); +- return -1; +- } +- +- for (;;) { +- int status; +- status = inflate(&z, Z_NO_FLUSH); +- if (status == Z_STREAM_END) +- break; +- else if (status != Z_OK) { +- WARN("inflate() failed. Broken PDF file?"); +- inflateEnd(&z); +- return -1; +- } +- +- if (z.avail_out == 0) { +- pdf_add_stream(dst, wbuf, WBUF_SIZE); +- z.next_out = wbuf; +- z.avail_out = WBUF_SIZE; +- } +- } +- +- if (WBUF_SIZE - z.avail_out > 0) +- pdf_add_stream(dst, wbuf, WBUF_SIZE - z.avail_out); +- +- return (inflateEnd(&z) == Z_OK ? 0 : -1); +-} + + static int +-get_decode_parms (struct decode_parms *parms, pdf_obj *dict) ++filter_get_DecodeParms_FlateDecode (struct decode_parms *parms, pdf_obj *dict) + { + pdf_obj *tmp; + +@@ -2278,18 +2239,25 @@ + parms->columns = 1; + + tmp = pdf_deref_obj(pdf_lookup_dict(dict, "Predictor")); +- if (tmp) ++ if (tmp) { + parms->predictor = pdf_number_value(tmp); ++ pdf_release_obj(tmp); ++ } + tmp = pdf_deref_obj(pdf_lookup_dict(dict, "Colors")); +- if (tmp) ++ if (tmp) { + parms->colors = pdf_number_value(tmp); ++ pdf_release_obj(tmp); ++ } + tmp = pdf_deref_obj(pdf_lookup_dict(dict, "BitsPerComponent")); +- if (tmp) ++ if (tmp) { + parms->bits_per_component = pdf_number_value(tmp); ++ pdf_release_obj(tmp); ++ } + tmp = pdf_deref_obj(pdf_lookup_dict(dict, "Columns")); +- if (tmp) ++ if (tmp) { + parms->columns = pdf_number_value(tmp); +- ++ pdf_release_obj(tmp); ++ } + if (parms->bits_per_component != 1 && + parms->bits_per_component != 2 && + parms->bits_per_component != 4 && +@@ -2354,17 +2322,19 @@ + * Especially, calling pdf_add_stream() for each 4 bytes append is highly + * inefficient. + */ +-static int +-filter_decoded (pdf_obj *dst, const void *src, int srclen, +- struct decode_parms *parms) ++static pdf_obj * ++filter_stream_decode_Predictor (const void *src, size_t srclen, struct decode_parms *parms) + { ++ pdf_obj *dst; + const unsigned char *p = (const unsigned char *) src; + const unsigned char *endptr = p + srclen; +- unsigned char *prev, *buf; +- int bits_per_pixel = parms->colors * parms->bits_per_component; +- int bytes_per_pixel = (bits_per_pixel + 7) / 8; +- int length = (parms->columns * bits_per_pixel + 7) / 8; +- int i, error = 0; ++ unsigned char *prev, *buf; ++ int bits_per_pixel = parms->colors * parms->bits_per_component; ++ int bytes_per_pixel = (bits_per_pixel + 7) / 8; ++ int length = (parms->columns * bits_per_pixel + 7) / 8; ++ int i, error = 0; ++ ++ dst = pdf_new_stream(0); + + prev = NEW(length, unsigned char); + buf = NEW(length, unsigned char); +@@ -2491,16 +2461,21 @@ + RELEASE(prev); + RELEASE(buf); + +- return error; ++ if (error) { ++ pdf_release_obj(dst); ++ dst = NULL; ++ } ++ ++ return dst; + } + +-static int +-pdf_add_stream_flate_filtered (pdf_obj *dst, const void *data, int len, struct decode_parms *parms) ++static pdf_obj * ++filter_stream_decode_FlateDecode (const void *data, size_t len, struct decode_parms *parms) + { +- pdf_obj *tmp; +- z_stream z; +- Bytef wbuf[WBUF_SIZE]; +- int error; ++ pdf_obj *dst; ++ pdf_obj *tmp; ++ z_stream z; ++ Bytef wbuf[WBUF_SIZE]; + + z.zalloc = Z_NULL; z.zfree = Z_NULL; z.opaque = Z_NULL; + +@@ -2509,7 +2484,7 @@ + + if (inflateInit(&z) != Z_OK) { + WARN("inflateInit() failed."); +- return -1; ++ return NULL; + } + + tmp = pdf_new_stream(0); +@@ -2521,7 +2496,8 @@ + else if (status != Z_OK) { + WARN("inflate() failed. Broken PDF file?"); + inflateEnd(&z); +- return -1; ++ pdf_release_obj(tmp); ++ return NULL; + } + + if (z.avail_out == 0) { +@@ -2534,79 +2510,310 @@ + if (WBUF_SIZE - z.avail_out > 0) + pdf_add_stream(tmp, wbuf, WBUF_SIZE - z.avail_out); + +- error = filter_decoded(dst, pdf_stream_dataptr(tmp), pdf_stream_length(tmp), parms); ++ if (inflateEnd(&z) == Z_OK) { ++ if (parms) { ++ dst = filter_stream_decode_Predictor(pdf_stream_dataptr(tmp), pdf_stream_length(tmp), parms); ++ } else { ++ dst = pdf_link_obj(tmp); ++ } ++ } else { ++ dst = NULL; ++ } + pdf_release_obj(tmp); + +- return ((!error && inflateEnd(&z) == Z_OK) ? 0 : -1); ++ return dst; + } + #endif + +-int +-pdf_concat_stream (pdf_obj *dst, pdf_obj *src) ++static pdf_obj * ++filter_stream_decode_ASCIIHexDecode (const void *data, size_t len) ++{ ++ pdf_obj *dst; ++ int eod, error; ++ const char *p = (const char *) data; ++ const char *endptr = p + len; ++ unsigned char *buf, ch; ++ size_t pos, n; ++ ++ buf = NEW((len+1)/2, unsigned char); ++ skip_white(&p, endptr); ++ ch = 0; n = 0; pos = 0; eod = 0; error = 0; ++ while (p < endptr && !error && !eod) { ++ char c1, val; ++ c1 = p[0]; ++ if (c1 >= 'A' && c1 <= 'F') { ++ val = c1 - 'A' + 10; ++ } else if (c1 >= 'a' && c1 <= 'f') { ++ val = c1 - 'a' + 10; ++ } else if (c1 >= '0' && c1 <= '9') { ++ val = c1 - '0'; ++ } else if (c1 == '>') { ++ val = 0; ++ eod = 1; ++ if ((pos % 2) == 0) ++ break; ++ } else { ++ error = -1; ++ break; ++ } ++ if (pos % 2) { ++ buf[n] = ch + val; ++ n++; ++ ch = 0; ++ } else { ++ ch = val << 4; ++ } ++ pos++; p++; ++ skip_white(&p, endptr); ++ } ++ if (error || !eod) { ++ WARN("Invalid ASCIIHex data seen: %s", error ? "Invalid character" : "No EOD marker"); ++ dst = NULL; ++ } else { ++ dst = pdf_new_stream(0); ++ pdf_add_stream(dst, buf, n); ++ } ++ RELEASE(buf); ++ ++ return dst; ++} ++ ++/* Percent sign is not start of comment here. ++ * We need this for reading Ascii85 encoded data. ++ */ ++#define is_space(c) ((c) == ' ' || (c) == '\t' || (c) == '\f' || \ ++ (c) == '\r' || (c) == '\n' || (c) == '\0') ++static void ++skip_white_a85 (const char **p, const char *endptr) ++{ ++ while (*p < endptr && (is_space(**p))) { ++ (*p)++; ++ } ++} ++ ++static pdf_obj * ++filter_stream_decode_ASCII85Decode (const void *data, size_t len) + { ++ pdf_obj *dst; ++ int eod, error; ++ const char *p = (const char *) data; ++ const char *endptr = p + len; ++ unsigned char *buf; ++ size_t n; ++ ++ buf = NEW(((len+4)/5)*4, unsigned char); ++ skip_white_a85(&p, endptr); ++ n = 0; eod = 0; error = 0; ++ while (p < endptr && !error && !eod) { ++ char q[5] = {'u', 'u', 'u', 'u', 'u'}; ++ int m; ++ char ch; ++ ++ ch = p[0]; ++ p++; ++ skip_white_a85(&p, endptr); ++ if (ch == 'z') { ++ memset(buf+n, 0, 4); ++ n += 4; ++ continue; ++ } else if (ch == '~') { ++ if (p < endptr && p[0] == '>') { ++ eod = 1; ++ p++; ++ } else { ++ error = -1; ++ } ++ break; ++ } ++ q[0] = ch; ++ for (m = 1; m < 5 && p < endptr; m++) { ++ ch = p[0]; ++ p++; ++ skip_white_a85(&p, endptr); ++ if (ch == '~') { ++ if (p < endptr && p[0] == '>') { ++ eod = 1; ++ p++; ++ } else { ++ error = -1; ++ } ++ break; ++ } else if (ch < '!' || ch > 'u') { ++ error = -1; ++ break; ++ } else { ++ q[m] = ch; ++ } ++ } ++ if (!error) { ++ uint32_t val = 0; ++ int i; ++ if (m <= 1) { ++ error = -1; ++ break; ++ } ++ val = 85*85*85*(q[0] - '!') + 85*85*(q[1] - '!') ++ + 85*(q[2] - '!') + (q[3] - '!'); ++ /* Check overflow */ ++ if (val > UINT32_MAX / 85) { ++ error = -1; ++ break; ++ } else { ++ val = 85 * val; ++ if (val > UINT32_MAX - (q[4] - '!')) { ++ error = -1; ++ break; ++ } ++ val += (q[4] - '!'); ++ } ++ if (!error) { ++ for (i = 3; i >= 0; i--) { ++ buf[n + i] = val & 0xff; ++ val /= 256; ++ } ++ n += m - 1; ++ } ++ } ++ } ++ ++ if (error) { ++ WARN("Error in reading ASCII85 data."); ++ dst = NULL; ++ } else if (!eod) { ++ WARN("Error in reading ASCII85 data: No EOD"); ++ dst = NULL; ++ } else { ++ dst = pdf_new_stream(0); ++ pdf_add_stream(dst, buf, n); ++ } ++ RELEASE(buf); ++ ++ return dst; ++} ++ ++static pdf_obj * ++filter_stream_decode (const char *filter_name, pdf_obj *src, pdf_obj *parm) ++{ ++ pdf_obj *dec; + const char *stream_data; +- int stream_length; +- pdf_obj *stream_dict; +- pdf_obj *filter; +- int error = 0; ++ size_t stream_length; + +- if (!PDF_OBJ_STREAMTYPE(dst) || !PDF_OBJ_STREAMTYPE(src)) +- ERROR("Invalid type."); ++ if (!filter_name) ++ return pdf_link_obj(src); + + stream_data = pdf_stream_dataptr(src); +- stream_length = pdf_stream_length (src); +- stream_dict = pdf_stream_dict (src); ++ stream_length = pdf_stream_length(src); + +- filter = pdf_lookup_dict(stream_dict, "Filter"); +- if (!filter) +- pdf_add_stream(dst, stream_data, stream_length); ++ if (!strcmp(filter_name, "ASCIIHexDecode")) { ++ dec = filter_stream_decode_ASCIIHexDecode(stream_data, stream_length); ++ } else if (!strcmp(filter_name, "ASCII85Decode")) { ++ dec = filter_stream_decode_ASCII85Decode(stream_data, stream_length); + #if HAVE_ZLIB +- else { +- struct decode_parms parms; +- int have_parms = 0; ++ } else if (!strcmp(filter_name, "FlateDecode")) { ++ struct decode_parms decode_parm; ++ if (parm) ++ filter_get_DecodeParms_FlateDecode(&decode_parm, parm); ++ dec = filter_stream_decode_FlateDecode(stream_data, stream_length, parm ? &decode_parm : NULL); ++#endif /* HAVE_ZLIB */ ++ } else { ++ WARN("DecodeFilter \"%s\" not supported.", filter_name); ++ dec = NULL; ++ } + +- if (pdf_lookup_dict(stream_dict, "DecodeParms")) { +- pdf_obj *tmp; ++ return dec; ++} + +- /* Dictionary or array */ +- tmp = pdf_deref_obj(pdf_lookup_dict(stream_dict, "DecodeParms")); +- if (PDF_OBJ_ARRAYTYPE(tmp)) { +- if (pdf_array_length(tmp) > 1) { +- WARN("Unexpected size for DecodeParms array."); +- return -1; +- } +- tmp = pdf_deref_obj(pdf_get_array(tmp, 0)); +- } +- if (!PDF_OBJ_DICTTYPE(tmp)) { +- WARN("PDF dict expected for DecodeParms..."); +- return -1; +- } +- error = get_decode_parms(&parms, tmp); +- if (error) +- ERROR("Invalid value(s) in DecodeParms dictionary."); +- have_parms = 1; +- } +- if (PDF_OBJ_ARRAYTYPE(filter)) { +- if (pdf_array_length(filter) > 1) { +- WARN("Multiple DecodeFilter not supported."); ++int ++pdf_concat_stream (pdf_obj *dst, pdf_obj *src) ++{ ++ pdf_obj *filtered; ++ pdf_obj *stream_dict; ++ pdf_obj *filter, *parms; ++ int error = 0; ++ ++ if (!PDF_OBJ_STREAMTYPE(dst) || !PDF_OBJ_STREAMTYPE(src)) { ++ WARN("Passed invalid type in pdf_concat_stream()."); ++ return -1; ++ } ++ ++ stream_dict = pdf_stream_dict(src); ++ ++ filter = pdf_lookup_dict(stream_dict, "Filter"); ++ if (!filter) { ++ pdf_add_stream(dst, pdf_stream_dataptr(src), pdf_stream_length(src)); ++ return 0; ++ } ++ if (pdf_lookup_dict(stream_dict, "DecodeParms")) { ++ /* Dictionary or array */ ++ parms = pdf_deref_obj(pdf_lookup_dict(stream_dict, "DecodeParms")); ++ if (!parms) { ++ WARN("Failed to deref DeocdeParms..."); ++ return -1; ++ } else if (!PDF_OBJ_ARRAYTYPE(parms) && !PDF_OBJ_DICTTYPE(parms)) { ++ WARN("PDF dict or array expected for DecodeParms..."); ++ pdf_release_obj(parms); ++ return -1; ++ } ++ } else { ++ parms = NULL; ++ } ++ if (PDF_OBJ_ARRAYTYPE(filter)) { ++ int i, num; ++ pdf_obj *prev = NULL; ++ ++ num = pdf_array_length(filter); ++ if (parms) { ++ if (!PDF_OBJ_ARRAYTYPE(parms) || pdf_array_length(parms) != num) { ++ WARN("Invalid DecodeParam object found."); ++ pdf_release_obj(parms); + return -1; + } +- filter = pdf_get_array(filter, 0); + } +- if (PDF_OBJ_NAMETYPE(filter)) { +- char *filter_name = pdf_name_value(filter); +- if (filter_name && !strcmp(filter_name, "FlateDecode")) { +- if (have_parms) +- error = pdf_add_stream_flate_filtered(dst, stream_data, stream_length, &parms); +- else +- error = pdf_add_stream_flate(dst, stream_data, stream_length); +- } else { +- WARN("DecodeFilter \"%s\" not supported.", filter_name); +- error = -1; ++ if (num == 0) { ++ filtered = pdf_link_obj(src); ++ } else { ++ filtered = NULL; ++ prev = pdf_link_obj(src); ++ for (i = 0; i < num && prev != NULL; i++) { ++ pdf_obj *tmp1, *tmp2; ++ ++ tmp1 = pdf_deref_obj(pdf_get_array(filter, i)); ++ if (parms) { ++ tmp2 = pdf_deref_obj(pdf_get_array(parms, i)); ++ } else { ++ tmp2 = NULL; ++ } ++ if (PDF_OBJ_NAMETYPE(tmp1)) { ++ filtered = filter_stream_decode(pdf_name_value(tmp1), prev, tmp2); ++ } else if (PDF_OBJ_NULLTYPE(tmp1)) { ++ filtered = pdf_link_obj(prev); ++ } else { ++ WARN("Unexpected object found for /Filter..."); ++ filtered = NULL; ++ } ++ if (prev) ++ pdf_release_obj(prev); ++ if (tmp1) ++ pdf_release_obj(tmp1); ++ if (tmp2) ++ pdf_release_obj(tmp2); ++ prev = filtered; + } +- } else +- ERROR("Broken PDF file?"); +-#endif /* HAVE_ZLIB */ ++ } ++ } else if (PDF_OBJ_NAMETYPE(filter)) { ++ filtered = filter_stream_decode(pdf_name_value(filter), src, parms); ++ } else { ++ WARN("Invalid value for /Filter found."); ++ filtered = NULL; ++ } ++ if (parms) ++ pdf_release_obj(parms); ++ if (filtered) { ++ pdf_add_stream(dst, pdf_stream_dataptr(filtered), pdf_stream_length(filtered)); ++ pdf_release_obj(filtered); ++ error = 0; ++ } else { ++ error = -1; + } + + return error; +diff -Naur a/texk/dvipdfm-x/pdfobj.h b/texk/dvipdfm-x/pdfobj.h +--- a/texk/dvipdfm-x/pdfobj.h 2018-09-15 22:18:43.000000000 +0100 ++++ b/texk/dvipdfm-x/pdfobj.h 2019-05-31 22:00:04.008964031 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2007-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2007-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -152,11 +152,6 @@ + extern void pdf_add_stream (pdf_obj *stream, + const void *stream_data_ptr, + int stream_data_len); +-#if HAVE_ZLIB +-extern int pdf_add_stream_flate (pdf_obj *stream, +- const void *stream_data_ptr, +- int stream_data_len); +-#endif + extern int pdf_concat_stream (pdf_obj *dst, pdf_obj *src); + extern pdf_obj *pdf_stream_dict (pdf_obj *stream); + extern int pdf_stream_length (pdf_obj *stream); +diff -Naur a/texk/dvipdfm-x/pdfximage.c b/texk/dvipdfm-x/pdfximage.c +--- a/texk/dvipdfm-x/pdfximage.c 2018-09-14 04:34:50.000000000 +0100 ++++ b/texk/dvipdfm-x/pdfximage.c 2019-05-31 22:00:04.008964031 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2007-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2007-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -363,6 +363,10 @@ + #define dpx_fopen(n,m) (MFOPEN((n),(m))) + #define dpx_fclose(f) (MFCLOSE((f))) + ++#if defined(WIN32) ++int utf8name_failed = 0; ++#endif /* WIN32 */ ++ + int + pdf_ximage_findresource (const char *ident, load_options options) + { +@@ -394,8 +398,23 @@ + strcpy(fullname, f); + } else { + /* try loading image */ ++#if defined(WIN32) ++ utf8name_failed = 0; ++#endif /* WIN32 */ + fullname = dpx_find_file(ident, "_pic_", ""); ++#if defined(WIN32) ++ if (!fullname && file_system_codepage != win32_codepage) { ++ int tmpcp = file_system_codepage; ++ utf8name_failed = 1; ++ file_system_codepage = win32_codepage; ++ fullname = dpx_find_file(ident, "_pic_", ""); ++ file_system_codepage = tmpcp; ++ } ++#endif /* WIN32 */ + if (!fullname) { ++#if defined(WIN32) ++ utf8name_failed = 0; ++#endif /* WIN32 */ + WARN("Error locating image file \"%s\"", ident); + return -1; + } +diff -Naur a/texk/dvipdfm-x/README b/texk/dvipdfm-x/README +--- a/texk/dvipdfm-x/README 2015-07-06 17:13:08.000000000 +0100 ++++ b/texk/dvipdfm-x/README 2019-05-31 22:00:04.006964029 +0100 +@@ -1,9 +1,17 @@ + dvipdfmx and xdvipdfmx for TeX Live + =================================== + ++This package is released under the GNU GPL, version 2, or (at your ++option) any later version. ++ ++dvipdfmx is now maintained as part of TeX Live. ++ ++Mailing list for bug reports and all discussion: ++https://lists.tug.org/dvipdfmx; anyone can join the list, but it is not ++necessary to join to post. Archives are public. ++ + xdvipdfmx + ========= +- + xdvipdfmx is an extended version of dvipdfmx, and is now incorporated in + the same sources. + +@@ -15,8 +23,6 @@ + redistributed under the terms of the GNU General Public License, + version 2 or (at your option) any later version. + +-There is a hope to merge xdvipdfmx into dvipdfmx. +- + Jonathan Kew mentions that in the past, XeTeX used a Mac-specific + program xdv2pdf as the backend instead of xdvipdfmx. xdv2pdf supported + a couple of special effects that are not yet available through +@@ -26,18 +32,8 @@ + if anyone is looking for some nontrivial but not-impossible job and + happens across this file. + +-The dvipdfmx Project +-==================== +- +-Copyright (C) 2002-2014 by Jin-Hwan Cho, Shunsaku Hirata, +-Matthias Franz, and the dvipdfmx project team. This package is released +-under the GNU GPL, version 2, or (at your option) any later version. +- +-dvipdfmx is now maintained as part of TeX Live. +- + Contents + -------- +- + 1. Introduction + + 2. Installation +diff -Naur a/texk/dvipdfm-x/spc_pdfm.c b/texk/dvipdfm-x/spc_pdfm.c +--- a/texk/dvipdfm-x/spc_pdfm.c 2019-03-30 03:42:07.000000000 +0000 ++++ b/texk/dvipdfm-x/spc_pdfm.c 2019-05-31 22:00:04.008964031 +0100 +@@ -597,6 +597,7 @@ + return dict; + } + ++#define SPC_PDFM_SUPPORT_ANNOT_TRANS 1 + static int + spc_handler_pdfm_annot (struct spc_env *spe, struct spc_arg *args) + { +@@ -604,7 +605,6 @@ + pdf_obj *annot_dict; + pdf_rect rect; + char *ident = NULL; +- pdf_coord cp; + transform_info ti; + + skip_white(&args->curptr, args->endptr); +@@ -642,19 +642,96 @@ + return -1; + } + +- cp.x = spe->x_user; cp.y = spe->y_user; +- pdf_dev_transform(&cp, NULL); +- if (ti.flags & INFO_HAS_USER_BBOX) { +- rect.llx = ti.bbox.llx + cp.x; +- rect.lly = ti.bbox.lly + cp.y; +- rect.urx = ti.bbox.urx + cp.x; +- rect.ury = ti.bbox.ury + cp.y; +- } else { +- rect.llx = cp.x; +- rect.lly = cp.y - spe->mag * ti.depth; +- rect.urx = cp.x + spe->mag * ti.width; +- rect.ury = cp.y + spe->mag * ti.height; ++#ifdef SPC_PDFM_SUPPORT_ANNOT_TRANS ++ { ++ pdf_coord cp1, cp2, cp3, cp4; ++ /* QuadPoints not working? */ ++#ifdef USE_QUADPOINTS ++ pdf_obj *qpoints; ++#endif ++ if (ti.flags & INFO_HAS_USER_BBOX) { ++ cp1.x = spe->x_user + ti.bbox.llx; ++ cp1.y = spe->y_user + ti.bbox.lly; ++ cp2.x = spe->x_user + ti.bbox.urx; ++ cp2.y = spe->y_user + ti.bbox.lly; ++ cp3.x = spe->x_user + ti.bbox.urx; ++ cp3.y = spe->y_user + ti.bbox.ury; ++ cp4.x = spe->x_user + ti.bbox.llx; ++ cp4.y = spe->y_user + ti.bbox.ury; ++ } else { ++ cp1.x = spe->x_user; ++ cp1.y = spe->y_user - spe->mag * ti.depth; ++ cp2.x = spe->x_user + spe->mag * ti.width; ++ cp2.y = spe->y_user - spe->mag * ti.depth; ++ cp3.x = spe->x_user + spe->mag * ti.width; ++ cp3.y = spe->y_user + spe->mag * ti.height; ++ cp4.x = spe->x_user; ++ cp4.y = spe->y_user + spe->mag * ti.height; ++ } ++ pdf_dev_transform(&cp1, NULL); ++ pdf_dev_transform(&cp2, NULL); ++ pdf_dev_transform(&cp3, NULL); ++ pdf_dev_transform(&cp4, NULL); ++ rect.llx = cp1.x; ++ if (cp2.x < rect.llx) ++ rect.llx = cp2.x; ++ if (cp3.x < rect.llx) ++ rect.llx = cp3.x; ++ if (cp4.x < rect.llx) ++ rect.llx = cp4.x; ++ rect.urx = cp1.x; ++ if (cp2.x > rect.urx) ++ rect.urx = cp2.x; ++ if (cp3.x > rect.urx) ++ rect.urx = cp3.x; ++ if (cp4.x > rect.urx) ++ rect.urx = cp4.x; ++ rect.lly = cp1.y; ++ if (cp2.y < rect.lly) ++ rect.lly = cp2.y; ++ if (cp3.y < rect.lly) ++ rect.lly = cp3.y; ++ if (cp4.y < rect.lly) ++ rect.lly = cp4.y; ++ rect.ury = cp1.y; ++ if (cp2.y > rect.ury) ++ rect.ury = cp2.y; ++ if (cp3.y > rect.ury) ++ rect.ury = cp3.y; ++ if (cp4.y > rect.ury) ++ rect.ury = cp4.y; ++#ifdef USE_QUADPOINTS ++ qpoints = pdf_new_array(); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp1.x, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp1.y, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp2.x, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp2.y, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp3.x, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp3.y, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp4.x, 0.01))); ++ pdf_add_array(qpoints, pdf_new_number(ROUND(cp4.y, 0.01))); ++ pdf_add_dict(annot_dict, pdf_new_name("QuadPoints"), qpoints); ++#endif + } ++#else ++ { ++ pdf_coord cp; ++ ++ cp.x = spe->x_user; cp.y = spe->y_user; ++ pdf_dev_transform(&cp, NULL); ++ if (ti.flags & INFO_HAS_USER_BBOX) { ++ rect.llx = ti.bbox.llx + cp.x; ++ rect.lly = ti.bbox.lly + cp.y; ++ rect.urx = ti.bbox.urx + cp.x; ++ rect.ury = ti.bbox.ury + cp.y; ++ } else { ++ rect.llx = cp.x; ++ rect.lly = cp.y - spe->mag * ti.depth; ++ rect.urx = cp.x + spe->mag * ti.width; ++ rect.ury = cp.y + spe->mag * ti.height; ++ } ++ } ++#endif + + /* Order is important... */ + if (ident) +diff -Naur a/texk/dvipdfm-x/specials.c b/texk/dvipdfm-x/specials.c +--- a/texk/dvipdfm-x/specials.c 2019-03-29 22:13:05.000000000 +0000 ++++ b/texk/dvipdfm-x/specials.c 2019-05-31 22:00:04.008964031 +0100 +@@ -169,12 +169,12 @@ + switch (k) { + /* xpos and ypos must be position in device space here. */ + case K_OBJ__XPOS: +- cp.x = dvi_dev_xpos(); cp.y = 0.0; ++ cp.x = dvi_dev_xpos(); cp.y = dvi_dev_ypos(); + pdf_dev_transform(&cp, NULL); + value = pdf_new_number(ROUND(cp.x, .01)); + break; + case K_OBJ__YPOS: +- cp.x = 0.0; cp.y = dvi_dev_ypos(); ++ cp.x = dvi_dev_xpos(); cp.y = dvi_dev_ypos(); + pdf_dev_transform(&cp, NULL); + value = pdf_new_number(ROUND(cp.y, .01)); + break; +@@ -233,12 +233,12 @@ + for (k = 0; _rkeys[k] && strcmp(key, _rkeys[k]); k++); + switch (k) { + case K_OBJ__XPOS: +- cp.x = dvi_dev_xpos(); cp.y = 0.0; ++ cp.x = dvi_dev_xpos(); cp.y = dvi_dev_ypos(); + pdf_dev_transform(&cp, NULL); + value = pdf_new_number(ROUND(cp.x, .01)); + break; + case K_OBJ__YPOS: +- cp.x = 0.0; cp.y = dvi_dev_ypos(); ++ cp.x = dvi_dev_xpos(); cp.y = dvi_dev_ypos(); + pdf_dev_transform(&cp, NULL); + value = pdf_new_number(ROUND(cp.y, .01)); + break; +diff -Naur a/texk/dvipdfm-x/tt_cmap.c b/texk/dvipdfm-x/tt_cmap.c +--- a/texk/dvipdfm-x/tt_cmap.c 2019-02-25 10:27:33.000000000 +0000 ++++ b/texk/dvipdfm-x/tt_cmap.c 2019-05-31 22:00:04.009964032 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2007-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2002-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + This program is free software; you can redistribute it and/or modify +@@ -68,11 +68,12 @@ + struct cmap0 *map; + int i; + +- if (len < 256) +- ERROR("invalid cmap subtable"); ++ if (len < 256) { ++ WARN("invalid format 0 TT cmap subtable"); ++ return NULL; ++ } + + map = NEW(1, struct cmap0); +- + for (i = 0; i < 256; i++) + map->glyphIndexArray[i] = sfnt_get_byte(sfont); + +@@ -114,14 +115,14 @@ + struct cmap2 *map; + USHORT i, n; + +- if (len < 512) +- ERROR("invalid cmap subtable"); +- +- map = NEW(1, struct cmap2); ++ if (len < 512) { ++ WARN("invalid fromt2 TT cmap subtable"); ++ return NULL; ++ } + ++ map = NEW(1, struct cmap2); + for (i = 0; i < 256; i++) + map->subHeaderKeys[i] = sfnt_get_ushort(sfont); +- + for (n = 0, i = 0; i < 256; i++) { + map->subHeaderKeys[i] /= 8; + if (n < map->subHeaderKeys[i]) +@@ -129,7 +130,13 @@ + } + n += 1; /* the number of subHeaders is one plus the max of subHeaderKeys */ + +- map->subHeaders = NEW(n, struct SubHeader); ++ if (len < 512 + n * 8 ) { ++ WARN("invalid/truncated format2 TT cmap subtable"); ++ RELEASE(map); ++ return NULL; ++ } ++ ++ map->subHeaders = NEW(n, struct SubHeader); + for (i = 0; i < n; i++) { + map->subHeaders[i].firstCode = sfnt_get_ushort(sfont); + map->subHeaders[i].entryCount = sfnt_get_ushort(sfont); +@@ -222,8 +229,10 @@ + struct cmap4 *map; + USHORT i, n, segCount; + +- if (len < 8) +- ERROR("invalid cmap subtable"); ++ if (len < 8) { ++ WARN("invalid format 4 TT cmap subtable"); ++ return NULL; ++ } + + map = NEW(1, struct cmap4); + +@@ -288,19 +297,19 @@ + * Last segment maps 0xffff to gid 0 (?) + */ + i = segCount = map->segCountX2 / 2; +- while (i-- > 0 && cc <= map->endCount[i]) { ++ while (i-- > 0 && cc <= map->endCount[i]) { + if (cc >= map->startCount[i]) { + if (map->idRangeOffset[i] == 0) { +- gid = (cc + map->idDelta[i]) & 0xffff; ++ gid = (cc + map->idDelta[i]) & 0xffff; + } else if (cc == 0xffff && map->idRangeOffset[i] == 0xffff) { +- /* this is for protection against some old broken fonts... */ +- gid = 0; ++ /* this is for protection against some old broken fonts... */ ++ gid = 0; + } else { +- j = map->idRangeOffset[i] - (segCount - i) * 2; +- j = (cc - map->startCount[i]) + (j / 2); +- gid = map->glyphIndexArray[j]; +- if (gid != 0) +- gid = (gid + map->idDelta[i]) & 0xffff; ++ j = map->idRangeOffset[i] - (segCount - i) * 2; ++ j = (cc - map->startCount[i]) + (j / 2); ++ gid = map->glyphIndexArray[j]; ++ if (gid != 0) ++ gid = (gid + map->idDelta[i]) & 0xffff; + } + break; + } +@@ -323,14 +332,15 @@ + struct cmap6 *map; + USHORT i; + +- if (len < 4) +- ERROR("invalid cmap subtable"); ++ if (len < 4) { ++ WARN("invalid format 6 TT cmap subtable"); ++ return NULL; ++ } + + map = NEW(1, struct cmap6); + map->firstCode = sfnt_get_ushort(sfont); + map->entryCount = sfnt_get_ushort(sfont); +- map->glyphIndexArray = NEW(map->entryCount, USHORT); +- ++ map->glyphIndexArray = NEW(map->entryCount, USHORT); + for (i = 0; i < map->entryCount; i++) + map->glyphIndexArray[i] = sfnt_get_ushort(sfont); + +@@ -390,13 +400,14 @@ + struct cmap12 *map; + ULONG i; + +- if (len < 4) +- ERROR("invalid cmap subtable"); ++ if (len < 4) { ++ WARN("invalid format 12 TT cmap subtable"); ++ return NULL; ++ } + + map = NEW(1, struct cmap12); + map->nGroups = sfnt_get_ulong(sfont); + map->groups = NEW(map->nGroups, struct charGroup); +- + for (i = 0; i < map->nGroups; i++) { + map->groups[i].startCharCode = sfnt_get_ulong(sfont); + map->groups[i].endCharCode = sfnt_get_ulong(sfont); +@@ -427,8 +438,8 @@ + cccc <= map->groups[i].endCharCode) { + if (cccc >= map->groups[i].startCharCode) { + gid = (USHORT) ((cccc - +- map->groups[i].startCharCode + +- map->groups[i].startGlyphID) & 0xffff); ++ map->groups[i].startCharCode + ++ map->groups[i].startGlyphID) & 0xffff); + break; + } + } +@@ -510,6 +521,7 @@ + WARN("Unrecognized OpenType/TrueType cmap format."); + tt_cmap_release(cmap); + return NULL; ++ break; + } + + if (!cmap->map) { +@@ -526,24 +538,25 @@ + + if (cmap) { + if (cmap->map) { +- switch(cmap->format) { ++ switch (cmap->format) { + case 0: +- release_cmap0(cmap->map); +- break; ++ release_cmap0(cmap->map); ++ break; + case 2: +- release_cmap2(cmap->map); +- break; ++ release_cmap2(cmap->map); ++ break; + case 4: +- release_cmap4(cmap->map); +- break; ++ release_cmap4(cmap->map); ++ break; + case 6: +- release_cmap6(cmap->map); +- break; ++ release_cmap6(cmap->map); ++ break; + case 12: +- release_cmap12(cmap->map); +- break; ++ release_cmap12(cmap->map); ++ break; + default: +- ERROR("Unrecognized OpenType/TrueType cmap format."); ++ WARN("Unrecognized OpenType/TrueType cmap format: %d", cmap->format); ++ break; + } + } + RELEASE(cmap); +@@ -582,129 +595,20 @@ + gid = lookup_cmap12(cmap->map, (ULONG) cc); + break; + default: +- ERROR("Unrecognized OpenType/TrueType cmap subtable format"); ++ WARN("Unrecognized OpenType/TrueType cmap subtable format: %d", cmap->format); + break; + } + + return gid; + } + +-/* Sorry for placing this here. +- * We need to rewrite TrueType font support code... +- */ + +-#define WBUF_SIZE 1024 +-static unsigned char wbuf[WBUF_SIZE]; + + static unsigned char srange_min[2] = {0x00, 0x00}; + static unsigned char srange_max[2] = {0xff, 0xff}; + static unsigned char lrange_min[4] = {0x00, 0x00, 0x00, 0x00}; + static unsigned char lrange_max[4] = {0x7f, 0xff, 0xff, 0xff}; + +-static void +-load_cmap4 (struct cmap4 *map, +- unsigned char *GIDToCIDMap, +- otl_gsub *gsub_vert, otl_gsub *gsub_list, +- CMap *cmap, CMap *tounicode_add) +-{ +- USHORT c0, c1, gid, cid; +- USHORT j, d, segCount; +- USHORT ch; +- int i; +- +- segCount = map->segCountX2 / 2; +- for (i = segCount - 1; i >= 0 ; i--) { +- c0 = map->startCount[i]; +- c1 = map->endCount[i]; +- d = map->idRangeOffset[i] / 2 - (segCount - i); +- for (j = 0; j <= c1 - c0; j++) { +- ch = c0 + j; +- if (map->idRangeOffset[i] == 0) { +- gid = (ch + map->idDelta[i]) & 0xffff; +- } else if (c0 == 0xffff && c1 == 0xffff && +- map->idRangeOffset[i] == 0xffff) { +- /* this is for protection against some old broken fonts... */ +- gid = 0; +- } else { +- gid = (map->glyphIndexArray[j+d] + map->idDelta[i]) & 0xffff; +- } +- if (gid != 0 && gid != 0xffff) { +- if (gsub_list) +- otl_gsub_apply_chain(gsub_list, &gid); +- if (gsub_vert) +- otl_gsub_apply(gsub_vert, &gid); +- if (GIDToCIDMap) { +- cid = ((GIDToCIDMap[2*gid] << 8)|GIDToCIDMap[2*gid+1]); +- if (cid == 0) +- WARN("GID %u does not have corresponding CID %u.", gid, cid); +- } else { +- cid = gid; +- } +- wbuf[0] = 0; +- wbuf[1] = 0; +- wbuf[2] = (ch >> 8) & 0xff; +- wbuf[3] = ch & 0xff; +- wbuf[4] = (cid >> 8) & 0xff; +- wbuf[5] = cid & 0xff; +- CMap_add_cidchar(cmap, wbuf, 4, cid); +- if (tounicode_add) { +- unsigned char *p = wbuf + 6; +- size_t uc_len; +- uc_len = UC_UTF16BE_encode_char(ch, &p, wbuf + WBUF_SIZE -1 ); +- CMap_add_bfchar(tounicode_add, wbuf+4, 2, wbuf+6, uc_len); +- } +- } +- } +- } +- +- return; +-} +- +-static void +-load_cmap12 (struct cmap12 *map, +- unsigned char *GIDToCIDMap, +- otl_gsub *gsub_vert, otl_gsub *gsub_list, +- CMap *cmap, CMap *tounicode_add) +-{ +- ULONG i, ch; /* LONG ? */ +- USHORT gid, cid; +- +- for (i = 0; i < map->nGroups; i++) { +- for (ch = map->groups[i].startCharCode; +- ch <= map->groups[i].endCharCode; +- ch++) { +- int d = ch - map->groups[i].startCharCode; +- gid = (USHORT) ((map->groups[i].startGlyphID + d) & 0xffff); +- if (gsub_list) +- otl_gsub_apply_chain(gsub_list, &gid); +- if (gsub_vert) +- otl_gsub_apply(gsub_vert, &gid); +- if (GIDToCIDMap) { +- cid = ((GIDToCIDMap[2*gid] << 8)|GIDToCIDMap[2*gid+1]); +- if (cid == 0) +- WARN("GID %u does not have corresponding CID %u.", gid, cid); +- } else { +- cid = gid; +- } +- wbuf[0] = (ch >> 24) & 0xff; +- wbuf[1] = (ch >> 16) & 0xff; +- wbuf[2] = (ch >> 8) & 0xff; +- wbuf[3] = ch & 0xff; +- wbuf[4] = (cid >> 8) & 0xff; +- wbuf[5] = cid & 0xff; +- CMap_add_cidchar(cmap, wbuf, 4, cid); +- if (tounicode_add) { +- unsigned char *p = wbuf + 6; +- size_t uc_len; +- uc_len = UC_UTF16BE_encode_char(ch, &p, wbuf + WBUF_SIZE -1 ); +- CMap_add_bfchar(tounicode_add, wbuf+4, 2, wbuf+6, uc_len); +- } +- } +- } +- +- return; +-} +- + /* OpenType CIDFont: + * + * We don't use GID for them. OpenType cmap table is for +@@ -717,78 +621,37 @@ + #include "cff_dict.h" + #include "cff.h" + +-static int +-handle_CIDFont (sfnt *sfont, +- unsigned char **GIDToCIDMap, CIDSysInfo *csi) +-{ +- cff_font *cffont; +- int offset, i; +- card16 num_glyphs, gid; +- cff_charsets *charset; +- unsigned char *map; +- struct tt_maxp_table *maxp; +- +- ASSERT(csi); +- +- offset = sfnt_find_table_pos(sfont, "CFF "); +- if (offset == 0) { +- csi->registry = NULL; +- csi->ordering = NULL; +- *GIDToCIDMap = NULL; +- return 0; +- } +- +- maxp = tt_read_maxp_table(sfont); +- num_glyphs = (card16) maxp->numGlyphs; +- RELEASE(maxp); +- if (num_glyphs < 1) +- ERROR("No glyph contained in this font..."); +- +- cffont = cff_open(sfont->stream, offset, 0); +- if (!cffont) +- ERROR("Could not open CFF font..."); +- +- +- if (!(cffont->flag & FONTTYPE_CIDFONT)) { +- cff_close(cffont); +- csi->registry = NULL; +- csi->ordering = NULL; +- *GIDToCIDMap = NULL; +- return 0; +- } ++/* This should be moved to cff.c */ ++static void ++create_GIDToCIDMap (uint16_t *GIDToCIDMap, uint16_t num_glyphs, cff_font *cffont) ++{ ++ cff_charsets *charset; ++ uint16_t gid, i; + +- if (!cff_dict_known(cffont->topdict, "ROS")) { +- ERROR("No CIDSystemInfo???"); +- } else { +- card16 reg, ord; ++ ASSERT(GIDToCIDMap); + +- reg = (card16) cff_dict_get(cffont->topdict, "ROS", 0); +- ord = (card16) cff_dict_get(cffont->topdict, "ROS", 1); ++ if (!cffont || !(cffont->flag & FONTTYPE_CIDFONT)) { ++ for (gid = 0; gid < num_glyphs; gid++) { ++ GIDToCIDMap[gid] = gid; ++ } + +- csi->registry = cff_get_string(cffont, reg); +- csi->ordering = cff_get_string(cffont, ord); +- csi->supplement = (int) cff_dict_get(cffont->topdict, "ROS", 2); ++ return; + } + +- cff_read_charsets(cffont); +- charset = cffont->charsets; +- if (!charset) { +- ERROR("No CFF charset data???"); +- } ++ memset(GIDToCIDMap, 0, num_glyphs*sizeof(uint16_t)); + +- map = NEW(65536 * 2, unsigned char); +- memset(map, 0, 65536 * 2); ++ charset = cffont->charsets; ++ if (!charset) ++ return; + switch (charset->format) { + case 0: + { + s_SID *cids; /* CID... */ +- ++ + cids = charset->data.glyphs; +- for (gid = 1, i = 0; +- i < charset->num_entries; i++) { +- map[2*gid ] = (cids[i] >> 8) & 0xff; +- map[2*gid+1] = cids[i] & 0xff; +- gid++; ++ for (gid = 1, i = 0; i < charset->num_entries; i++) { ++ GIDToCIDMap[gid] = cids[i]; ++ gid++; + } + } + break; +@@ -798,16 +661,14 @@ + card16 cid, count; + + ranges = charset->data.range1; +- for (gid = 1, i = 0; +- i < charset->num_entries; i++) { +- cid = ranges[i].first; +- count = ranges[i].n_left + 1; /* card8 */ +- while (count-- > 0 && +- gid <= num_glyphs) { +- map[2*gid ] = (cid >> 8) & 0xff; +- map[2*gid + 1] = cid & 0xff; +- gid++; cid++; +- } ++ for (gid = 1, i = 0; i < charset->num_entries; i++) { ++ cid = ranges[i].first; ++ count = ranges[i].n_left + 1; /* card8 */ ++ while (count-- > 0 && gid <= num_glyphs) { ++ GIDToCIDMap[gid] = cid; ++ gid++; ++ cid++; ++ } + } + } + break; +@@ -817,55 +678,52 @@ + card16 cid, count; + + ranges = charset->data.range2; +- if (charset->num_entries == 1 && +- ranges[0].first == 1) { +- /* "Complete" CIDFont */ +- RELEASE(map); map = NULL; ++ if (charset->num_entries == 1 && ranges[0].first == 1) { ++ /* "Complete" CIDFont */ ++ for (gid = 0; gid < num_glyphs; gid++) { ++ GIDToCIDMap[gid] = gid; ++ } + } else { +- /* Not trivial mapping */ +- for (gid = 1, i = 0; +- i < charset->num_entries; i++) { +- cid = ranges[i].first; +- count = ranges[i].n_left + 1; +- while (count-- > 0 && +- gid <= num_glyphs) { +- map[2*gid] = (cid >> 8) & 0xff; +- map[2*gid+1] = cid & 0xff; +- gid++; cid++; +- } +- } ++ /* Not trivial mapping */ ++ for (gid = 1, i = 0; i < charset->num_entries; i++) { ++ cid = ranges[i].first; ++ count = ranges[i].n_left + 1; ++ while (count-- > 0 && gid <= num_glyphs) { ++ GIDToCIDMap[gid] = cid; ++ gid++; ++ cid++; ++ } ++ } + } + } + break; + default: +- RELEASE(map); map = NULL; +- ERROR("Unknown CFF charset format...: %d", charset->format); ++ WARN("Unknown CFF charset format...: %d", charset->format); + break; + } +- cff_close(cffont); + +- *GIDToCIDMap = map; +- return 1; ++ return; + } + + static int is_PUA_or_presentation (unsigned int uni) + { + /* Some of CJK Radicals Supplement and Kangxi Radicals + * are commonly double encoded, lower the priority. ++ * CJK Compatibility Ideographs & Supplement added. + */ + return ((uni >= 0x2E80 && uni <= 0x2EF3) || (uni >= 0x2F00 && uni <= 0x2FD5) || + (uni >= 0xE000 && uni <= 0xF8FF) || (uni >= 0xFB00 && uni <= 0xFB4F) || ++ (uni >= 0xF900 && uni <= 0xFAFF) || (uni >= 0x2F800 && uni <= 0x2FA1F) || + (uni >= 0xF0000 && uni <= 0xFFFFD) || (uni >= 0x100000 && uni <= 0x10FFFD)); + } + +-static char* +-sfnt_get_glyphname(struct tt_post_table *post, cff_font *cffont, USHORT gid) ++static char * ++lookup_glyph_name (struct tt_post_table *post, cff_font *cffont, USHORT gid) + { +- char* name = NULL; ++ char *name = NULL; + + if (post) + name = tt_get_glyphname(post, gid); +- + if (!name && cffont) + name = cff_get_glyphname(cffont, gid); + +@@ -881,94 +739,82 @@ + #define is_used_char2(b,c) (((b)[(c)/8]) & (1 << (7-((c)%8)))) + #endif + +-static USHORT +-handle_subst_glyphs (CMap *cmap, +- CMap *cmap_add, +- const char *used_glyphs, +- sfnt *sfont, +- cff_font *cffont) ++static int32_t ++handle_subst_glyphs (CMap *cmap, CMap *cmap_add, char *used_chars) + { +- USHORT count; +- USHORT i; +- struct tt_post_table *post = NULL; +- +- if (!cmap_add) +- post = tt_read_post_table(sfont); +- +- for (count = 0, i = 0; i < 8192; i++) { +- int j; +- int32_t len; +- int inbytesleft, outbytesleft; +- const unsigned char *inbuf; +- unsigned char *outbuf; ++ int32_t count = 0; ++ int32_t cid; + +- if (used_glyphs[i] == 0) ++ for (cid = 0; cid < 65536; cid++) { ++ if (!is_used_char2(used_chars, cid)) + continue; ++ else { ++ unsigned char buf[256]; ++ int inbytesleft = 2, outbytesleft = 254; ++ size_t len; ++ unsigned char *outbuf = buf + 2; ++ const unsigned char *inbuf = buf; ++ ++ buf[0] = (cid >> 8) & 0xff; ++ buf[1] = cid & 0xff; ++ CMap_decode(cmap_add, &inbuf, &inbytesleft, &outbuf, &outbytesleft); ++ if (inbytesleft == 0) { ++ len = 254 - outbytesleft; ++ CMap_add_bfchar(cmap, buf, 2, buf + 2, len); ++ used_chars[cid / 8] &= ~(1 << (7 - (cid % 8))); ++ count++; ++ } ++ } ++ } + +- for (j = 0; j < 8; j++) { +- USHORT gid = 8 * i + j; ++ return count; ++} + +- if (!is_used_char2(used_glyphs, gid)) +- continue; ++static int32_t ++add_ToUnicode_via_glyph_name (CMap *cmap, char *used_chars, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, ++ sfnt *sfont, cff_font *cffont) ++{ ++ int32_t count = 0; ++ USHORT gid; ++ struct tt_post_table *post = NULL; + +- if (!cmap_add) { +-#define MAX_UNICODES 16 +- /* try to look up Unicode values from the glyph name... */ +- char* name; +- int32_t unicodes[MAX_UNICODES]; +- int unicode_count = -1; +- name = sfnt_get_glyphname(post, cffont, gid); +- if (name) { +- unicode_count = agl_get_unicodes(name, unicodes, MAX_UNICODES); +- } ++ post = tt_read_post_table(sfont); ++ if (!post && !cffont) ++ return count; ++ ++ for (gid = 0; gid < num_glyphs; gid++) { ++ uint16_t cid = GIDToCIDMap[gid]; ++ if (is_used_char2(used_chars, cid)) { ++#define MAX_UNICODES 32 ++ char *name; ++ int32_t unicodes[MAX_UNICODES]; ++ int unicode_count = -1; ++ ++ name = lookup_glyph_name(post, cffont, gid); ++ if (name) { ++ unicode_count = agl_get_unicodes(name, unicodes, MAX_UNICODES); + #undef MAX_UNICODES +- if (unicode_count == -1) { +- if(dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { +- if (name) +- MESG("No Unicode mapping available: GID=%u, name=%s\n", gid, name); +- else +- MESG("No Unicode mapping available: GID=%u\n", gid); +- } +- } else { +- /* the Unicode characters go into wbuf[2] and following, in UTF16BE */ +- /* we rely on WBUF_SIZE being more than adequate for MAX_UNICODES */ +- unsigned char* p = wbuf + 2; +- int k; +- len = 0; ++ RELEASE(name); ++ if (unicode_count > 0) { ++ unsigned char *buf; ++ unsigned char *p, *endptr; ++ int k; ++ size_t len = 0; ++ ++ buf = NEW(unicode_count*4+2, unsigned char); ++ p = buf + 2; ++ endptr = buf + (unicode_count * 4 + 2); + for (k = 0; k < unicode_count; ++k) { +- len += UC_UTF16BE_encode_char(unicodes[k], &p, wbuf+WBUF_SIZE); ++ len += UC_UTF16BE_encode_char(unicodes[k], &p, endptr); + } +- wbuf[0] = (gid >> 8) & 0xff; +- wbuf[1] = gid & 0xff; +- CMap_add_bfchar(cmap, wbuf, 2, wbuf + 2, len); +- } +- RELEASE(name); +- } else { +- wbuf[0] = (gid >> 8) & 0xff; +- wbuf[1] = gid & 0xff; +- +- inbuf = wbuf; +- inbytesleft = 2; +- outbuf = wbuf + 2; +- outbytesleft = WBUF_SIZE - 2; +- CMap_decode(cmap_add, &inbuf, &inbytesleft, &outbuf, &outbytesleft); +- +- if (inbytesleft != 0) { +- WARN("CMap conversion failed..."); +- } else { +- len = WBUF_SIZE - 2 - outbytesleft; +- CMap_add_bfchar(cmap, wbuf, 2, wbuf + 2, len); ++ buf[0] = (cid >> 8) & 0xff; ++ buf[1] = cid & 0xff; ++ CMap_add_bfchar(cmap, buf, 2, buf + 2, len); ++ used_chars[cid / 8] &= ~(1 << (7 - (cid % 8))); + count++; + +- if (dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { +- int _i; +- +- MESG("otf_cmap>> Additional ToUnicode mapping: <%04X> <", gid); +- for (_i = 0; _i < len; _i++) { +- MESG("%02X", wbuf[2 + _i]); +- } +- MESG(">\n"); +- } ++ RELEASE(buf); + } + } + } +@@ -980,70 +826,11 @@ + return count; + } + +-static cff_font * +-prepare_CIDFont_from_sfnt(sfnt* sfont) +-{ +- cff_font *cffont; +- unsigned offset = 0; +- +- if (sfont->type != SFNT_TYPE_POSTSCRIPT || +- sfnt_read_table_directory(sfont, 0) < 0 || +- (offset = sfnt_find_table_pos(sfont, "CFF ")) == 0) { +- return NULL; +- } +- +- cffont = cff_open(sfont->stream, offset, 0); +- if (!cffont) +- return NULL; +- +- cff_read_charsets(cffont); +- return cffont; +-} +- +-static USHORT +-add_to_cmap_if_used (CMap *cmap, +- cff_font *cffont, +- char *used_chars, +- USHORT gid, +- ULONG ch) +-{ +- USHORT count = 0; +- USHORT cid = cffont ? cff_charsets_lookup_inverse(cffont, gid) : gid; +- if (is_used_char2(used_chars, cid)) { +- int len; +- unsigned char *p = wbuf + 2; +- +- count++; +- +- wbuf[0] = (cid >> 8) & 0xff; +- wbuf[1] = (cid & 0xff); +- len = UC_UTF16BE_encode_char((int32_t) ch, &p, wbuf + WBUF_SIZE); +- CMap_add_bfchar(cmap, wbuf, 2, wbuf + 2, len); +- +- /* Skip PUA characters and alphabetic presentation forms, allowing +- * handle_subst_glyphs() as it might find better mapping. Fixes the +- * mapping of ligatures encoded in PUA in fonts like Linux Libertine +- * and old Adobe fonts. +- */ +- if (!is_PUA_or_presentation(ch)) { +- /* Avoid duplicate entry +- * There are problem when two Unicode code is mapped to +- * single glyph... +- */ +- used_chars[cid / 8] &= ~(1 << (7 - (cid % 8))); +- } +- } +- +- return count; +-} +- +-static USHORT +-create_ToUnicode_cmap4 (CMap *cmap, +- struct cmap4 *map, +- char *used_chars, +- cff_font *cffont) ++static void ++create_inverse_cmap4 (int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ struct cmap4 *map) + { +- USHORT count = 0, segCount = map->segCountX2 / 2; ++ USHORT segCount = map->segCountX2 / 2; + USHORT i, j; + + for (i = 0; i < segCount; i++) { +@@ -1062,32 +849,33 @@ + } else { + gid = (map->glyphIndexArray[j + d] + map->idDelta[i]) & 0xffff; + } +- +- count += add_to_cmap_if_used(cmap, cffont, used_chars, gid, ch); ++ if (is_PUA_or_presentation(ch)) { ++ map_sub[gid] = ch; ++ } else { ++ map_base[gid] = ch; ++ } + } + } +- +- return count; + } + +-static USHORT +-create_ToUnicode_cmap12 (CMap *cmap, +- struct cmap12 *map, +- char *used_chars, +- cff_font *cffont) ++static void ++create_inverse_cmap12 (int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ struct cmap12 *map) + { +- ULONG i, ch, count = 0; ++ ULONG i, ch; + + for (i = 0; i < map->nGroups; i++) { + for (ch = map->groups[i].startCharCode; + ch <= map->groups[i].endCharCode; ch++) { + int d = ch - map->groups[i].startCharCode; + USHORT gid = (USHORT) ((map->groups[i].startGlyphID + d) & 0xffff); +- count += add_to_cmap_if_used(cmap, cffont, used_chars, gid, ch); ++ if (is_PUA_or_presentation(ch)) { ++ map_sub[gid] = ch; ++ } else { ++ map_base[gid] = ch; ++ } + } + } +- +- return count; + } + + /* NOTE: Reverse mapping code which had been placed here is removed since: +@@ -1096,60 +884,163 @@ + * Especially, the second one causes problems. + */ + static pdf_obj * +-create_ToUnicode_cmap (tt_cmap *ttcmap, ++create_ToUnicode_cmap (tt_cmap *ttcmap, + const char *cmap_name, +- CMap *cmap_add, ++ CMap *cmap_add, + const char *used_chars, +- sfnt *sfont) ++ sfnt *sfont) + { +- pdf_obj *stream = NULL; +- CMap *cmap; +- USHORT count = 0; +- cff_font *cffont = prepare_CIDFont_from_sfnt(sfont); +- char is_cidfont = cffont && (cffont->flag & FONTTYPE_CIDFONT); +- +- cmap = CMap_new(); +- CMap_set_name (cmap, cmap_name); +- CMap_set_wmode(cmap, 0); +- CMap_set_type (cmap, CMAP_TYPE_TO_UNICODE); +- CMap_set_CIDSysInfo(cmap, &CSI_UNICODE); +- CMap_add_codespacerange(cmap, srange_min, srange_max, 2); ++ pdf_obj *stream = NULL; ++ int32_t *map_base = NULL, *map_sub = NULL; ++ USHORT gid, num_glyphs = 0; + +- /* cmap_add here stores information about all unencoded glyphs which can be +- * accessed only through OT Layout GSUB table. +- */ +- { +- char used_chars_copy[8192]; +- memcpy(used_chars_copy, used_chars, 8192); ++ ASSERT(ttcmap); + +- /* For create_ToUnicode_cmap{4,12}(), cffont is for GID -> CID lookup, +- * so it is only needed for CID fonts. */ +- switch (ttcmap->format) { +- case 4: +- count = create_ToUnicode_cmap4(cmap, ttcmap->map, used_chars_copy, +- is_cidfont ? cffont : NULL); +- break; +- case 12: +- count = create_ToUnicode_cmap12(cmap, ttcmap->map, used_chars_copy, +- is_cidfont ? cffont : NULL); +- break; ++ /* Get num_glyphs from maxp talbe */ ++ { ++ struct tt_maxp_table *maxp; ++ ++ maxp = tt_read_maxp_table(sfont); ++ if (maxp) { ++ num_glyphs = maxp->numGlyphs; ++ RELEASE(maxp); + } ++ } + +- /* For handle_subst_glyphs(), cffont is for GID -> glyph name lookup, so +- * it is only needed for non-CID fonts. */ +- count += handle_subst_glyphs(cmap, cmap_add, used_chars_copy, sfont, +- is_cidfont ? NULL : cffont); ++ /* Initialize GID to Unicode mapping table */ ++ map_base = NEW(num_glyphs, int32_t); ++ map_sub = NEW(num_glyphs, int32_t); ++ for (gid = 0; gid < num_glyphs; gid++) { ++ map_base[gid] = -1; ++ map_sub [gid] = -1; + } + +- if (count < 1) +- stream = NULL; +- else { +- stream = CMap_create_stream(cmap); ++ /* Create "base" mapping from inverse mapping of OpenType cmap */ ++ switch (ttcmap->format) { ++ case 4: ++ create_inverse_cmap4(map_base, map_sub, num_glyphs, ttcmap->map); ++ break; ++ case 12: ++ create_inverse_cmap12(map_base, map_sub, num_glyphs, ttcmap->map); ++ break; + } +- CMap_release(cmap); + +- if (cffont) +- cff_close(cffont); ++ /* Now create ToUnicode CMap stream */ ++ { ++ CMap *cmap; ++ int32_t count; ++ cff_font *cffont = NULL; ++ char is_cidfont = 0; ++ uint16_t *GIDToCIDMap = NULL; ++ char *used_chars_copy = NULL; ++ ++ if (sfont->type == SFNT_TYPE_POSTSCRIPT) { ++ ULONG offset; ++ offset = sfnt_find_table_pos(sfont, "CFF "); ++ cffont = cff_open(sfont->stream, offset, 0); ++ cff_read_charsets(cffont); ++ } ++ is_cidfont = cffont && (cffont->flag & FONTTYPE_CIDFONT); ++ ++ /* GIT to CID mapping info. */ ++ GIDToCIDMap = NEW(num_glyphs, uint16_t); ++ if (is_cidfont) { ++ create_GIDToCIDMap(GIDToCIDMap, num_glyphs, cffont); ++ } else { ++ for (gid = 0; gid < num_glyphs; gid++) { ++ GIDToCIDMap[gid] = gid; ++ } ++ } ++ cmap = CMap_new(); ++ CMap_set_name (cmap, cmap_name); ++ CMap_set_wmode(cmap, 0); ++ CMap_set_type (cmap, CMAP_TYPE_TO_UNICODE); ++ CMap_set_CIDSysInfo(cmap, &CSI_UNICODE); ++ CMap_add_codespacerange(cmap, srange_min, srange_max, 2); ++ ++ count = 0; ++ used_chars_copy = NEW(8192, char); ++ memcpy(used_chars_copy, used_chars, 8192); ++ for (gid = 0; gid < num_glyphs; gid++) { ++ uint16_t cid = GIDToCIDMap[gid]; ++ if (is_used_char2(used_chars_copy, cid)) { ++ int32_t ch; ++ unsigned char src[2], dst[4]; ++ unsigned char *p = dst, *endptr = dst + 4; ++ size_t len; ++ ++ ch = map_base[gid]; ++ if (UC_is_valid(ch)) { ++ src[0] = (cid >> 8) & 0xff; ++ src[1] = cid & 0xff; ++ len = UC_UTF16BE_encode_char(ch, &p, endptr); ++ CMap_add_bfchar(cmap, src, 2, dst, len); ++ used_chars_copy[cid / 8] &= ~(1 << (7 - (cid % 8))); ++ count++; ++ } ++ } ++ } ++ ++ /* cmap_add here stores information about all unencoded glyphs which can be ++ * accessed only through OT Layout GSUB table. ++ * This is only availabel when encoding is "unicode". ++ */ ++ if (cmap_add) { ++ count += handle_subst_glyphs(cmap, cmap_add, used_chars_copy); ++ } else { ++ /* Else, try gathering information from GSUB tables */ ++ count += otl_gsub_add_ToUnicode(cmap, used_chars_copy, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, sfont); ++ } ++ /* Find Unicode mapping via PostScript glyph names... */ ++ count += add_ToUnicode_via_glyph_name(cmap, used_chars_copy, num_glyphs, ++ GIDToCIDMap, sfont, is_cidfont ? NULL : cffont); ++ if (cffont) ++ cff_close(cffont); ++ ++ /* Finaly, PUA and presentation forms... */ ++ for (gid = 0; gid < num_glyphs; gid++) { ++ uint16_t cid = GIDToCIDMap[gid]; ++ if (is_used_char2(used_chars_copy, cid)) { ++ int32_t ch; ++ unsigned char src[2], dst[4]; ++ unsigned char *p = dst, *endptr = dst + 4; ++ size_t len; ++ ++ ch = map_sub[gid]; ++ if (UC_is_valid(ch)) { ++ src[0] = (cid >> 8) & 0xff; ++ src[1] = cid & 0xff; ++ len = UC_UTF16BE_encode_char(ch, &p, endptr); ++ CMap_add_bfchar(cmap, src, 2, dst, len); ++ used_chars_copy[cid / 8] &= ~(1 << (7 - (cid % 8))); ++ count++; ++ } ++ } ++ } ++ ++ /* Check for missing mapping */ ++ if (dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { ++ for (gid = 0; gid < num_glyphs; gid++) { ++ uint16_t cid = GIDToCIDMap[gid]; ++ if (is_used_char2(used_chars_copy, cid)) { ++ WARN("Unable to find ToUnicode mapping for glyph CID=%u (GID=%u)", cid, gid); ++ } ++ } ++ } ++ RELEASE(GIDToCIDMap); ++ RELEASE(used_chars_copy); ++ ++ if (count < 1) ++ stream = NULL; ++ else { ++ stream = CMap_create_stream(cmap); ++ } ++ CMap_release(cmap); ++ } ++ RELEASE(map_base); ++ RELEASE(map_sub); + + return stream; + } +@@ -1169,29 +1060,27 @@ + + pdf_obj * + otf_create_ToUnicode_stream (const char *font_name, +- int ttc_index, /* 0 for non-TTC */ ++ int ttc_index, /* 0 for non-TTC */ + const char *basefont, + const char *used_chars) + { +- pdf_obj *cmap_ref = NULL; +- int res_id; +- pdf_obj *cmap_obj = NULL; +- CMap *cmap_add; +- int cmap_add_id; +- tt_cmap *ttcmap; +- char *cmap_name, *cmap_add_name; +- FILE *fp = NULL; +- sfnt *sfont; +- ULONG offset = 0; +- int i; ++ pdf_obj *cmap_ref = NULL; /* returned value */ ++ CMap *cmap_add = NULL; ++ char *cmap_name; ++ FILE *fp = NULL; ++ sfnt *sfont; ++ ULONG offset = 0; ++ tt_cmap *ttcmap; ++ int cmap_id, cmap_add_id; ++ int i; + + cmap_name = NEW(strlen(basefont)+strlen("-UTF16")+1, char); + sprintf(cmap_name, "%s-UTF16", basefont); + +- res_id = pdf_findresource("CMap", cmap_name); +- if (res_id >= 0) { ++ cmap_id = pdf_findresource("CMap", cmap_name); ++ if (cmap_id >= 0) { + RELEASE(cmap_name); +- cmap_ref = pdf_get_resource_reference(res_id); ++ cmap_ref = pdf_get_resource_reference(cmap_id); + return cmap_ref; + } + +@@ -1212,7 +1101,10 @@ + } + + if (!sfont) { +- ERROR("Could not open OpenType/TrueType font file \"%s\"", font_name); ++ WARN("Could not open OpenType/TrueType font file \"%s\"", font_name); ++ RELEASE(cmap_name); ++ DPXFCLOSE(fp); ++ return NULL; + } + + switch (sfont->type) { +@@ -1222,7 +1114,11 @@ + case SFNT_TYPE_TTC: + offset = ttc_read_offset(sfont, ttc_index); + if (offset == 0) { +- ERROR("Invalid TTC index"); ++ WARN("Invalid TTC index for font: %s", font_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ RELEASE(cmap_name); ++ return NULL; + } + break; + default: +@@ -1231,111 +1127,180 @@ + } + + if (sfnt_read_table_directory(sfont, offset) < 0) { +- ERROR("Could not read OpenType/TrueType table directory."); ++ WARN("Could not read OpenType/TrueType table directory: %s", font_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ RELEASE(cmap_name); ++ return NULL; + } + +- cmap_add_name = NEW(strlen(font_name)+strlen(",000-UCS32-Add")+1, char); +- sprintf(cmap_add_name, "%s,%03d-UCS32-Add", font_name, ttc_index); +- cmap_add_id = CMap_cache_find(cmap_add_name); +- RELEASE(cmap_add_name); +- if (cmap_add_id < 0) { +- cmap_add = NULL; +- } else { +- cmap_add = CMap_cache_get(cmap_add_id); ++ /* cmap_add is used for storing information on ToUnicode mapping for ++ * unencoded glyphs which can be reached only through GSUB substitution. ++ * This is available only when "unicode" is specified in the encoding ++ * field of fontmap. We remember the inverse mapping via cmap_add in this ++ * case. ++ */ ++ { ++ char *cmap_add_name; ++ ++ cmap_add_name = NEW(strlen(font_name)+strlen(",000-UCS32-Add")+1, char); ++ sprintf(cmap_add_name, "%s,%03d-UCS32-Add", font_name, ttc_index); ++ cmap_add_id = CMap_cache_find(cmap_add_name); ++ RELEASE(cmap_add_name); ++ if (cmap_add_id < 0) { ++ cmap_add = NULL; ++ } else { ++ cmap_add = CMap_cache_get(cmap_add_id); ++ } + } + +- CMap_set_silent(1); /* many warnings without this... */ ++ ttcmap = NULL; + for (i = 0; i < sizeof(cmap_plat_encs) / sizeof(cmap_plat_enc_rec); ++i) { + ttcmap = tt_cmap_read(sfont, cmap_plat_encs[i].platform, cmap_plat_encs[i].encoding); + if (!ttcmap) + continue; + + if (ttcmap->format == 4 || ttcmap->format == 12) { +- cmap_obj = create_ToUnicode_cmap(ttcmap, cmap_name, cmap_add, used_chars, sfont); + break; ++ } else { ++ tt_cmap_release(ttcmap); ++ ttcmap = NULL; + } + } +-#if defined(LIBDPX) +- if (cmap_obj == NULL && dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) +-#else +- if (cmap_obj == NULL) +-#endif /* LIBDPX */ +- WARN("Unable to read OpenType/TrueType Unicode cmap table."); +- tt_cmap_release(ttcmap); +- CMap_set_silent(0); +- +- if (cmap_obj) { +- res_id = pdf_defineresource("CMap", cmap_name, +- cmap_obj, PDF_RES_FLUSH_IMMEDIATE); +- cmap_ref = pdf_get_resource_reference(res_id); +- } else { +- cmap_ref = NULL; ++ if (ttcmap) { ++ pdf_obj *cmap_obj; ++ ++ CMap_set_silent(1); /* many warnings without this... */ ++ cmap_obj = create_ToUnicode_cmap(ttcmap, cmap_name, cmap_add, used_chars, sfont); ++ CMap_set_silent(0); ++ if (cmap_obj) { ++ cmap_id = pdf_defineresource("CMap", cmap_name, ++ cmap_obj, PDF_RES_FLUSH_IMMEDIATE); ++ cmap_ref = pdf_get_resource_reference(cmap_id); ++ } ++ tt_cmap_release(ttcmap); + } +- RELEASE(cmap_name); + ++ /* Cleanup */ ++ RELEASE(cmap_name); + sfnt_close(sfont); +- if (fp) +- DPXFCLOSE(fp); ++ DPXFCLOSE(fp); ++ ++#ifndef LIBDPX ++ if (!cmap_ref) { ++ WARN("Creating ToUnicode CMap failed for \"%s\"", font_name); ++ } ++#endif + + return cmap_ref; + } + +-static int +-load_base_CMap (const char *cmap_name, CMap *tounicode_add, int wmode, +- CIDSysInfo *csi, unsigned char *GIDToCIDMap, +- otl_gsub *gsub_vert, otl_gsub *gsub_list, +- tt_cmap *ttcmap) +-{ +- int cmap_id; + +- cmap_id = CMap_cache_find(cmap_name); +- if (cmap_id < 0) { +- CMap *cmap; ++/* Creating input CMaps from OT cmap table */ + +- cmap = CMap_new(); +- CMap_set_name (cmap, cmap_name); +- CMap_set_type (cmap, CMAP_TYPE_CODE_TO_CID); +- CMap_set_wmode(cmap, wmode); +- CMap_add_codespacerange(cmap, lrange_min, lrange_max, 4); ++static void ++load_cmap4 (struct cmap4 *map, uint16_t *GIDToCIDMap, USHORT num_glyphs, ++ otl_gsub *gsub_vert, otl_gsub *gsub_list, ++ CMap *cmap, int32_t *map_base, int32_t *map_sub) ++{ ++ USHORT c0, c1, gid, cid; ++ USHORT j, d, segCount; ++ USHORT ch; ++ int i; ++ unsigned char buf[4]; + +- if (csi) { /* CID */ +- CMap_set_CIDSysInfo(cmap, csi); +- } else { +- CMap_set_CIDSysInfo(cmap, &CSI_IDENTITY); ++ segCount = map->segCountX2 / 2; ++ for (i = segCount - 1; i >= 0 ; i--) { ++ c0 = map->startCount[i]; ++ c1 = map->endCount[i]; ++ d = map->idRangeOffset[i] / 2 - (segCount - i); ++ for (j = 0; j <= c1 - c0; j++) { ++ ch = c0 + j; ++ if (map->idRangeOffset[i] == 0) { ++ gid = (ch + map->idDelta[i]) & 0xffff; ++ } else if (c0 == 0xffff && c1 == 0xffff && map->idRangeOffset[i] == 0xffff) { ++ /* this is for protection against some old broken fonts... */ ++ gid = 0; ++ } else { ++ gid = (map->glyphIndexArray[j+d] + map->idDelta[i]) & 0xffff; ++ } ++ if (gid != 0 && gid != 0xffff) { ++ /* Apply GSUB features */ ++ if (gsub_list) ++ otl_gsub_apply_chain(gsub_list, &gid); ++ if (gsub_vert) ++ otl_gsub_apply(gsub_vert, &gid); ++ cid = (gid < num_glyphs) ? GIDToCIDMap[gid] : 0; ++ buf[0] = 0; ++ buf[1] = 0; ++ buf[2] = (ch >> 8) & 0xff; ++ buf[3] = ch & 0xff; ++ CMap_add_cidchar(cmap, buf, 4, cid); ++ /* For ToUnicode creation */ ++ if (map_base && map_sub) { ++ if (is_PUA_or_presentation(ch)) { ++ map_sub[gid] = ch; ++ } else { ++ map_base[gid] = ch; ++ } ++ } ++ } + } ++ } + +- if (ttcmap->format == 12) { +- load_cmap12(ttcmap->map, GIDToCIDMap, gsub_vert, gsub_list, +- cmap, tounicode_add); +- } else if (ttcmap->format == 4) { +- load_cmap4(ttcmap->map, GIDToCIDMap, gsub_vert, gsub_list, +- cmap, tounicode_add); +- } ++ return; ++} + +- cmap_id = CMap_cache_add(cmap); ++static void ++load_cmap12 (struct cmap12 *map, uint16_t *GIDToCIDMap, USHORT num_glyphs, ++ otl_gsub *gsub_vert, otl_gsub *gsub_list, ++ CMap *cmap, int32_t *map_base, int32_t *map_sub) ++{ ++ ULONG i, ch; ++ USHORT gid, cid; ++ unsigned char buf[4]; ++ ++ for (i = 0; i < map->nGroups; i++) { ++ for (ch = map->groups[i].startCharCode; ++ ch <= map->groups[i].endCharCode; ch++) { ++ int d = ch - map->groups[i].startCharCode; ++ gid = (USHORT) ((map->groups[i].startGlyphID + d) & 0xffff); ++ if (gsub_list) ++ otl_gsub_apply_chain(gsub_list, &gid); ++ if (gsub_vert) ++ otl_gsub_apply(gsub_vert, &gid); ++ cid = (gid < num_glyphs) ? GIDToCIDMap[gid] : 0; ++ buf[0] = (ch >> 24) & 0xff; ++ buf[1] = (ch >> 16) & 0xff; ++ buf[2] = (ch >> 8) & 0xff; ++ buf[3] = ch & 0xff; ++ CMap_add_cidchar(cmap, buf, 4, cid); ++ if (map_base && map_sub) { ++ if (is_PUA_or_presentation(ch)) { ++ map_sub[gid] = ch; ++ } else { ++ map_base[gid] = ch; ++ } ++ } ++ } + } + +- return cmap_id; ++ return; + } + + int + otf_load_Unicode_CMap (const char *map_name, int ttc_index, /* 0 for non-TTC font */ +- const char *otl_tags, int wmode) ++ const char *otl_tags, int wmode) + { +- int cmap_id = -1; +- /* Additional ToUncidoe mappings required by OTL GSUB substitusion */ +- int tounicode_add_id = -1; +- CMap *tounicode_add = NULL; +- char *tounicode_add_name = NULL; +- int is_cidfont = 0; +- sfnt *sfont; +- ULONG offset = 0; +- char *cmap_name = NULL; +- FILE *fp = NULL; +- otl_gsub *gsub_vert = NULL, *gsub_list = NULL; +- tt_cmap *ttcmap; +- CIDSysInfo csi = {NULL, NULL, 0}; +- unsigned char *GIDToCIDMap = NULL; ++ int cmap_id = -1; ++ char *cmap_name = NULL; ++ sfnt *sfont = NULL; ++ ULONG offset = 0; ++ uint16_t num_glyphs = 0; ++ FILE *fp = NULL; ++ tt_cmap *ttcmap = NULL; ++ CIDSysInfo csi = {NULL, NULL, 0}; ++ uint16_t *GIDToCIDMap = NULL; + + if (!map_name) + return -1; +@@ -1359,11 +1324,6 @@ + sprintf(cmap_name, "%s,%03d-UCS4-H", map_name, ttc_index); + } + } +- if (dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { +- MESG("\n"); +- MESG("otf_cmap>> Unicode charmap for font=\"%s\" layout=\"%s\"\n", +- map_name, (otl_tags ? otl_tags : "none")); +- } + cmap_id = CMap_cache_find(cmap_name); + if (cmap_id >= 0) { + RELEASE(cmap_name); +@@ -1374,6 +1334,12 @@ + } + + /* CMap not found */ ++ if (dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { ++ MESG("\n"); ++ MESG("otf_cmap>> Creating Unicode charmap for font=\"%s\" layout=\"%s\"\n", ++ map_name, (otl_tags ? otl_tags : "none")); ++ } ++ + fp = DPXFOPEN(map_name, DPX_RES_TYPE_TTFONT); + if (!fp) { + fp = DPXFOPEN(map_name, DPX_RES_TYPE_OTFONT); +@@ -1390,13 +1356,20 @@ + } + + if (!sfont) { +- ERROR("Could not open OpenType/TrueType/dfont font file \"%s\"", map_name); ++ WARN("Could not open OpenType/TrueType/dfont font file \"%s\"", map_name); ++ RELEASE(cmap_name); ++ DPXFCLOSE(fp); ++ return -1; + } + switch (sfont->type) { + case SFNT_TYPE_TTC: + offset = ttc_read_offset(sfont, ttc_index); + if (offset == 0) { +- ERROR("Invalid TTC index"); ++ WARN("Offset=0 returned for font=%s, TTC_index=%d", map_name, ttc_index); ++ RELEASE(cmap_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ return -1; + } + break; + case SFNT_TYPE_TRUETYPE: +@@ -1407,41 +1380,79 @@ + offset = sfont->offset; + break; + default: +- ERROR("Not a OpenType/TrueType/TTC font?: %s", map_name); ++ WARN("Not a OpenType/TrueType/TTC font?: %s", map_name); ++ RELEASE(cmap_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ return -1; + break; + } + +- if (sfnt_read_table_directory(sfont, offset) < 0) +- ERROR("Could not read OpenType/TrueType table directory."); ++ if (sfnt_read_table_directory(sfont, offset) < 0) { ++ WARN("Could not read OpenType/TrueType table directory: %s", map_name); ++ RELEASE(cmap_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ return -1; ++ } + ++ { ++ struct tt_maxp_table *maxp; + +- if (otl_tags) { +- /* tounicode_add here is later refered by otf_create_ToUnicode_stream() +- * for finding additional CID to Unicode mapping entries required by +- * OTL gsub substitution. +- */ +- tounicode_add_name = NEW(strlen(map_name)+strlen(",000-UCS32-Add")+1, char); +- sprintf(tounicode_add_name, "%s,%03d-UCS32-Add", map_name, ttc_index); +- tounicode_add_id = CMap_cache_find(tounicode_add_name); +- if (tounicode_add_id >= 0) +- tounicode_add = CMap_cache_get(tounicode_add_id); +- else { +- tounicode_add = CMap_new(); +- CMap_set_name (tounicode_add, tounicode_add_name); +- CMap_set_type (tounicode_add, CMAP_TYPE_TO_UNICODE); +- CMap_set_wmode(tounicode_add, 0); +- CMap_add_codespacerange(tounicode_add, srange_min, srange_max, 2); +- CMap_set_CIDSysInfo(tounicode_add, &CSI_UNICODE); +- CMap_add_bfchar(tounicode_add, srange_min, 2, srange_max, 2); +- tounicode_add_id = CMap_cache_add(tounicode_add); +- } +- RELEASE(tounicode_add_name); ++ maxp = tt_read_maxp_table(sfont); ++ num_glyphs = (card16) maxp->numGlyphs; ++ RELEASE(maxp); + } + ++ GIDToCIDMap = NEW(num_glyphs, uint16_t); ++ memset(GIDToCIDMap, 0, num_glyphs*sizeof(uint16_t)); + if (sfont->type == SFNT_TYPE_POSTSCRIPT) { +- is_cidfont = handle_CIDFont(sfont, &GIDToCIDMap, &csi); ++ cff_font *cffont; ++ card16 gid; ++ ++ offset = sfnt_find_table_pos(sfont, "CFF "); ++ cffont = cff_open(sfont->stream, offset, 0); ++ if (!cffont) { ++ RELEASE(cmap_name); ++ RELEASE(GIDToCIDMap); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ return -1; ++ } ++ if (!(cffont->flag & FONTTYPE_CIDFONT)) { ++ csi.registry = strdup("Adobe"); ++ csi.ordering = strdup("Identity"); ++ csi.supplement = 0; ++ for (gid = 0; gid < num_glyphs; gid++) { ++ GIDToCIDMap[gid] = gid; ++ } ++ } else { ++ if (!cff_dict_known(cffont->topdict, "ROS")) { ++ csi.registry = strdup("Adobe"); ++ csi.ordering = strdup("Identity"); ++ csi.supplement = 0; ++ } else { ++ card16 reg, ord; ++ ++ reg = (card16) cff_dict_get(cffont->topdict, "ROS", 0); ++ ord = (card16) cff_dict_get(cffont->topdict, "ROS", 1); ++ csi.registry = cff_get_string(cffont, reg); ++ csi.ordering = cff_get_string(cffont, ord); ++ csi.supplement = (int) cff_dict_get(cffont->topdict, "ROS", 2); ++ } ++ cff_read_charsets(cffont); ++ create_GIDToCIDMap(GIDToCIDMap, num_glyphs, cffont); ++ } ++ cff_close(cffont); + } else { +- is_cidfont = 0; ++ uint16_t gid; ++ ++ csi.registry = strdup("Adobe"); ++ csi.ordering = strdup("Identity"); ++ csi.supplement = 0; ++ for (gid = 0; gid < num_glyphs; gid++) { ++ GIDToCIDMap[gid] = gid; ++ } + } + + ttcmap = tt_cmap_read(sfont, 3, 10); /* Microsoft UCS4 */ +@@ -1449,63 +1460,122 @@ + ttcmap = tt_cmap_read(sfont, 3, 1); /* Microsoft UCS2 */ + if (!ttcmap) { + ttcmap = tt_cmap_read(sfont, 0, 3); /* Unicode 2.0 or later */ +-#if defined(LIBDPX) +- if (!ttcmap && dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { +-#else +- if (!ttcmap) { +-#endif /* LIBDPX */ +- ERROR("Unable to read OpenType/TrueType Unicode cmap table."); +- } + } + } +- if (wmode == 1) { +- gsub_vert = otl_gsub_new(); +- if (otl_gsub_add_feat(gsub_vert, "*", "*", "vrt2", sfont) < 0) { +- if (otl_gsub_add_feat(gsub_vert, "*", "*", "vert", sfont) < 0) { +- WARN("GSUB feature vrt2/vert not found."); +- otl_gsub_release(gsub_vert); +- gsub_vert = NULL; ++ ++ if (ttcmap) { ++ CMap *cmap = NULL; ++ int32_t *map_base, *map_sub; ++ otl_gsub *gsub_vert = NULL; ++ otl_gsub *gsub_list = NULL; ++ uint32_t gid; ++ ++ if (wmode == 1) { ++ gsub_vert = otl_gsub_new(); ++ if (otl_gsub_add_feat(gsub_vert, "*", "*", "vrt2", sfont) < 0) { ++ if (otl_gsub_add_feat(gsub_vert, "*", "*", "vert", sfont) < 0) { ++ WARN("GSUB feature vrt2/vert not found."); ++ otl_gsub_release(gsub_vert); ++ gsub_vert = NULL; ++ } else { ++ otl_gsub_select(gsub_vert, "*", "*", "vert"); ++ } + } else { +- otl_gsub_select(gsub_vert, "*", "*", "vert"); ++ otl_gsub_select(gsub_vert, "*", "*", "vrt2"); + } + } else { +- otl_gsub_select(gsub_vert, "*", "*", "vrt2"); ++ gsub_vert = NULL; + } +- } else { +- gsub_vert = NULL; +- } +- if (otl_tags) { +- gsub_list = otl_gsub_new(); +- if (otl_gsub_add_feat_list(gsub_list, otl_tags, sfont) < 0) { +- WARN("Readin GSUB feature table(s) failed for \"%s\"", otl_tags); ++ if (otl_tags) { ++ gsub_list = otl_gsub_new(); ++ if (otl_gsub_add_feat_list(gsub_list, otl_tags, sfont) < 0) { ++ WARN("Reading GSUB feature table(s) failed for \"%s\"", otl_tags); ++ } else { ++ otl_gsub_set_chain(gsub_list, otl_tags); ++ } + } else { +- otl_gsub_set_chain(gsub_list, otl_tags); ++ gsub_list = NULL; + } +- } else { +- gsub_list = NULL; ++ cmap = CMap_new(); ++ CMap_set_name(cmap, cmap_name); ++ CMap_set_type(cmap, CMAP_TYPE_CODE_TO_CID); ++ CMap_set_wmode(cmap, wmode); ++ CMap_add_codespacerange(cmap, lrange_min, lrange_max, 4); ++ CMap_set_CIDSysInfo(cmap, &csi); ++ map_base = NEW(num_glyphs, int32_t); ++ map_sub = NEW(num_glyphs, int32_t); ++ for (gid = 0; gid < num_glyphs; gid++) { ++ map_base[gid] = -1; ++ map_sub[gid] = -1; ++ } ++ switch (ttcmap->format) { ++ case 12: ++ load_cmap12(ttcmap->map, GIDToCIDMap, num_glyphs, ++ gsub_vert, gsub_list, ++ cmap, map_base, map_sub); ++ break; ++ case 4: ++ load_cmap4(ttcmap->map, GIDToCIDMap, num_glyphs, ++ gsub_vert, gsub_list, ++ cmap, map_base, map_sub); ++ break; ++ } ++ if (gsub_vert) ++ otl_gsub_release(gsub_vert); ++ if (gsub_list) ++ otl_gsub_release(gsub_list); ++ tt_cmap_release(ttcmap); ++ ++ if (otl_tags) { ++ CMap *tounicode = NULL; ++ char *tounicode_name; ++ int tounicode_id; ++ ++ tounicode_name = NEW(strlen(map_name)+strlen(",000-UCS32-Add")+1, char); ++ sprintf(tounicode_name, "%s,%03d-UCS32-Add", map_name, ttc_index); ++ tounicode_id = CMap_cache_find(tounicode_name); ++ if (tounicode_id >= 0) ++ tounicode = CMap_cache_get(tounicode_id); ++ else { ++ tounicode = CMap_new(); ++ CMap_set_name (tounicode, tounicode_name); ++ CMap_set_type (tounicode, CMAP_TYPE_TO_UNICODE); ++ CMap_set_wmode(tounicode, 0); ++ CMap_add_codespacerange(tounicode, srange_min, srange_max, 2); ++ CMap_set_CIDSysInfo(tounicode, &CSI_UNICODE); ++ CMap_add_bfchar(tounicode, srange_min, 2, srange_max, 2); ++ tounicode_id = CMap_cache_add(tounicode); ++ } ++ RELEASE(tounicode_name); ++ ++ for (gid = 0; gid < num_glyphs; gid++) { ++ uint16_t cid = GIDToCIDMap[gid]; ++ unsigned char src[2], dst[4]; ++ if (cid > 0) { ++ int32_t ch = UC_is_valid(map_base[gid]) ? map_base[gid] : map_sub[gid]; ++ if (UC_is_valid(ch)) { ++ unsigned char *p = dst; ++ unsigned char *endptr = dst + 4; ++ size_t len; ++ src[0] = (cid >> 8) & 0xff; ++ src[1] = cid & 0xff; ++ len = UC_UTF16BE_encode_char(ch, &p, endptr); ++ if (len > 0) { ++ CMap_add_bfchar(tounicode, src, 2, dst, len); ++ } ++ } ++ } ++ } ++ } ++ cmap_id = CMap_cache_add(cmap); + } +- cmap_id = load_base_CMap(cmap_name, tounicode_add, wmode, +- (is_cidfont ? &csi : NULL), GIDToCIDMap, +- gsub_vert, gsub_list, ttcmap); +- if (cmap_id < 0) +- ERROR("Failed to read OpenType/TrueType cmap table."); +- if (gsub_vert) +- otl_gsub_release(gsub_vert); +- gsub_vert = NULL; +- if (gsub_list) +- otl_gsub_release(gsub_list); +- gsub_list = NULL; + + RELEASE(cmap_name); +- if (GIDToCIDMap) +- RELEASE(GIDToCIDMap); +- if (is_cidfont) { +- if (csi.registry) +- RELEASE(csi.registry); +- if (csi.ordering) +- RELEASE(csi.ordering); +- } +- tt_cmap_release(ttcmap); ++ RELEASE(GIDToCIDMap); ++ if (csi.registry) ++ RELEASE(csi.registry); ++ if (csi.ordering) ++ RELEASE(csi.ordering); + sfnt_close(sfont); + DPXFCLOSE(fp); + +@@ -1515,14 +1585,11 @@ + int + otf_try_load_GID_to_CID_map (const char *map_name, int ttc_index, int wmode) + { +- int cmap_id = -1; +- sfnt *sfont; +- ULONG offset = 0; +- char *cmap_name = NULL; +- FILE *fp = NULL; +- CIDSysInfo csi = {NULL, NULL, 0}; +- int is_cidfont = 0; +- unsigned char *GIDToCIDMap = NULL; ++ int cmap_id = -1; ++ sfnt *sfont = NULL; ++ ULONG offset = 0; ++ char *cmap_name = NULL; ++ FILE *fp = NULL; + + if (!map_name) + return -1; +@@ -1559,13 +1626,20 @@ + } + + if (!sfont) { +- ERROR("Could not open OpenType/TrueType/dfont font file \"%s\"", map_name); ++ WARN("Could not open OpenType/TrueType/dfont font file \"%s\"", map_name); ++ RELEASE(cmap_name); ++ DPXFCLOSE(fp); ++ return -1; + } + switch (sfont->type) { + case SFNT_TYPE_TTC: + offset = ttc_read_offset(sfont, ttc_index); + if (offset == 0) { +- ERROR("Invalid TTC index"); ++ WARN("Invalid TTC index for font \"%s\": %d", map_name, ttc_index); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ RELEASE(cmap_name); ++ return -1; + } + break; + case SFNT_TYPE_TRUETYPE: +@@ -1576,12 +1650,20 @@ + offset = sfont->offset; + break; + default: +- ERROR("Not a OpenType/TrueType/TTC font?: %s", map_name); +- break; ++ WARN("Not a OpenType/TrueType/TTC font?: %s", map_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ RELEASE(cmap_name); ++ return -1; + } + +- if (sfnt_read_table_directory(sfont, offset) < 0) +- ERROR("Could not read OpenType/TrueType table directory."); ++ if (sfnt_read_table_directory(sfont, offset) < 0) { ++ WARN("Could not read OpenType/TrueType table directory: %s", map_name); ++ sfnt_close(sfont); ++ DPXFCLOSE(fp); ++ RELEASE(cmap_name); ++ return -1; ++ } + if (sfont->type != SFNT_TYPE_POSTSCRIPT) { + RELEASE(cmap_name); + sfnt_close(sfont); +@@ -1590,41 +1672,71 @@ + } + + /* Read GID-to-CID mapping if CFF OpenType is found. */ +- is_cidfont = handle_CIDFont(sfont, &GIDToCIDMap, &csi); +- if (is_cidfont) { +- if (GIDToCIDMap) { +- CMap *cmap; +- int32_t gid; +- const unsigned char csrange[4] = {0x00, 0x00, 0xff, 0xff}; ++ if (sfont->type == SFNT_TYPE_POSTSCRIPT) { ++ cff_font *cffont; ++ struct tt_maxp_table *maxp; ++ const unsigned char csrange[4] = {0x00, 0x00, 0xff, 0xff}; ++ uint16_t num_glyphs = 0; ++ ++ maxp = tt_read_maxp_table(sfont); ++ num_glyphs = (card16) maxp->numGlyphs; ++ RELEASE(maxp); ++ ++ offset = sfnt_find_table_pos(sfont, "CFF "); ++ cffont = cff_open(sfont->stream, offset, 0); ++ if (cffont && cffont->flag & FONTTYPE_CIDFONT) { ++ CMap *cmap; ++ uint16_t gid; ++ uint16_t *GIDToCIDMap = NULL; ++ CIDSysInfo csi = {NULL, NULL, 0}; ++ ++ if (!cff_dict_known(cffont->topdict, "ROS")) { ++ csi.registry = strdup("Adobe"); ++ csi.ordering = strdup("Identity"); ++ csi.supplement = 0; ++ } else { ++ card16 reg, ord; + ++ reg = (card16) cff_dict_get(cffont->topdict, "ROS", 0); ++ ord = (card16) cff_dict_get(cffont->topdict, "ROS", 1); ++ csi.registry = cff_get_string(cffont, reg); ++ csi.ordering = cff_get_string(cffont, ord); ++ csi.supplement = (int) cff_dict_get(cffont->topdict, "ROS", 2); ++ } ++ cff_read_charsets(cffont); ++ GIDToCIDMap = NEW(num_glyphs, uint16_t); ++ memset(GIDToCIDMap, 0, num_glyphs*sizeof(uint16_t)); ++ create_GIDToCIDMap(GIDToCIDMap, num_glyphs, cffont); + cmap = CMap_new(); + CMap_set_name (cmap, cmap_name); + CMap_set_type (cmap, CMAP_TYPE_CODE_TO_CID); + CMap_set_wmode(cmap, wmode); + CMap_add_codespacerange(cmap, &csrange[0], &csrange[2], 2); + CMap_set_CIDSysInfo(cmap, &csi); +- +- for (gid = 0; gid < 65536; gid++) { +- unsigned char src[2]; ++ for (gid = 0; gid < num_glyphs; gid++) { ++ unsigned char src[2], dst[2]; + src[0] = (gid >> 8) & 0xff; + src[1] = gid & 0xff; +- CMap_add_bfchar(cmap, src, 2, &GIDToCIDMap[gid*2], 2); ++ dst[0] = (GIDToCIDMap[gid] >> 8) & 0xff; ++ dst[1] = GIDToCIDMap[gid] & 0xff; ++ CMap_add_bfchar(cmap, src, 2, dst, 2); + } + cmap_id = CMap_cache_add(cmap); + if (dpx_conf.verbose_level > VERBOSE_LEVEL_MIN) { + MESG("\n"); + MESG("otf_cmap>> Creating GID-to-CID mapping for font=\"%s\"\n", map_name); + } ++ RELEASE(GIDToCIDMap); ++ if (csi.registry) ++ RELEASE(csi.registry); ++ if (csi.ordering) ++ RELEASE(csi.ordering); + } +- /* Identity mapping for null GIDToCIDMap */ ++ if (cffont) ++ cff_close(cffont); + } ++ + RELEASE(cmap_name); +- if (GIDToCIDMap) +- RELEASE(GIDToCIDMap); +- if (csi.registry) +- RELEASE(csi.registry); +- if (csi.ordering) +- RELEASE(csi.ordering); + sfnt_close(sfont); + DPXFCLOSE(fp); + +diff -Naur a/texk/dvipdfm-x/tt_gsub.c b/texk/dvipdfm-x/tt_gsub.c +--- a/texk/dvipdfm-x/tt_gsub.c 2018-12-21 03:39:51.000000000 +0000 ++++ b/texk/dvipdfm-x/tt_gsub.c 2019-05-31 22:00:04.009964032 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2002-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2002-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + This program is free software; you can redistribute it and/or modify +@@ -977,10 +977,11 @@ + + sfnt_seek_set(sfont, offset); + clt_read_feature_table(&feature_table, sfont); ++#if 0 + if (feature_table.FeatureParams != 0) { + ERROR("unrecognized FeatureParams"); + } +- ++#endif + /* Lookup table */ + for (i = 0; i < feature_table.LookupListIndex.count; i++) { + struct clt_lookup_table lookup_table; +@@ -1680,98 +1681,303 @@ + return retval; + } + +-#if 0 ++#if 1 ++#include "unicode.h" ++ ++#ifndef is_used_char2 ++#define is_used_char2(b,c) (((b)[(c)/8]) & (1 << (7-((c)%8)))) ++#endif ++ ++static int ++add_glyph_if_valid (CMap *cmap, char *used_chars, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, USHORT gid, USHORT gid_sub) ++{ ++ int count = 0; ++ unsigned char src[2], dst[4]; ++ unsigned char *p = dst, *endptr = dst + 4; ++ size_t len; ++ uint16_t cid_sub; ++ ++ if (gid_sub >= num_glyphs || gid >= num_glyphs) ++ return 0; ++ ++ cid_sub = GIDToCIDMap[gid_sub]; ++ if (is_used_char2(used_chars, cid_sub)) { ++ int32_t ch = map_base[gid]; ++ if (UC_is_valid(ch)) { ++ src[0] = (cid_sub >> 8) & 0xff; ++ src[1] = cid_sub & 0xff; ++ len = UC_UTF16BE_encode_char(ch, &p, endptr); ++ CMap_add_bfchar(cmap, src, 2, dst, len); ++ used_chars[cid_sub / 8] &= ~(1 << (7 - (cid_sub % 8))); ++ count = 1; ++ } else { ++ ch = map_sub[gid]; ++ if (UC_is_valid(ch)) { ++ src[0] = (cid_sub >> 8) & 0xff; ++ src[1] = cid_sub & 0xff; ++ len = UC_UTF16BE_encode_char(ch, &p, endptr); ++ CMap_add_bfchar(cmap, src, 2, dst, len); ++ used_chars[cid_sub / 8] &= ~(1 << (7 - (cid_sub % 8))); ++ count = 1; ++ } ++ } ++ } ++ return count; ++} ++ + static int +-otl_gsub_dump_single (struct otl_gsub_subtab *subtab) ++add_ToUnicode_single (CMap *cmap, char *used_chars, ++ struct otl_gsub_subtab *subtab, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap) + { +- int gid, idx; ++ int count = 0; ++ USHORT i, idx, gid; ++ USHORT gid_sub; + + ASSERT(subtab); + + if (subtab->SubstFormat == 1) { + struct otl_gsub_single1 *data; ++ struct clt_coverage *cov; + + data = (subtab->table).single1; +- for (gid = 0; gid < 0x10000; gid++) { +- idx = clt_lookup_coverage(&data->coverage, gid); +- if (idx >= 0) { +- fprintf(stdout, "substitute \\%u by \\%u;\n", +- (USHORT) gid, (USHORT) (gid + data->DeltaGlyphID)); ++ cov = &data->coverage; ++ switch (cov->format) { ++ case 1: /* list */ ++ for (idx = 0; idx < cov->count; idx++) { ++ gid = cov->list[idx]; ++ gid_sub = gid + data->DeltaGlyphID; ++ count += add_glyph_if_valid(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, gid_sub); + } ++ break; ++ case 2: /* range */ ++ for (i = 0; i < cov->count; i++) { ++ for (gid = cov->range[i].Start; ++ gid <= cov->range[i].End && gid < num_glyphs; gid++) { ++ idx = cov->range[i].StartCoverageIndex + gid - cov->range[i].Start; ++ gid_sub = gid + data->DeltaGlyphID; ++ count += add_glyph_if_valid(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, gid_sub); ++ } ++ } ++ break; + } + } else if (subtab->SubstFormat == 2) { + struct otl_gsub_single2 *data; ++ struct clt_coverage *cov; + + data = (subtab->table).single2; +- for (gid = 0; gid < 0x10000; gid++) { +- idx = clt_lookup_coverage(&data->coverage, gid); +- if (idx >= 0 && +- idx < data->GlyphCount) { +- fprintf(stdout, "substitute \\%u by \\%u;\n", +- (USHORT) gid, (data->Substitute)[idx]); ++ cov = &data->coverage; ++ switch (cov->format) { ++ case 1: /* list */ ++ for (idx = 0; idx < cov->count; idx++) { ++ gid = cov->list[idx]; ++ if (idx >= 0 && idx < data->GlyphCount) { ++ gid_sub = (data->Substitute)[idx]; ++ count += add_glyph_if_valid(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, gid_sub); ++ } + } ++ break; ++ case 2: /* range */ ++ for (i = 0; i < cov->count; i++) { ++ for (gid = cov->range[i].Start; ++ gid <= cov->range[i].End && gid < num_glyphs; gid++) { ++ idx = cov->range[i].StartCoverageIndex + gid - cov->range[i].Start; ++ if (idx >= 0 && idx < data->GlyphCount) { ++ gid_sub = (data->Substitute)[idx]; ++ count += add_glyph_if_valid(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, gid_sub); ++ } ++ } ++ } ++ break; + } + } + +- return 0; ++ return count; + } + +-static int +-otl_gsub_dump_alternate (struct otl_gsub_subtab *subtab) ++static int32_t ++add_alternate1_inverse_map (CMap *cmap, char *used_chars, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, USHORT gid, int idx, ++ struct otl_gsub_alternate1 *data) + { +- int gid, idx; ++ int32_t count = 0; ++ ++ if (idx >= 0 && idx < data->AlternateSetCount) { ++ struct otl_gsub_altset *altset; ++ USHORT i; ++ ++ altset = &(data->AlternateSet[idx]); ++ if (altset->GlyphCount == 0) ++ return count; ++ for (i = 0; i < altset->GlyphCount; i++) { ++ USHORT gid_alt = altset->Alternate[i]; ++ count += add_glyph_if_valid(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, gid_alt); ++ } ++ } ++ return count; ++} ++ ++static int32_t ++add_ToUnicode_alternate (CMap *cmap, char *used_chars, ++ struct otl_gsub_subtab *subtab, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap) ++{ ++ int32_t count = 0; ++ USHORT i, gid, idx; + + ASSERT(subtab); + + if (subtab->SubstFormat == 1) { + struct otl_gsub_alternate1 *data; +- ++ struct clt_coverage *cov; + data = subtab->table.alternate1; +- for (gid = 0; gid < 0x10000; gid++) { +- idx = clt_lookup_coverage(&data->coverage, gid); +- if (idx >= 0 && idx < data->AlternateSetCount) { +- struct otl_gsub_altset *altset; +- USHORT i; +- altset = &(data->AlternateSet[idx]); +- if (altset->GlyphCount == 0) +- continue; +- fprintf(stdout, "substitute \\%u from [", (USHORT) gid); +- for (i = 0; i < altset->GlyphCount; i++) { +- fprintf(stdout, " \\%u", altset->Alternate[i]); ++ cov = &data->coverage; ++ switch (cov->format) { ++ case 1: /* list */ ++ for (idx = 0; idx < cov->count; idx++) { ++ gid = cov->list[idx]; ++ if (gid < num_glyphs) { ++ count += add_alternate1_inverse_map(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, idx, data); ++ } ++ } ++ break; ++ case 2: /* range */ ++ for (i = 0; i < cov->count; i++) { ++ for (gid = cov->range[i].Start; ++ gid <= cov->range[i].End && gid < num_glyphs; gid++) { ++ idx = cov->range[i].StartCoverageIndex + gid - cov->range[i].Start; ++ count += add_alternate1_inverse_map(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, idx, data); + } +- fprintf(stdout, " ];\n"); + } ++ break; + } + } ++ return count; ++} + +- return 0; ++static int32_t ++add_ligature1_inverse_map (CMap *cmap, char *used_chars, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, USHORT gid_1, int idx, ++ struct otl_gsub_ligature1 *data) ++{ ++ int32_t count = 0; ++ ++ if (idx >= 0 && idx < data->LigSetCount) { ++ struct otl_gsub_ligset *ligset; ++ USHORT i, j; ++ ++ ligset = &(data->LigatureSet[idx]); ++ for (j = 0; j < ligset->LigatureCount; j++) { ++ USHORT gid_sub = ligset->Ligature[j].LigGlyph; ++ if (gid_sub < num_glyphs) { ++ uint16_t cid = GIDToCIDMap[gid_sub]; ++ if (is_used_char2(used_chars, cid)) { ++ int32_t ch, *ucv; ++ USHORT comp_count = ligset->Ligature[j].CompCount; ++ int fail_count = 0; ++ ++ ucv = NEW(comp_count, int32_t); ++ ch = UC_is_valid(map_base[gid_1]) ? map_base[gid_1] : map_sub[gid_1]; ++ ucv[0] = ch; ++ fail_count += UC_is_valid(ch) ? 0 : 1; ++ for (i = 0; i < ligset->Ligature[j].CompCount - 1; i++) { ++ USHORT gid = ligset->Ligature[j].Component[i]; ++ if (gid < num_glyphs) { ++ ch = UC_is_valid(map_base[gid]) ? map_base[gid] : map_sub[gid]; ++ ucv[i+1] = ch; ++ fail_count += UC_is_valid(ch) ? 0 : 1; ++ } else { ++ fail_count += 1; ++ } ++ } ++ if (fail_count == 0) { ++ unsigned char src[2], *dst; ++ unsigned char *p, *endptr; ++ size_t len = 0; ++ ++ src[0] = (cid >> 8) & 0xff; ++ src[1] = cid & 0xff; ++ dst = NEW(comp_count*4, unsigned char); ++ p = dst; ++ endptr = dst + comp_count * 4; ++ for (i = 0; i < comp_count; i++) { ++ len += UC_UTF16BE_encode_char(ucv[i], &p, endptr); ++ } ++ CMap_add_bfchar(cmap, src, 2, dst, len); ++ used_chars[cid / 8] &= ~(1 << (7 - (cid % 8))); ++ count++; ++ RELEASE(dst); ++ } ++ RELEASE(ucv); ++ } ++ } ++ } ++ } ++ ++ return count; + } + +-static int +-otl_gsub_dump_ligature (struct otl_gsub_subtab *subtab) ++static int32_t ++add_ToUnicode_ligature (CMap *cmap, char *used_chars, ++ struct otl_gsub_subtab *subtab, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap) + { +- int gid, idx; ++ int32_t count = 0; ++ USHORT i, idx, gid; + + ASSERT(subtab); + + if (subtab->SubstFormat == 1) { + struct otl_gsub_ligature1 *data; ++ struct clt_coverage *cov; + + data = subtab->table.ligature1; +- for (gid = 0; gid < 0x10000; gid++) { +- idx = clt_lookup_coverage(&data->coverage, gid); +- if (idx >= 0 && idx < data->LigSetCount) { +- struct otl_gsub_ligset *ligset; +- USHORT i, j; +- ligset = &(data->LigatureSet[idx]); +- for (j = 0; j < ligset->LigatureCount; j++) { +- fprintf(stdout, "substitute \\%u", (USHORT) gid); +- for (i = 0; i < ligset->Ligature[j].CompCount - 1; i++) { +- fprintf(stdout, " \\%u", ligset->Ligature[j].Component[i]); ++ cov = &data->coverage; ++ switch (cov->format) { ++ case 1: /* list */ ++ for (idx = 0; idx < cov->count; idx++) { ++ gid = cov->list[idx]; ++ if (gid < num_glyphs) { ++ count += add_ligature1_inverse_map(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, idx, data); ++ } ++ } ++ break; ++ case 2: /* range */ ++ for (i = 0; i < cov->count; i++) { ++ for (gid = cov->range[i].Start; ++ gid <= cov->range[i].End && gid < num_glyphs; gid++) { ++ idx = cov->range[i].StartCoverageIndex + gid - cov->range[i].Start; ++ if (gid < num_glyphs) { ++ count += add_ligature1_inverse_map(cmap, used_chars, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap, gid, idx, data); + } +- fprintf(stdout, " by \\%u;\n", ligset->Ligature[j].LigGlyph); + } + } ++ break; + } + } + +@@ -1779,48 +1985,44 @@ + } + + int +-otl_gsub_dump (otl_gsub *gsub_list, +- const char *script, const char *language, const char *feature) ++otl_gsub_add_ToUnicode (CMap *cmap, char *used_chars, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, sfnt *sfont) + { +- int error = -1; ++ int count = 0; ++ otl_gsub *gsub_list; + struct otl_gsub_tab *gsub; + struct otl_gsub_subtab *subtab; +- int sel, i, j; +- +- if (!gsub_list) +- return -1; ++ int i, j; + +- sel = gsub_list->select; +- error = otl_gsub_select(gsub_list, script, language, feature); +- if (error < 0) { +- ERROR("GSUB feature %s.%s.%s not found.", script, language, feature); +- } +- +- i = gsub_list->select; +- if (i < 0 || i >= gsub_list->num_gsubs) { +- ERROR("GSUB not selected..."); +- return -1; +- } +- gsub = &(gsub_list->gsubs[i]); ++ gsub_list = otl_gsub_new(); ++ otl_gsub_add_feat(gsub_list, "*", "*", "*", sfont); + +- for (j = 0; +- !error && +- j < gsub->num_subtables; j++) { +- subtab = &(gsub->subtables[j]); +- switch ((int) subtab->LookupType){ +- case OTL_GSUB_TYPE_SINGLE: +- error = otl_gsub_dump_single(subtab); +- break; +- case OTL_GSUB_TYPE_ALTERNATE: +- error = otl_gsub_dump_alternate(subtab); +- break; +- case OTL_GSUB_TYPE_LIGATURE: +- error = otl_gsub_dump_ligature(subtab); +- break; ++ for (i = 0; i < gsub_list->num_gsubs; i++) { ++ gsub = &(gsub_list->gsubs[i]); ++ for (j = 0; j < gsub->num_subtables; j++) { ++ subtab = &(gsub->subtables[j]); ++ switch ((int) subtab->LookupType){ ++ case OTL_GSUB_TYPE_SINGLE: ++ count += add_ToUnicode_single(cmap, used_chars, subtab, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap); ++ break; ++ case OTL_GSUB_TYPE_ALTERNATE: ++ count += add_ToUnicode_alternate(cmap, used_chars, subtab, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap); ++ break; ++ case OTL_GSUB_TYPE_LIGATURE: ++ count += add_ToUnicode_ligature(cmap, used_chars, subtab, ++ map_base, map_sub, num_glyphs, ++ GIDToCIDMap); ++ break; ++ } + } + } +- gsub_list->select = sel; ++ otl_gsub_release(gsub_list); + +- return error; ++ return count; + } + #endif +diff -Naur a/texk/dvipdfm-x/tt_gsub.h b/texk/dvipdfm-x/tt_gsub.h +--- a/texk/dvipdfm-x/tt_gsub.h 2018-09-14 04:34:50.000000000 +0100 ++++ b/texk/dvipdfm-x/tt_gsub.h 2019-05-31 22:00:04.009964032 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2002-2018 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2002-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + This program is free software; you can redistribute it and/or modify +@@ -23,6 +23,7 @@ + + #include "sfnt.h" + #include "otl_opt.h" ++#include "cmap.h" + + typedef struct otl_gsub otl_gsub; + +@@ -59,11 +60,7 @@ + extern int otl_gsub_set_chain (otl_gsub *gsub_list, const char *otl_tags); + extern int otl_gsub_apply_chain (otl_gsub *gsub_list, USHORT *gid); + +-#if 0 +-extern int otl_gsub_dump (otl_gsub *gsub_list, +- const char *script, +- const char *language, +- const char *feature); +-#endif +- ++extern int otl_gsub_add_ToUnicode (CMap *cmap, char *used_chars, ++ int32_t *map_base, int32_t *map_sub, USHORT num_glyphs, ++ uint16_t *GIDToCIDMap, sfnt *sfont); + #endif /* _TT_GSUB_H_ */ +diff -Naur a/texk/dvipdfm-x/unicode.c b/texk/dvipdfm-x/unicode.c +--- a/texk/dvipdfm-x/unicode.c 2016-01-06 10:13:28.000000000 +0000 ++++ b/texk/dvipdfm-x/unicode.c 2019-05-31 22:00:04.009964032 +0100 +@@ -1,6 +1,6 @@ + /* This is dvipdfmx, an eXtended version of dvipdfm by Mark A. Wicks. + +- Copyright (C) 2002-2016 by Jin-Hwan Cho and Shunsaku Hirata, ++ Copyright (C) 2002-2019 by Jin-Hwan Cho and Shunsaku Hirata, + the dvipdfmx project team. + + Copyright (C) 1998, 1999 by Mark A. Wicks <mwicks@kettering.edu> +@@ -123,7 +123,7 @@ + unsigned char *p = *pp; + + if (ucv >= 0 && ucv <= 0xFFFF) { +- if (p + 2 >= endptr) ++ if (p + 2 > endptr) + return 0; + p[0] = (ucv >> 8) & 0xff; + p[1] = ucv & 0xff; +@@ -131,7 +131,7 @@ + } else if (ucv >= 0x010000 && ucv <= 0x10FFFF) { + unsigned short high, low; + +- if (p + 4 >= endptr) ++ if (p + 4 > endptr) + return 0; + ucv -= 0x00010000; + high = (ucv >> UC_SUR_SHIFT) + UC_SUR_HIGH_START; +@@ -142,7 +142,7 @@ + p[3] = (low & 0xff); + count = 4; + } else { +- if (p + 2 >= endptr) ++ if (p + 2 > endptr) + return 0; + p[0] = (UC_REPLACEMENT_CHAR >> 8) & 0xff; + p[1] = (UC_REPLACEMENT_CHAR & 0xff); +@@ -207,25 +207,25 @@ + return 0; + + if (ucv < 0x7f) { +- if (p >= endptr - 1) ++ if (p + 1 > endptr) + return 0; + p[0] = (unsigned char) ucv; + count = 1; + } else if (ucv <= 0x7ff) { +- if (p >= endptr -2) ++ if (p + 2 > endptr) + return 0; + p[0] = (unsigned char) (0xc0 | (ucv >> 6)); + p[1] = (unsigned char) (0x80 | (ucv & 0x3f)); + count = 2; + } else if (ucv <= 0xffff) { +- if (p >= endptr - 3) ++ if (p + 3 > endptr) + return 0; + p[0] = (unsigned char) (0xe0 | (ucv >> 12)); + p[1] = (unsigned char) (0x80 | ((ucv >> 6) & 0x3f)); + p[2] = (unsigned char) (0x80 | (ucv & 0x3f)); + count = 3; + } else if (ucv <= 0x1fffff) { +- if (p >= endptr - 4) ++ if (p + 4 > endptr) + return 0; + p[0] = (unsigned char) (0xf0 | (ucv >> 18)); + p[1] = (unsigned char) (0x80 | ((ucv >> 12) & 0x3f)); +@@ -233,7 +233,7 @@ + p[3] = (unsigned char) (0x80 | (ucv & 0x3f)); + count = 4; + } else if (ucv <= 0x3ffffff) { +- if (p >= endptr - 5) ++ if (p + 5 > endptr) + return 0; + p[0] = (unsigned char) (0xf8 | (ucv >> 24)); + p[1] = (unsigned char) (0x80 | ((ucv >> 18) & 0x3f)); +@@ -242,7 +242,7 @@ + p[4] = (unsigned char) (0x80 | (ucv & 0x3f)); + count = 5; + } else if (ucv <= 0x7fffffff) { +- if (p >= endptr - 6) ++ if (p + 6 > endptr) + return 0; + p[0] = (unsigned char) (0xfc | (ucv >> 30)); + p[1] = (unsigned char) (0x80 | ((ucv >> 24) & 0x3f)); +diff -Naur a/texk/dvipsk/ChangeLog b/texk/dvipsk/ChangeLog +--- a/texk/dvipsk/ChangeLog 2019-04-07 02:42:55.000000000 +0100 ++++ b/texk/dvipsk/ChangeLog 2019-05-31 22:00:04.009964032 +0100 +@@ -1,3 +1,9 @@ ++2019-04-30 Karl Berry <karl@tug.org> ++ ++ * dosection.c (dosection): close PostScript string constant ++ for long filenames. tex-k mail from Arnaud Blouin, ++ 24 Apr 2019 13:54:10. ++ + 2019-04-07 Karl Berry <karl@freefriends.org> + + * TeX Live 2019. +diff -Naur a/texk/dvipsk/dosection.c b/texk/dvipsk/dosection.c +--- a/texk/dvipsk/dosection.c 2019-03-30 01:50:10.000000000 +0000 ++++ b/texk/dvipsk/dosection.c 2019-05-31 22:00:04.009964032 +0100 +@@ -23,7 +23,7 @@ + int np; + int k; + integer thispage = 0; +- char buf[104]; ++ char buf[300]; /* really 253 */ + + dopsfont(s); + #ifdef HPS +@@ -40,7 +40,9 @@ + doubleout(mag); + numout((integer)DPI); + numout((integer)VDPI); +- snprintf(buf, sizeof(buf), "(%.500s)", fulliname); ++ /* possibly lines in eps files are supposed to be <= 255; ++ not worth testing the limits merely to output a long file name. */ ++ snprintf(buf, sizeof(buf), "(%.250s)", fulliname); + cmdout(buf); + newline(); + cmdout("@start"); +diff -Naur a/texk/web2c/ptexdir/ChangeLog b/texk/web2c/ptexdir/ChangeLog +--- a/texk/web2c/ptexdir/ChangeLog 2019-02-06 11:01:31.000000000 +0000 ++++ b/texk/web2c/ptexdir/ChangeLog 2019-05-31 22:00:04.010964033 +0100 +@@ -1,3 +1,11 @@ ++2019-05-06 Hironori Kitagawa <h_kitagawa2001@yahoo.co.jp> ++ ++ * ptex-base.ch: ++ Make appropriate comparison of U+0100 by \if in upTeX. ++ https://github.com/texjporg/tex-jp-build/issues/68 ++ Re-eval kcatcode of Japanese character token in \if and \ifcat. ++ https://github.com/texjporg/ptex-manual/issues/4 ++ + 2019-02-03 Hironori Kitagawa <h_kitagawa2001@yahoo.co.jp> + + * ptex-base.ch: Ignore newline char after Japanese control +diff -Naur a/texk/web2c/ptexdir/ptex-base.ch b/texk/web2c/ptexdir/ptex-base.ch +--- a/texk/web2c/ptexdir/ptex-base.ch 2019-02-06 11:00:54.000000000 +0000 ++++ b/texk/web2c/ptexdir/ptex-base.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -59,6 +59,7 @@ + % (2017-09-07) HK pTeX p3.7.2 More restrictions on direction change commands. + % (2018-01-21) HK Added \ptexversion primitive and co. pTeX p3.8. + % (2018-04-14) HK pTeX p3.8.1 Bug fix for discontinuous KINSOKU table. ++% (2019-02-03) HK pTeX p3.8.2 Change \inhibitglue, add \disinhibitglue. + % + + @x +@@ -324,6 +325,13 @@ + wterm(')'); + @z + ++@x ++@d max_halfword==@"FFFFFFF {largest allowable value in a |halfword|} ++@y ++@d max_halfword==@"FFFFFFF {largest allowable value in a |halfword|} ++@d max_cjk_val=@"10000 ++@z ++ + @x [8.111] l.2436 - pTeX: check hi/ho + (mem_top+sup_main_memory>=max_halfword) then bad:=14; + @y +@@ -2533,19 +2541,19 @@ + end; + @y + if (cur_cmd=kanji)or(cur_cmd=kana)or(cur_cmd=other_kchar) then +- begin m:=cur_cmd; n:=cur_chr; ++ begin n:=cur_chr; m:=kcat_code(kcatcodekey(n)); + end + else if (cur_cmd>active_char)or(cur_chr>255) then +- begin m:=relax; n:=256; ++ begin m:=relax; n:=max_cjk_val; + end + else begin m:=cur_cmd; n:=cur_chr; + end; + get_x_token_or_active_char; + if (cur_cmd=kanji)or(cur_cmd=kana)or(cur_cmd=other_kchar) then +- begin cur_cmd:=cur_cmd; +- end {dummy} ++ begin cur_cmd:=kcat_code(kcatcodekey(cur_chr)); ++ end + else if (cur_cmd>active_char)or(cur_chr>255) then +- begin cur_cmd:=relax; cur_chr:=256; ++ begin cur_cmd:=relax; cur_chr:=max_cjk_val; + end; + @z + +diff -Naur a/texk/web2c/uptexdir/ChangeLog b/texk/web2c/uptexdir/ChangeLog +--- a/texk/web2c/uptexdir/ChangeLog 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/ChangeLog 2019-05-31 22:00:04.010964033 +0100 +@@ -1,3 +1,28 @@ ++2019-05-25 TANAKA Takuji <ttk@t-lab.opal.ne.jp> ++ ++ * uptex-m.ch: ++ Correct upTeX_revision ".25", upTeX_version_string "-u1.25". ++ ++2019-05-06 TANAKA Takuji <ttk@t-lab.opal.ne.jp> ++ ++ * uptex-m.ch, upbibtex.ch, updvitype.ch, uppltotf.ch, uptftopl.ch, ++ uptex_version.h: upTeX version u1.25. ++ * kanji.c, kanji.h: ++ Fix bug of kcatcode at Fullwidth ASCII variants and ++ Halfwidth Katakana variants from Yusuke Terada san: ++ https://github.com/texjporg/tex-jp-build/pull/79 ++ Set default internal encoding EUC/SJIS if a command name is ++ with prefix of "p" or "ep", intending to be compatible with ++ pTeX family (ptex, eptex, pbibtex, pdvitype, ppltotf, ptftopl) ++ (experimental). ++ ++2019-05-06 Hironori Kitagawa <h_kitagawa2001@yahoo.co.jp> ++ ++ * uptex-m.ch: ++ Make appropreate comparison of U+0100 by \if. ++ https://github.com/texjporg/tex-jp-build/issues/68 ++ * tests/test_if.tex: Test case. ++ + 2019-02-23 TANAKA Takuji <ttk@t-lab.opal.ne.jp> + + * uptex-m.ch, upbibtex.ch, updvitype.ch, uppltotf.ch, uptftopl.ch, +@@ -24,7 +49,7 @@ + 2018-09-16 TANAKA Takuji <ttk@t-lab.opal.ne.jp> + + * upbibtex.ch: Fix bug of substring$ +- from Takashi Sakai: ++ from Takashi Sakai san: + https://github.com/texjporg/tex-jp-build/issues/64 + https://github.com/texjporg/tex-jp-build/pull/66 + +diff -Naur a/texk/web2c/uptexdir/kanji.c b/texk/web2c/uptexdir/kanji.c +--- a/texk/web2c/uptexdir/kanji.c 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/kanji.c 2019-05-31 22:00:04.010964033 +0100 +@@ -444,7 +444,7 @@ + || (LATIN_SMALL_LETTER_O_WITH_STROKE <=c && c<=LATIN_SMALL_LETTER_Y_WITH_DIAERESIS ) ) + return 0x1FD; + } +- if (block==0xa0) { ++ if (block==0xa1) { + /* Fullwidth ASCII variants except for U+FF01..FF0F, U+FF1A..FF20, U+FF3B..FF40, U+FF5B..FF5E */ + if ( (FULLWIDTH_DIGIT_0 <=c && c<=FULLWIDTH_DIGIT_9 ) + || (FULLWIDTH_CAPITAL_A<=c && c<=FULLWIDTH_CAPITAL_Z) +@@ -485,8 +485,6 @@ + { + char *p; + +- enable_UPTEX (true); /* enable */ +- + init_kanji (file_str, internal_str); + + p = getenv ("PTEX_KANJI_ENC"); +@@ -504,3 +502,33 @@ + } + #endif + } ++ ++void init_default_kanji_select(void) ++{ ++ char *base; ++ ++ base = kpse_program_basename (argv[0]); ++ ++ if (FILESTRNCASEEQ(base, "p", 1) || FILESTRNCASEEQ(base, "ep", 2)) { ++ ++ enable_UPTEX (false); /* disable */ ++#if defined(WIN32) ++/* pBibTeX is EUC only */ ++ if (FILESTRNCASEEQ(base, "pbibtex", 7)) { ++ init_default_kanji(NULL, "euc"); ++ } else { ++/* for pTeX, e-pTeX, pDVItype, pPLtoTF, and pTFtoPL */ ++ init_default_kanji(NULL, "sjis"); ++ } ++#else ++ init_default_kanji(NULL, "euc"); ++#endif ++ ++ } else { ++ ++/* for upTeX, e-upTeX, upBibTeX, upDVItype, upPLtoTF, and upTFtoPL */ ++ enable_UPTEX (true); /* enable */ ++ init_default_kanji ("utf8", "uptex"); ++ ++ } ++} +diff -Naur a/texk/web2c/uptexdir/kanji.h b/texk/web2c/uptexdir/kanji.h +--- a/texk/web2c/uptexdir/kanji.h 2019-02-06 11:01:31.000000000 +0000 ++++ b/texk/web2c/uptexdir/kanji.h 2019-05-31 22:00:04.010964033 +0100 +@@ -38,8 +38,9 @@ + extern integer multilenbuffchar (integer c); + + extern void init_default_kanji (const_string file_str, const_string internal_str); ++extern void init_default_kanji_select (void); + /* for upTeX, e-upTeX, upBibTeX, upDVItype, upPLtoTF, and upTFtoPL */ +-#define initkanji() init_default_kanji("utf8", "uptex") ++#define initkanji() init_default_kanji_select() + /* for upDVItype */ + #define setpriorfileenc() set_prior_file_enc() + +diff -Naur a/texk/web2c/uptexdir/tests/test_if.tex b/texk/web2c/uptexdir/tests/test_if.tex +--- a/texk/web2c/uptexdir/tests/test_if.tex 1970-01-01 01:00:00.000000000 +0100 ++++ b/texk/web2c/uptexdir/tests/test_if.tex 2019-05-31 22:00:04.010964033 +0100 +@@ -0,0 +1,29 @@ ++\kcatcode`あ=18 ++\def\xA{あ}\let\yA=あ ++\kcatcode`あ=17 ++\def\xB{あ}\let\yB=あ ++\kcatcode`あ=16 ++ ++\message{\ifcat あ\xA Y\else N\fi} ++\message{\ifcat あ\yA Y\else N\fi} ++\message{\ifcat あ\xB Y\else N\fi} ++\message{\ifcat あ\yB Y\else N\fi} ++ ++\message{\if あ\xA Y\else N\fi} ++\message{\if あ\yA Y\else N\fi} ++\message{\if い\xA Y\else N\fi} ++\message{\if い\yA Y\else N\fi} ++ ++\ifx\ucs\undefined\else ++ \kcatcode"100=16 ++ \message{upTeX} ++ \def\xA{Ā}% U+0100 ++ \def\xB{ā}% U+0101 ++ \message{\if \xA\relax Y\else N\fi} ++ \message{\if \xB\relax Y\else N\fi} ++ \message{\ifcat\xA\relax Y\else N\fi} ++ \message{\ifcat\xB\relax Y\else N\fi} ++\fi ++\end ++ ++ +diff -Naur a/texk/web2c/uptexdir/upbibtex.ch b/texk/web2c/uptexdir/upbibtex.ch +--- a/texk/web2c/uptexdir/upbibtex.ch 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/upbibtex.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -3,7 +3,7 @@ + @d banner=='This is pBibTeX, Version 0.99d-j0.33' + @y + @d my_name=='upbibtex' +-@d banner=='This is upBibTeX, Version 0.99d-j0.33-u1.24' ++@d banner=='This is upBibTeX, Version 0.99d-j0.33-u1.25' + @z + + @x +diff -Naur a/texk/web2c/uptexdir/updvitype.ch b/texk/web2c/uptexdir/updvitype.ch +--- a/texk/web2c/uptexdir/updvitype.ch 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/updvitype.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -3,7 +3,7 @@ + @d banner=='This is pDVItype, Version 3.6-p0.4' + @y + @d my_name=='updvitype' +-@d banner=='This is upDVItype, Version 3.6-p0.4-u1.24' ++@d banner=='This is upDVItype, Version 3.6-p0.4-u1.25' + @z + + @x procedure initialize +diff -Naur a/texk/web2c/uptexdir/uppltotf.ch b/texk/web2c/uptexdir/uppltotf.ch +--- a/texk/web2c/uptexdir/uppltotf.ch 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/uppltotf.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -3,7 +3,7 @@ + @d banner=='This is pPLtoTF, Version 3.6-p2.0' + @y + @d my_name=='uppltotf' +-@d banner=='This is upPLtoTF, Version 3.6-p2.0-u1.24' ++@d banner=='This is upPLtoTF, Version 3.6-p2.0-u1.25' + @z + + @x +diff -Naur a/texk/web2c/uptexdir/uptex-m.ch b/texk/web2c/uptexdir/uptex-m.ch +--- a/texk/web2c/uptexdir/uptex-m.ch 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/uptex-m.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -1,4 +1,4 @@ +-% This is a change file for upTeX u1.24 ++% This is a change file for upTeX u1.25 + % By Takuji Tanaka. + % + % (02/26/2007) TTK upTeX u0.01 +@@ -39,6 +39,8 @@ + % (2018-01-21) HK Added \uptexversion primitive and co. + % (2018-02-24) TTK upTeX u1.23 + % (2019-02-23) TTK upTeX u1.24 ++% (2019-05-06) HK Hironori Kitagawa fixed a bug in \if. ++% (2019-05-06) TTK upTeX u1.25 + + @x upTeX: banner + {printed when \pTeX\ starts} +@@ -46,8 +48,8 @@ + {printed when \pTeX\ starts} + @# + @d upTeX_version=1 +-@d upTeX_revision==".24" +-@d upTeX_version_string=='-u1.24' {current u\pTeX\ version} ++@d upTeX_revision==".25" ++@d upTeX_version_string=='-u1.25' {current u\pTeX\ version} + @# + @d upTeX_banner=='This is upTeX, Version 3.14159265',pTeX_version_string,upTeX_version_string + @d upTeX_banner_k==upTeX_banner +@@ -142,6 +144,7 @@ + @d max_quarterword=255 {largest allowable value in a |quarterword|} + @d min_halfword==-@"FFFFFFF {smallest allowable value in a |halfword|} + @d max_halfword==@"FFFFFFF {largest allowable value in a |halfword|} ++@d max_cjk_val=@"10000 + @y + @d min_quarterword=0 {smallest allowable value in a |quarterword|} + @d max_quarterword=@"FFFF {largest allowable value in a |quarterword|} +@@ -699,16 +702,24 @@ + + @x + if (cur_cmd=kanji)or(cur_cmd=kana)or(cur_cmd=other_kchar) then ++ begin n:=cur_chr; m:=kcat_code(kcatcodekey(n)); ++ end + @y + if (cur_cmd>=kanji)and(cur_cmd<=hangul) then ++ begin m:=cur_cmd; n:=cur_chr; ++ end + @z + + @x + get_x_token_or_active_char; + if (cur_cmd=kanji)or(cur_cmd=kana)or(cur_cmd=other_kchar) then ++ begin cur_cmd:=kcat_code(kcatcodekey(cur_chr)); ++ end + @y + get_x_token_or_active_char; + if (cur_cmd>=kanji)and(cur_cmd<=hangul) then ++ begin cur_cmd:=cur_cmd; ++ end {dummy} + @z + + @x +diff -Naur a/texk/web2c/uptexdir/uptex_version.h b/texk/web2c/uptexdir/uptex_version.h +--- a/texk/web2c/uptexdir/uptex_version.h 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/uptex_version.h 2019-05-31 22:00:04.010964033 +0100 +@@ -1 +1 @@ +-#define UPTEX_VERSION "u1.24" ++#define UPTEX_VERSION "u1.25" +diff -Naur a/texk/web2c/uptexdir/uptftopl.ch b/texk/web2c/uptexdir/uptftopl.ch +--- a/texk/web2c/uptexdir/uptftopl.ch 2019-02-23 01:59:36.000000000 +0000 ++++ b/texk/web2c/uptexdir/uptftopl.ch 2019-05-31 22:00:04.010964033 +0100 +@@ -3,7 +3,7 @@ + @d banner=='This is pTFtoPL, Version 3.3-p2.0' + @y + @d my_name=='uptftopl' +-@d banner=='This is upTFtoPL, Version 3.3-p2.0-u1.24' ++@d banner=='This is upTFtoPL, Version 3.3-p2.0-u1.25' + @z + + @x +diff -Naur a/texk/web2c/xetexdir/ChangeLog b/texk/web2c/xetexdir/ChangeLog +--- a/texk/web2c/xetexdir/ChangeLog 2019-01-02 22:41:45.000000000 +0000 ++++ b/texk/web2c/xetexdir/ChangeLog 2019-05-31 22:02:30.345042172 +0100 +@@ -1,3 +1,8 @@ ++2019-05-30 Khaled Hosny <dr.khaled.hosny@gmail.com> ++ ++ * XeTeXLayoutInterface.cpp: Do not use hb-icu if HarfBuzz ++ version is 2.5.0 or newer. ++ + 2019-01-03 Akira Kakuto <kakuto@fuk.kindai.ac.jp> + + * NEWS, xetex_version.h, xetex.web: Sync with the upstream. +diff -Naur a/texk/web2c/xetexdir/XeTeXLayoutInterface.cpp b/texk/web2c/xetexdir/XeTeXLayoutInterface.cpp +--- a/texk/web2c/xetexdir/XeTeXLayoutInterface.cpp 2017-03-12 08:47:36.000000000 +0000 ++++ b/texk/web2c/xetexdir/XeTeXLayoutInterface.cpp 2019-05-31 22:05:06.636170781 +0100 +@@ -2,7 +2,7 @@ + Part of the XeTeX typesetting system + Copyright (c) 1994-2008 by SIL International + Copyright (c) 2009-2012 by Jonathan Kew +- Copyright (c) 2012-2015 by Khaled Hosny ++ Copyright (c) 2012-2019 by Khaled Hosny + + SIL Author(s): Jonathan Kew + +@@ -39,8 +39,11 @@ + + #include <graphite2/Font.h> + #include <graphite2/Segment.h> ++#include <hb.h> + #include <hb-graphite2.h> ++#if !HB_VERSION_ATLEAST(2,5,0) + #include <hb-icu.h> ++#endif + #include <hb-ot.h> + + #include "XeTeX_web.h" +@@ -661,6 +664,7 @@ + free(engine->shaper); + } + ++#if !HB_VERSION_ATLEAST(2,5,0) + static unsigned int + _decompose_compat(hb_unicode_funcs_t* ufuncs, + hb_codepoint_t u, +@@ -677,8 +681,7 @@ + hb_unicode_funcs_set_decompose_compatibility_func(ufuncs, _decompose_compat, NULL, NULL); + return ufuncs; + } +- +-static hb_unicode_funcs_t* hbUnicodeFuncs = NULL; ++#endif + + int + layoutChars(XeTeXLayoutEngine engine, uint16_t chars[], int32_t offset, int32_t count, int32_t max, +@@ -699,11 +702,15 @@ + + script = hb_ot_tag_to_script (engine->script); + ++ hb_buffer_reset(engine->hbBuffer); ++ ++#if !HB_VERSION_ATLEAST(2,5,0) ++ static hb_unicode_funcs_t* hbUnicodeFuncs = NULL; + if (hbUnicodeFuncs == NULL) + hbUnicodeFuncs = _get_unicode_funcs(); +- +- hb_buffer_reset(engine->hbBuffer); + hb_buffer_set_unicode_funcs(engine->hbBuffer, hbUnicodeFuncs); ++#endif ++ + hb_buffer_add_utf16(engine->hbBuffer, chars, max, offset, count); + hb_buffer_set_direction(engine->hbBuffer, direction); + hb_buffer_set_script(engine->hbBuffer, script); |