matplotlib
diff --git a/‎lib/matplotlib/backends/backend_pdf.py
Lines changed: 1 addition & 1 deletion b/‎lib/matplotlib/backends/backend_pdf.py
Lines changed: 1 addition & 1 deletion
diff --git a/‎lib/matplotlib/dviread.py
Lines changed: 196 additions & 63 deletions b/‎lib/matplotlib/dviread.py
Lines changed: 196 additions & 63 deletions
@@ -991,7 +991,7 @@ def _embedTeXFont(self, fontinfo):
 
         # Widths
         widthsObject = self.reserveObject('font widths')
-        tfm = fontinfo.dvifont._tfm
+        tfm = fontinfo.dvifont._metrics
         # convert from TeX's 12.20 representation to 1/1000 text space units.
         widths = [(1000 * tfm.width.get(char, 0)) >> 20
                   for char in range(max(tfm.width, default=-1) + 1)]
 
@@ -30,7 +30,8 @@
 
 import numpy as np
 
-from matplotlib import _api, cbook
+from matplotlib import _api, cbook, textpath
+from matplotlib.ft2font import FT2Font, LoadFlags
 
 _log = logging.getLogger(__name__)
 
@@ -106,18 +107,27 @@ def font_effects(self):
     @property
     def glyph_name_or_index(self):
         """
-        Either the glyph name or the native charmap glyph index.
-
-        If :file:`pdftex.map` specifies an encoding for this glyph's font, that
-        is a mapping of glyph indices to Adobe glyph names; use it to convert
-        dvi indices to glyph names.  Callers can then convert glyph names to
-        glyph indices (with FT_Get_Name_Index/get_name_index), and load the
-        glyph using FT_Load_Glyph/load_glyph.
-
-        If :file:`pdftex.map` specifies no encoding, the indices directly map
-        to the font's "native" charmap; glyphs should directly load using
-        FT_Load_Char/load_char after selecting the native charmap.
+        The glyph name, the native charmap glyph index, or the raw glyph index.
+
+        If the font is a TrueType file (which can currently only happen for
+        DVI files generated by xetex or luatex), then this number is the raw
+        index of the glyph, which can be passed to FT_Load_Glyph/load_glyph.
+
+        Otherwise, the font is a PostScript font.  For such fonts, if
+        :file:`pdftex.map` specifies an encoding for this glyph's font,
+        that is a mapping of glyph indices to Adobe glyph names; which
+        is used by this property to convert dvi numbers to glyph names.
+        Callers can then convert glyph names to glyph indices (with
+        FT_Get_Name_Index/get_name_index), and load the glyph using
+        FT_Load_Glyph/load_glyph.
+
+        If :file:`pdftex.map` specifies no encoding for a PostScript font,
+        this number is an index to the font's "native" charmap; glyphs should
+        directly load using FT_Load_Char/load_char after selecting the native
+        charmap.
         """
+        # TODO: The last section is only true on luatex since luaotfload 3.15;
+        # add a version check in the tex file generated by texmanager.
         entry = self._get_pdftexmap_entry()
         return (_parse_enc(entry.encoding)[self.glyph]
                 if entry.encoding is not None else self.glyph)
@@ -399,7 +409,7 @@ def _put_char_real(self, char):
             scale = font._scale
             for x, y, f, g, w in font._vf[char].text:
                 newf = DviFont(scale=_mul1220(scale, f._scale),
-                               tfm=f._tfm, texname=f.texname, vf=f._vf)
+                               metrics=f._metrics, texname=f.texname, vf=f._vf)
                 self.text.append(Text(self.h + _mul1220(x, scale),
                                       self.v + _mul1220(y, scale),
                                       newf, g, newf._width_of(g)))
@@ -495,7 +505,27 @@ def _fnt_def(self, k, c, s, d, a, l):
 
     def _fnt_def_real(self, k, c, s, d, a, l):
         n = self.file.read(a + l)
-        fontname = n[-l:].decode('ascii')
+        fontname = n[-l:].decode("ascii")
+        # Note that checksum seems wrong?
+        if fontname.startswith("["):
+            path, sep, rest = fontname[1:].rpartition("]")
+            if not sep or rest[:1] not in ["", ":"]:
+                raise ValueError(f"Invalid modern font name: {fontname}")
+            flags = {}  # TODO: Actually record these flags.
+            if rest[1:]:
+                for kv in rest[1:].split(";"):
+                    k, v = kv.split("=", 1)
+                    if k == "index":
+                        if v != 0:
+                            raise NotImplementedError(
+                                "Indexing TTC fonts is not supported yet")
+                    elif k in ["embolden", "slant", "extend"]:
+                        flags[k] = int(v) / 65536
+                    else:
+                        _log.warning("Ignoring invalid key-value pair: %r", kv)
+            metrics = TtfMetrics(path)
+            self.fonts[k] = DviFont(scale=s, metrics=metrics, texname=n, vf=None)
+            return
         try:
             tfm = _tfmfile(fontname)
         except FileNotFoundError as exc:
@@ -512,12 +542,12 @@ def _fnt_def_real(self, k, c, s, d, a, l):
             vf = _vffile(fontname)
         except FileNotFoundError:
             vf = None
-        self.fonts[k] = DviFont(scale=s, tfm=tfm, texname=n, vf=vf)
+        self.fonts[k] = DviFont(scale=s, metrics=tfm, texname=n, vf=vf)
 
     @_dispatch(247, state=_dvistate.pre, args=('u1', 'u4', 'u4', 'u4', 'u1'))
     def _pre(self, i, num, den, mag, k):
         self.file.read(k)  # comment in the dvi file
-        if i != 2:
+        if i not in [2, 7]:  # 2: pdftex, luatex; 7: xetex
             raise ValueError(f"Unknown dvi format {i}")
         if num != 25400000 or den != 7227 * 2**16:
             raise ValueError("Nonstandard units in dvi file")
@@ -538,13 +568,70 @@ def _post(self, _):
         # TODO: actually read the postamble and finale?
         # currently post_post just triggers closing the file
 
-    @_dispatch(249)
-    def _post_post(self, _):
+    @_dispatch(249, args=())
+    def _post_post(self):
+        raise NotImplementedError
+
+    @_dispatch(250, args=())
+    def _begin_reflect(self):
         raise NotImplementedError
 
-    @_dispatch(min=250, max=255)
-    def _malformed(self, offset):
-        raise ValueError(f"unknown command: byte {250 + offset}")
+    @_dispatch(251, args=())
+    def _end_reflect(self):
+        raise NotImplementedError
+
+    @_dispatch(252, args=())
+    def _define_native_font(self):
+        k = self._read_arg(4, signed=False)
+        s = self._read_arg(4, signed=False)
+        flags = self._read_arg(2, signed=False)
+        l = self._read_arg(1, signed=False)
+        n = self.file.read(l)
+        i = self._read_arg(4, signed=False)
+        # TODO: Actually record these flags.
+        if flags & 0x0200:
+            rgba = [self._read_arg(1, signed=False) for _ in range(4)]
+        if flags & 0x1000:
+            extend = self._read_arg(4, signed=True) / 65536
+        if flags & 0x2000:
+            slant = self._read_arg(4, signed=True) / 65536
+        if flags & 0x4000:
+            embolden = self._read_arg(4, signed=True) / 65536
+        if i:
+            raise NotImplementedError("Indexing TTC fonts is not supported yet")
+        metrics = TtfMetrics(n)
+        self.fonts[k] = DviFont(
+            scale=s, metrics=metrics, texname=b"[" + n + b"]", vf=None)
+
+    @_dispatch(253, args=())
+    def _set_glyphs(self):
+        w = self._read_arg(4, signed=False)
+        k = self._read_arg(2, signed=False)
+        xy = [self._read_arg(4, signed=True) for _ in range(2 * k)]
+        g = [self._read_arg(2, signed=False) for _ in range(k)]
+        font = self.fonts[self.f]
+        for i in range(k):
+            self.text.append(Text(self.h + xy[2 * i], self.v + xy[2 * i + 1],
+                                  font, g[i], font._width_of(g[i])))
+        self.h += w
+
+    @_dispatch(254, args=())
+    def _set_text_and_glyphs(self):
+        l = self._read_arg(2, signed=False)
+        t = self.file.read(2 * l)  # utf16
+        w = self._read_arg(4, signed=False)
+        k = self._read_arg(2, signed=False)
+        xy = [self._read_arg(4, signed=True) for _ in range(2 * k)]
+        g = [self._read_arg(2, signed=False) for _ in range(k)]
+        font = self.fonts[self.f]
+        for i in range(k):
+            self.text.append(Text(self.h + xy[2 * i], self.v + xy[2 * i + 1],
+                                  font, g[i], font._width_of(g[i])))
+        self.h += w
+
+    @_dispatch(255)
+    def _malformed(self, raw):
+        raise ValueError("unknown command: byte 255")
 
 
 class DviFont:
@@ -562,7 +649,7 @@ class DviFont:
     ----------
     scale : float
         Factor by which the font is scaled from its natural size.
-    tfm : Tfm
+    tfm : Tfm | TtfMetrics
         TeX font metrics for this font
     texname : bytes
        Name of the font as used internally by TeX and friends, as an ASCII
@@ -578,12 +665,12 @@ class DviFont:
        Size of the font in Adobe points, converted from the slightly
        smaller TeX points.
     """
-    __slots__ = ('texname', 'size', '_scale', '_vf', '_tfm')
+    __slots__ = ('texname', 'size', '_scale', '_vf', '_metrics')
 
-    def __init__(self, scale, tfm, texname, vf):
+    def __init__(self, scale, metrics, texname, vf):
         _api.check_isinstance(bytes, texname=texname)
         self._scale = scale
-        self._tfm = tfm
+        self._metrics = metrics
         self.texname = texname
         self._vf = vf
         self.size = scale * (72.0 / (72.27 * 2**16))
@@ -604,32 +691,30 @@ def __repr__(self):
 
     def _width_of(self, char):
         """Width of char in dvi units."""
-        width = self._tfm.width.get(char, None)
-        if width is not None:
-            return _mul1220(width, self._scale)
-        _log.debug('No width for char %d in font %s.', char, self.texname)
-        return 0
+        metrics = self._metrics.get_metrics(char)
+        if metrics is None:
+            _log.debug('No width for char %d in font %s.', char, self.texname)
+            return 0
+        return _mul1220(metrics.width, self._scale)
 
     def _height_depth_of(self, char):
         """Height and depth of char in dvi units."""
-        result = []
-        for metric, name in ((self._tfm.height, "height"),
-                             (self._tfm.depth, "depth")):
-            value = metric.get(char, None)
-            if value is None:
-                _log.debug('No %s for char %d in font %s',
-                           name, char, self.texname)
-                result.append(0)
-            else:
-                result.append(_mul1220(value, self._scale))
+        metrics = self._metrics.get_metrics(char)
+        if metrics is None:
+            _log.debug('No metrics for char %d in font %s', char, self.texname)
+            return [0, 0]
+        metrics = [
+            _mul1220(metrics.height, self._scale),
+            _mul1220(metrics.depth, self._scale),
+        ]
         # cmsyXX (symbols font) glyph 0 ("minus") has a nonzero descent
         # so that TeX aligns equations properly
         # (https://tex.stackexchange.com/q/526103/)
         # but we actually care about the rasterization depth to align
         # the dvipng-generated images.
         if re.match(br'^cmsy\d+$', self.texname) and char == 0:
-            result[-1] = 0
-        return result
+            metrics[-1] = 0
+        return metrics
 
 
 class Vf(Dvi):
@@ -761,6 +846,9 @@ def _mul1220(num1, num2):
     return (num1*num2) >> 20
 
 
+WHD = namedtuple('WHD', 'width height depth')
+
+
 class Tfm:
     """
     A TeX Font Metric file.
@@ -783,7 +871,7 @@ class Tfm:
        specified in the dvi file. These are dicts because indexing may
        not start from 0.
     """
-    __slots__ = ('checksum', 'design_size', 'width', 'height', 'depth')
+    __slots__ = ('checksum', 'design_size', '_whds', 'widths')
 
     def __init__(self, filename):
         _log.debug('opening tfm file %s', filename)
@@ -799,15 +887,42 @@ def __init__(self, filename):
             widths = struct.unpack(f'!{nw}i', file.read(4*nw))
             heights = struct.unpack(f'!{nh}i', file.read(4*nh))
             depths = struct.unpack(f'!{nd}i', file.read(4*nd))
-        self.width = {}
-        self.height = {}
-        self.depth = {}
+        self._whds = {}
         for idx, char in enumerate(range(bc, ec+1)):
             byte0 = char_info[4*idx]
             byte1 = char_info[4*idx+1]
-            self.width[char] = widths[byte0]
-            self.height[char] = heights[byte1 >> 4]
-            self.depth[char] = depths[byte1 & 0xf]
+            self._whds[char] = WHD(
+                widths[byte0], heights[byte1 >> 4], depths[byte1 & 0xf])
+        self.widths = [(1000 * self._whds[c].width if c in self._whds else 0) >> 20
+                       for c in range(max(self._whds))] if self._whds else []
+
+    def get_metrics(self, char):
+        return self._whds[char]
+
+    width = _api.deprecated("3.11")(
+        property(lambda self: {c: m.width for c, m in self._whds}))
+    height = _api.deprecated("3.11")(
+        property(lambda self: {c: m.height for c, m in self._whds}))
+    depth = _api.deprecated("3.11")(
+        property(lambda self: {c: m.depth for c, m in self._whds}))
+
+
+class TtfMetrics:
+    def __init__(self, filename):
+        self._face = FT2Font(filename, hinting_factor=1)  # Manage closing?
+
+    def get_metrics(self, char):
+        # _mul2012 uses a truncating bitshift for compatibility with dvitype,
+        # but I still need to figure out truncation rules when upem is 1000
+        # (e.g. lmroman10-regular.otf) and thus the metrics themselves are not
+        # exactly representable as 20.12 fp.  For now, just truncate during
+        # conversion to 20.12 as well.  (When upem is 2048 the conversion is
+        # exact and the truncation does nothing.)
+        upem = self._face.units_per_EM  # Usually 2048 or 1000.
+        g = self._face.load_glyph(char, LoadFlags.NO_SCALE)
+        return WHD(int(g.horiAdvance / upem * 2**20),
+                   int(g.height / upem * 2**20),
+                   int((g.height - g.horiBearingY) / upem * 2**20))
 
 
 PsFont = namedtuple('PsFont', 'texname psname effects encoding filename')
@@ -1002,8 +1117,7 @@ def _parse_enc(path):
     Returns
     -------
     list
-        The nth entry of the list is the PostScript glyph name of the nth
-        glyph.
+        The nth list item is the PostScript glyph name of the nth glyph.
     """
     no_comments = re.sub("%.*", "", Path(path).read_text(encoding="ascii"))
     array = re.search(r"(?s)\[(.*)\]", no_comments).group(1)
@@ -1108,26 +1222,45 @@ def _fontfile(cls, suffix, texname):
     from argparse import ArgumentParser
     import itertools
 
+    import fontTools.agl
+
     parser = ArgumentParser()
     parser.add_argument("filename")
     parser.add_argument("dpi", nargs="?", type=float, default=None)
     args = parser.parse_args()
     with Dvi(args.filename, args.dpi) as dvi:
         fontmap = PsfontsMap(find_tex_file('pdftex.map'))
         for page in dvi:
-            print(f"=== new page === "
+            print(f"=== NEW PAGE === "
                   f"(w: {page.width}, h: {page.height}, d: {page.descent})")
-            for font, group in itertools.groupby(
-                    page.text, lambda text: text.font):
-                print(f"font: {font.texname.decode('latin-1')!r}\t"
-                      f"scale: {font._scale / 2 ** 20}")
-                print("x", "y", "glyph", "chr", "w", "(glyphs)", sep="\t")
+            print("--- GLYPHS ---")
+            for font, group in itertools.groupby(page.text, lambda text: text.font):
+                font_name = font.texname.decode("latin-1")
+                filename = (font_name[1:-1] if font_name.startswith("[")
+                            else fontmap[font.texname].filename)
+                if font_name.startswith("["):
+                    print(f"font: {font_name}")
+                else:
+                    print(f"font: {font_name} at {filename}")
+                print(f"scale: {font._scale / 2 ** 20}")
+                print(" ".join(map("{:>11}".format, ["x", "y", "glyph", "chr", "w"])))
+                face = FT2Font(filename)
                 for text in group:
-                    print(text.x, text.y, text.glyph,
-                          chr(text.glyph) if chr(text.glyph).isprintable()
-                          else ".",
-                          text.width, sep="\t")
+                    if font_name.startswith("["):
+                        glyph_name = face.get_glyph_name(text.glyph)
+                    else:
+                        if isinstance(text.glyph_name_or_index, str):
+                            glyph_name = text.glyph_name_or_index
+                        else:
+                            textpath.TextToPath._select_native_charmap(face)
+                            glyph_name = face.get_glyph_name(
+                                face.get_char_index(text.glyph))
+                    glyph_str = fontTools.agl.toUnicode(glyph_name)
+                    print(" ".join(map("{:>11}".format, [
+                        text.x, text.y, text.glyph, glyph_str, text.width])))
             if page.boxes:
-                print("x", "y", "h", "w", "", "(boxes)", sep="\t")
+                print("--- BOXES ---")
+                print(" ".join(map("{:>11}".format, ["x", "y", "h", "w"])))
                 for box in page.boxes:
-                    print(box.x, box.y, box.height, box.width, sep="\t")
+                    print(" ".join(map("{:>11}".format, [
+                        box.x, box.y, box.height, box.width])))