fonttools/Lib/fontTools/ttLib/tables/O_S_2f_2.py

from fontTools.misc import sstruct
from fontTools.misc.roundTools import otRound
from fontTools.misc.textTools import safeEval, num2binary, binary2num
from fontTools.ttLib.tables import DefaultTable
import bisect
import logging


log = logging.getLogger(__name__)

# panose classification

panoseFormat = """
	bFamilyType:        B
	bSerifStyle:        B
	bWeight:            B
	bProportion:        B
	bContrast:          B
	bStrokeVariation:   B
	bArmStyle:          B
	bLetterForm:        B
	bMidline:           B
	bXHeight:           B
"""


class Panose(object):
    def __init__(self, **kwargs):
        _, names, _ = sstruct.getformat(panoseFormat)
        for name in names:
            setattr(self, name, kwargs.pop(name, 0))
        for k in kwargs:
            raise TypeError(f"Panose() got an unexpected keyword argument {k!r}")

    def toXML(self, writer, ttFont):
        formatstring, names, fixes = sstruct.getformat(panoseFormat)
        for name in names:
            writer.simpletag(name, value=getattr(self, name))
            writer.newline()

    def fromXML(self, name, attrs, content, ttFont):
        setattr(self, name, safeEval(attrs["value"]))


# 'sfnt' OS/2 and Windows Metrics table - 'OS/2'

OS2_format_0 = """
	>   # big endian
	version:                H       # version
	xAvgCharWidth:          h       # average character width
	usWeightClass:          H       # degree of thickness of strokes
	usWidthClass:           H       # aspect ratio
	fsType:                 H       # type flags
	ySubscriptXSize:        h       # subscript horizontal font size
	ySubscriptYSize:        h       # subscript vertical font size
	ySubscriptXOffset:      h       # subscript x offset
	ySubscriptYOffset:      h       # subscript y offset
	ySuperscriptXSize:      h       # superscript horizontal font size
	ySuperscriptYSize:      h       # superscript vertical font size
	ySuperscriptXOffset:    h       # superscript x offset
	ySuperscriptYOffset:    h       # superscript y offset
	yStrikeoutSize:         h       # strikeout size
	yStrikeoutPosition:     h       # strikeout position
	sFamilyClass:           h       # font family class and subclass
	panose:                 10s     # panose classification number
	ulUnicodeRange1:        L       # character range
	ulUnicodeRange2:        L       # character range
	ulUnicodeRange3:        L       # character range
	ulUnicodeRange4:        L       # character range
	achVendID:              4s      # font vendor identification
	fsSelection:            H       # font selection flags
	usFirstCharIndex:       H       # first unicode character index
	usLastCharIndex:        H       # last unicode character index
	sTypoAscender:          h       # typographic ascender
	sTypoDescender:         h       # typographic descender
	sTypoLineGap:           h       # typographic line gap
	usWinAscent:            H       # Windows ascender
	usWinDescent:           H       # Windows descender
"""

OS2_format_1_addition = """
	ulCodePageRange1:   L
	ulCodePageRange2:   L
"""

OS2_format_2_addition = (
    OS2_format_1_addition
    + """
	sxHeight:           h
	sCapHeight:         h
	usDefaultChar:      H
	usBreakChar:        H
	usMaxContext:       H
"""
)

OS2_format_5_addition = (
    OS2_format_2_addition
    + """
	usLowerOpticalPointSize:    H
	usUpperOpticalPointSize:    H
"""
)

bigendian = "	>	# big endian\n"

OS2_format_1 = OS2_format_0 + OS2_format_1_addition
OS2_format_2 = OS2_format_0 + OS2_format_2_addition
OS2_format_5 = OS2_format_0 + OS2_format_5_addition
OS2_format_1_addition = bigendian + OS2_format_1_addition
OS2_format_2_addition = bigendian + OS2_format_2_addition
OS2_format_5_addition = bigendian + OS2_format_5_addition


class table_O_S_2f_2(DefaultTable.DefaultTable):

    """the OS/2 table"""

    dependencies = ["head"]

    def decompile(self, data, ttFont):
        dummy, data = sstruct.unpack2(OS2_format_0, data, self)

        if self.version == 1:
            dummy, data = sstruct.unpack2(OS2_format_1_addition, data, self)
        elif self.version in (2, 3, 4):
            dummy, data = sstruct.unpack2(OS2_format_2_addition, data, self)
        elif self.version == 5:
            dummy, data = sstruct.unpack2(OS2_format_5_addition, data, self)
            self.usLowerOpticalPointSize /= 20
            self.usUpperOpticalPointSize /= 20
        elif self.version != 0:
            from fontTools import ttLib

            raise ttLib.TTLibError(
                "unknown format for OS/2 table: version %s" % self.version
            )
        if len(data):
            log.warning("too much 'OS/2' table data")

        self.panose = sstruct.unpack(panoseFormat, self.panose, Panose())

    def compile(self, ttFont):
        self.updateFirstAndLastCharIndex(ttFont)
        panose = self.panose
        head = ttFont["head"]
        if (self.fsSelection & 1) and not (head.macStyle & 1 << 1):
            log.warning(
                "fsSelection bit 0 (italic) and "
                "head table macStyle bit 1 (italic) should match"
            )
        if (self.fsSelection & 1 << 5) and not (head.macStyle & 1):
            log.warning(
                "fsSelection bit 5 (bold) and "
                "head table macStyle bit 0 (bold) should match"
            )
        if (self.fsSelection & 1 << 6) and (self.fsSelection & 1 + (1 << 5)):
            log.warning(
                "fsSelection bit 6 (regular) is set, "
                "bits 0 (italic) and 5 (bold) must be clear"
            )
        if self.version < 4 and self.fsSelection & 0b1110000000:
            log.warning(
                "fsSelection bits 7, 8 and 9 are only defined in "
                "OS/2 table version 4 and up: version %s",
                self.version,
            )
        self.panose = sstruct.pack(panoseFormat, self.panose)
        if self.version == 0:
            data = sstruct.pack(OS2_format_0, self)
        elif self.version == 1:
            data = sstruct.pack(OS2_format_1, self)
        elif self.version in (2, 3, 4):
            data = sstruct.pack(OS2_format_2, self)
        elif self.version == 5:
            d = self.__dict__.copy()
            d["usLowerOpticalPointSize"] = round(self.usLowerOpticalPointSize * 20)
            d["usUpperOpticalPointSize"] = round(self.usUpperOpticalPointSize * 20)
            data = sstruct.pack(OS2_format_5, d)
        else:
            from fontTools import ttLib

            raise ttLib.TTLibError(
                "unknown format for OS/2 table: version %s" % self.version
            )
        self.panose = panose
        return data

    def toXML(self, writer, ttFont):
        writer.comment(
            "The fields 'usFirstCharIndex' and 'usLastCharIndex'\n"
            "will be recalculated by the compiler"
        )
        writer.newline()
        if self.version == 1:
            format = OS2_format_1
        elif self.version in (2, 3, 4):
            format = OS2_format_2
        elif self.version == 5:
            format = OS2_format_5
        else:
            format = OS2_format_0
        formatstring, names, fixes = sstruct.getformat(format)
        for name in names:
            value = getattr(self, name)
            if name == "panose":
                writer.begintag("panose")
                writer.newline()
                value.toXML(writer, ttFont)
                writer.endtag("panose")
            elif name in (
                "ulUnicodeRange1",
                "ulUnicodeRange2",
                "ulUnicodeRange3",
                "ulUnicodeRange4",
                "ulCodePageRange1",
                "ulCodePageRange2",
            ):
                writer.simpletag(name, value=num2binary(value))
            elif name in ("fsType", "fsSelection"):
                writer.simpletag(name, value=num2binary(value, 16))
            elif name == "achVendID":
                writer.simpletag(name, value=repr(value)[1:-1])
            else:
                writer.simpletag(name, value=value)
            writer.newline()

    def fromXML(self, name, attrs, content, ttFont):
        if name == "panose":
            self.panose = panose = Panose()
            for element in content:
                if isinstance(element, tuple):
                    name, attrs, content = element
                    panose.fromXML(name, attrs, content, ttFont)
        elif name in (
            "ulUnicodeRange1",
            "ulUnicodeRange2",
            "ulUnicodeRange3",
            "ulUnicodeRange4",
            "ulCodePageRange1",
            "ulCodePageRange2",
            "fsType",
            "fsSelection",
        ):
            setattr(self, name, binary2num(attrs["value"]))
        elif name == "achVendID":
            setattr(self, name, safeEval("'''" + attrs["value"] + "'''"))
        else:
            setattr(self, name, safeEval(attrs["value"]))

    def updateFirstAndLastCharIndex(self, ttFont):
        if "cmap" not in ttFont:
            return
        codes = set()
        for table in getattr(ttFont["cmap"], "tables", []):
            if table.isUnicode():
                codes.update(table.cmap.keys())
        if codes:
            minCode = min(codes)
            maxCode = max(codes)
            # USHORT cannot hold codepoints greater than 0xFFFF
            self.usFirstCharIndex = min(0xFFFF, minCode)
            self.usLastCharIndex = min(0xFFFF, maxCode)

    # misspelled attributes kept for legacy reasons

    @property
    def usMaxContex(self):
        return self.usMaxContext

    @usMaxContex.setter
    def usMaxContex(self, value):
        self.usMaxContext = value

    @property
    def fsFirstCharIndex(self):
        return self.usFirstCharIndex

    @fsFirstCharIndex.setter
    def fsFirstCharIndex(self, value):
        self.usFirstCharIndex = value

    @property
    def fsLastCharIndex(self):
        return self.usLastCharIndex

    @fsLastCharIndex.setter
    def fsLastCharIndex(self, value):
        self.usLastCharIndex = value

    def getUnicodeRanges(self):
        """Return the set of 'ulUnicodeRange*' bits currently enabled."""
        bits = set()
        ul1, ul2 = self.ulUnicodeRange1, self.ulUnicodeRange2
        ul3, ul4 = self.ulUnicodeRange3, self.ulUnicodeRange4
        for i in range(32):
            if ul1 & (1 << i):
                bits.add(i)
            if ul2 & (1 << i):
                bits.add(i + 32)
            if ul3 & (1 << i):
                bits.add(i + 64)
            if ul4 & (1 << i):
                bits.add(i + 96)
        return bits

    def setUnicodeRanges(self, bits):
        """Set the 'ulUnicodeRange*' fields to the specified 'bits'."""
        ul1, ul2, ul3, ul4 = 0, 0, 0, 0
        for bit in bits:
            if 0 <= bit < 32:
                ul1 |= 1 << bit
            elif 32 <= bit < 64:
                ul2 |= 1 << (bit - 32)
            elif 64 <= bit < 96:
                ul3 |= 1 << (bit - 64)
            elif 96 <= bit < 123:
                ul4 |= 1 << (bit - 96)
            else:
                raise ValueError("expected 0 <= int <= 122, found: %r" % bit)
        self.ulUnicodeRange1, self.ulUnicodeRange2 = ul1, ul2
        self.ulUnicodeRange3, self.ulUnicodeRange4 = ul3, ul4

    def recalcUnicodeRanges(self, ttFont, pruneOnly=False):
        """Intersect the codepoints in the font's Unicode cmap subtables with
        the Unicode block ranges defined in the OpenType specification (v1.7),
        and set the respective 'ulUnicodeRange*' bits if there is at least ONE
        intersection.
        If 'pruneOnly' is True, only clear unused bits with NO intersection.
        """
        unicodes = set()
        for table in ttFont["cmap"].tables:
            if table.isUnicode():
                unicodes.update(table.cmap.keys())
        if pruneOnly:
            empty = intersectUnicodeRanges(unicodes, inverse=True)
            bits = self.getUnicodeRanges() - empty
        else:
            bits = intersectUnicodeRanges(unicodes)
        self.setUnicodeRanges(bits)
        return bits

    def getCodePageRanges(self):
        """Return the set of 'ulCodePageRange*' bits currently enabled."""
        bits = set()
        ul1, ul2 = self.ulCodePageRange1, self.ulCodePageRange2
        for i in range(32):
            if ul1 & (1 << i):
                bits.add(i)
            if ul2 & (1 << i):
                bits.add(i + 32)
        return bits

    def setCodePageRanges(self, bits):
        """Set the 'ulCodePageRange*' fields to the specified 'bits'."""
        ul1, ul2 = 0, 0
        for bit in bits:
            if 0 <= bit < 32:
                ul1 |= 1 << bit
            elif 32 <= bit < 64:
                ul2 |= 1 << (bit - 32)
            else:
                raise ValueError(f"expected 0 <= int <= 63, found: {bit:r}")
        self.ulCodePageRange1, self.ulCodePageRange2 = ul1, ul2

    def recalcCodePageRanges(self, ttFont, pruneOnly=False):
        unicodes = set()
        for table in ttFont["cmap"].tables:
            if table.isUnicode():
                unicodes.update(table.cmap.keys())
        bits = calcCodePageRanges(unicodes)
        if pruneOnly:
            bits &= self.getCodePageRanges()
        # when no codepage ranges can be enabled, fall back to enabling bit 0
        # (Latin 1) so that the font works in MS Word:
        # https://github.com/googlei18n/fontmake/issues/468
        if not bits:
            bits = {0}
        self.setCodePageRanges(bits)
        return bits

    def recalcAvgCharWidth(self, ttFont):
        """Recalculate xAvgCharWidth using metrics from ttFont's 'hmtx' table.

        Set it to 0 if the unlikely event 'hmtx' table is not found.
        """
        avg_width = 0
        hmtx = ttFont.get("hmtx")
        if hmtx is not None:
            widths = [width for width, _ in hmtx.metrics.values() if width > 0]
            if widths:
                avg_width = otRound(sum(widths) / len(widths))
        self.xAvgCharWidth = avg_width
        return avg_width


# Unicode ranges data from the OpenType OS/2 table specification v1.7

OS2_UNICODE_RANGES = (
    (("Basic Latin", (0x0000, 0x007F)),),
    (("Latin-1 Supplement", (0x0080, 0x00FF)),),
    (("Latin Extended-A", (0x0100, 0x017F)),),
    (("Latin Extended-B", (0x0180, 0x024F)),),
    (
        ("IPA Extensions", (0x0250, 0x02AF)),
        ("Phonetic Extensions", (0x1D00, 0x1D7F)),
        ("Phonetic Extensions Supplement", (0x1D80, 0x1DBF)),
    ),
    (
        ("Spacing Modifier Letters", (0x02B0, 0x02FF)),
        ("Modifier Tone Letters", (0xA700, 0xA71F)),
    ),
    (
        ("Combining Diacritical Marks", (0x0300, 0x036F)),
        ("Combining Diacritical Marks Supplement", (0x1DC0, 0x1DFF)),
    ),
    (("Greek and Coptic", (0x0370, 0x03FF)),),
    (("Coptic", (0x2C80, 0x2CFF)),),
    (
        ("Cyrillic", (0x0400, 0x04FF)),
        ("Cyrillic Supplement", (0x0500, 0x052F)),
        ("Cyrillic Extended-A", (0x2DE0, 0x2DFF)),
        ("Cyrillic Extended-B", (0xA640, 0xA69F)),
    ),
    (("Armenian", (0x0530, 0x058F)),),
    (("Hebrew", (0x0590, 0x05FF)),),
    (("Vai", (0xA500, 0xA63F)),),
    (("Arabic", (0x0600, 0x06FF)), ("Arabic Supplement", (0x0750, 0x077F))),
    (("NKo", (0x07C0, 0x07FF)),),
    (("Devanagari", (0x0900, 0x097F)),),
    (("Bengali", (0x0980, 0x09FF)),),
    (("Gurmukhi", (0x0A00, 0x0A7F)),),
    (("Gujarati", (0x0A80, 0x0AFF)),),
    (("Oriya", (0x0B00, 0x0B7F)),),
    (("Tamil", (0x0B80, 0x0BFF)),),
    (("Telugu", (0x0C00, 0x0C7F)),),
    (("Kannada", (0x0C80, 0x0CFF)),),
    (("Malayalam", (0x0D00, 0x0D7F)),),
    (("Thai", (0x0E00, 0x0E7F)),),
    (("Lao", (0x0E80, 0x0EFF)),),
    (("Georgian", (0x10A0, 0x10FF)), ("Georgian Supplement", (0x2D00, 0x2D2F))),
    (("Balinese", (0x1B00, 0x1B7F)),),
    (("Hangul Jamo", (0x1100, 0x11FF)),),
    (
        ("Latin Extended Additional", (0x1E00, 0x1EFF)),
        ("Latin Extended-C", (0x2C60, 0x2C7F)),
        ("Latin Extended-D", (0xA720, 0xA7FF)),
    ),
    (("Greek Extended", (0x1F00, 0x1FFF)),),
    (
        ("General Punctuation", (0x2000, 0x206F)),
        ("Supplemental Punctuation", (0x2E00, 0x2E7F)),
    ),
    (("Superscripts And Subscripts", (0x2070, 0x209F)),),
    (("Currency Symbols", (0x20A0, 0x20CF)),),
    (("Combining Diacritical Marks For Symbols", (0x20D0, 0x20FF)),),
    (("Letterlike Symbols", (0x2100, 0x214F)),),
    (("Number Forms", (0x2150, 0x218F)),),
    (
        ("Arrows", (0x2190, 0x21FF)),
        ("Supplemental Arrows-A", (0x27F0, 0x27FF)),
        ("Supplemental Arrows-B", (0x2900, 0x297F)),
        ("Miscellaneous Symbols and Arrows", (0x2B00, 0x2BFF)),
    ),
    (
        ("Mathematical Operators", (0x2200, 0x22FF)),
        ("Supplemental Mathematical Operators", (0x2A00, 0x2AFF)),
        ("Miscellaneous Mathematical Symbols-A", (0x27C0, 0x27EF)),
        ("Miscellaneous Mathematical Symbols-B", (0x2980, 0x29FF)),
    ),
    (("Miscellaneous Technical", (0x2300, 0x23FF)),),
    (("Control Pictures", (0x2400, 0x243F)),),
    (("Optical Character Recognition", (0x2440, 0x245F)),),
    (("Enclosed Alphanumerics", (0x2460, 0x24FF)),),
    (("Box Drawing", (0x2500, 0x257F)),),
    (("Block Elements", (0x2580, 0x259F)),),
    (("Geometric Shapes", (0x25A0, 0x25FF)),),
    (("Miscellaneous Symbols", (0x2600, 0x26FF)),),
    (("Dingbats", (0x2700, 0x27BF)),),
    (("CJK Symbols And Punctuation", (0x3000, 0x303F)),),
    (("Hiragana", (0x3040, 0x309F)),),
    (
        ("Katakana", (0x30A0, 0x30FF)),
        ("Katakana Phonetic Extensions", (0x31F0, 0x31FF)),
    ),
    (("Bopomofo", (0x3100, 0x312F)), ("Bopomofo Extended", (0x31A0, 0x31BF))),
    (("Hangul Compatibility Jamo", (0x3130, 0x318F)),),
    (("Phags-pa", (0xA840, 0xA87F)),),
    (("Enclosed CJK Letters And Months", (0x3200, 0x32FF)),),
    (("CJK Compatibility", (0x3300, 0x33FF)),),
    (("Hangul Syllables", (0xAC00, 0xD7AF)),),
    (("Non-Plane 0 *", (0xD800, 0xDFFF)),),
    (("Phoenician", (0x10900, 0x1091F)),),
    (
        ("CJK Unified Ideographs", (0x4E00, 0x9FFF)),
        ("CJK Radicals Supplement", (0x2E80, 0x2EFF)),
        ("Kangxi Radicals", (0x2F00, 0x2FDF)),
        ("Ideographic Description Characters", (0x2FF0, 0x2FFF)),
        ("CJK Unified Ideographs Extension A", (0x3400, 0x4DBF)),
        ("CJK Unified Ideographs Extension B", (0x20000, 0x2A6DF)),
        ("Kanbun", (0x3190, 0x319F)),
    ),
    (("Private Use Area (plane 0)", (0xE000, 0xF8FF)),),
    (
        ("CJK Strokes", (0x31C0, 0x31EF)),
        ("CJK Compatibility Ideographs", (0xF900, 0xFAFF)),
        ("CJK Compatibility Ideographs Supplement", (0x2F800, 0x2FA1F)),
    ),
    (("Alphabetic Presentation Forms", (0xFB00, 0xFB4F)),),
    (("Arabic Presentation Forms-A", (0xFB50, 0xFDFF)),),
    (("Combining Half Marks", (0xFE20, 0xFE2F)),),
    (
        ("Vertical Forms", (0xFE10, 0xFE1F)),
        ("CJK Compatibility Forms", (0xFE30, 0xFE4F)),
    ),
    (("Small Form Variants", (0xFE50, 0xFE6F)),),
    (("Arabic Presentation Forms-B", (0xFE70, 0xFEFF)),),
    (("Halfwidth And Fullwidth Forms", (0xFF00, 0xFFEF)),),
    (("Specials", (0xFFF0, 0xFFFF)),),
    (("Tibetan", (0x0F00, 0x0FFF)),),
    (("Syriac", (0x0700, 0x074F)),),
    (("Thaana", (0x0780, 0x07BF)),),
    (("Sinhala", (0x0D80, 0x0DFF)),),
    (("Myanmar", (0x1000, 0x109F)),),
    (
        ("Ethiopic", (0x1200, 0x137F)),
        ("Ethiopic Supplement", (0x1380, 0x139F)),
        ("Ethiopic Extended", (0x2D80, 0x2DDF)),
    ),
    (("Cherokee", (0x13A0, 0x13FF)),),
    (("Unified Canadian Aboriginal Syllabics", (0x1400, 0x167F)),),
    (("Ogham", (0x1680, 0x169F)),),
    (("Runic", (0x16A0, 0x16FF)),),
    (("Khmer", (0x1780, 0x17FF)), ("Khmer Symbols", (0x19E0, 0x19FF))),
    (("Mongolian", (0x1800, 0x18AF)),),
    (("Braille Patterns", (0x2800, 0x28FF)),),
    (("Yi Syllables", (0xA000, 0xA48F)), ("Yi Radicals", (0xA490, 0xA4CF))),
    (
        ("Tagalog", (0x1700, 0x171F)),
        ("Hanunoo", (0x1720, 0x173F)),
        ("Buhid", (0x1740, 0x175F)),
        ("Tagbanwa", (0x1760, 0x177F)),
    ),
    (("Old Italic", (0x10300, 0x1032F)),),
    (("Gothic", (0x10330, 0x1034F)),),
    (("Deseret", (0x10400, 0x1044F)),),
    (
        ("Byzantine Musical Symbols", (0x1D000, 0x1D0FF)),
        ("Musical Symbols", (0x1D100, 0x1D1FF)),
        ("Ancient Greek Musical Notation", (0x1D200, 0x1D24F)),
    ),
    (("Mathematical Alphanumeric Symbols", (0x1D400, 0x1D7FF)),),
    (
        ("Private Use (plane 15)", (0xF0000, 0xFFFFD)),
        ("Private Use (plane 16)", (0x100000, 0x10FFFD)),
    ),
    (
        ("Variation Selectors", (0xFE00, 0xFE0F)),
        ("Variation Selectors Supplement", (0xE0100, 0xE01EF)),
    ),
    (("Tags", (0xE0000, 0xE007F)),),
    (("Limbu", (0x1900, 0x194F)),),
    (("Tai Le", (0x1950, 0x197F)),),
    (("New Tai Lue", (0x1980, 0x19DF)),),
    (("Buginese", (0x1A00, 0x1A1F)),),
    (("Glagolitic", (0x2C00, 0x2C5F)),),
    (("Tifinagh", (0x2D30, 0x2D7F)),),
    (("Yijing Hexagram Symbols", (0x4DC0, 0x4DFF)),),
    (("Syloti Nagri", (0xA800, 0xA82F)),),
    (
        ("Linear B Syllabary", (0x10000, 0x1007F)),
        ("Linear B Ideograms", (0x10080, 0x100FF)),
        ("Aegean Numbers", (0x10100, 0x1013F)),
    ),
    (("Ancient Greek Numbers", (0x10140, 0x1018F)),),
    (("Ugaritic", (0x10380, 0x1039F)),),
    (("Old Persian", (0x103A0, 0x103DF)),),
    (("Shavian", (0x10450, 0x1047F)),),
    (("Osmanya", (0x10480, 0x104AF)),),
    (("Cypriot Syllabary", (0x10800, 0x1083F)),),
    (("Kharoshthi", (0x10A00, 0x10A5F)),),
    (("Tai Xuan Jing Symbols", (0x1D300, 0x1D35F)),),
    (
        ("Cuneiform", (0x12000, 0x123FF)),
        ("Cuneiform Numbers and Punctuation", (0x12400, 0x1247F)),
    ),
    (("Counting Rod Numerals", (0x1D360, 0x1D37F)),),
    (("Sundanese", (0x1B80, 0x1BBF)),),
    (("Lepcha", (0x1C00, 0x1C4F)),),
    (("Ol Chiki", (0x1C50, 0x1C7F)),),
    (("Saurashtra", (0xA880, 0xA8DF)),),
    (("Kayah Li", (0xA900, 0xA92F)),),
    (("Rejang", (0xA930, 0xA95F)),),
    (("Cham", (0xAA00, 0xAA5F)),),
    (("Ancient Symbols", (0x10190, 0x101CF)),),
    (("Phaistos Disc", (0x101D0, 0x101FF)),),
    (
        ("Carian", (0x102A0, 0x102DF)),
        ("Lycian", (0x10280, 0x1029F)),
        ("Lydian", (0x10920, 0x1093F)),
    ),
    (("Domino Tiles", (0x1F030, 0x1F09F)), ("Mahjong Tiles", (0x1F000, 0x1F02F))),
)


_unicodeStarts = []
_unicodeValues = [None]


def _getUnicodeRanges():
    # build the ranges of codepoints for each unicode range bit, and cache result
    if not _unicodeStarts:
        unicodeRanges = [
            (start, (stop, bit))
            for bit, blocks in enumerate(OS2_UNICODE_RANGES)
            for _, (start, stop) in blocks
        ]
        for start, (stop, bit) in sorted(unicodeRanges):
            _unicodeStarts.append(start)
            _unicodeValues.append((stop, bit))
    return _unicodeStarts, _unicodeValues


def intersectUnicodeRanges(unicodes, inverse=False):
    """Intersect a sequence of (int) Unicode codepoints with the Unicode block
    ranges defined in the OpenType specification v1.7, and return the set of
    'ulUnicodeRanges' bits for which there is at least ONE intersection.
    If 'inverse' is True, return the the bits for which there is NO intersection.

    >>> intersectUnicodeRanges([0x0410]) == {9}
    True
    >>> intersectUnicodeRanges([0x0410, 0x1F000]) == {9, 57, 122}
    True
    >>> intersectUnicodeRanges([0x0410, 0x1F000], inverse=True) == (
    ...     set(range(len(OS2_UNICODE_RANGES))) - {9, 57, 122})
    True
    """
    unicodes = set(unicodes)
    unicodestarts, unicodevalues = _getUnicodeRanges()
    bits = set()
    for code in unicodes:
        stop, bit = unicodevalues[bisect.bisect(unicodestarts, code)]
        if code <= stop:
            bits.add(bit)
    # The spec says that bit 57 ("Non Plane 0") implies that there's
    # at least one codepoint beyond the BMP; so I also include all
    # the non-BMP codepoints here
    if any(0x10000 <= code < 0x110000 for code in unicodes):
        bits.add(57)
    return set(range(len(OS2_UNICODE_RANGES))) - bits if inverse else bits


def calcCodePageRanges(unicodes):
    """Given a set of Unicode codepoints (integers), calculate the
    corresponding OS/2 CodePage range bits.
    This is a direct translation of FontForge implementation:
    https://github.com/fontforge/fontforge/blob/7b2c074/fontforge/tottf.c#L3158
    """
    bits = set()
    hasAscii = set(range(0x20, 0x7E)).issubset(unicodes)
    hasLineart = ord("┤") in unicodes

    for uni in unicodes:
        if uni == ord("Þ") and hasAscii:
            bits.add(0)  # Latin 1
        elif uni == ord("Ľ") and hasAscii:
            bits.add(1)  # Latin 2: Eastern Europe
            if hasLineart:
                bits.add(58)  # Latin 2
        elif uni == ord("Б"):
            bits.add(2)  # Cyrillic
            if ord("Ѕ") in unicodes and hasLineart:
                bits.add(57)  # IBM Cyrillic
            if ord("╜") in unicodes and hasLineart:
                bits.add(49)  # MS-DOS Russian
        elif uni == ord("Ά"):
            bits.add(3)  # Greek
            if hasLineart and ord("½") in unicodes:
                bits.add(48)  # IBM Greek
            if hasLineart and ord("√") in unicodes:
                bits.add(60)  # Greek, former 437 G
        elif uni == ord("İ") and hasAscii:
            bits.add(4)  # Turkish
            if hasLineart:
                bits.add(56)  # IBM turkish
        elif uni == ord("א"):
            bits.add(5)  # Hebrew
            if hasLineart and ord("√") in unicodes:
                bits.add(53)  # Hebrew
        elif uni == ord("ر"):
            bits.add(6)  # Arabic
            if ord("√") in unicodes:
                bits.add(51)  # Arabic
            if hasLineart:
                bits.add(61)  # Arabic; ASMO 708
        elif uni == ord("ŗ") and hasAscii:
            bits.add(7)  # Windows Baltic
            if hasLineart:
                bits.add(59)  # MS-DOS Baltic
        elif uni == ord("₫") and hasAscii:
            bits.add(8)  # Vietnamese
        elif uni == ord("ๅ"):
            bits.add(16)  # Thai
        elif uni == ord("エ"):
            bits.add(17)  # JIS/Japan
        elif uni == ord("ㄅ"):
            bits.add(18)  # Chinese: Simplified
        elif uni == ord("ㄱ"):
            bits.add(19)  # Korean wansung
        elif uni == ord("央"):
            bits.add(20)  # Chinese: Traditional
        elif uni == ord("곴"):
            bits.add(21)  # Korean Johab
        elif uni == ord("♥") and hasAscii:
            bits.add(30)  # OEM Character Set
        # TODO: Symbol bit has a special meaning (check the spec), we need
        # to confirm if this is wanted by default.
        # elif chr(0xF000) <= char <= chr(0xF0FF):
        #    codepageRanges.add(31)          # Symbol Character Set
        elif uni == ord("þ") and hasAscii and hasLineart:
            bits.add(54)  # MS-DOS Icelandic
        elif uni == ord("╚") and hasAscii:
            bits.add(62)  # WE/Latin 1
            bits.add(63)  # US
        elif hasAscii and hasLineart and ord("√") in unicodes:
            if uni == ord("Å"):
                bits.add(50)  # MS-DOS Nordic
            elif uni == ord("é"):
                bits.add(52)  # MS-DOS Canadian French
            elif uni == ord("õ"):
                bits.add(55)  # MS-DOS Portuguese

    if hasAscii and ord("‰") in unicodes and ord("∑") in unicodes:
        bits.add(29)  # Macintosh Character Set (US Roman)

    return bits


if __name__ == "__main__":
    import doctest, sys

    sys.exit(doctest.testmod().failed)
-												Move sstruct under fontTools.misc

Our footprint in the Python module namespace is all under
fontTools now.  User code importing sstruct should be updated
to say "from fontTools.misc import sstruct".

											
										
										
											2013-09-17 16:59:39 -04:00
+								from fontTools.misc import sstruct
-												[OS/2] define recalcXAvgCharWidth method

copied from current subsetter code (matches ufo2ft's outlineCompiler)

											
										
										
											2022-04-21 18:44:44 +01:00
+								from fontTools.misc.roundTools import otRound
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								from fontTools.misc.textTools import safeEval, num2binary, binary2num
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								from fontTools.ttLib.tables import DefaultTable
-												Don’t calculate whole sets of unicode codepoints

_getUnicodeRangeSets used to calculate sets containing lots of numbers, only to
get intersections between a set and ranges. Creating and manipulating a lot of
big sets requires a lot of memory.

The function has been replaced by _getUnicodeRanges, returning a list of range
starts boundaries and a list of range stops + corresponding bits.

Tests on intersectUnicodeRanges save about 130 MB (!) of RAM, with no
significant speed penalty.

											
										
										
											2020-06-04 00:33:26 +02:00
+								import bisect
-												[O_S_2f_2] replace print with logger

											
										
										
											2016-01-24 14:33:40 +00:00
+								import logging
-												a few cosmetic/style changes


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@206 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2002-05-10 19:03:34 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
-												[O_S_2f_2] replace print with logger

											
										
										
											2016-01-24 14:33:40 +00:00
+								log = logging.getLogger(__name__)
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								# panose classification
 								panoseFormat = """
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									bFamilyType:        B
 									bSerifStyle:        B
 									bWeight:            B
 									bProportion:        B
 									bContrast:          B
 									bStrokeVariation:   B
 									bArmStyle:          B
 									bLetterForm:        B
 									bMidline:           B
 									bXHeight:           B
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								"""
-												More whitespace

											
										
										
											2015-04-26 02:01:01 -04:00
-												py23 Use new-style classes

Such that we get the same semantics in both Python 2 and 3.

											
										
										
											2013-11-28 14:26:58 -05:00
+								class Panose(object):
-												Update Lib/fontTools/ttLib/tables/O_S_2f_2.py

Co-authored-by: Cosimo Lupo <cosimo@anthrotype.com>
											
										
										
											2023-07-07 23:12:44 +08:00
+								    def __init__(self, **kwargs):
 								        _, names, _ = sstruct.getformat(panoseFormat)
-												Use Panose class

											
										
										
											2023-07-07 22:09:58 +08:00
+								        for name in names:
-												Update Lib/fontTools/ttLib/tables/O_S_2f_2.py

Co-authored-by: Cosimo Lupo <cosimo@anthrotype.com>
											
										
										
											2023-07-07 23:12:44 +08:00
+								            setattr(self, name, kwargs.pop(name, 0))
 								        for k in kwargs:
 								            raise TypeError(f"Panose() got an unexpected keyword argument {k!r}")
-												Use Panose class

											
										
										
											2023-07-07 22:09:58 +08:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								    def toXML(self, writer, ttFont):
 								        formatstring, names, fixes = sstruct.getformat(panoseFormat)
 								        for name in names:
 								            writer.simpletag(name, value=getattr(self, name))
 								            writer.newline()
-												More whitespace

											
										
										
											2015-04-26 02:01:01 -04:00
-to3 equivalent to --fix=tuple_params

I hope I got this all right...

											
										
										
											2013-11-27 03:19:32 -05:00
+								    def fromXML(self, name, attrs, content, ttFont):
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        setattr(self, name, safeEval(attrs["value"]))
 								# 'sfnt' OS/2 and Windows Metrics table - 'OS/2'
 								OS2_format_0 = """
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									>   # big endian
 									version:                H       # version
 									xAvgCharWidth:          h       # average character width
 									usWeightClass:          H       # degree of thickness of strokes
 									usWidthClass:           H       # aspect ratio
-												fix sign of fsType

											
										
										
											2019-05-23 17:40:01 +02:00
+									fsType:                 H       # type flags
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									ySubscriptXSize:        h       # subscript horizontal font size
 									ySubscriptYSize:        h       # subscript vertical font size
 									ySubscriptXOffset:      h       # subscript x offset
 									ySubscriptYOffset:      h       # subscript y offset
 									ySuperscriptXSize:      h       # superscript horizontal font size
 									ySuperscriptYSize:      h       # superscript vertical font size
 									ySuperscriptXOffset:    h       # superscript x offset
 									ySuperscriptYOffset:    h       # superscript y offset
 									yStrikeoutSize:         h       # strikeout size
 									yStrikeoutPosition:     h       # strikeout position
 									sFamilyClass:           h       # font family class and subclass
 									panose:                 10s     # panose classification number
-												Unsigned long data field must be packed with "L" instead of "l" (sometimes an OverflowError can occur)


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@501 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2006-01-12 14:04:40 +00:00
+									ulUnicodeRange1:        L       # character range
 									ulUnicodeRange2:        L       # character range
 									ulUnicodeRange3:        L       # character range
 									ulUnicodeRange4:        L       # character range
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									achVendID:              4s      # font vendor identification
 									fsSelection:            H       # font selection flags
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+									usFirstCharIndex:       H       # first unicode character index
 									usLastCharIndex:        H       # last unicode character index
-												spec changed: three fields are now unsigned instead of signed,
and due to the the wonderful <snort> hungarian notation the field
names changed as well... (So this change is not b/w compatible)


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@167 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2001-08-15 07:01:44 +00:00
+									sTypoAscender:          h       # typographic ascender
 									sTypoDescender:         h       # typographic descender
 									sTypoLineGap:           h       # typographic line gap
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									usWinAscent:            H       # Windows ascender
 									usWinDescent:           H       # Windows descender
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								"""
 								OS2_format_1_addition = """
-												Unsigned long data field must be packed with "L" instead of "l" (sometimes an OverflowError can occur)


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@501 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2006-01-12 14:04:40 +00:00
+									ulCodePageRange1:   L
 									ulCodePageRange2:   L
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								"""
 								OS2_format_2_addition = (
 								    OS2_format_1_addition
 								    + """
-												formatting


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@111 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2000-06-08 18:38:43 +00:00
+									sxHeight:           h
 									sCapHeight:         h
 									usDefaultChar:      H
 									usBreakChar:        H
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+									usMaxContext:       H
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								"""
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								)
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								OS2_format_5_addition = (
 								    OS2_format_2_addition
 								    + """
 									usLowerOpticalPointSize:    H
 									usUpperOpticalPointSize:    H
 								"""
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								)
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								bigendian = "	>	# big endian\n"
 								OS2_format_1 = OS2_format_0 + OS2_format_1_addition
 								OS2_format_2 = OS2_format_0 + OS2_format_2_addition
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								OS2_format_5 = OS2_format_0 + OS2_format_5_addition
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								OS2_format_1_addition = bigendian + OS2_format_1_addition
 								OS2_format_2_addition = bigendian + OS2_format_2_addition
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								OS2_format_5_addition = bigendian + OS2_format_5_addition
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
 								class table_O_S_2f_2(DefaultTable.DefaultTable):
-												More whitespace

											
										
										
											2015-04-26 02:01:01 -04:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								    """the OS/2 table"""
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												OS/2: fsSelection bits 0 and 5 should match head.macStyle bits 1 and 0

											
										
										
											2016-10-22 11:13:49 +01:00
+								    dependencies = ["head"]
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								    def decompile(self, data, ttFont):
 								        dummy, data = sstruct.unpack2(OS2_format_0, data, self)
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        if self.version == 1:
-												Remove workaround for buggy OS/2 tables

Those fonts should all be gone by now...

											
										
										
											2013-11-25 07:27:43 -05:00
+								            dummy, data = sstruct.unpack2(OS2_format_1_addition, data, self)
-												added 'support' for OS/2 version 4: can anyone verify this is correct? I can't seem to find an OS/2 v4 spec...


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@513 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2007-10-22 09:31:02 +00:00
+								        elif self.version in (2, 3, 4):
-												Remove workaround for buggy OS/2 tables

Those fonts should all be gone by now...

											
										
										
											2013-11-25 07:27:43 -05:00
+								            dummy, data = sstruct.unpack2(OS2_format_2_addition, data, self)
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								        elif self.version == 5:
-												Remove workaround for buggy OS/2 tables

Those fonts should all be gone by now...

											
										
										
											2013-11-25 07:27:43 -05:00
+								            dummy, data = sstruct.unpack2(OS2_format_5_addition, data, self)
-												py23 from __future__ import division and adjust divisions

											
										
										
											2013-11-27 17:46:17 -05:00
+								            self.usLowerOpticalPointSize /= 20
 								            self.usUpperOpticalPointSize /= 20
-to3 --fix=ne

											
										
										
											2013-11-27 02:40:30 -05:00
+								        elif self.version != 0:
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								            from fontTools import ttLib
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-to3 --fix=raise

											
										
										
											2013-11-27 02:42:28 -05:00
+								            raise ttLib.TTLibError(
 								                "unknown format for OS/2 table: version %s" % self.version
 								            )
-												Remove workaround for buggy OS/2 tables

Those fonts should all be gone by now...

											
										
										
											2013-11-25 07:27:43 -05:00
+								        if len(data):
-												[O_S_2f_2] replace print with logger

											
										
										
											2016-01-24 14:33:40 +00:00
+								            log.warning("too much 'OS/2' table data")
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        self.panose = sstruct.unpack(panoseFormat, self.panose, Panose())
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								    def compile(self, ttFont):
-												[OS/2] update fsFirstCharIndex and fsLastCharIndex upon compile;
add comment to XML output;
use all unicode cmap subtables, but set 0xFFFF as max value for USHORT

											
										
										
											2015-05-03 16:46:58 +01:00
+								        self.updateFirstAndLastCharIndex(ttFont)
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        panose = self.panose
-												OS/2: fsSelection bits 0 and 5 should match head.macStyle bits 1 and 0

											
										
										
											2016-10-22 11:13:49 +01:00
+								        head = ttFont["head"]
-												OS2/2: fix checking fsSelection bits matching head.macStyle bits

											
										
										
											2016-11-03 11:31:03 +00:00
+								        if (self.fsSelection & 1) and not (head.macStyle & 1 << 1):
-												OS/2: fsSelection bits 0 and 5 should match head.macStyle bits 1 and 0

											
										
										
											2016-10-22 11:13:49 +01:00
+								            log.warning(
 								                "fsSelection bit 0 (italic) and "
 								                "head table macStyle bit 1 (italic) should match"
 								            )
-												OS2/2: fix checking fsSelection bits matching head.macStyle bits

											
										
										
											2016-11-03 11:31:03 +00:00
+								        if (self.fsSelection & 1 << 5) and not (head.macStyle & 1):
-												OS/2: fsSelection bits 0 and 5 should match head.macStyle bits 1 and 0

											
										
										
											2016-10-22 11:13:49 +01:00
+								            log.warning(
 								                "fsSelection bit 5 (bold) and "
 								                "head table macStyle bit 0 (bold) should match"
 								            )
-												OS/2: if fsSelection bit 6 is on bits then 0 and 5 must be clear

											
										
										
											2016-10-22 11:09:46 +01:00
+								        if (self.fsSelection & 1 << 6) and (self.fsSelection & 1 + (1 << 5)):
 								            log.warning(
 								                "fsSelection bit 6 (regular) is set, "
 								                "bits 0 (italic) and 5 (bold) must be clear"
 								            )
-												OS/2: warn when fsSelection bits defined in version 4 are on but version < 4

											
										
										
											2015-05-12 11:11:21 +01:00
+								        if self.version < 4 and self.fsSelection & 0b1110000000:
 								            log.warning(
 								                "fsSelection bits 7, 8 and 9 are only defined in "
 								                "OS/2 table version 4 and up: version %s",
 								                self.version,
 								            )
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        self.panose = sstruct.pack(panoseFormat, self.panose)
 								        if self.version == 0:
 								            data = sstruct.pack(OS2_format_0, self)
 								        elif self.version == 1:
 								            data = sstruct.pack(OS2_format_1, self)
-												added 'support' for OS/2 version 4: can anyone verify this is correct? I can't seem to find an OS/2 v4 spec...


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@513 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2007-10-22 09:31:02 +00:00
+								        elif self.version in (2, 3, 4):
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								            data = sstruct.pack(OS2_format_2, self)
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								        elif self.version == 5:
-												Improve OS/2 format 5 compile

											
										
										
											2013-11-26 19:33:49 -05:00
+								            d = self.__dict__.copy()
-												replace int(round(...)) with round(...)

We don't need to cast to int when using the round function from py23,
as this is a backport of python3's built-in round and thus it returns
an int when called with a single argument.

											
										
										
											2017-10-22 12:03:52 +01:00
+								            d["usLowerOpticalPointSize"] = round(self.usLowerOpticalPointSize * 20)
 								            d["usUpperOpticalPointSize"] = round(self.usUpperOpticalPointSize * 20)
-												Improve OS/2 format 5 compile

											
										
										
											2013-11-26 19:33:49 -05:00
+								            data = sstruct.pack(OS2_format_5, d)
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        else:
 								            from fontTools import ttLib
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-to3 --fix=raise

											
										
										
											2013-11-27 02:42:28 -05:00
+								            raise ttLib.TTLibError(
 								                "unknown format for OS/2 table: version %s" % self.version
 								            )
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        self.panose = panose
 								        return data
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								    def toXML(self, writer, ttFont):
-												[OS/2] update fsFirstCharIndex and fsLastCharIndex upon compile;
add comment to XML output;
use all unicode cmap subtables, but set 0xFFFF as max value for USHORT

											
										
										
											2015-05-03 16:46:58 +01:00
+								        writer.comment(
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								            "The fields 'usFirstCharIndex' and 'usLastCharIndex'\n"
-												[OS/2] update fsFirstCharIndex and fsLastCharIndex upon compile;
add comment to XML output;
use all unicode cmap subtables, but set 0xFFFF as max value for USHORT

											
										
										
											2015-05-03 16:46:58 +01:00
+								            "will be recalculated by the compiler"
 								        )
 								        writer.newline()
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        if self.version == 1:
 								            format = OS2_format_1
-												added 'support' for OS/2 version 4: can anyone verify this is correct? I can't seem to find an OS/2 v4 spec...


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@513 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											2007-10-22 09:31:02 +00:00
+								        elif self.version in (2, 3, 4):
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								            format = OS2_format_2
-												Support for OS/2 table version 5 as proposed by Microsoft
https://github.com/fontforge/fontforge/issues/956

											
										
										
											2013-11-18 21:53:25 +01:00
+								        elif self.version == 5:
 								            format = OS2_format_5
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        else:
 								            format = OS2_format_0
 								        formatstring, names, fixes = sstruct.getformat(format)
 								        for name in names:
 								            value = getattr(self, name)
 								            if name == "panose":
 								                writer.begintag("panose")
 								                writer.newline()
 								                value.toXML(writer, ttFont)
 								                writer.endtag("panose")
-												More whitespace

											
										
										
											2015-04-26 02:01:01 -04:00
+								            elif name in (
 								                "ulUnicodeRange1",
 								                "ulUnicodeRange2",
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								                "ulUnicodeRange3",
 								                "ulUnicodeRange4",
 								                "ulCodePageRange1",
 								                "ulCodePageRange2",
 								            ):
 								                writer.simpletag(name, value=num2binary(value))
 								            elif name in ("fsType", "fsSelection"):
 								                writer.simpletag(name, value=num2binary(value, 16))
 								            elif name == "achVendID":
 								                writer.simpletag(name, value=repr(value)[1:-1])
 								            else:
 								                writer.simpletag(name, value=value)
 								            writer.newline()
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-to3 equivalent to --fix=tuple_params

I hope I got this all right...

											
										
										
											2013-11-27 03:19:32 -05:00
+								    def fromXML(self, name, attrs, content, ttFont):
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								        if name == "panose":
 								            self.panose = panose = Panose()
 								            for element in content:
-to3 --fix=types manual additions

Don't know why the tool didn't catch these.

											
										
										
											2013-11-27 05:17:37 -05:00
+								                if isinstance(element, tuple):
-to3 equivalent to --fix=tuple_params

I hope I got this all right...

											
										
										
											2013-11-27 03:19:32 -05:00
+								                    name, attrs, content = element
 								                    panose.fromXML(name, attrs, content, ttFont)
-												More whitespace

											
										
										
											2015-04-26 02:01:01 -04:00
+								        elif name in (
 								            "ulUnicodeRange1",
 								            "ulUnicodeRange2",
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								            "ulUnicodeRange3",
 								            "ulUnicodeRange4",
 								            "ulCodePageRange1",
 								            "ulCodePageRange2",
 								            "fsType",
 								            "fsSelection",
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								        ):
-												Created a new library directory called "FreeLib". All OpenSource RFMKII components will reside there, fontTools being the flagship.


git-svn-id: svn://svn.code.sf.net/p/fonttools/code/trunk@2 4cde692c-a291-49d1-8350-778aa11640f8

											
										
										
											1999-12-16 21:34:53 +00:00
+								            setattr(self, name, binary2num(attrs["value"]))
 								        elif name == "achVendID":
 								            setattr(self, name, safeEval("'''" + attrs["value"] + "'''"))
-												[OS/2] update fsFirstCharIndex and fsLastCharIndex upon compile;
add comment to XML output;
use all unicode cmap subtables, but set 0xFFFF as max value for USHORT

											
										
										
											2015-05-03 16:46:58 +01:00
+								        else:
 								            setattr(self, name, safeEval(attrs["value"]))
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Simplify fix for https://github.com/behdad/fonttools/pull/498

											
										
										
											2016-02-02 11:52:24 +08:00
+								    def updateFirstAndLastCharIndex(self, ttFont):
 								        if "cmap" not in ttFont:
 								            return
-												[OS/2] update fsFirstCharIndex and fsLastCharIndex upon compile;
add comment to XML output;
use all unicode cmap subtables, but set 0xFFFF as max value for USHORT

											
										
										
											2015-05-03 16:46:58 +01:00
+								        codes = set()
 								        for table in getattr(ttFont["cmap"], "tables", []):
 								            if table.isUnicode():
 								                codes.update(table.cmap.keys())
 								        if codes:
 								            minCode = min(codes)
 								            maxCode = max(codes)
 								            # USHORT cannot hold codepoints greater than 0xFFFF
-												Simplify fix for https://github.com/behdad/fonttools/pull/498

											
										
										
											2016-02-02 11:52:24 +08:00
+								            self.usFirstCharIndex = min(0xFFFF, minCode)
 								            self.usLastCharIndex = min(0xFFFF, maxCode)
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    # misspelled attributes kept for legacy reasons
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @property
 								    def usMaxContex(self):
 								        return self.usMaxContext
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @usMaxContex.setter
 								    def usMaxContex(self, value):
 								        self.usMaxContext = value
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @property
 								    def fsFirstCharIndex(self):
 								        return self.usFirstCharIndex
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @fsFirstCharIndex.setter
 								    def fsFirstCharIndex(self, value):
 								        self.usFirstCharIndex = value
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @property
 								    def fsLastCharIndex(self):
 								        return self.usLastCharIndex
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] fix misspelled attributes, and keep them using property decorators

											
										
										
											2015-05-23 19:10:12 +01:00
+								    @fsLastCharIndex.setter
 								    def fsLastCharIndex(self, value):
 								        self.usLastCharIndex = value
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    def getUnicodeRanges(self):
 								        """Return the set of 'ulUnicodeRange*' bits currently enabled."""
 								        bits = set()
 								        ul1, ul2 = self.ulUnicodeRange1, self.ulUnicodeRange2
 								        ul3, ul4 = self.ulUnicodeRange3, self.ulUnicodeRange4
 								        for i in range(32):
 								            if ul1 & (1 << i):
 								                bits.add(i)
 								            if ul2 & (1 << i):
 								                bits.add(i + 32)
 								            if ul3 & (1 << i):
 								                bits.add(i + 64)
 								            if ul4 & (1 << i):
 								                bits.add(i + 96)
 								        return bits
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    def setUnicodeRanges(self, bits):
 								        """Set the 'ulUnicodeRange*' fields to the specified 'bits'."""
 								        ul1, ul2, ul3, ul4 = 0, 0, 0, 0
 								        for bit in bits:
 								            if 0 <= bit < 32:
 								                ul1 |= 1 << bit
 								            elif 32 <= bit < 64:
 								                ul2 |= 1 << (bit - 32)
 								            elif 64 <= bit < 96:
 								                ul3 |= 1 << (bit - 64)
 								            elif 96 <= bit < 123:
 								                ul4 |= 1 << (bit - 96)
 								            else:
 								                raise ValueError("expected 0 <= int <= 122, found: %r" % bit)
 								        self.ulUnicodeRange1, self.ulUnicodeRange2 = ul1, ul2
 								        self.ulUnicodeRange3, self.ulUnicodeRange4 = ul3, ul4
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    def recalcUnicodeRanges(self, ttFont, pruneOnly=False):
 								        """Intersect the codepoints in the font's Unicode cmap subtables with
 								        the Unicode block ranges defined in the OpenType specification (v1.7),
 								        and set the respective 'ulUnicodeRange*' bits if there is at least ONE
 								        intersection.
 								        If 'pruneOnly' is True, only clear unused bits with NO intersection.
 								        """
 								        unicodes = set()
 								        for table in ttFont["cmap"].tables:
 								            if table.isUnicode():
 								                unicodes.update(table.cmap.keys())
 								        if pruneOnly:
 								            empty = intersectUnicodeRanges(unicodes, inverse=True)
 								            bits = self.getUnicodeRanges() - empty
 								        else:
 								            bits = intersectUnicodeRanges(unicodes)
 								        self.setUnicodeRanges(bits)
 								        return bits
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] Add recalcCodePageRanges

Ported from the ufo2ft code (which is port from FontForge code), with
some additional functions for parity with recalcUnicodeRanges.

											
										
										
											2023-11-11 01:22:18 +02:00
+								    def getCodePageRanges(self):
 								        """Return the set of 'ulCodePageRange*' bits currently enabled."""
 								        bits = set()
 								        ul1, ul2 = self.ulCodePageRange1, self.ulCodePageRange2
 								        for i in range(32):
 								            if ul1 & (1 << i):
 								                bits.add(i)
 								            if ul2 & (1 << i):
 								                bits.add(i + 32)
 								        return bits
 								    def setCodePageRanges(self, bits):
 								        """Set the 'ulCodePageRange*' fields to the specified 'bits'."""
 								        ul1, ul2 = 0, 0
 								        for bit in bits:
 								            if 0 <= bit < 32:
 								                ul1 |= 1 << bit
 								            elif 32 <= bit < 64:
 								                ul2 |= 1 << (bit - 32)
 								            else:
 								                raise ValueError(f"expected 0 <= int <= 63, found: {bit:r}")
 								        self.ulCodePageRange1, self.ulCodePageRange2 = ul1, ul2
 								    def recalcCodePageRanges(self, ttFont, pruneOnly=False):
 								        unicodes = set()
 								        for table in ttFont["cmap"].tables:
 								            if table.isUnicode():
 								                unicodes.update(table.cmap.keys())
 								        bits = calcCodePageRanges(unicodes)
 								        if pruneOnly:
 								            bits &= self.getCodePageRanges()
 								        # when no codepage ranges can be enabled, fall back to enabling bit 0
 								        # (Latin 1) so that the font works in MS Word:
 								        # https://github.com/googlei18n/fontmake/issues/468
 								        if not bits:
 								            bits = {0}
 								        self.setCodePageRanges(bits)
 								        return bits
-												drop the 'X' from recalcAvgCharWidth method name

											
										
										
											2022-04-21 19:02:15 +01:00
+								    def recalcAvgCharWidth(self, ttFont):
-												[OS/2] define recalcXAvgCharWidth method

copied from current subsetter code (matches ufo2ft's outlineCompiler)

											
										
										
											2022-04-21 18:44:44 +01:00
+								        """Recalculate xAvgCharWidth using metrics from ttFont's 'hmtx' table.
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] define recalcXAvgCharWidth method

copied from current subsetter code (matches ufo2ft's outlineCompiler)

											
										
										
											2022-04-21 18:44:44 +01:00
+								        Set it to 0 if the unlikely event 'hmtx' table is not found.
 								        """
 								        avg_width = 0
 								        hmtx = ttFont.get("hmtx")
-												Guard against a ZeroDivisonError

The code was copied from ufo2ft.

											
										
										
											2023-03-01 19:52:43 +00:00
+								        if hmtx is not None:
 								            widths = [width for width, _ in hmtx.metrics.values() if width > 0]
 								            if widths:
 								                avg_width = otRound(sum(widths) / len(widths))
-												[OS/2] define recalcXAvgCharWidth method

copied from current subsetter code (matches ufo2ft's outlineCompiler)

											
										
										
											2022-04-21 18:44:44 +01:00
+								        self.xAvgCharWidth = avg_width
 								        return avg_width
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
 								# Unicode ranges data from the OpenType OS/2 table specification v1.7
 								OS2_UNICODE_RANGES = (
 								    (("Basic Latin", (0x0000, 0x007F)),),
 								    (("Latin-1 Supplement", (0x0080, 0x00FF)),),
 								    (("Latin Extended-A", (0x0100, 0x017F)),),
 								    (("Latin Extended-B", (0x0180, 0x024F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("IPA Extensions", (0x0250, 0x02AF)),
 								        ("Phonetic Extensions", (0x1D00, 0x1D7F)),
 								        ("Phonetic Extensions Supplement", (0x1D80, 0x1DBF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
 								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Spacing Modifier Letters", (0x02B0, 0x02FF)),
 								        ("Modifier Tone Letters", (0xA700, 0xA71F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
 								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Combining Diacritical Marks", (0x0300, 0x036F)),
 								        ("Combining Diacritical Marks Supplement", (0x1DC0, 0x1DFF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Greek and Coptic", (0x0370, 0x03FF)),),
 								    (("Coptic", (0x2C80, 0x2CFF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Cyrillic", (0x0400, 0x04FF)),
 								        ("Cyrillic Supplement", (0x0500, 0x052F)),
 								        ("Cyrillic Extended-A", (0x2DE0, 0x2DFF)),
 								        ("Cyrillic Extended-B", (0xA640, 0xA69F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Armenian", (0x0530, 0x058F)),),
 								    (("Hebrew", (0x0590, 0x05FF)),),
 								    (("Vai", (0xA500, 0xA63F)),),
 								    (("Arabic", (0x0600, 0x06FF)), ("Arabic Supplement", (0x0750, 0x077F))),
 								    (("NKo", (0x07C0, 0x07FF)),),
 								    (("Devanagari", (0x0900, 0x097F)),),
 								    (("Bengali", (0x0980, 0x09FF)),),
 								    (("Gurmukhi", (0x0A00, 0x0A7F)),),
 								    (("Gujarati", (0x0A80, 0x0AFF)),),
 								    (("Oriya", (0x0B00, 0x0B7F)),),
 								    (("Tamil", (0x0B80, 0x0BFF)),),
 								    (("Telugu", (0x0C00, 0x0C7F)),),
 								    (("Kannada", (0x0C80, 0x0CFF)),),
 								    (("Malayalam", (0x0D00, 0x0D7F)),),
 								    (("Thai", (0x0E00, 0x0E7F)),),
 								    (("Lao", (0x0E80, 0x0EFF)),),
 								    (("Georgian", (0x10A0, 0x10FF)), ("Georgian Supplement", (0x2D00, 0x2D2F))),
 								    (("Balinese", (0x1B00, 0x1B7F)),),
 								    (("Hangul Jamo", (0x1100, 0x11FF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Latin Extended Additional", (0x1E00, 0x1EFF)),
 								        ("Latin Extended-C", (0x2C60, 0x2C7F)),
 								        ("Latin Extended-D", (0xA720, 0xA7FF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Greek Extended", (0x1F00, 0x1FFF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("General Punctuation", (0x2000, 0x206F)),
 								        ("Supplemental Punctuation", (0x2E00, 0x2E7F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Superscripts And Subscripts", (0x2070, 0x209F)),),
 								    (("Currency Symbols", (0x20A0, 0x20CF)),),
 								    (("Combining Diacritical Marks For Symbols", (0x20D0, 0x20FF)),),
 								    (("Letterlike Symbols", (0x2100, 0x214F)),),
 								    (("Number Forms", (0x2150, 0x218F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Arrows", (0x2190, 0x21FF)),
 								        ("Supplemental Arrows-A", (0x27F0, 0x27FF)),
 								        ("Supplemental Arrows-B", (0x2900, 0x297F)),
 								        ("Miscellaneous Symbols and Arrows", (0x2B00, 0x2BFF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
 								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Mathematical Operators", (0x2200, 0x22FF)),
 								        ("Supplemental Mathematical Operators", (0x2A00, 0x2AFF)),
 								        ("Miscellaneous Mathematical Symbols-A", (0x27C0, 0x27EF)),
 								        ("Miscellaneous Mathematical Symbols-B", (0x2980, 0x29FF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Miscellaneous Technical", (0x2300, 0x23FF)),),
 								    (("Control Pictures", (0x2400, 0x243F)),),
 								    (("Optical Character Recognition", (0x2440, 0x245F)),),
 								    (("Enclosed Alphanumerics", (0x2460, 0x24FF)),),
 								    (("Box Drawing", (0x2500, 0x257F)),),
 								    (("Block Elements", (0x2580, 0x259F)),),
 								    (("Geometric Shapes", (0x25A0, 0x25FF)),),
 								    (("Miscellaneous Symbols", (0x2600, 0x26FF)),),
 								    (("Dingbats", (0x2700, 0x27BF)),),
 								    (("CJK Symbols And Punctuation", (0x3000, 0x303F)),),
 								    (("Hiragana", (0x3040, 0x309F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Katakana", (0x30A0, 0x30FF)),
 								        ("Katakana Phonetic Extensions", (0x31F0, 0x31FF)),
 								    ),
 								    (("Bopomofo", (0x3100, 0x312F)), ("Bopomofo Extended", (0x31A0, 0x31BF))),
 								    (("Hangul Compatibility Jamo", (0x3130, 0x318F)),),
 								    (("Phags-pa", (0xA840, 0xA87F)),),
 								    (("Enclosed CJK Letters And Months", (0x3200, 0x32FF)),),
 								    (("CJK Compatibility", (0x3300, 0x33FF)),),
 								    (("Hangul Syllables", (0xAC00, 0xD7AF)),),
 								    (("Non-Plane 0 *", (0xD800, 0xDFFF)),),
 								    (("Phoenician", (0x10900, 0x1091F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("CJK Unified Ideographs", (0x4E00, 0x9FFF)),
 								        ("CJK Radicals Supplement", (0x2E80, 0x2EFF)),
 								        ("Kangxi Radicals", (0x2F00, 0x2FDF)),
 								        ("Ideographic Description Characters", (0x2FF0, 0x2FFF)),
 								        ("CJK Unified Ideographs Extension A", (0x3400, 0x4DBF)),
 								        ("CJK Unified Ideographs Extension B", (0x20000, 0x2A6DF)),
 								        ("Kanbun", (0x3190, 0x319F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Private Use Area (plane 0)", (0xE000, 0xF8FF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("CJK Strokes", (0x31C0, 0x31EF)),
 								        ("CJK Compatibility Ideographs", (0xF900, 0xFAFF)),
 								        ("CJK Compatibility Ideographs Supplement", (0x2F800, 0x2FA1F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Alphabetic Presentation Forms", (0xFB00, 0xFB4F)),),
 								    (("Arabic Presentation Forms-A", (0xFB50, 0xFDFF)),),
 								    (("Combining Half Marks", (0xFE20, 0xFE2F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Vertical Forms", (0xFE10, 0xFE1F)),
 								        ("CJK Compatibility Forms", (0xFE30, 0xFE4F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Small Form Variants", (0xFE50, 0xFE6F)),),
 								    (("Arabic Presentation Forms-B", (0xFE70, 0xFEFF)),),
 								    (("Halfwidth And Fullwidth Forms", (0xFF00, 0xFFEF)),),
 								    (("Specials", (0xFFF0, 0xFFFF)),),
 								    (("Tibetan", (0x0F00, 0x0FFF)),),
 								    (("Syriac", (0x0700, 0x074F)),),
 								    (("Thaana", (0x0780, 0x07BF)),),
 								    (("Sinhala", (0x0D80, 0x0DFF)),),
 								    (("Myanmar", (0x1000, 0x109F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Ethiopic", (0x1200, 0x137F)),
 								        ("Ethiopic Supplement", (0x1380, 0x139F)),
 								        ("Ethiopic Extended", (0x2D80, 0x2DDF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Cherokee", (0x13A0, 0x13FF)),),
 								    (("Unified Canadian Aboriginal Syllabics", (0x1400, 0x167F)),),
 								    (("Ogham", (0x1680, 0x169F)),),
 								    (("Runic", (0x16A0, 0x16FF)),),
 								    (("Khmer", (0x1780, 0x17FF)), ("Khmer Symbols", (0x19E0, 0x19FF))),
 								    (("Mongolian", (0x1800, 0x18AF)),),
 								    (("Braille Patterns", (0x2800, 0x28FF)),),
 								    (("Yi Syllables", (0xA000, 0xA48F)), ("Yi Radicals", (0xA490, 0xA4CF))),
 								    (
 								        ("Tagalog", (0x1700, 0x171F)),
 								        ("Hanunoo", (0x1720, 0x173F)),
 								        ("Buhid", (0x1740, 0x175F)),
 								        ("Tagbanwa", (0x1760, 0x177F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Old Italic", (0x10300, 0x1032F)),),
 								    (("Gothic", (0x10330, 0x1034F)),),
 								    (("Deseret", (0x10400, 0x1044F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Byzantine Musical Symbols", (0x1D000, 0x1D0FF)),
 								        ("Musical Symbols", (0x1D100, 0x1D1FF)),
 								        ("Ancient Greek Musical Notation", (0x1D200, 0x1D24F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Mathematical Alphanumeric Symbols", (0x1D400, 0x1D7FF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												Fix "Private Use (plane 15)" range

https://twitter.com/ken_lunde/status/796564061206913024
https://www.microsoft.com/typography/otspec/errata.htm
											
										
										
											2016-11-21 11:26:57 +09:00
+								        ("Private Use (plane 15)", (0xF0000, 0xFFFFD)),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Private Use (plane 16)", (0x100000, 0x10FFFD)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
 								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Variation Selectors", (0xFE00, 0xFE0F)),
 								        ("Variation Selectors Supplement", (0xE0100, 0xE01EF)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Tags", (0xE0000, 0xE007F)),),
 								    (("Limbu", (0x1900, 0x194F)),),
 								    (("Tai Le", (0x1950, 0x197F)),),
 								    (("New Tai Lue", (0x1980, 0x19DF)),),
 								    (("Buginese", (0x1A00, 0x1A1F)),),
 								    (("Glagolitic", (0x2C00, 0x2C5F)),),
 								    (("Tifinagh", (0x2D30, 0x2D7F)),),
 								    (("Yijing Hexagram Symbols", (0x4DC0, 0x4DFF)),),
 								    (("Syloti Nagri", (0xA800, 0xA82F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Linear B Syllabary", (0x10000, 0x1007F)),
 								        ("Linear B Ideograms", (0x10080, 0x100FF)),
 								        ("Aegean Numbers", (0x10100, 0x1013F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Ancient Greek Numbers", (0x10140, 0x1018F)),),
 								    (("Ugaritic", (0x10380, 0x1039F)),),
 								    (("Old Persian", (0x103A0, 0x103DF)),),
 								    (("Shavian", (0x10450, 0x1047F)),),
 								    (("Osmanya", (0x10480, 0x104AF)),),
 								    (("Cypriot Syllabary", (0x10800, 0x1083F)),),
 								    (("Kharoshthi", (0x10A00, 0x10A5F)),),
 								    (("Tai Xuan Jing Symbols", (0x1D300, 0x1D35F)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Cuneiform", (0x12000, 0x123FF)),
 								        ("Cuneiform Numbers and Punctuation", (0x12400, 0x1247F)),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    ),
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    (("Counting Rod Numerals", (0x1D360, 0x1D37F)),),
 								    (("Sundanese", (0x1B80, 0x1BBF)),),
 								    (("Lepcha", (0x1C00, 0x1C4F)),),
 								    (("Ol Chiki", (0x1C50, 0x1C7F)),),
 								    (("Saurashtra", (0xA880, 0xA8DF)),),
 								    (("Kayah Li", (0xA900, 0xA92F)),),
 								    (("Rejang", (0xA930, 0xA95F)),),
 								    (("Cham", (0xAA00, 0xAA5F)),),
 								    (("Ancient Symbols", (0x10190, 0x101CF)),),
 								    (("Phaistos Disc", (0x101D0, 0x101FF)),),
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
+								    (
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								        ("Carian", (0x102A0, 0x102DF)),
 								        ("Lycian", (0x10280, 0x1029F)),
 								        ("Lydian", (0x10920, 0x1093F)),
 								    ),
 								    (("Domino Tiles", (0x1F030, 0x1F09F)), ("Mahjong Tiles", (0x1F000, 0x1F02F))),
 								)
-												Don’t calculate whole sets of unicode codepoints

_getUnicodeRangeSets used to calculate sets containing lots of numbers, only to
get intersections between a set and ranges. Creating and manipulating a lot of
big sets requires a lot of memory.

The function has been replaced by _getUnicodeRanges, returning a list of range
starts boundaries and a list of range stops + corresponding bits.

Tests on intersectUnicodeRanges save about 130 MB (!) of RAM, with no
significant speed penalty.

											
										
										
											2020-06-04 00:33:26 +02:00
+								_unicodeStarts = []
 								_unicodeValues = [None]
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												Don’t calculate whole sets of unicode codepoints

_getUnicodeRangeSets used to calculate sets containing lots of numbers, only to
get intersections between a set and ranges. Creating and manipulating a lot of
big sets requires a lot of memory.

The function has been replaced by _getUnicodeRanges, returning a list of range
starts boundaries and a list of range stops + corresponding bits.

Tests on intersectUnicodeRanges save about 130 MB (!) of RAM, with no
significant speed penalty.

											
										
										
											2020-06-04 00:33:26 +02:00
+								def _getUnicodeRanges():
 								    # build the ranges of codepoints for each unicode range bit, and cache result
 								    if not _unicodeStarts:
 								        unicodeRanges = [
 								            (start, (stop, bit))
 								            for bit, blocks in enumerate(OS2_UNICODE_RANGES)
 								            for _, (start, stop) in blocks
 								        ]
 								        for start, (stop, bit) in sorted(unicodeRanges):
 								            _unicodeStarts.append(start)
 								            _unicodeValues.append((stop, bit))
 								    return _unicodeStarts, _unicodeValues
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
 								def intersectUnicodeRanges(unicodes, inverse=False):
 								    """Intersect a sequence of (int) Unicode codepoints with the Unicode block
 								    ranges defined in the OpenType specification v1.7, and return the set of
 								    'ulUnicodeRanges' bits for which there is at least ONE intersection.
 								    If 'inverse' is True, return the the bits for which there is NO intersection.
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    >>> intersectUnicodeRanges([0x0410]) == {9}
 								    True
 								    >>> intersectUnicodeRanges([0x0410, 0x1F000]) == {9, 57, 122}
 								    True
 								    >>> intersectUnicodeRanges([0x0410, 0x1F000], inverse=True) == (
-												Don’t calculate whole sets of unicode codepoints

_getUnicodeRangeSets used to calculate sets containing lots of numbers, only to
get intersections between a set and ranges. Creating and manipulating a lot of
big sets requires a lot of memory.

The function has been replaced by _getUnicodeRanges, returning a list of range
starts boundaries and a list of range stops + corresponding bits.

Tests on intersectUnicodeRanges save about 130 MB (!) of RAM, with no
significant speed penalty.

											
										
										
											2020-06-04 00:33:26 +02:00
+								    ...     set(range(len(OS2_UNICODE_RANGES))) - {9, 57, 122})
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    True
 								    """
 								    unicodes = set(unicodes)
-												Don’t calculate whole sets of unicode codepoints

_getUnicodeRangeSets used to calculate sets containing lots of numbers, only to
get intersections between a set and ranges. Creating and manipulating a lot of
big sets requires a lot of memory.

The function has been replaced by _getUnicodeRanges, returning a list of range
starts boundaries and a list of range stops + corresponding bits.

Tests on intersectUnicodeRanges save about 130 MB (!) of RAM, with no
significant speed penalty.

											
										
										
											2020-06-04 00:33:26 +02:00
+								    unicodestarts, unicodevalues = _getUnicodeRanges()
 								    bits = set()
 								    for code in unicodes:
 								        stop, bit = unicodevalues[bisect.bisect(unicodestarts, code)]
 								        if code <= stop:
 								            bits.add(bit)
 								    # The spec says that bit 57 ("Non Plane 0") implies that there's
 								    # at least one codepoint beyond the BMP; so I also include all
 								    # the non-BMP codepoints here
 								    if any(0x10000 <= code < 0x110000 for code in unicodes):
 								        bits.add(57)
 								    return set(range(len(OS2_UNICODE_RANGES))) - bits if inverse else bits
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
-												[OS/2] Add recalcCodePageRanges

Ported from the ufo2ft code (which is port from FontForge code), with
some additional functions for parity with recalcUnicodeRanges.

											
										
										
											2023-11-11 01:22:18 +02:00
+								def calcCodePageRanges(unicodes):
 								    """Given a set of Unicode codepoints (integers), calculate the
 								    corresponding OS/2 CodePage range bits.
 								    This is a direct translation of FontForge implementation:
 								    https://github.com/fontforge/fontforge/blob/7b2c074/fontforge/tottf.c#L3158
 								    """
 								    bits = set()
 								    hasAscii = set(range(0x20, 0x7E)).issubset(unicodes)
 								    hasLineart = ord("┤") in unicodes
 								    for uni in unicodes:
 								        if uni == ord("Þ") and hasAscii:
 								            bits.add(0)  # Latin 1
 								        elif uni == ord("Ľ") and hasAscii:
 								            bits.add(1)  # Latin 2: Eastern Europe
 								            if hasLineart:
 								                bits.add(58)  # Latin 2
 								        elif uni == ord("Б"):
 								            bits.add(2)  # Cyrillic
 								            if ord("Ѕ") in unicodes and hasLineart:
 								                bits.add(57)  # IBM Cyrillic
 								            if ord("╜") in unicodes and hasLineart:
 								                bits.add(49)  # MS-DOS Russian
 								        elif uni == ord("Ά"):
 								            bits.add(3)  # Greek
 								            if hasLineart and ord("½") in unicodes:
 								                bits.add(48)  # IBM Greek
 								            if hasLineart and ord("√") in unicodes:
 								                bits.add(60)  # Greek, former 437 G
 								        elif uni == ord("İ") and hasAscii:
 								            bits.add(4)  # Turkish
 								            if hasLineart:
 								                bits.add(56)  # IBM turkish
 								        elif uni == ord("א"):
 								            bits.add(5)  # Hebrew
 								            if hasLineart and ord("√") in unicodes:
 								                bits.add(53)  # Hebrew
 								        elif uni == ord("ر"):
 								            bits.add(6)  # Arabic
 								            if ord("√") in unicodes:
 								                bits.add(51)  # Arabic
 								            if hasLineart:
 								                bits.add(61)  # Arabic; ASMO 708
 								        elif uni == ord("ŗ") and hasAscii:
 								            bits.add(7)  # Windows Baltic
 								            if hasLineart:
 								                bits.add(59)  # MS-DOS Baltic
 								        elif uni == ord("₫") and hasAscii:
 								            bits.add(8)  # Vietnamese
 								        elif uni == ord("ๅ"):
 								            bits.add(16)  # Thai
 								        elif uni == ord("エ"):
 								            bits.add(17)  # JIS/Japan
 								        elif uni == ord("ㄅ"):
 								            bits.add(18)  # Chinese: Simplified
 								        elif uni == ord("ㄱ"):
 								            bits.add(19)  # Korean wansung
 								        elif uni == ord("央"):
 								            bits.add(20)  # Chinese: Traditional
 								        elif uni == ord("곴"):
 								            bits.add(21)  # Korean Johab
 								        elif uni == ord("♥") and hasAscii:
 								            bits.add(30)  # OEM Character Set
 								        # TODO: Symbol bit has a special meaning (check the spec), we need
 								        # to confirm if this is wanted by default.
 								        # elif chr(0xF000) <= char <= chr(0xF0FF):
 								        #    codepageRanges.add(31)          # Symbol Character Set
 								        elif uni == ord("þ") and hasAscii and hasLineart:
 								            bits.add(54)  # MS-DOS Icelandic
 								        elif uni == ord("╚") and hasAscii:
 								            bits.add(62)  # WE/Latin 1
 								            bits.add(63)  # US
 								        elif hasAscii and hasLineart and ord("√") in unicodes:
 								            if uni == ord("Å"):
 								                bits.add(50)  # MS-DOS Nordic
 								            elif uni == ord("é"):
 								                bits.add(52)  # MS-DOS Canadian French
 								            elif uni == ord("õ"):
 								                bits.add(55)  # MS-DOS Portuguese
 								    if hasAscii and ord("‰") in unicodes and ord("∑") in unicodes:
 								        bits.add(29)  # Macintosh Character Set (US Roman)
 								    return bits
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								if __name__ == "__main__":
 								    import doctest, sys
-												Blacken code

											
										
										
											2022-12-13 11:26:36 +00:00
-												[OS/2] add Unicode ranges data from OT spec, plus methods to get/set bits manually, or recalc/prune automatically

											
										
										
											2016-01-27 16:27:02 +00:00
+								    sys.exit(doctest.testmod().failed)