feat: Support for kerning and ligatures (#873)

## Summary **What is the goal of this PR?** Improved typesetting, including [kerning](https://en.wikipedia.org/wiki/Kerning) and [ligatures](https://en.wikipedia.org/wiki/Ligature_(writing)#Latin_alphabet). **What changes are included?** - The script to convert built-in fonts now adds kerning and ligature information to the generated font headers. - Epub page layout calculates proper kerning spaces and makes ligature substitutions according to the selected font. ![3U1B1808](https://github.com/user-attachments/assets/1accb16f-2f1a-41e5-adca-89f1f1348494) ![3U1B1810](https://github.com/user-attachments/assets/2f6bd007-490e-420f-b774-3380b4add7ea) ![3U1B1815](https://github.com/user-attachments/assets/1986bb77-2db0-46e2-a5d6-8315dae9eb19) ## Additional Context - I am not a typography expert. - The implementation has been reworked from the earlier version, so it is no longer necessary to omit Open Dyslexic, and kerning data now covers all fonts, styles, and codepoints for which we include bitmap data. - Claude Opus 4.6 helped with a lot of this. - There's an included test epub document with lots of kerning and ligature examples, shown in the photos. **_After some time to mature, I think this change is in decent shape to merge and get people testing._** After opening this PR I came across #660, which overlaps in adding ligature support. --- ### AI Usage While CrossPoint doesn't have restrictions on AI tools in contributing, please be transparent about their usage as it helps set the right context for reviewers. Did you use AI tools to help write this code? _**YES, Claude Opus 4.6**_ --------- Co-authored-by: Cursor <cursoragent@cursor.com>
2026-02-24 02:31:43 -06:00
parent 13592db50f
commit 0eb8a9346b
67 changed files with 80729 additions and 36388 deletions
--- a/lib/EpdFont/scripts/fontconvert.py
+++ b/lib/EpdFont/scripts/fontconvert.py
@@ -6,6 +6,7 @@ import re
 import math
 import argparse
 from collections import namedtuple
+from fontTools.ttLib import TTFont

 # Originally from https://github.com/vroland/epdiy

@@ -106,6 +107,9 @@ intervals = [
    # (0xFE30, 0xFE4F),
    # # CJK Compatibility Ideographs
    # (0xF900, 0xFAFF),
+    ### Alphabetic Presentation Forms (Latin ligatures) ###
+    # ff, fi, fl, ffi, ffl, long-st, st
+    (0xFB00, 0xFB06),
    ### Specials
    # Replacement Character
    (0xFFFD, 0xFFFD),
@@ -134,7 +138,6 @@ def load_glyph(code_point):
            face.load_glyph(glyph_index, load_flags)
            return face
        face_index += 1
-    print(f"code point {code_point} ({hex(code_point)}) not found in font stack!", file=sys.stderr)
    return None

 unmerged_intervals = sorted(intervals + add_ints)
@@ -275,6 +278,375 @@ for index, glyph in enumerate(all_glyphs):
    glyph_data.extend([b for b in packed])
    glyph_props.append(props)

+# --- Kerning pair extraction ---
+# Modern fonts store kerning in the OpenType GPOS table, which FreeType's
+# get_kerning() does not read. We use fonttools to parse both the legacy
+# kern table and the GPOS 'kern' feature (PairPos lookups, including
+# Extension wrappers).
+
+COMBINING_MARKS_START = 0x0300
+COMBINING_MARKS_END = 0x036F
+all_codepoints = [g.code_point for g in glyph_props]
+kernable_codepoints = set(cp for cp in all_codepoints
+                          if not (COMBINING_MARKS_START <= cp <= COMBINING_MARKS_END))
+
+# Map each kernable codepoint to the font-stack index that serves it
+# (same priority logic as load_glyph).
+cp_to_face_idx = {}
+for cp in kernable_codepoints:
+    for face_idx, f in enumerate(font_stack):
+        if f.get_char_index(cp) > 0:
+            cp_to_face_idx[cp] = face_idx
+            break
+
+# Group codepoints by face index
+face_idx_cps = {}
+for cp, fi in cp_to_face_idx.items():
+    face_idx_cps.setdefault(fi, set()).add(cp)
+
+def _extract_pairpos_subtable(subtable, glyph_to_cp, raw_kern):
+    """Extract kerning from a PairPos subtable (Format 1 or 2)."""
+    if subtable.Format == 1:
+        # Individual pairs
+        for i, coverage_glyph in enumerate(subtable.Coverage.glyphs):
+            if coverage_glyph not in glyph_to_cp:
+                continue
+            pair_set = subtable.PairSet[i]
+            for pvr in pair_set.PairValueRecord:
+                if pvr.SecondGlyph not in glyph_to_cp:
+                    continue
+                xa = 0
+                if hasattr(pvr, 'Value1') and pvr.Value1:
+                    xa = getattr(pvr.Value1, 'XAdvance', 0) or 0
+                if xa != 0:
+                    key = (coverage_glyph, pvr.SecondGlyph)
+                    raw_kern[key] = raw_kern.get(key, 0) + xa
+    elif subtable.Format == 2:
+        # Class-based pairs
+        class_def1 = subtable.ClassDef1.classDefs if subtable.ClassDef1 else {}
+        class_def2 = subtable.ClassDef2.classDefs if subtable.ClassDef2 else {}
+        coverage_set = set(subtable.Coverage.glyphs)
+        for left_glyph in glyph_to_cp:
+            if left_glyph not in coverage_set:
+                continue
+            c1 = class_def1.get(left_glyph, 0)
+            if c1 >= len(subtable.Class1Record):
+                continue
+            class1_rec = subtable.Class1Record[c1]
+            for right_glyph in glyph_to_cp:
+                c2 = class_def2.get(right_glyph, 0)
+                if c2 >= len(class1_rec.Class2Record):
+                    continue
+                c2_rec = class1_rec.Class2Record[c2]
+                xa = 0
+                if hasattr(c2_rec, 'Value1') and c2_rec.Value1:
+                    xa = getattr(c2_rec.Value1, 'XAdvance', 0) or 0
+                if xa != 0:
+                    key = (left_glyph, right_glyph)
+                    raw_kern[key] = raw_kern.get(key, 0) + xa
+
+def extract_kerning_fonttools(font_path, codepoints, ppem):
+    """Extract kerning pairs from a font file using fonttools.
+
+    Returns dict of {(leftCp, rightCp): pixel_adjust} for the given
+    codepoints.  Values are scaled from font design units to integer
+    pixels at ppem.
+    """
+    font = TTFont(font_path)
+    units_per_em = font['head'].unitsPerEm
+    cmap = font.getBestCmap() or {}
+
+    # Build glyph_name -> codepoint map (only for requested codepoints)
+    glyph_to_cp = {}
+    for cp in codepoints:
+        gname = cmap.get(cp)
+        if gname:
+            glyph_to_cp[gname] = cp
+
+    # Collect raw kerning values in font design units
+    raw_kern = {}  # (left_glyph_name, right_glyph_name) -> design_units
+
+    # 1. Legacy kern table
+    if 'kern' in font:
+        for subtable in font['kern'].kernTables:
+            if hasattr(subtable, 'kernTable'):
+                for (lg, rg), val in subtable.kernTable.items():
+                    if lg in glyph_to_cp and rg in glyph_to_cp:
+                        raw_kern[(lg, rg)] = raw_kern.get((lg, rg), 0) + val
+
+    # 2. GPOS 'kern' feature
+    if 'GPOS' in font:
+        gpos = font['GPOS'].table
+        kern_lookup_indices = set()
+        if gpos.FeatureList:
+            for fr in gpos.FeatureList.FeatureRecord:
+                if fr.FeatureTag == 'kern':
+                    kern_lookup_indices.update(fr.Feature.LookupListIndex)
+        for li in kern_lookup_indices:
+            lookup = gpos.LookupList.Lookup[li]
+            for st in lookup.SubTable:
+                actual = st
+                # Unwrap Extension (lookup type 9) wrappers
+                if lookup.LookupType == 9 and hasattr(st, 'ExtSubTable'):
+                    actual = st.ExtSubTable
+                if hasattr(actual, 'Format'):
+                    _extract_pairpos_subtable(actual, glyph_to_cp, raw_kern)
+
+    font.close()
+
+    # Scale design-unit values to pixels
+    scale = ppem / units_per_em
+    result = {}  # (leftCp, rightCp) -> adjust
+    for (lg, rg), du in raw_kern.items():
+        lcp = glyph_to_cp[lg]
+        rcp = glyph_to_cp[rg]
+        adjust = int(math.floor(du * scale))
+        if adjust != 0:
+            adjust = max(-128, min(127, adjust))
+            result[(lcp, rcp)] = adjust
+    return result
+
+# The ppem used by the existing glyph rasterization:
+#   face.set_char_size(size << 6, size << 6, 150, 150)
+# means size_pt at 150 DPI -> ppem = size * 150 / 72
+ppem = size * 150.0 / 72.0
+
+kern_map = {}  # (leftCp, rightCp) -> adjust
+for face_idx, cps in face_idx_cps.items():
+    font_path = args.fontstack[face_idx]
+    kern_map.update(extract_kerning_fonttools(font_path, cps, ppem))
+
+print(f"kerning: {len(kern_map)} pairs extracted", file=sys.stderr)
+
+# --- Derive class-based kerning from pairs ---
+kern_left_classes = []   # list of (codepoint, classId)
+kern_right_classes = []  # list of (codepoint, classId)
+kern_matrix = []         # flat list of int8_t values
+kern_left_class_count = 0
+kern_right_class_count = 0
+
+if kern_map:
+    all_left_cps = {lcp for lcp, _ in kern_map}
+    all_right_cps = {rcp for _, rcp in kern_map}
+
+    sorted_right_cps = sorted(all_right_cps)
+    sorted_left_cps = sorted(all_left_cps)
+
+    # Group left codepoints by identical adjustment row
+    left_profile_to_class = {}
+    left_class_map = {}
+    left_class_id = 1
+    for lcp in sorted(all_left_cps):
+        row = tuple(kern_map.get((lcp, rcp), 0) for rcp in sorted_right_cps)
+        if row not in left_profile_to_class:
+            left_profile_to_class[row] = left_class_id
+            left_class_id += 1
+        left_class_map[lcp] = left_profile_to_class[row]
+
+    # Group right codepoints by identical adjustment column
+    right_profile_to_class = {}
+    right_class_map = {}
+    right_class_id = 1
+    for rcp in sorted(all_right_cps):
+        col = tuple(kern_map.get((lcp, rcp), 0) for lcp in sorted_left_cps)
+        if col not in right_profile_to_class:
+            right_profile_to_class[col] = right_class_id
+            right_class_id += 1
+        right_class_map[rcp] = right_profile_to_class[col]
+
+    kern_left_class_count = left_class_id - 1
+    kern_right_class_count = right_class_id - 1
+
+    if kern_left_class_count > 255 or kern_right_class_count > 255:
+        print(f"WARNING: kerning class count exceeds uint8_t range "
+              f"(left={kern_left_class_count}, right={kern_right_class_count})",
+              file=sys.stderr)
+
+    # Build the class x class matrix
+    kern_matrix = [0] * (kern_left_class_count * kern_right_class_count)
+    for (lcp, rcp), adjust in kern_map.items():
+        lc = left_class_map[lcp] - 1
+        rc = right_class_map[rcp] - 1
+        kern_matrix[lc * kern_right_class_count + rc] = adjust
+
+    # Build sorted class entry lists
+    kern_left_classes = sorted(left_class_map.items())
+    kern_right_classes = sorted(right_class_map.items())
+
+    matrix_size = kern_left_class_count * kern_right_class_count
+    entries_size = (len(kern_left_classes) + len(kern_right_classes)) * 3
+    print(f"kerning: {kern_left_class_count} left classes, {kern_right_class_count} right classes, "
+          f"{matrix_size + entries_size} bytes", file=sys.stderr)
+
+# --- Ligature pair extraction ---
+# Parse the OpenType GSUB table for LigatureSubst (type 4) lookups.
+# Multi-character ligatures (3+ codepoints) are decomposed into chained
+# pairs when an intermediate ligature exists (e.g., ffi = ff + i where ff
+# is itself a ligature). Only pairs where both input codepoints and the
+# output codepoint are in the generated glyph set are included.
+
+all_codepoints_set = set(all_codepoints)
+
+# Standard Unicode ligature codepoints for known input sequences.
+# Used as a fallback when the GSUB substitute glyph has no cmap entry.
+STANDARD_LIGATURE_MAP = {
+    (0x66, 0x66):       0xFB00,  # ff
+    (0x66, 0x69):       0xFB01,  # fi
+    (0x66, 0x6C):       0xFB02,  # fl
+    (0x66, 0x66, 0x69): 0xFB03,  # ffi
+    (0x66, 0x66, 0x6C): 0xFB04,  # ffl
+    (0x17F, 0x74):      0xFB05,  # long-s + t
+    (0x73, 0x74):       0xFB06,  # st
+}
+
+def extract_ligatures_fonttools(font_path, codepoints):
+    """Extract ligature substitution pairs from a font file using fonttools.
+
+    Returns list of (packed_pair, ligature_codepoint) for the given codepoints.
+    Multi-character ligatures are decomposed into chained pairs.
+    """
+    font = TTFont(font_path)
+    cmap = font.getBestCmap() or {}
+
+    # Build glyph_name -> codepoint and codepoint -> glyph_name maps
+    glyph_to_cp = {}
+    cp_to_glyph = {}
+    for cp, gname in cmap.items():
+        glyph_to_cp[gname] = cp
+        cp_to_glyph[cp] = gname
+
+    # Collect raw ligature rules: (sequence_of_codepoints) -> ligature_codepoint
+    raw_ligatures = {}  # tuple of codepoints -> ligature codepoint
+
+    if 'GSUB' in font:
+        gsub = font['GSUB'].table
+
+        # Find lookup indices for ligature features.
+        # Currently extracts 'liga' (standard) and 'rlig' (required) only.
+        # To also extract discretionary or historical ligatures, add:
+        #   'dlig' - Discretionary Ligatures (e.g., ft, st in Bookerly)
+        #   'hlig' - Historical Ligatures (e.g., long-s+t in OpenDyslexic)
+        # These are off by default in standard text renderers.
+        LIGATURE_FEATURES = ('liga', 'rlig')
+        liga_lookup_indices = set()
+        if gsub.FeatureList:
+            for fr in gsub.FeatureList.FeatureRecord:
+                if fr.FeatureTag in LIGATURE_FEATURES:
+                    liga_lookup_indices.update(fr.Feature.LookupListIndex)
+
+        for li in liga_lookup_indices:
+            lookup = gsub.LookupList.Lookup[li]
+            for st in lookup.SubTable:
+                actual = st
+                # Unwrap Extension (lookup type 7) wrappers
+                if lookup.LookupType == 7 and hasattr(st, 'ExtSubTable'):
+                    actual = st.ExtSubTable
+                # LigatureSubst is lookup type 4
+                if not hasattr(actual, 'ligatures'):
+                    continue
+                for first_glyph, ligature_list in actual.ligatures.items():
+                    if first_glyph not in glyph_to_cp:
+                        continue
+                    first_cp = glyph_to_cp[first_glyph]
+                    for lig in ligature_list:
+                        # lig.Component is a list of subsequent glyph names
+                        # lig.LigGlyph is the substitute glyph name
+                        component_cps = []
+                        valid = True
+                        for comp_glyph in lig.Component:
+                            if comp_glyph not in glyph_to_cp:
+                                valid = False
+                                break
+                            component_cps.append(glyph_to_cp[comp_glyph])
+                        if not valid:
+                            continue
+                        seq = tuple([first_cp] + component_cps)
+                        if lig.LigGlyph in glyph_to_cp:
+                            lig_cp = glyph_to_cp[lig.LigGlyph]
+                        elif seq in STANDARD_LIGATURE_MAP:
+                            lig_cp = STANDARD_LIGATURE_MAP[seq]
+                        else:
+                            seq_str = ', '.join(f'U+{cp:04X}' for cp in seq)
+                            print(f"ligatures: WARNING: dropping ligature ({seq_str}) -> "
+                                  f"glyph '{lig.LigGlyph}': output glyph has no cmap entry "
+                                  f"and input sequence is not in STANDARD_LIGATURE_MAP",
+                                  file=sys.stderr)
+                            continue
+                        raw_ligatures[seq] = lig_cp
+
+    font.close()
+
+    # Filter: only keep ligatures where all input and output codepoints are
+    # in our generated glyph set
+    filtered = {}
+    for seq, lig_cp in raw_ligatures.items():
+        if lig_cp not in codepoints and lig_cp not in all_codepoints_set:
+            continue
+        if all(cp in codepoints for cp in seq):
+            filtered[seq] = lig_cp
+
+    # Decompose into chained pairs
+    # For 2-codepoint sequences: direct pair (a, b) -> lig
+    # For 3+ codepoint sequences: chain through intermediates
+    #   e.g., (f, f, i) -> ffi requires (f, f) -> ff to exist,
+    #   then we add (ff, i) -> ffi
+    pairs = []
+    # First pass: collect all 2-codepoint ligatures
+    two_char = {seq: lig_cp for seq, lig_cp in filtered.items() if len(seq) == 2}
+    for seq, lig_cp in two_char.items():
+        packed = (seq[0] << 16) | seq[1]
+        pairs.append((packed, lig_cp))
+
+    # Second pass: decompose 3+ codepoint ligatures into chained pairs
+    for seq, lig_cp in filtered.items():
+        if len(seq) < 3:
+            continue
+        # Try to find an intermediate: check if the first N-1 codepoints
+        # form a known ligature, then chain (intermediate, last) -> lig
+        prefix = seq[:-1]
+        last_cp = seq[-1]
+        if prefix in filtered:
+            intermediate_cp = filtered[prefix]
+            packed = (intermediate_cp << 16) | last_cp
+            pairs.append((packed, lig_cp))
+        else:
+            print(f"ligatures: skipping {len(seq)}-char ligature "
+                  f"({', '.join(f'U+{cp:04X}' for cp in seq)}) -> U+{lig_cp:04X}: "
+                  f"no intermediate ligature for prefix", file=sys.stderr)
+
+    return pairs
+
+ligature_codepoints = set(cp for cp in all_codepoints
+                          if not (COMBINING_MARKS_START <= cp <= COMBINING_MARKS_END))
+
+# Map ligature codepoints to the font-stack index that serves them
+lig_cp_to_face_idx = {}
+for cp in ligature_codepoints:
+    for face_idx, f in enumerate(font_stack):
+        if f.get_char_index(cp) > 0:
+            lig_cp_to_face_idx[cp] = face_idx
+            break
+
+# Group by face index
+lig_face_idx_cps = {}
+for cp, fi in lig_cp_to_face_idx.items():
+    lig_face_idx_cps.setdefault(fi, set()).add(cp)
+
+ligature_pairs = []
+for face_idx, cps in lig_face_idx_cps.items():
+    font_path = args.fontstack[face_idx]
+    ligature_pairs.extend(extract_ligatures_fonttools(font_path, cps))
+
+# Deduplicate (keep first occurrence) and sort
+seen_lig_keys = set()
+unique_ligature_pairs = []
+for packed, lig_cp in ligature_pairs:
+    if packed not in seen_lig_keys:
+        seen_lig_keys.add(packed)
+        unique_ligature_pairs.append((packed, lig_cp))
+ligature_pairs = sorted(unique_ligature_pairs, key=lambda p: p[0])
+print(f"ligatures: {len(ligature_pairs)} pairs extracted", file=sys.stderr)
+
 compress = args.compress

 # Build groups for compression
@@ -294,6 +666,7 @@ if compress:
        (0x20A0, 0x20CF),   # Currency Symbols
        (0x2190, 0x21FF),   # Arrows
        (0x2200, 0x22FF),   # Math Operators
+        (0xFB00, 0xFB06),   # Alphabetic Presentation Forms (ligatures)
        (0xFFFD, 0xFFFD),   # Replacement Character
    ]

@@ -385,9 +758,14 @@ else:
        print ("    " + " ".join(f"0x{b:02X}," for b in c))
    print ("};\n");

+def cp_label(cp):
+    if cp == 0x5C:
+        return '<backslash>'
+    return chr(cp) if 0x20 < cp < 0x7F else f'U+{cp:04X}'
+
 print(f"static const EpdGlyph {font_name}Glyphs[] = {{")
 for i, g in enumerate(glyph_props):
-    print ("    { " + ", ".join([f"{a}" for a in list(g[:-1])]),"},", f"// {chr(g.code_point) if g.code_point != 92 else '<backslash>'}")
+    print ("    { " + ", ".join([f"{a}" for a in list(g[:-1])]),"},", f"// {cp_label(g.code_point)}")
 print ("};\n");

 print(f"static const EpdUnicodeInterval {font_name}Intervals[] = {{")
@@ -405,6 +783,30 @@ if compress:
        compressed_offset += len(compressed)
    print("};\n")

+if kern_map:
+    print(f"static const EpdKernClassEntry {font_name}KernLeftClasses[] = {{")
+    for cp, cls in kern_left_classes:
+        print(f"    {{ 0x{cp:04X}, {cls} }}, // {cp_label(cp)}")
+    print("};\n")
+
+    print(f"static const EpdKernClassEntry {font_name}KernRightClasses[] = {{")
+    for cp, cls in kern_right_classes:
+        print(f"    {{ 0x{cp:04X}, {cls} }}, // {cp_label(cp)}")
+    print("};\n")
+
+    print(f"static const int8_t {font_name}KernMatrix[] = {{")
+    for row in range(kern_left_class_count):
+        row_start = row * kern_right_class_count
+        row_vals = kern_matrix[row_start:row_start + kern_right_class_count]
+        print("    " + ", ".join(f"{v:4d}" for v in row_vals) + ",")
+    print("};\n")
+
+if ligature_pairs:
+    print(f"static const EpdLigaturePair {font_name}LigaturePairs[] = {{")
+    for packed_pair, lig_cp in ligature_pairs:
+        print(f"    {{ 0x{packed_pair:08X}, 0x{lig_cp:04X} }}, // {cp_label(packed_pair >> 16)} {cp_label(packed_pair & 0xFFFF)} -> {cp_label(lig_cp)}")
+    print("};\n")
+
 print(f"static const EpdFontData {font_name} = {{")
 print(f"    {font_name}Bitmaps,")
 print(f"    {font_name}Glyphs,")
@@ -420,4 +822,26 @@ if compress:
 else:
    print(f"    nullptr,")
    print(f"    0,")
+if kern_map:
+    print(f"    {font_name}KernLeftClasses,")
+    print(f"    {font_name}KernRightClasses,")
+    print(f"    {font_name}KernMatrix,")
+    print(f"    {len(kern_left_classes)},")
+    print(f"    {len(kern_right_classes)},")
+    print(f"    {kern_left_class_count},")
+    print(f"    {kern_right_class_count},")
+else:
+    print(f"    nullptr,")
+    print(f"    nullptr,")
+    print(f"    nullptr,")
+    print(f"    0,")
+    print(f"    0,")
+    print(f"    0,")
+    print(f"    0,")
+if ligature_pairs:
+    print(f"    {font_name}LigaturePairs,")
+    print(f"    {len(ligature_pairs)},")
+else:
+    print(f"    nullptr,")
+    print(f"    0,")
 print("};")