From 02eb6606d7dfb8ad1d4dbdcad3badebc37a8dc49 Mon Sep 17 00:00:00 2001 From: Behdad Esfahbod Date: Fri, 10 Jun 2022 17:10:42 -0600 Subject: [PATCH] [indic-generator] Remove redundant PLACEHODER characters overrides https://github.com/harfbuzz/harfbuzz/pull/3648#discussion_r894631922 --- src/gen-indic-table.py | 58 ++++++++++++++++++++---------------------- 1 file changed, 28 insertions(+), 30 deletions(-) diff --git a/src/gen-indic-table.py b/src/gen-indic-table.py index 3edcb758a..d9c0d6c69 100755 --- a/src/gen-indic-table.py +++ b/src/gen-indic-table.py @@ -146,6 +146,34 @@ position_map = { category_overrides = { + # These are the variation-selectors. They only appear in the Myanmar grammar + # but are not Myanmar-specific + 0xFE00: 'VS', + 0xFE01: 'VS', + 0xFE02: 'VS', + 0xFE03: 'VS', + 0xFE04: 'VS', + 0xFE05: 'VS', + 0xFE06: 'VS', + 0xFE07: 'VS', + 0xFE08: 'VS', + 0xFE09: 'VS', + 0xFE0A: 'VS', + 0xFE0B: 'VS', + 0xFE0C: 'VS', + 0xFE0D: 'VS', + 0xFE0E: 'VS', + 0xFE0F: 'VS', + + # These appear in the OT Myanmar spec, but are not Myanmar-specific + 0x2015: 'PLACEHOLDER', + 0x2022: 'PLACEHOLDER', + 0x25FB: 'PLACEHOLDER', + 0x25FC: 'PLACEHOLDER', + 0x25FD: 'PLACEHOLDER', + 0x25FE: 'PLACEHOLDER', + + # Indic 0x0930: 'Ra', # Devanagari @@ -247,38 +275,8 @@ category_overrides = { # https://docs.microsoft.com/en-us/typography/script-development/myanmar#analyze - 0xFE00: 'VS', - 0xFE01: 'VS', - 0xFE02: 'VS', - 0xFE03: 'VS', - 0xFE04: 'VS', - 0xFE05: 'VS', - 0xFE06: 'VS', - 0xFE07: 'VS', - 0xFE08: 'VS', - 0xFE09: 'VS', - 0xFE0A: 'VS', - 0xFE0B: 'VS', - 0xFE0C: 'VS', - 0xFE0D: 'VS', - 0xFE0E: 'VS', - 0xFE0F: 'VS', - 0x104E: 'C', # The spec says C, IndicSyllableCategory says Consonant_Placeholder - 0x002D: 'PLACEHOLDER', - 0x00A0: 'PLACEHOLDER', - 0x00D7: 'PLACEHOLDER', - 0x2012: 'PLACEHOLDER', - 0x2013: 'PLACEHOLDER', - 0x2014: 'PLACEHOLDER', - 0x2015: 'PLACEHOLDER', - 0x2022: 'PLACEHOLDER', - 0x25FB: 'PLACEHOLDER', - 0x25FC: 'PLACEHOLDER', - 0x25FD: 'PLACEHOLDER', - 0x25FE: 'PLACEHOLDER', - 0x1004: 'Ra', 0x101B: 'Ra', 0x105A: 'Ra',