[USE] Add CGJ to table

This commit is contained in:
Behdad Esfahbod 2015-07-21 11:57:23 +01:00
parent 4febed61ed
commit ba72801325
2 changed files with 11 additions and 3 deletions

View File

@ -39,8 +39,12 @@ for i, f in enumerate (files):
data[i][u] = t data[i][u] = t
values[i][t] = values[i].get (t, 0) + end - start + 1 values[i][t] = values[i].get (t, 0) + end - start + 1
# Merge data into one dict:
defaults = ('Other', 'Not_Applicable', 'Cn', 'No_Block') defaults = ('Other', 'Not_Applicable', 'Cn', 'No_Block')
# TODO CGJ is not in Unicode Indic files, but used in USE
data[0][0x034F] = defaults[0]
# Merge data into one dict:
for i,v in enumerate (defaults): for i,v in enumerate (defaults):
values[i][v] = values[i].get (v, 0) + 1 values[i][v] = values[i].get (v, 0) + 1
combined = {} combined = {}
@ -180,7 +184,10 @@ def is_Word_Joiner(U, UISC, UGC):
return U == 0x2060 return U == 0x2060
def is_OTHER(U, UISC, UGC): def is_OTHER(U, UISC, UGC):
#SPEC-OUTDATED return UGC == Zs # or any other SCRIPT_COMMON characters #SPEC-OUTDATED return UGC == Zs # or any other SCRIPT_COMMON characters
return UISC == Other and not is_SYM_MOD(U, UISC, UGC) return (UISC == Other
and not is_SYM_MOD(U, UISC, UGC)
and not is_CGJ(U, UISC, UGC)
)
def is_Reserved(U, UISC, UGC): def is_Reserved(U, UISC, UGC):
return UGC == 'Cn' return UGC == 'Cn'
def is_REPHA(U, UISC, UGC): def is_REPHA(U, UISC, UGC):
@ -325,7 +332,7 @@ data = map_to_use(data)
# Remove the outliers # Remove the outliers
singles = {} singles = {}
for u in [0x25CC, 0x1107F]: for u in [0x034F, 0x25CC, 0x1107F]:
singles[u] = data[u] singles[u] = data[u]
del data[u] del data[u]

View File

@ -640,6 +640,7 @@ hb_use_get_categories (hb_codepoint_t u)
if (hb_in_range (u, 0x0028u, 0x003Fu)) return use_table[u - 0x0028u + use_offset_0x0028u]; if (hb_in_range (u, 0x0028u, 0x003Fu)) return use_table[u - 0x0028u + use_offset_0x0028u];
if (hb_in_range (u, 0x00A0u, 0x00D7u)) return use_table[u - 0x00A0u + use_offset_0x00a0u]; if (hb_in_range (u, 0x00A0u, 0x00D7u)) return use_table[u - 0x00A0u + use_offset_0x00a0u];
if (hb_in_range (u, 0x0900u, 0x0DF7u)) return use_table[u - 0x0900u + use_offset_0x0900u]; if (hb_in_range (u, 0x0900u, 0x0DF7u)) return use_table[u - 0x0900u + use_offset_0x0900u];
if (unlikely (u == 0x034Fu)) return USE_CGJ;
break; break;
case 0x1u: case 0x1u: