Blame - tools/fonts/fontchain_linter.py - android_frameworks_base

2016-03-09 23:08:45 -0800

[diff] [blame]

1

#!/usr/bin/env python

2

3

import collections

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

4

import copy

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

5

import glob

6

from os import path

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

7

import re

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

8

import sys

9

from xml.etree import ElementTree

10

11

from fontTools import ttLib

12

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

13

EMOJI_VS = 0xFE0F

14

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

15

LANG_TO_SCRIPT = {

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

16

'af': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

17

'as': 'Beng',

Calvin Pan

2021-12-06 21:42:12 +0800

[diff] [blame]

18

'am': 'Latn',

Roozbeh Pournader

7e04dd1

2017-10-13 17:41:31 -0700

[diff] [blame]

19

'be': 'Cyrl',

Roozbeh Pournader

033b222

2017-02-22 18:53:39 -0800

[diff] [blame]

20

'bg': 'Cyrl',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

21

'bn': 'Beng',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

22

'cs': 'Latn',

Roozbeh Pournader

033b222

2017-02-22 18:53:39 -0800

[diff] [blame]

23

'cu': 'Cyrl',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

24

'cy': 'Latn',

25

'da': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

26

'de': 'Latn',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

27

'el': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

28

'en': 'Latn',

29

'es': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

30

'et': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

31

'eu': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

32

'fr': 'Latn',

33

'ga': 'Latn',

Calvin Pan

2021-12-06 21:42:12 +0800

[diff] [blame]

34

'gl': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

35

'gu': 'Gujr',

36

'hi': 'Deva',

37

'hr': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

38

'hu': 'Latn',

39

'hy': 'Armn',

Calvin Pan

2021-12-06 21:42:12 +0800

[diff] [blame]

40

'it': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

41

'ja': 'Jpan',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

42

'ka': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

43

'kn': 'Knda',

44

'ko': 'Kore',

Roozbeh Pournader

7e04dd1

2017-10-13 17:41:31 -0700

[diff] [blame]

45

'la': 'Latn',

Calvin Pan

2021-12-06 21:42:12 +0800

[diff] [blame]

46

'lt': 'Latn',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

47

'lv': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

48

'ml': 'Mlym',

49

'mn': 'Cyrl',

50

'mr': 'Deva',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

51

'nb': 'Latn',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

52

'nl': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

53

'nn': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

54

'or': 'Orya',

55

'pa': 'Guru',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

56

'pt': 'Latn',

Calvin Pan

13c70d6

2022-01-21 16:42:18 +0800

[diff] [blame]

57

'ru': 'Latn',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

58

'sk': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

59

'sl': 'Latn',

Calvin Pan

2021-12-14 18:50:31 +0800

[diff] [blame]

60

'sq': 'Latn',

Calvin Pan

1e966a3

2022-01-12 16:12:38 +0800

[diff] [blame]

61

'sv': 'Latn',

Jungshik Shin

2016-03-19 09:32:34 -0700

[diff] [blame]

62

'ta': 'Taml',

63

'te': 'Telu',

64

'tk': 'Latn',

Calvin Pan

2021-12-06 21:42:12 +0800

[diff] [blame]

65

'uk': 'Latn',

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

66

}

67

68

def lang_to_script(lang_code):

69

lang = lang_code.lower()

70

while lang not in LANG_TO_SCRIPT:

71

hyphen_idx = lang.rfind('-')

72

assert hyphen_idx != -1, (

73

'We do not know what script the "%s" language is written in.'

74

% lang_code)

75

assumed_script = lang[hyphen_idx+1:]

76

if len(assumed_script) == 4 and assumed_script.isalpha():

77

# This is actually the script

78

return assumed_script.title()

79

lang = lang[:hyphen_idx]

80

return LANG_TO_SCRIPT[lang]

81

82

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

83

def printable(inp):

84

if type(inp) is set: # set of character sequences

85

return '{' + ', '.join([printable(seq) for seq in inp]) + '}'

86

if type(inp) is tuple: # character sequence

87

return '<' + (', '.join([printable(ch) for ch in inp])) + '>'

88

else: # single character

89

return 'U+%04X' % inp

90

91

92

def open_font(font):

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

93

font_file, index = font

94

font_path = path.join(_fonts_dir, font_file)

95

if index is not None:

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

96

return ttLib.TTFont(font_path, fontNumber=index)

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

97

else:

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

98

return ttLib.TTFont(font_path)

99

100

101

def get_best_cmap(font):

102

ttfont = open_font(font)

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

103

all_unicode_cmap = None

104

bmp_cmap = None

105

for cmap in ttfont['cmap'].tables:

106

specifier = (cmap.format, cmap.platformID, cmap.platEncID)

107

if specifier == (4, 3, 1):

108

assert bmp_cmap is None, 'More than one BMP cmap in %s' % (font, )

109

bmp_cmap = cmap

110

elif specifier == (12, 3, 10):

111

assert all_unicode_cmap is None, (

112

'More than one UCS-4 cmap in %s' % (font, ))

113

all_unicode_cmap = cmap

114

115

return all_unicode_cmap.cmap if all_unicode_cmap else bmp_cmap.cmap

116

117

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

118

def get_variation_sequences_cmap(font):

119

ttfont = open_font(font)

120

vs_cmap = None

121

for cmap in ttfont['cmap'].tables:

122

specifier = (cmap.format, cmap.platformID, cmap.platEncID)

123

if specifier == (14, 0, 5):

124

assert vs_cmap is None, 'More than one VS cmap in %s' % (font, )

vs_cmap = cmap

return vs_cmap

def get_emoji_map(font):

130

# Add normal characters

131

emoji_map = copy.copy(get_best_cmap(font))

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

132

reverse_cmap = {glyph: code for code, glyph in emoji_map.items() if not contains_pua(code) }

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

133

134

# Add variation sequences

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

135

vs_cmap = get_variation_sequences_cmap(font)

136

if vs_cmap:

137

for vs in vs_cmap.uvsDict:

138

for base, glyph in vs_cmap.uvsDict[vs]:

139

if glyph is None:

140

emoji_map[(base, vs)] = emoji_map[base]

141

else:

142

emoji_map[(base, vs)] = glyph

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

143

144

# Add GSUB rules

145

ttfont = open_font(font)

146

for lookup in ttfont['GSUB'].table.LookupList.Lookup:

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

147

if lookup.LookupType != 4:

148

# Other lookups are used in the emoji font for fallback.

149

# We ignore them for now.

150

continue

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

151

for subtable in lookup.SubTable:

152

ligatures = subtable.ligatures

153

for first_glyph in ligatures:

154

for ligature in ligatures[first_glyph]:

155

sequence = [first_glyph] + ligature.Component

156

sequence = [reverse_cmap[glyph] for glyph in sequence]

157

sequence = tuple(sequence)

158

# Make sure no starting subsequence of 'sequence' has been

159

# seen before.

160

for sub_len in range(2, len(sequence)+1):

161

subsequence = sequence[:sub_len]

162

assert subsequence not in emoji_map

163

emoji_map[sequence] = ligature.LigGlyph

return emoji_map

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

168

def assert_font_supports_any_of_chars(font, chars):

169

best_cmap = get_best_cmap(font)

170

for char in chars:

171

if char in best_cmap:

172

return

173

sys.exit('None of characters in %s were found in %s' % (chars, font))

174

175

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

176

def assert_font_supports_all_of_chars(font, chars):

177

best_cmap = get_best_cmap(font)

178

for char in chars:

179

assert char in best_cmap, (

180

'U+%04X was not found in %s' % (char, font))

181

182

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

183

def assert_font_supports_none_of_chars(font, chars, fallbackName):

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

184

best_cmap = get_best_cmap(font)

185

for char in chars:

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

186

if fallbackName:

187

assert char not in best_cmap, 'U+%04X was found in %s' % (char, font)

188

else:

189

assert char not in best_cmap, (

190

'U+%04X was found in %s in fallback %s' % (char, font, fallbackName))

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

191

192

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

193

def assert_font_supports_all_sequences(font, sequences):

194

vs_dict = get_variation_sequences_cmap(font).uvsDict

195

for base, vs in sorted(sequences):

196

assert vs in vs_dict and (base, None) in vs_dict[vs], (

197

'<U+%04X, U+%04X> was not found in %s' % (base, vs, font))

198

199

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

200

def check_hyphens(hyphens_dir):

201

# Find all the scripts that need automatic hyphenation

202

scripts = set()

203

for hyb_file in glob.iglob(path.join(hyphens_dir, '*.hyb')):

204

hyb_file = path.basename(hyb_file)

205

assert hyb_file.startswith('hyph-'), (

206

'Unknown hyphenation file %s' % hyb_file)

207

lang_code = hyb_file[hyb_file.index('-')+1:hyb_file.index('.')]

208

scripts.add(lang_to_script(lang_code))

209

210

HYPHENS = {0x002D, 0x2010}

211

for script in scripts:

212

fonts = _script_to_font_map[script]

213

assert fonts, 'No fonts found for the "%s" script' % script

214

for font in fonts:

215

assert_font_supports_any_of_chars(font, HYPHENS)

216

217

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

218

class FontRecord(object):

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

219

def __init__(self, name, psName, scripts, variant, weight, style, fallback_for, font):

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

220

self.name = name

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

221

self.psName = psName

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

222

self.scripts = scripts

223

self.variant = variant

224

self.weight = weight

225

self.style = style

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

226

self.fallback_for = fallback_for

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

self.font = font

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

230

def parse_fonts_xml(fonts_xml_path):

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

231

global _script_to_font_map, _fallback_chains, _all_fonts

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

232

_script_to_font_map = collections.defaultdict(set)

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

233

_fallback_chains = {}

234

_all_fonts = []

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

235

tree = ElementTree.parse(fonts_xml_path)

Seigo Nonaka

9092dc2

2017-01-06 16:54:52 +0900

[diff] [blame]

236

families = tree.findall('family')

237

# Minikin supports up to 254 but users can place their own font at the first

238

# place. Thus, 253 is the maximum allowed number of font families in the

239

# default collection.

240

assert len(families) < 254, (

241

'System font collection can contains up to 253 font families.')

242

for family in families:

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

243

name = family.get('name')

244

variant = family.get('variant')

245

langs = family.get('lang')

Seigo Nonaka

e26eb8c

2022-03-02 15:43:49 -0800

[diff] [blame]

246

ignoreAttr = family.get('ignore')

247

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

248

if name:

249

assert variant is None, (

250

'No variant expected for LGC font %s.' % name)

251

assert langs is None, (

252

'No language expected for LGC fonts %s.' % name)

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

253

assert name not in _fallback_chains, 'Duplicated name entry %s' % name

254

_fallback_chains[name] = []

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

255

else:

256

assert variant in {None, 'elegant', 'compact'}, (

257

'Unexpected value for variant: %s' % variant)

258

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

259

trim_re = re.compile(r"^[ \n\r\t]*(.+)[ \n\r\t]*$")

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

260

for family in families:

261

name = family.get('name')

262

variant = family.get('variant')

263

langs = family.get('lang')

Seigo Nonaka

e26eb8c

2022-03-02 15:43:49 -0800

[diff] [blame]

264

ignoreAttr = family.get('ignore')

265

ignore = ignoreAttr == 'true' or ignoreAttr == '1'

266

267

if ignore:

268

continue

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

269

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

270

if langs:

271

langs = langs.split()

272

scripts = {lang_to_script(lang) for lang in langs}

else:

scripts = set()

for child in family:

assert child.tag == 'font', (

278

'Unknown tag <%s>' % child.tag)

Jungshik Shin

88b1114

2017-03-17 14:56:17 -0700

[diff] [blame]

279

font_file = child.text.rstrip()

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

280

281

m = trim_re.match(font_file)

282

font_file = m.group(1)

283

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

284

weight = int(child.get('weight'))

285

assert weight % 100 == 0, (

286

'Font weight "%d" is not a multiple of 100.' % weight)

287

288

style = child.get('style')

289

assert style in {'normal', 'italic'}, (

290

'Unknown style "%s"' % style)

291

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

292

fallback_for = child.get('fallbackFor')

293

294

assert not name or not fallback_for, (

295

'name and fallbackFor cannot be present at the same time')

296

assert not fallback_for or fallback_for in _fallback_chains, (

297

'Unknown fallback name: %s' % fallback_for)

298

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

299

index = child.get('index')

if index:

index = int(index)

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

303

if not path.exists(path.join(_fonts_dir, m.group(1))):

Seigo Nonaka

1403ff2

2018-01-18 17:24:31 -0800

[diff] [blame]

304

continue # Missing font is a valid case. Just ignore the missing font files.

305

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

306

record = FontRecord(

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

307

name,

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

308

child.get('postScriptName'),

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

frozenset(scripts),

variant,

weight,

style,

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

fallback_for,

(font_file, index))

_all_fonts.append(record)

317

318

if not fallback_for:

319

if not name or name == 'sans-serif':

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

320

for _, fallback in _fallback_chains.items():

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

321

fallback.append(record)

322

else:

323

_fallback_chains[name].append(record)

324

else:

325

_fallback_chains[fallback_for].append(record)

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

326

327

if name: # non-empty names are used for default LGC fonts

328

map_scripts = {'Latn', 'Grek', 'Cyrl'}

329

else:

330

map_scripts = scripts

331

for script in map_scripts:

332

_script_to_font_map[script].add((font_file, index))

333

334

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

335

def check_emoji_coverage(all_emoji, equivalent_emoji):

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

336

emoji_fonts = get_emoji_fonts()

337

check_emoji_font_coverage(emoji_fonts, all_emoji, equivalent_emoji)

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

338

339

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

340

def get_emoji_fonts():

341

return [ record.font for record in _all_fonts if 'Zsye' in record.scripts ]

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

342

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

343

def seq_any(sequence, pred):

344

if type(sequence) is tuple:

345

return any([pred(x) for x in sequence])

346

else:

347

return pred(sequence)

348

349

def seq_all(sequence, pred):

350

if type(sequence) is tuple:

351

return all([pred(x) for x in sequence])

352

else:

353

return pred(sequence)

354

355

def is_regional_indicator(x):

356

# regional indicator A..Z

357

return 0x1F1E6 <= x <= 0x1F1FF

def is_tag(x):

# tag block

return 0xE0000 <= x <= 0xE007F

362

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

363

def is_pua(x):

364

return 0xE000 <= x <= 0xF8FF or 0xF0000 <= x <= 0xFFFFD or 0x100000 <= x <= 0x10FFFD

365

366

def contains_pua(sequence):

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

367

return seq_any(sequence, is_pua)

368

369

def contains_regional_indicator(sequence):

370

return seq_any(sequence, is_regional_indicator)

371

372

def only_tags(sequence):

373

return seq_all(sequence, is_tag)

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

374

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

375

def get_psname(ttf):

376

return str(next(x for x in ttf['name'].names

377

if x.platformID == 3 and x.platEncID == 1 and x.nameID == 6))

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

378

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

379

def hex_strs(sequence):

380

if type(sequence) is tuple:

381

return tuple(f"{s:X}" for s in sequence)

382

return hex(sequence)

383

384

def check_plausible_compat_pua(coverage, all_emoji, equivalent_emoji):

385

# A PUA should point to every RGI emoji and that PUA should be unique to the

386

# set of equivalent sequences for the emoji.

387

problems = []

388

for seq in all_emoji:

389

# We're looking to match not-PUA with PUA so filter out existing PUA

390

if contains_pua(seq):

391

continue

392

393

# Filter out non-RGI things that end up in all_emoji

394

if only_tags(seq) or seq in {ZWJ, COMBINING_KEYCAP, EMPTY_FLAG_SEQUENCE}:

continue

equivalents = [seq]

if seq in equivalent_emoji:

399

equivalents.append(equivalent_emoji[seq])

400

401

# If there are problems the hex code is much more useful

402

log_equivalents = [hex_strs(s) for s in equivalents]

403

404

# The system compat font should NOT include regional indicators as these have been split out

405

if contains_regional_indicator(seq):

406

assert not any(s in coverage for s in equivalents), f"Regional indicators not expected in compat font, found {log_equivalents}"

407

continue

408

409

glyph = {coverage[e] for e in equivalents}

410

if len(glyph) != 1:

411

problems.append(f"{log_equivalents} should all point to the same glyph")

412

continue

413

glyph = next(iter(glyph))

414

415

pua = {s for s, g in coverage.items() if contains_pua(s) and g == glyph}

416

if not pua:

417

problems.append(f"Expected PUA for {log_equivalents} but none exist")

418

continue

419

420

assert not problems, "\n".join(sorted(problems)) + f"\n{len(problems)} PUA problems"

421

422

def check_emoji_compat(all_emoji, equivalent_emoji):

423

compat_psnames = set()

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

424

for emoji_font in get_emoji_fonts():

425

ttf = open_font(emoji_font)

426

psname = get_psname(ttf)

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

427

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

428

is_compat_font = "meta" in ttf and 'Emji' in ttf["meta"].data

429

if not is_compat_font:

430

continue

431

compat_psnames.add(psname)

432

433

# If the font has compat metadata it should have PUAs for emoji sequences

434

coverage = get_emoji_map(emoji_font)

435

check_plausible_compat_pua(coverage, all_emoji, equivalent_emoji)

436

437

438

# NotoColorEmoji must be a Compat font.

439

assert 'NotoColorEmoji' in compat_psnames, 'NotoColorEmoji MUST be a compat font'

440

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

441

442

def check_emoji_font_coverage(emoji_fonts, all_emoji, equivalent_emoji):

443

coverages = []

444

for emoji_font in emoji_fonts:

445

coverages.append(get_emoji_map(emoji_font))

Rod S

e34a19d

2020-03-16 00:01:15 -0700

[diff] [blame]

errors = []

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

449

for sequence in all_emoji:

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

450

if all([sequence not in coverage for coverage in coverages]):

451

errors.append('%s is not supported in the emoji font.' % printable(sequence))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

452

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

453

for coverage in coverages:

454

for sequence in coverage:

455

if sequence in {0x0000, 0x000D, 0x0020}:

456

# The font needs to support a few extra characters, which is OK

457

continue

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

458

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

459

if contains_pua(sequence):

460

# The font needs to have some PUA for EmojiCompat library.

461

continue

Seigo Nonaka

2021-05-04 17:12:35 -0700

[diff] [blame]

462

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

463

if sequence not in all_emoji:

464

errors.append('%s support unexpected in the emoji font.' % printable(sequence))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

465

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

466

for first, second in equivalent_emoji.items():

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

467

for coverage in coverages:

468

if first not in coverage or second not in coverage:

469

continue # sequence will be reported missing

470

if coverage[first] != coverage[second]:

471

errors.append('%s and %s should map to the same glyph.' % (

472

printable(first),

473

printable(second)))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

474

Seigo Nonaka

2021-06-14 17:38:22 -0700

[diff] [blame]

475

for coverage in coverages:

476

for glyph in set(coverage.values()):

477

maps_to_glyph = [

478

seq for seq in coverage if coverage[seq] == glyph and not contains_pua(seq) ]

479

if len(maps_to_glyph) > 1:

480

# There are more than one sequences mapping to the same glyph. We

481

# need to make sure they were expected to be equivalent.

482

equivalent_seqs = set()

483

for seq in maps_to_glyph:

484

equivalent_seq = seq

485

while equivalent_seq in equivalent_emoji:

486

equivalent_seq = equivalent_emoji[equivalent_seq]

487

equivalent_seqs.add(equivalent_seq)

488

if len(equivalent_seqs) != 1:

489

errors.append('The sequences %s should not result in the same glyph %s' % (

490

printable(equivalent_seqs),

491

glyph))

Roozbeh Pournader

2016-07-25 14:04:34 -0700

[diff] [blame]

492

Rod S

e34a19d

2020-03-16 00:01:15 -0700

[diff] [blame]

493

assert not errors, '%d emoji font errors:\n%s\n%d emoji font coverage errors' % (len(errors), '\n'.join(errors), len(errors))

494

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

495

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

496

def check_emoji_defaults(default_emoji):

497

missing_text_chars = _emoji_properties['Emoji'] - default_emoji

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

498

for name, fallback_chain in _fallback_chains.items():

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

499

emoji_font_seen = False

500

for record in fallback_chain:

501

if 'Zsye' in record.scripts:

502

emoji_font_seen = True

503

# No need to check the emoji font

504

continue

505

# For later fonts, we only check them if they have a script

506

# defined, since the defined script may get them to a higher

507

# score even if they appear after the emoji font. However,

508

# we should skip checking the text symbols font, since

509

# symbol fonts should be able to override the emoji display

510

# style when 'Zsym' is explicitly specified by the user.

511

if emoji_font_seen and (not record.scripts or 'Zsym' in record.scripts):

512

continue

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

513

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

514

# Check default emoji-style characters

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

515

assert_font_supports_none_of_chars(record.font, default_emoji, name)

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

516

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

517

# Mark default text-style characters appearing in fonts above the emoji

518

# font as seen

519

if not emoji_font_seen:

520

missing_text_chars -= set(get_best_cmap(record.font))

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

521

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

522

# Noto does not have monochrome glyphs for Unicode 7.0 wingdings and

523

# webdings yet.

524

missing_text_chars -= _chars_by_age['7.0']

525

assert missing_text_chars == set(), (

526

'Text style version of some emoji characters are missing: ' +

527

repr(missing_text_chars))

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

528

529

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

530

# Setting reverse to true returns a dictionary that maps the values to sets of

531

# characters, useful for some binary properties. Otherwise, we get a

532

# dictionary that maps characters to the property values, assuming there's only

533

# one property in the file.

534

def parse_unicode_datafile(file_path, reverse=False):

535

if reverse:

536

output_dict = collections.defaultdict(set)

537

else:

538

output_dict = {}

539

with open(file_path) as datafile:

540

for line in datafile:

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

541

if '#' in line:

542

line = line[:line.index('#')]

543

line = line.strip()

544

if not line:

545

continue

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

546

Roozbeh Pournader

2016-07-25 14:04:34 -0700

[diff] [blame]

547

chars, prop = line.split(';')[:2]

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

548

chars = chars.strip()

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

549

prop = prop.strip()

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

550

551

if ' ' in chars: # character sequence

552

sequence = [int(ch, 16) for ch in chars.split(' ')]

553

additions = [tuple(sequence)]

554

elif '..' in chars: # character range

555

char_start, char_end = chars.split('..')

556

char_start = int(char_start, 16)

557

char_end = int(char_end, 16)

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

558

additions = range(char_start, char_end+1)

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

559

else: # singe character

560

additions = [int(chars, 16)]

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

561

if reverse:

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

562

output_dict[prop].update(additions)

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

563

else:

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

564

for addition in additions:

565

assert addition not in output_dict

566

output_dict[addition] = prop

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

return output_dict

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

570

def parse_emoji_variants(file_path):

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

571

emoji_set = set()

572

text_set = set()

573

with open(file_path) as datafile:

574

for line in datafile:

575

if '#' in line:

576

line = line[:line.index('#')]

line = line.strip()

if not line:

continue

sequence, description, _ = line.split(';')

581

sequence = sequence.strip().split(' ')

582

base = int(sequence[0], 16)

583

vs = int(sequence[1], 16)

584

description = description.strip()

585

if description == 'text style':

586

text_set.add((base, vs))

587

elif description == 'emoji style':

588

emoji_set.add((base, vs))

589

return text_set, emoji_set

590

591

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

592

def parse_ucd(ucd_path):

593

global _emoji_properties, _chars_by_age

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

594

global _text_variation_sequences, _emoji_variation_sequences

595

global _emoji_sequences, _emoji_zwj_sequences

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

596

_emoji_properties = parse_unicode_datafile(

597

path.join(ucd_path, 'emoji-data.txt'), reverse=True)

Roozbeh Pournader

f7a68c1

2017-04-04 18:59:31 -0700

[diff] [blame]

598

emoji_properties_additions = parse_unicode_datafile(

599

path.join(ucd_path, 'additions', 'emoji-data.txt'), reverse=True)

600

for prop in emoji_properties_additions.keys():

601

_emoji_properties[prop].update(emoji_properties_additions[prop])

602

Roozbeh Pournader

2016-03-16 18:55:32 -0700

[diff] [blame]

603

_chars_by_age = parse_unicode_datafile(

604

path.join(ucd_path, 'DerivedAge.txt'), reverse=True)

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

605

sequences = parse_emoji_variants(

606

path.join(ucd_path, 'emoji-variation-sequences.txt'))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

607

_text_variation_sequences, _emoji_variation_sequences = sequences

608

_emoji_sequences = parse_unicode_datafile(

609

path.join(ucd_path, 'emoji-sequences.txt'))

Siyamed Sinir

6e06ad0

2017-04-19 18:18:35 -0700

[diff] [blame]

610

_emoji_sequences.update(parse_unicode_datafile(

611

path.join(ucd_path, 'additions', 'emoji-sequences.txt')))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

612

_emoji_zwj_sequences = parse_unicode_datafile(

613

path.join(ucd_path, 'emoji-zwj-sequences.txt'))

Roozbeh Pournader

1800ba4

2017-03-17 18:23:23 -0700

[diff] [blame]

614

_emoji_zwj_sequences.update(parse_unicode_datafile(

615

path.join(ucd_path, 'additions', 'emoji-zwj-sequences.txt')))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

616

Siyamed Sinir

d97df5a

2018-04-12 13:11:42 -0700

[diff] [blame]

617

exclusions = parse_unicode_datafile(path.join(ucd_path, 'additions', 'emoji-exclusions.txt'))

618

_emoji_sequences = remove_emoji_exclude(_emoji_sequences, exclusions)

619

_emoji_zwj_sequences = remove_emoji_exclude(_emoji_zwj_sequences, exclusions)

620

_emoji_variation_sequences = remove_emoji_variation_exclude(_emoji_variation_sequences, exclusions)

Qingqing Deng

5e98771

2019-03-25 16:53:34 -0700

[diff] [blame]

621

# Unicode 12.0 adds Basic_Emoji in emoji-sequences.txt. We ignore them here since we are already

622

# checking the emoji presentations with emoji-variation-sequences.txt.

623

# Please refer to http://unicode.org/reports/tr51/#def_basic_emoji_set .

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

624

_emoji_sequences = {k: v for k, v in _emoji_sequences.items() if not v == 'Basic_Emoji' }

Qingqing Deng

5e98771

2019-03-25 16:53:34 -0700

[diff] [blame]

625

Siyamed Sinir

d97df5a

2018-04-12 13:11:42 -0700

[diff] [blame]

626

627

def remove_emoji_variation_exclude(source, items):

628

return source.difference(items.keys())

629

630

def remove_emoji_exclude(source, items):

631

return {k: v for k, v in source.items() if k not in items}

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

632

633

def flag_sequence(territory_code):

634

return tuple(0x1F1E6 + ord(ch) - ord('A') for ch in territory_code)

635

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

636

EQUIVALENT_FLAGS = {

637

flag_sequence('BV'): flag_sequence('NO'),

638

flag_sequence('CP'): flag_sequence('FR'),

639

flag_sequence('HM'): flag_sequence('AU'),

640

flag_sequence('SJ'): flag_sequence('NO'),

641

flag_sequence('UM'): flag_sequence('US'),

642

}

643

644

COMBINING_KEYCAP = 0x20E3

645

646

LEGACY_ANDROID_EMOJI = {

647

0xFE4E5: flag_sequence('JP'),

648

0xFE4E6: flag_sequence('US'),

649

0xFE4E7: flag_sequence('FR'),

650

0xFE4E8: flag_sequence('DE'),

651

0xFE4E9: flag_sequence('IT'),

652

0xFE4EA: flag_sequence('GB'),

653

0xFE4EB: flag_sequence('ES'),

654

0xFE4EC: flag_sequence('RU'),

655

0xFE4ED: flag_sequence('CN'),

656

0xFE4EE: flag_sequence('KR'),

657

0xFE82C: (ord('#'), COMBINING_KEYCAP),

658

0xFE82E: (ord('1'), COMBINING_KEYCAP),

659

0xFE82F: (ord('2'), COMBINING_KEYCAP),

660

0xFE830: (ord('3'), COMBINING_KEYCAP),

661

0xFE831: (ord('4'), COMBINING_KEYCAP),

662

0xFE832: (ord('5'), COMBINING_KEYCAP),

663

0xFE833: (ord('6'), COMBINING_KEYCAP),

664

0xFE834: (ord('7'), COMBINING_KEYCAP),

665

0xFE835: (ord('8'), COMBINING_KEYCAP),

666

0xFE836: (ord('9'), COMBINING_KEYCAP),

667

0xFE837: (ord('0'), COMBINING_KEYCAP),

668

}

669

Siyamed Sinir

77a1b14

2018-07-12 12:02:18 -0700

[diff] [blame]

670

# This is used to define the emoji that should have the same glyph.

671

# i.e. previously we had gender based Kiss (0x1F48F), which had the same glyph

672

# with Kiss: Woman, Man (0x1F469, 0x200D, 0x2764, 0x200D, 0x1F48B, 0x200D, 0x1F468)

673

# in that case a valid row would be:

674

# (0x1F469, 0x200D, 0x2764, 0x200D, 0x1F48B, 0x200D, 0x1F468): 0x1F48F,

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

675

ZWJ_IDENTICALS = {

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

676

}

677

Seigo Nonaka

c180863

2018-05-14 13:39:40 -0700

[diff] [blame]

678

SAME_FLAG_MAPPINGS = [

679

# Diego Garcia and British Indian Ocean Territory

680

((0x1F1EE, 0x1F1F4), (0x1F1E9, 0x1F1EC)),

681

# St. Martin and France

682

((0x1F1F2, 0x1F1EB), (0x1F1EB, 0x1F1F7)),

683

# Spain and Ceuta & Melilla

684

((0x1F1EA, 0x1F1F8), (0x1F1EA, 0x1F1E6)),

685

]

686

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

687

ZWJ = 0x200D

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

688

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

689

EMPTY_FLAG_SEQUENCE = (0x1F3F4, 0xE007F)

690

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

691

def is_fitzpatrick_modifier(cp):

Roozbeh Pournader

2016-07-25 14:04:34 -0700

[diff] [blame]

692

return 0x1F3FB <= cp <= 0x1F3FF

693

694

695

def reverse_emoji(seq):

696

rev = list(reversed(seq))

697

# if there are fitzpatrick modifiers in the sequence, keep them after

698

# the emoji they modify

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

699

for i in range(1, len(rev)):

Roozbeh Pournader

2016-07-25 14:04:34 -0700

[diff] [blame]

700

if is_fitzpatrick_modifier(rev[i-1]):

701

rev[i], rev[i-1] = rev[i-1], rev[i]

702

return tuple(rev)

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

703

704

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

705

def compute_expected_emoji():

706

equivalent_emoji = {}

707

sequence_pieces = set()

708

all_sequences = set()

709

all_sequences.update(_emoji_variation_sequences)

710

Raph Levien

2b8b819

2016-08-09 14:28:54 -0700

[diff] [blame]

711

# add zwj sequences not in the current emoji-zwj-sequences.txt

712

adjusted_emoji_zwj_sequences = dict(_emoji_zwj_sequences)

713

adjusted_emoji_zwj_sequences.update(_emoji_zwj_sequences)

Raph Levien

2b8b819

2016-08-09 14:28:54 -0700

[diff] [blame]

714

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

715

# Add empty flag tag sequence that is supported as fallback

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

716

_emoji_sequences[EMPTY_FLAG_SEQUENCE] = 'Emoji_Tag_Sequence'

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

717

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

718

for sequence in _emoji_sequences.keys():

719

sequence = tuple(ch for ch in sequence if ch != EMOJI_VS)

720

all_sequences.add(sequence)

721

sequence_pieces.update(sequence)

722

Raph Levien

2b8b819

2016-08-09 14:28:54 -0700

[diff] [blame]

723

for sequence in adjusted_emoji_zwj_sequences.keys():

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

724

sequence = tuple(ch for ch in sequence if ch != EMOJI_VS)

725

all_sequences.add(sequence)

726

sequence_pieces.update(sequence)

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

727

Seigo Nonaka

c180863

2018-05-14 13:39:40 -0700

[diff] [blame]

728

for first, second in SAME_FLAG_MAPPINGS:

729

equivalent_emoji[first] = second

730

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

731

# Add all tag characters used in flags

732

sequence_pieces.update(range(0xE0030, 0xE0039 + 1))

733

sequence_pieces.update(range(0xE0061, 0xE007A + 1))

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

734

735

all_emoji = (

736

_emoji_properties['Emoji'] |

737

all_sequences |

738

sequence_pieces |

739

set(LEGACY_ANDROID_EMOJI.keys()))

740

default_emoji = (

741

_emoji_properties['Emoji_Presentation'] |

742

all_sequences |

743

set(LEGACY_ANDROID_EMOJI.keys()))

744

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

745

equivalent_emoji.update(EQUIVALENT_FLAGS)

746

equivalent_emoji.update(LEGACY_ANDROID_EMOJI)

747

equivalent_emoji.update(ZWJ_IDENTICALS)

Roozbeh Pournader

2017-04-10 13:52:20 -0700

[diff] [blame]

748

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

749

for seq in _emoji_variation_sequences:

750

equivalent_emoji[seq] = seq[0]

751

752

return all_emoji, default_emoji, equivalent_emoji

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

753

754

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

755

def check_compact_only_fallback():

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

756

for name, fallback_chain in _fallback_chains.items():

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

757

for record in fallback_chain:

758

if record.variant == 'compact':

759

same_script_elegants = [x for x in fallback_chain

760

if x.scripts == record.scripts and x.variant == 'elegant']

761

assert same_script_elegants, (

762

'%s must be in elegant of %s as fallback of "%s" too' % (

763

record.font, record.scripts, record.fallback_for),)

764

765

Roozbeh Pournader

2016-07-27 13:08:37 -0700

[diff] [blame]

766

def check_vertical_metrics():

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

767

for record in _all_fonts:

Roozbeh Pournader

2016-07-27 13:08:37 -0700

[diff] [blame]

768

if record.name in ['sans-serif', 'sans-serif-condensed']:

769

font = open_font(record.font)

Roozbeh Pournader

ede3a17

2016-07-27 16:35:12 -0700

[diff] [blame]

770

assert font['head'].yMax == 2163 and font['head'].yMin == -555, (

Roozbeh Pournader

2017-05-18 18:38:36 -0700

[diff] [blame]

771

'yMax and yMin of %s do not match expected values.' % (

772

record.font,))

Roozbeh Pournader

ede3a17

2016-07-27 16:35:12 -0700

[diff] [blame]

773

Roozbeh Pournader

2017-05-18 18:38:36 -0700

[diff] [blame]

774

if record.name in ['sans-serif', 'sans-serif-condensed',

775

'serif', 'monospace']:

Roozbeh Pournader

ede3a17

2016-07-27 16:35:12 -0700

[diff] [blame]

776

font = open_font(record.font)

Roozbeh Pournader

2017-05-18 18:38:36 -0700

[diff] [blame]

777

assert (font['hhea'].ascent == 1900 and

778

font['hhea'].descent == -500), (

779

'ascent and descent of %s do not match expected '

780

'values.' % (record.font,))

781

782

783

def check_cjk_punctuation():

784

cjk_scripts = {'Hans', 'Hant', 'Jpan', 'Kore'}

785

cjk_punctuation = range(0x3000, 0x301F + 1)

Haibo Huang

2020-03-05 11:58:47 -0800

[diff] [blame]

786

for name, fallback_chain in _fallback_chains.items():

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

787

for record in fallback_chain:

788

if record.scripts.intersection(cjk_scripts):

789

# CJK font seen. Stop checking the rest of the fonts.

790

break

791

assert_font_supports_none_of_chars(record.font, cjk_punctuation, name)

Roozbeh Pournader

2016-07-27 13:08:37 -0700

[diff] [blame]

792

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

793

def getPostScriptName(font):

794

font_file, index = font

795

font_path = path.join(_fonts_dir, font_file)

796

if index is not None:

797

# Use the first font file in the collection for resolving post script name.

798

ttf = ttLib.TTFont(font_path, fontNumber=0)

799

else:

800

ttf = ttLib.TTFont(font_path)

801

802

nameTable = ttf['name']

803

for name in nameTable.names:

804

if (name.nameID == 6 and name.platformID == 3 and name.platEncID == 1

805

and name.langID == 0x0409):

806

return str(name)

807

808

def check_canonical_name():

809

for record in _all_fonts:

810

file_name, index = record.font

811

812

psName = getPostScriptName(record.font)

813

if record.psName:

814

# If fonts element has postScriptName attribute, it should match with the PostScript

815

# name in the name table.

816

assert psName == record.psName, ('postScriptName attribute %s should match with %s' % (

817

record.psName, psName))

818

else:

819

# If fonts element doesn't have postScriptName attribute, the file name should match

820

# with the PostScript name in the name table.

821

assert psName == file_name[:-4], ('file name %s should match with %s' % (

822

file_name, psName))

823

Roozbeh Pournader

2016-07-27 13:08:37 -0700

[diff] [blame]

824

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

825

def main():

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

826

global _fonts_dir

Doug Felt

2016-07-08 17:42:15 -0700

[diff] [blame]

827

target_out = sys.argv[1]

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

828

_fonts_dir = path.join(target_out, 'fonts')

829

830

fonts_xml_path = path.join(target_out, 'etc', 'fonts.xml')

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

831

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

832

parse_fonts_xml(fonts_xml_path)

833

Seigo Nonaka

2017-07-05 16:06:23 -0700

[diff] [blame]

834

check_compact_only_fallback()

835

Roozbeh Pournader

2016-07-27 13:08:37 -0700

[diff] [blame]

836

check_vertical_metrics()

837

Roozbeh Pournader

2016-03-09 23:08:45 -0800

[diff] [blame]

838

hyphens_dir = path.join(target_out, 'usr', 'hyphen-data')

839

check_hyphens(hyphens_dir)

840

Roozbeh Pournader

2017-05-18 18:38:36 -0700

[diff] [blame]

841

check_cjk_punctuation()

842

Seigo Nonaka

2021-04-16 00:11:43 -0700

[diff] [blame]

843

check_canonical_name()

844

Roozbeh Pournader

27ec3ac

2016-03-31 13:05:32 -0700

[diff] [blame]

845

check_emoji = sys.argv[2]

846

if check_emoji == 'true':

847

ucd_path = sys.argv[3]

848

parse_ucd(ucd_path)

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

849

all_emoji, default_emoji, equivalent_emoji = compute_expected_emoji()

Rod S

2022-03-26 16:16:41 -0700

[diff] [blame^]

850

check_emoji_compat(all_emoji, equivalent_emoji)

Roozbeh Pournader

2016-03-31 13:54:56 -0700

[diff] [blame]

851

check_emoji_coverage(all_emoji, equivalent_emoji)

852

check_emoji_defaults(default_emoji)

Roozbeh Pournader

2016-03-16 13:53:47 -0700

[diff] [blame]

853

Roozbeh Pournader