scripts/color_emoji_image_diff.py - platform/external/noto-fonts - Git at Google

 #!/usr/bin/env python

 # Copyright (C) 2018 The Android Open Source Project
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #      http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.

 import contextlib
 import itertools
 import io
 import os
 import sys

 from fontTools import ttLib
 from PIL import Image

 def to_hex_str(value):
     """Converts given int value to hex without the 0x prefix"""
     return format(value, 'X')

 def codepoint_to_string(codepoints):
     """Converts a list of codepoints into a string separated with space."""
     return '_'.join([to_hex_str(x) for x in codepoints])

 def read_cmap12(ttf, glyph_to_codepoint_map, codepoint_map):
     cmap = ttf['cmap']
     for table in cmap.tables:
         if table.format == 12 and table.platformID == 3 and table.platEncID == 10:
             for codepoint, glyph_name in table.cmap.iteritems():
                 glyph_to_codepoint_map[glyph_name] = codepoint
                 codepoint_map[codepoint_to_string([codepoint])] = glyph_name
                 # self.update_emoji_data([codepoint], glyph_name)
             return table
     raise ValueError("Font doesn't contain cmap with format:12, platformID:3 and platEncID:10")

 def read_gsub(ttf, glyph_to_codepoint_map, codepoint_map):
     gsub = ttf['GSUB']
     ligature_subtables = []
     context_subtables = []
     # this code is font dependent, implementing all gsub rules is out of scope of EmojiCompat
     # and would be expensive with little value
     for lookup in gsub.table.LookupList.Lookup:
         for subtable in lookup.SubTable:
             if subtable.LookupType == 5:
                 context_subtables.append(subtable)
             elif subtable.LookupType == 4:
                 ligature_subtables.append(subtable)

     for subtable in context_subtables:
         add_gsub_context_subtable(subtable, gsub.table.LookupList, glyph_to_codepoint_map, codepoint_map)

     for subtable in ligature_subtables:
         add_gsub_ligature_subtable(subtable, glyph_to_codepoint_map, codepoint_map)

 def add_gsub_context_subtable(subtable, lookup_list, glyph_to_codepoint_map, codepoint_map):
     for sub_class_set in subtable.SubClassSet:
         if sub_class_set:
             for sub_class_rule in sub_class_set.SubClassRule:
                 subs_list = len(sub_class_rule.SubstLookupRecord) * [None]
                 for record in sub_class_rule.SubstLookupRecord:
                     subs_list[record.SequenceIndex] = get_substitutions(lookup_list,
                                                                         record.LookupListIndex)
                 combinations = list(itertools.product(*subs_list))
                 for seq in combinations:
                     glyph_names = [x["input"] for x in seq]
                     codepoints = [glyph_to_codepoint_map[x] for x in glyph_names]
                     outputs = [x["output"] for x in seq if x["output"]]
                     nonempty_outputs = filter(lambda x: x.strip() , outputs)
                     if len(nonempty_outputs) == 0:
                         print("Warning: no output glyph is set for " + str(glyph_names))
                         continue
                     elif len(nonempty_outputs) > 1:
                         print(
                             "Warning: multiple glyph is set for "
                                 + str(glyph_names) + ", will use the first one")

                     glyph = nonempty_outputs[0]
                     codepoint_map[codepoint_to_string(codepoints)] = glyph

 def get_substitutions(lookup_list, index):
     result = []
     for x in lookup_list.Lookup[index].SubTable:
         for input, output in x.mapping.iteritems():
             result.append({"input": input, "output": output})
     return result

 def add_gsub_ligature_subtable(subtable, glyph_to_codepoint_map, codepoint_map):
     for name, ligatures in subtable.ligatures.iteritems():
         for ligature in ligatures:
             glyph_names = [name] + ligature.Component
             codepoints = [glyph_to_codepoint_map[x] for x in glyph_names]
             codepoint_map[codepoint_to_string(codepoints)] = ligature.LigGlyph

 def read_cbdt(ttf):
   cbdt = ttf['CBDT']
   glyph_to_image = {}
   for strike_data in cbdt.strikeData:
     for key, data in strike_data.iteritems():
       data.decompile
       glyph_to_image[key] = Image.open(io.BytesIO(data.imageData))
   return glyph_to_image


 rgba_map = {}

 def similar_img(img1, img2):
     # return if images are the same with accepting some changes
     if img1 is None and img2 is None: return True
     if img1 is None or img2 is None: return False
     if not img1.size == img2.size: return False

     pixels1 = rgba_map.get(img1, img1.convert('L').getdata())
     pixels2 = rgba_map.get(img2, img2.convert('L').getdata())
     pixels = itertools.izip(pixels1, pixels2)
     diff = 0
     for px1, px2 in pixels:
         diff = diff + abs(px1-px2)
     pixel_count = 1.0 * img1.size[0] * img1.size[1]
     normalized_diff = diff / pixel_count / 255.0 * 100.0
     if normalized_diff <= 0.5: return True
     return False

 def main(argv):
   codepoint_map_1 = {}
   codepoint_map_2 = {}
   glyph_to_codepoint_map_1 = {}
   glyph_to_codepoint_map_2 = {}

   with contextlib.closing(ttLib.TTFont(argv[1])) as ttf:
     font1_cbdt = read_cbdt(ttf)
     read_cmap12(ttf, glyph_to_codepoint_map_1, codepoint_map_1)
     read_gsub(ttf, glyph_to_codepoint_map_1, codepoint_map_1)
   with contextlib.closing(ttLib.TTFont(argv[2])) as ttf:
     font2_cbdt = read_cbdt(ttf)
     read_cmap12(ttf, glyph_to_codepoint_map_2, codepoint_map_2)
     read_gsub(ttf, glyph_to_codepoint_map_2, codepoint_map_2)

   glyphs1 = set(font1_cbdt.keys())
   glyphs2 = set(font2_cbdt.keys())

   codepoints_set1 = set(codepoint_map_1.keys())
   codepoints_set2 = set(codepoint_map_2.keys())

   if codepoints_set1 != codepoints_set2:
     print "Codepoints set has changed: : %s" % (codepoints_set1 ^ codepoints_set2)

   all_codepoints = set(codepoint_map_1.keys()).union(codepoint_map_2.keys())

   for key in all_codepoints:
     glyph1 = codepoint_map_1[key] if key in codepoint_map_1 else None
     glyph2 = codepoint_map_2[key] if key in codepoint_map_2 else None

     image1 = font1_cbdt[glyph1] if glyph1 and glyph1 in font1_cbdt else None
     image2 = font2_cbdt[glyph2] if glyph2 and glyph2 in font2_cbdt else None

     if not similar_img(image1, image2):
       print 'Glyph %s has different image' % key
       if image1:
         with open(os.path.join(argv[3], '%s_old.png' % key), 'w') as f:
             image1.save(f)
       if image2:
         with open(os.path.join(argv[3], '%s_new.png' % key), 'w') as f:
             image2.save(f)


 def print_usage():
     """Prints how to use the script."""
     print("usage: old_font new_font output_dir")

 if __name__ == '__main__':
    if len(sys.argv) < 3:
        print_usage()
        sys.exit(1)
    main(sys.argv)
	#!/usr/bin/env python

	# Copyright (C) 2018 The Android Open Source Project
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	import contextlib
	import itertools
	import io
	import os
	import sys

	from fontTools import ttLib
	from PIL import Image

	def to_hex_str(value):
	"""Converts given int value to hex without the 0x prefix"""
	return format(value, 'X')

	def codepoint_to_string(codepoints):
	"""Converts a list of codepoints into a string separated with space."""
	return '_'.join([to_hex_str(x) for x in codepoints])

	def read_cmap12(ttf, glyph_to_codepoint_map, codepoint_map):
	cmap = ttf['cmap']
	for table in cmap.tables:
	if table.format == 12 and table.platformID == 3 and table.platEncID == 10:
	for codepoint, glyph_name in table.cmap.iteritems():
	glyph_to_codepoint_map[glyph_name] = codepoint
	codepoint_map[codepoint_to_string([codepoint])] = glyph_name
	# self.update_emoji_data([codepoint], glyph_name)
	return table
	raise ValueError("Font doesn't contain cmap with format:12, platformID:3 and platEncID:10")

	def read_gsub(ttf, glyph_to_codepoint_map, codepoint_map):
	gsub = ttf['GSUB']
	ligature_subtables = []
	context_subtables = []
	# this code is font dependent, implementing all gsub rules is out of scope of EmojiCompat
	# and would be expensive with little value
	for lookup in gsub.table.LookupList.Lookup:
	for subtable in lookup.SubTable:
	if subtable.LookupType == 5:
	context_subtables.append(subtable)
	elif subtable.LookupType == 4:
	ligature_subtables.append(subtable)

	for subtable in context_subtables:
	add_gsub_context_subtable(subtable, gsub.table.LookupList, glyph_to_codepoint_map, codepoint_map)

	for subtable in ligature_subtables:
	add_gsub_ligature_subtable(subtable, glyph_to_codepoint_map, codepoint_map)

	def add_gsub_context_subtable(subtable, lookup_list, glyph_to_codepoint_map, codepoint_map):
	for sub_class_set in subtable.SubClassSet:
	if sub_class_set:
	for sub_class_rule in sub_class_set.SubClassRule:
	subs_list = len(sub_class_rule.SubstLookupRecord) * [None]
	for record in sub_class_rule.SubstLookupRecord:
	subs_list[record.SequenceIndex] = get_substitutions(lookup_list,
	record.LookupListIndex)
	combinations = list(itertools.product(*subs_list))
	for seq in combinations:
	glyph_names = [x["input"] for x in seq]
	codepoints = [glyph_to_codepoint_map[x] for x in glyph_names]
	outputs = [x["output"] for x in seq if x["output"]]
	nonempty_outputs = filter(lambda x: x.strip() , outputs)
	if len(nonempty_outputs) == 0:
	print("Warning: no output glyph is set for " + str(glyph_names))
	continue
	elif len(nonempty_outputs) > 1:
	print(
	"Warning: multiple glyph is set for "
	+ str(glyph_names) + ", will use the first one")

	glyph = nonempty_outputs[0]
	codepoint_map[codepoint_to_string(codepoints)] = glyph

	def get_substitutions(lookup_list, index):
	result = []
	for x in lookup_list.Lookup[index].SubTable:
	for input, output in x.mapping.iteritems():
	result.append({"input": input, "output": output})
	return result

	def add_gsub_ligature_subtable(subtable, glyph_to_codepoint_map, codepoint_map):
	for name, ligatures in subtable.ligatures.iteritems():
	for ligature in ligatures:
	glyph_names = [name] + ligature.Component
	codepoints = [glyph_to_codepoint_map[x] for x in glyph_names]
	codepoint_map[codepoint_to_string(codepoints)] = ligature.LigGlyph

	def read_cbdt(ttf):
	cbdt = ttf['CBDT']
	glyph_to_image = {}
	for strike_data in cbdt.strikeData:
	for key, data in strike_data.iteritems():
	data.decompile
	glyph_to_image[key] = Image.open(io.BytesIO(data.imageData))
	return glyph_to_image


	rgba_map = {}

	def similar_img(img1, img2):
	# return if images are the same with accepting some changes
	if img1 is None and img2 is None: return True
	if img1 is None or img2 is None: return False
	if not img1.size == img2.size: return False

	pixels1 = rgba_map.get(img1, img1.convert('L').getdata())
	pixels2 = rgba_map.get(img2, img2.convert('L').getdata())
	pixels = itertools.izip(pixels1, pixels2)
	diff = 0
	for px1, px2 in pixels:
	diff = diff + abs(px1-px2)
	pixel_count = 1.0 * img1.size[0] * img1.size[1]
	normalized_diff = diff / pixel_count / 255.0 * 100.0
	if normalized_diff <= 0.5: return True
	return False

	def main(argv):
	codepoint_map_1 = {}
	codepoint_map_2 = {}
	glyph_to_codepoint_map_1 = {}
	glyph_to_codepoint_map_2 = {}

	with contextlib.closing(ttLib.TTFont(argv[1])) as ttf:
	font1_cbdt = read_cbdt(ttf)
	read_cmap12(ttf, glyph_to_codepoint_map_1, codepoint_map_1)
	read_gsub(ttf, glyph_to_codepoint_map_1, codepoint_map_1)
	with contextlib.closing(ttLib.TTFont(argv[2])) as ttf:
	font2_cbdt = read_cbdt(ttf)
	read_cmap12(ttf, glyph_to_codepoint_map_2, codepoint_map_2)
	read_gsub(ttf, glyph_to_codepoint_map_2, codepoint_map_2)

	glyphs1 = set(font1_cbdt.keys())
	glyphs2 = set(font2_cbdt.keys())

	codepoints_set1 = set(codepoint_map_1.keys())
	codepoints_set2 = set(codepoint_map_2.keys())

	if codepoints_set1 != codepoints_set2:
	print "Codepoints set has changed: : %s" % (codepoints_set1 ^ codepoints_set2)

	all_codepoints = set(codepoint_map_1.keys()).union(codepoint_map_2.keys())

	for key in all_codepoints:
	glyph1 = codepoint_map_1[key] if key in codepoint_map_1 else None
	glyph2 = codepoint_map_2[key] if key in codepoint_map_2 else None

	image1 = font1_cbdt[glyph1] if glyph1 and glyph1 in font1_cbdt else None
	image2 = font2_cbdt[glyph2] if glyph2 and glyph2 in font2_cbdt else None

	if not similar_img(image1, image2):
	print 'Glyph %s has different image' % key
	if image1:
	with open(os.path.join(argv[3], '%s_old.png' % key), 'w') as f:
	image1.save(f)
	if image2:
	with open(os.path.join(argv[3], '%s_new.png' % key), 'w') as f:
	image2.save(f)


	def print_usage():
	"""Prints how to use the script."""
	print("usage: old_font new_font output_dir")

	if __name__ == '__main__':
	if len(sys.argv) < 3:
	print_usage()
	sys.exit(1)
	main(sys.argv)