import sys from unicode_parse_common import * # http://www.unicode.org/Public/5.1.0/ucd/extracted/DerivedCombiningClass.txt class IdentityMap(object): def __getitem__(_, key): return key def main(infile, outfile): ranges = unicode_file_parse(infile, IdentityMap(), '0') ranges = sort_and_merge(ranges) print >>outfile, '// Generated from Unicode tables\n' print >>outfile, '#ifndef COMBINING_PROPERTIES_H_' print >>outfile, '#define COMBINING_PROPERTIES_H_\n' print >>outfile, '#include <stdint.h>' print >>outfile, 'struct combining_property {' print >>outfile, ' uint32_t range_start;' print >>outfile, ' uint32_t range_end;' print >>outfile, ' uint8_t klass;' print >>outfile, '};\n' print >>outfile, 'static const struct combining_property combining_properties[] = {' for (start, end, value) in ranges: print >>outfile, ' {0x%x, 0x%x, %s},' % (start, end, value) print >>outfile, '};\n' print >>outfile, 'static const unsigned combining_properties_count = %d;\n' % len(ranges) print >>outfile, '#endif // COMBINING_PROPERTIES_H_' if __name__ == '__main__': if len(sys.argv) != 3: print 'Usage: %s <input .txt> <output .h>' % sys.argv[0] else: main(file(sys.argv[1], 'r'), file(sys.argv[2], 'w+'))