#!/usr/bin/perl use warnings; use strict; # Convert Unicode mapping tables to C structures # Input files may be found at http://unicode.org/Public/MAPPINGS # # Usage: conv.pl <input_file> die "Usage: conv.pl <input_file>\n" if (scalar(@ARGV) != 1); my @table; open MAP, "<$ARGV[0]" or die "Failed opening $ARGV[0]: $!\n"; while (<MAP>) { next if (/^#/); my @parts = split(/\s+/); # Ignore ASCII part next if (hex($parts[0]) < 0x80); # Convert undefined entries to U+FFFF if ($parts[1] =~ /^#/) { push(@table, "0xFFFF"); } else { push(@table, $parts[1]); } } close MAP; # You'll have to go through and fix up the structure name print "static uint32_t ${ARGV[0]}[128] = {\n\t"; my $count = 0; foreach my $item (@table) { print "$item, "; $count++; if ($count % 8 == 0 && $count != 128) { print "\n\t"; } } print "\n};\n\n";