From 0f01495d34c2cefeb3a78e0646edbde076f8558c Mon Sep 17 00:00:00 2001 From: John Mark Bell Date: Thu, 4 Sep 2008 17:01:17 +0000 Subject: Perl script to convert Unicode mapping tables to C structures svn path=/trunk/libparserutils/; revision=5234 --- build/conv.pl | 49 +++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 49 insertions(+) create mode 100755 build/conv.pl (limited to 'build/conv.pl') diff --git a/build/conv.pl b/build/conv.pl new file mode 100755 index 0000000..314b73f --- /dev/null +++ b/build/conv.pl @@ -0,0 +1,49 @@ +#!/usr/bin/perl + +use warnings; +use strict; + +# Convert Unicode mapping tables to C structures +# Input files may be found at http://unicode.org/Public/MAPPINGS +# +# Usage: conv.pl + +die "Usage: conv.pl \n" if (scalar(@ARGV) != 1); + +my @table; + +open MAP, "<$ARGV[0]" or die "Failed opening $ARGV[0]: $!\n"; + +while () { + next if (/^#/); + + my @parts = split(/\s+/); + + # Ignore ASCII part + next if (hex($parts[0]) < 0x80); + + # Convert undefined entries to U+FFFF + if ($parts[1] =~ /^#/) { + push(@table, "0xFFFF"); + } else { + push(@table, $parts[1]); + } +} + +close MAP; + +# You'll have to go through and fix up the structure name +print "static uint32_t ${ARGV[0]}[128] = {\n\t"; + +my $count = 0; +foreach my $item (@table) { + print "$item, "; + $count++; + + if ($count % 8 == 0 && $count != 128) { + print "\n\t"; + } +} + +print "\n};\n\n"; + -- cgit v1.2.3