From: Martin Mares Date: Sat, 11 Oct 2003 08:55:38 +0000 (+0000) Subject: Renamed charset import scripts. X-Git-Tag: holmes-import~1200 X-Git-Url: http://mj.ucw.cz/gitweb/?a=commitdiff_plain;h=c79a2911da7be63aaf4abec6b3ffad36dd5bcfb1;p=libucw.git Renamed charset import scripts. --- diff --git a/charset/misc/import-recode b/charset/misc/import-recode new file mode 100755 index 00000000..07b5a854 --- /dev/null +++ b/charset/misc/import-recode @@ -0,0 +1,33 @@ +#!/usr/bin/perl +# +# Use `recode` to create a translation table +# (c) 2003, Robert Spalek +# + +use open IN => ":utf8"; + +foreach $charset (@ARGV) +{ + print "Charset: $charset\n"; + open(fi, "recode -s -f $charset/..utf-8/ tmp/$charset") || die; + + while () + { + chop; + (($number, $char) = /^([0-9A-F]{2})\t(.?)$/) || die "Cannot parse $_"; + $recode[hex $number] = $char ne "" ? ord $char : -1; + } + $#recode >= 0 || die "Empty recoding table"; + $recode[10] = 10; + $recode[13] = 13; + + for ($i=0; $i<=$#recode; $i++) + { + printf fo "%02X\t%04X\n", $i, $recode[$i] + if $recode[$i] >= 0; + } + + close(fo); + close(fi); +} diff --git a/charset/misc/import-unicode_org b/charset/misc/import-unicode_org new file mode 100755 index 00000000..6c610343 --- /dev/null +++ b/charset/misc/import-unicode_org @@ -0,0 +1,28 @@ +#!/usr/bin/perl +# Import charset tables from ftp.unicode.org +# (c) 2003, Robert Spalek + +foreach $file (@ARGV) +{ + print "Converting $file\n"; + ($prefix, $filename) = $file =~ m|^(.*/)([^/]*)$|; + + open(fi, "<$file") || die; + open(fo, ">$file-tr") || die; + print fo "# $filename charset file +# Imported from ftp://ftp.unicode.org/Public/MAPPINGS/$file +# (c) 2003, Robert Spalek + +"; + while () + { + next if /^#/; + chop; + if (($code, $unicode, $comment) = /^0x(..)\t0x(....)\t#\t?(.*)$/) + { + print fo "$code\t$unicode\t$comment\n"; + } + } + close(fo); + close(fi); +} diff --git a/charset/misc/mkcharset b/charset/misc/mkcharset deleted file mode 100755 index 07b5a854..00000000 --- a/charset/misc/mkcharset +++ /dev/null @@ -1,33 +0,0 @@ -#!/usr/bin/perl -# -# Use `recode` to create a translation table -# (c) 2003, Robert Spalek -# - -use open IN => ":utf8"; - -foreach $charset (@ARGV) -{ - print "Charset: $charset\n"; - open(fi, "recode -s -f $charset/..utf-8/ tmp/$charset") || die; - - while () - { - chop; - (($number, $char) = /^([0-9A-F]{2})\t(.?)$/) || die "Cannot parse $_"; - $recode[hex $number] = $char ne "" ? ord $char : -1; - } - $#recode >= 0 || die "Empty recoding table"; - $recode[10] = 10; - $recode[13] = 13; - - for ($i=0; $i<=$#recode; $i++) - { - printf fo "%02X\t%04X\n", $i, $recode[$i] - if $recode[$i] >= 0; - } - - close(fo); - close(fi); -} diff --git a/charset/misc/trunicode b/charset/misc/trunicode deleted file mode 100755 index 6c610343..00000000 --- a/charset/misc/trunicode +++ /dev/null @@ -1,28 +0,0 @@ -#!/usr/bin/perl -# Import charset tables from ftp.unicode.org -# (c) 2003, Robert Spalek - -foreach $file (@ARGV) -{ - print "Converting $file\n"; - ($prefix, $filename) = $file =~ m|^(.*/)([^/]*)$|; - - open(fi, "<$file") || die; - open(fo, ">$file-tr") || die; - print fo "# $filename charset file -# Imported from ftp://ftp.unicode.org/Public/MAPPINGS/$file -# (c) 2003, Robert Spalek - -"; - while () - { - next if /^#/; - chop; - if (($code, $unicode, $comment) = /^0x(..)\t0x(....)\t#\t?(.*)$/) - { - print fo "$code\t$unicode\t$comment\n"; - } - } - close(fo); - close(fi); -}