初版
This commit is contained in:
@@ -0,0 +1,60 @@
|
||||
#!/usr/bin/perl
|
||||
|
||||
#################################################################################
|
||||
# Author: Serge Kozlov #
|
||||
# Date: 09/21/2005 #
|
||||
# Purpose: The script produces a text file ../data/charset_utf8.txt #
|
||||
# in UTF8 format. Each line contains one UTF8 character #
|
||||
# between 20 and 07FF #
|
||||
#################################################################################
|
||||
|
||||
genfile("../data/charset_utf8.txt", 33, 2047, "utf8");
|
||||
genfile(">../data/charset_utf8.txt", 19968, 20479,"utf8");
|
||||
|
||||
|
||||
#genfile("../data/charset_utf8.txt", 33, 2047, "utf8");
|
||||
|
||||
sub genfile ($$$$)
|
||||
{
|
||||
my $fn = shift;
|
||||
my $i_from = shift;
|
||||
my $i_to = shift;
|
||||
my $typ = shift;
|
||||
open F, ">$fn";
|
||||
for ($i = $i_from; $i <= $i_to; $i++)
|
||||
{
|
||||
if (($i > 32) && ($i < 65533) && ($i != 65279))
|
||||
{
|
||||
if ($typ eq "utf8")
|
||||
{
|
||||
if ($i < 128)
|
||||
{
|
||||
print F pack("C", $i), "\n";
|
||||
}
|
||||
elsif (($i > 127) && ($i < 2048))
|
||||
{
|
||||
$b1 = (($i & 1984) >> 6) + 192;
|
||||
$b2 = ($i & 63) + 128;
|
||||
print F pack("C", $b1);
|
||||
print F pack("C", $b2), "\n";
|
||||
}
|
||||
else
|
||||
{
|
||||
$b1 = (($i & 61440) >> 12) + 224;
|
||||
$b2 = (($i & 4032) >> 6) + 128;
|
||||
$b3 = ($i & 63) + 128;
|
||||
print F pack("C", $b1);
|
||||
print F pack("C", $b2);
|
||||
print F pack("C", $b3), "\n";
|
||||
}
|
||||
}
|
||||
elsif ($typ eq "ucs2")
|
||||
{
|
||||
print F pack("C", 0);
|
||||
print F pack("C", $i);
|
||||
print F pack("C", 0), "\n";
|
||||
}
|
||||
}
|
||||
}
|
||||
close F;
|
||||
}
|
||||
Reference in New Issue
Block a user