3
#################################################################################
4
# Author: Serge Kozlov #
6
# Purpose: The script produces a text file ../data/charset_utf8.txt #
7
# in UTF8 format. Each line contains one UTF8 character #
8
# between 20 and 07FF #
9
#################################################################################
11
genfile("../data/charset_utf8.txt", 33, 2047, "utf8");
12
genfile(">../data/charset_utf8.txt", 19968, 20479,"utf8");
15
#genfile("../data/charset_utf8.txt", 33, 2047, "utf8");
24
for ($i = $i_from; $i <= $i_to; $i++)
26
if (($i > 32) && ($i < 65533) && ($i != 65279))
32
print F pack("C", $i), "\n";
34
elsif (($i > 127) && ($i < 2048))
36
$b1 = (($i & 1984) >> 6) + 192;
37
$b2 = ($i & 63) + 128;
38
print F pack("C", $b1);
39
print F pack("C", $b2), "\n";
43
$b1 = (($i & 61440) >> 12) + 224;
44
$b2 = (($i & 4032) >> 6) + 128;
45
$b3 = ($i & 63) + 128;
46
print F pack("C", $b1);
47
print F pack("C", $b2);
48
print F pack("C", $b3), "\n";
51
elsif ($typ eq "ucs2")
54
print F pack("C", $i);
55
print F pack("C", 0), "\n";