blob: 2731136021816df12bea6094af49668d7ee88858 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
|
#!./perl
BEGIN {
unless(grep /blib/, @INC) {
chdir 't' if -d 't';
@INC = '../lib';
}
}
$| = 1;
print "1..15\n";
use charnames ':full';
print "not " unless "Here\N{EXCLAMATION MARK}?" eq "Here\041?";
print "ok 1\n";
{
use bytes; # UTEST can switch utf8 on
print "# \$res=$res \$\@='$@'\nnot "
if $res = eval <<'EOE'
use charnames ":full";
"Here: \N{CYRILLIC SMALL LETTER BE}!";
1
EOE
or $@ !~ /above 0xFF/;
print "ok 2\n";
# print "# \$res=$res \$\@='$@'\n";
print "# \$res=$res \$\@='$@'\nnot "
if $res = eval <<'EOE'
use charnames 'cyrillic';
"Here: \N{Be}!";
1
EOE
or $@ !~ /CYRILLIC CAPITAL LETTER BE.*above 0xFF/;
print "ok 3\n";
}
# If octal representation of unicode char is \0xyzt, then the utf8 is \3xy\2zt
$encoded_be = "\320\261";
$encoded_alpha = "\316\261";
$encoded_bet = "\327\221";
$encoded_deseng = "\360\220\221\215";
sub to_bytes {
pack"a*", shift;
}
{
use charnames ':full';
print "not " unless to_bytes("\N{CYRILLIC SMALL LETTER BE}") eq $encoded_be;
print "ok 4\n";
use charnames qw(cyrillic greek :short);
print "not " unless to_bytes("\N{be},\N{alpha},\N{hebrew:bet}")
eq "$encoded_be,$encoded_alpha,$encoded_bet";
print "ok 5\n";
}
{
use charnames ':full';
print "not " unless "\x{263a}" eq "\N{WHITE SMILING FACE}";
print "ok 6\n";
print "not " unless length("\x{263a}") == 1;
print "ok 7\n";
print "not " unless length("\N{WHITE SMILING FACE}") == 1;
print "ok 8\n";
print "not " unless sprintf("%vx", "\x{263a}") eq "263a";
print "ok 9\n";
print "not " unless sprintf("%vx", "\N{WHITE SMILING FACE}") eq "263a";
print "ok 10\n";
print "not " unless sprintf("%vx", "\xFF\N{WHITE SMILING FACE}") eq "ff.263a";
print "ok 11\n";
print "not " unless sprintf("%vx", "\x{ff}\N{WHITE SMILING FACE}") eq "ff.263a";
print "ok 12\n";
}
{
use charnames qw(:full);
use utf8;
my $x = "\x{221b}";
my $named = "\N{CUBE ROOT}";
print "not " unless ord($x) == ord($named);
print "ok 13\n";
}
{
use charnames qw(:full);
use utf8;
print "not " unless "\x{100}\N{CENT SIGN}" eq "\x{100}"."\N{CENT SIGN}";
print "ok 14\n";
}
{
use charnames ':full';
# XXX this test breaks in 5.6.x because the Unicode database is missing
# "DESERET SMALL LETTER ENG". Uncomment after updating to Unicode 3.1
# print "not "
# unless to_bytes("\N{DESERET SMALL LETTER ENG}") eq $encoded_deseng;
print "ok 15\n";
}
|