-
Notifications
You must be signed in to change notification settings - Fork 135
/
length.t
63 lines (45 loc) · 1.99 KB
/
length.t
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
use v6;
use Test;
# L<S32::Str/Str/=item length>
=begin pod
Various length tests (though "length" should not be used)
Don't mismatch "length" with the "width" property for Unicode characters.
L<"http://www.unicode.org/unicode/reports/tr11/">
=end pod
plan 29;
throws-like({"moose".length}, X::Method::NotFound, 'Str.length properly unimplemented');
# string literals, for sanity
# L<S32::Str/Str/=item chars>
# Please add test strings in your favorite script, especially if
# it is boustrophedonic or otherwise interesting.
my @stringy = <@stringy>;
my @data = (
# string octets codepoints chars
"", 0, 0, 0,
"moose", 5, 5, 5,
"møøse", 7, 5, 5,
"C:\\Program Files", 16, 16, 16,
~@stringy, 8, 8, 8,
"\x020ac \\x020ac", 11, 9, 9,
"בדיקה", 10, 5, 5,
"בדיקה 123", 14, 9, 9,
"rántottcsirke", 14, 13, 13,
"aáeéiíoóöőuúüű", 23, 14, 14,
"AÁEÉIÍOÓÖŐUÚÜŰ", 23, 14, 14,
"»«", 4, 2, 2,
">><<", 4, 4, 4,
);
#:map { my %hash; %hash<string bytes codes> = $_; \%hash };
# L<S32::Str/Str/=item chars>
# L<S32::Str/Str/=item codes>
for @data -> $string, $bytes, $codes, $chars {
is($string.chars, $chars, "'{$string}'.chars");
is($string.codes, $codes, "'{$string}'.codes");
}
# test something with a codepoint above 0xFFFF to catch errors that an
# UTF-16 based implementation might make
#?rakudo.jvm todo '.codes weirdness on JVM, possibly NYI? RT #124742'
is "\x[E0100]".codes, 1, '.codes on a >0xFFFF char'; # \c[VARIATION SELECTOR-17]
# test graphemes without a precomposed character in Unicode 5
is "\c[LATIN CAPITAL LETTER A WITH DOT ABOVE, COMBINING DOT BELOW]".codes, 2, '.codes on grapheme without precomposite';
# vim: ft=perl6