xref: /openbsd/gnu/usr.bin/perl/t/op/tr.t (revision 78b63d65)
1# tr.t
2
3BEGIN {
4    chdir 't' if -d 't';
5    @INC = '../lib';
6}
7
8print "1..54\n";
9
10$_ = "abcdefghijklmnopqrstuvwxyz";
11
12tr/a-z/A-Z/;
13
14print "not " unless $_ eq "ABCDEFGHIJKLMNOPQRSTUVWXYZ";
15print "ok 1\n";
16
17tr/A-Z/a-z/;
18
19print "not " unless $_ eq "abcdefghijklmnopqrstuvwxyz";
20print "ok 2\n";
21
22tr/b-y/B-Y/;
23
24print "not " unless $_ eq "aBCDEFGHIJKLMNOPQRSTUVWXYz";
25print "ok 3\n";
26
27# In EBCDIC 'I' is \xc9 and 'J' is \0xd1, 'i' is \x89 and 'j' is \x91.
28# Yes, discontinuities.  Regardless, the \xca in the below should stay
29# untouched (and not became \x8a).
30{
31    no utf8;
32    $_ = "I\xcaJ";
33
34    tr/I-J/i-j/;
35
36    print "not " unless $_ eq "i\xcaj";
37    print "ok 4\n";
38}
39#
40
41# make sure that tr cancels IOK and NOK
42($x = 12) =~ tr/1/3/;
43(my $y = 12) =~ tr/1/3/;
44($f = 1.5) =~ tr/1/3/;
45(my $g = 1.5) =~ tr/1/3/;
46print "not " unless $x + $y + $f + $g == 71;
47print "ok 5\n";
48
49# make sure tr is harmless if not updating  -  see [ID 20000511.005]
50$_ = 'fred';
51/([a-z]{2})/;
52$1 =~ tr/A-Z//;
53s/^(\s*)f/$1F/;
54print "not " if $_ ne 'Fred';
55print "ok 6\n";
56
57# check tr handles UTF8 correctly
58($x = 256.65.258) =~ tr/a/b/;
59print "not " if $x ne 256.65.258 or length $x != 3;
60print "ok 7\n";
61$x =~ tr/A/B/;
62if (ord("\t") == 9) { # ASCII
63    print "not " if $x ne 256.66.258 or length $x != 3;
64}
65else {
66    print "not " if $x ne 256.65.258 or length $x != 3;
67}
68print "ok 8\n";
69# EBCDIC variants of the above tests
70($x = 256.193.258) =~ tr/a/b/;
71print "not " if $x ne 256.193.258 or length $x != 3;
72print "ok 9\n";
73$x =~ tr/A/B/;
74if (ord("\t") == 9) { # ASCII
75    print "not " if $x ne 256.193.258 or length $x != 3;
76}
77else {
78    print "not " if $x ne 256.194.258 or length $x != 3;
79}
80print "ok 10\n";
81
82{
83if (ord("\t") == 9) { # ASCII
84    use utf8;
85}
86# 11 - changing UTF8 characters in a UTF8 string, same length.
87$l = chr(300); $r = chr(400);
88$x = 200.300.400;
89$x =~ tr/\x{12c}/\x{190}/;
90printf "not (%vd) ", $x if $x ne 200.400.400 or length $x != 3;
91print "ok 11\n";
92
93# 12 - changing UTF8 characters in UTF8 string, more bytes.
94$x = 200.300.400;
95$x =~ tr/\x{12c}/\x{be8}/;
96printf "not (%vd) ", $x if $x ne 200.3048.400 or length $x != 3;
97print "ok 12\n";
98
99# 13 - introducing UTF8 characters to non-UTF8 string.
100$x = 100.125.60;
101$x =~ tr/\x{64}/\x{190}/;
102printf "not (%vd) ", $x if $x ne 400.125.60 or length $x != 3;
103print "ok 13\n";
104
105# 14 - removing UTF8 characters from UTF8 string
106$x = 400.125.60;
107$x =~ tr/\x{190}/\x{64}/;
108printf "not (%vd) ", $x if $x ne 100.125.60 or length $x != 3;
109print "ok 14\n";
110
111# 15 - counting UTF8 chars in UTF8 string
112$x = 400.125.60.400;
113$y = $x =~ tr/\x{190}/\x{190}/;
114print "not " if $y != 2;
115print "ok 15\n";
116
117# 16 - counting non-UTF8 chars in UTF8 string
118$x = 60.400.125.60.400;
119$y = $x =~ tr/\x{3c}/\x{3c}/;
120print "not " if $y != 2;
121print "ok 16\n";
122
123# 17 - counting UTF8 chars in non-UTF8 string
124$x = 200.125.60;
125$y = $x =~ tr/\x{190}/\x{190}/;
126print "not " if $y != 0;
127print "ok 17\n";
128}
129
130# 18: test brokenness with tr/a-z-9//;
131$_ = "abcdefghijklmnopqrstuvwxyz";
132eval "tr/a-z-9/ /";
133print (($@ =~ /^Ambiguous range in transliteration operator/ || $^V lt v5.7.0)
134       ? '' : 'not ', "ok 18\n");
135
136# 19-21: Make sure leading and trailing hyphens still work
137$_ = "car-rot9";
138tr/-a-m/./;
139print (($_ eq '..r.rot9') ? '' : 'not ', "ok 19\n");
140
141$_ = "car-rot9";
142tr/a-m-/./;
143print (($_ eq '..r.rot9') ? '' : 'not ', "ok 20\n");
144
145$_ = "car-rot9";
146tr/-a-m-/./;
147print (($_ eq '..r.rot9') ? '' : 'not ', "ok 21\n");
148
149$_ = "abcdefghijklmnop";
150tr/ae-hn/./;
151print (($_ eq '.bcd....ijklm.op') ? '' : 'not ', "ok 22\n");
152
153$_ = "abcdefghijklmnop";
154tr/a-cf-kn-p/./;
155print (($_ eq '...de......lm...') ? '' : 'not ', "ok 23\n");
156
157$_ = "abcdefghijklmnop";
158tr/a-ceg-ikm-o/./;
159print (($_ eq '...d.f...j.l...p') ? '' : 'not ', "ok 24\n");
160
161# 25: Test reversed range check
162# 20000705 MJD
163eval "tr/m-d/ /";
164print (($@ =~ /^Invalid \[\] range "m-d" in transliteration operator/ || $^V lt v5.7.0)
165       ? '' : 'not ', "ok 25\n");
166
167# 26: test cannot update if read-only
168eval '$1 =~ tr/x/y/';
169print (($@ =~ /^Modification of a read-only value attempted/) ? '' : 'not ',
170       "ok 26\n");
171
172# 27: test can count read-only
173'abcdef' =~ /(bcd)/;
174print (( eval '$1 =~ tr/abcd//' == 3) ? '' : 'not ', "ok 27\n");
175
176# 28: test lhs OK if not updating
177print ((eval '"123" =~ tr/12//' == 2) ? '' : 'not ', "ok 28\n");
178
179# 29: test lhs bad if updating
180eval '"123" =~ tr/1/1/';
181print (($@ =~ m|^Can't modify constant item in transliteration \(tr///\)|)
182       ? '' : 'not ', "ok 29\n");
183
184# v300 (0x12c) is UTF-8-encoded as 196 172 (0xc4 0xac)
185# v400 (0x190) is UTF-8-encoded as 198 144 (0xc6 0x90)
186
187# Transliterate a byte to a byte, all four ways.
188
189($a = v300.196.172.300.196.172) =~ tr/\xc4/\xc5/;
190print "not " unless $a eq v300.197.172.300.197.172;
191print "ok 30\n";
192
193($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{c5}/;
194print "not " unless $a eq v300.197.172.300.197.172;
195print "ok 31\n";
196
197($a = v300.196.172.300.196.172) =~ tr/\x{c4}/\xc5/;
198print "not " unless $a eq v300.197.172.300.197.172;
199print "ok 32\n";
200
201($a = v300.196.172.300.196.172) =~ tr/\x{c4}/\x{c5}/;
202print "not " unless $a eq v300.197.172.300.197.172;
203print "ok 33\n";
204
205# Transliterate a byte to a wide character.
206
207($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{12d}/;
208print "not " unless $a eq v300.301.172.300.301.172;
209print "ok 34\n";
210
211# Transliterate a wide character to a byte.
212
213($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\xc3/;
214print "not " unless $a eq v195.196.172.195.196.172;
215print "ok 35\n";
216
217# Transliterate a wide character to a wide character.
218
219($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\x{12d}/;
220print "not " unless $a eq v301.196.172.301.196.172;
221print "ok 36\n";
222
223# Transliterate both ways.
224
225($a = v300.196.172.300.196.172) =~ tr/\xc4\x{12c}/\x{12d}\xc3/;
226print "not " unless $a eq v195.301.172.195.301.172;
227print "ok 37\n";
228
229# Transliterate all (four) ways.
230
231($a = v300.196.172.300.196.172.400.198.144) =~
232	tr/\xac\xc4\x{12c}\x{190}/\xad\x{12d}\xc5\x{191}/;
233print "not " unless $a eq v197.301.173.197.301.173.401.198.144;
234print "ok 38\n";
235
236# Transliterate and count.
237
238print "not "
239    unless (($a = v300.196.172.300.196.172) =~ tr/\xc4/\xc5/)       == 2;
240print "ok 39\n";
241
242print "not "
243    unless (($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\x{12d}/) == 2;
244print "ok 40\n";
245
246# Transliterate with complement.
247
248($a = v300.196.172.300.196.172) =~ tr/\xc4/\x{12d}/c;
249print "not " unless $a eq v301.196.301.301.196.301;
250print "ok 41\n";
251
252($a = v300.196.172.300.196.172) =~ tr/\x{12c}/\xc5/c;
253print "not " unless $a eq v300.197.197.300.197.197;
254print "ok 42\n";
255
256# Transliterate with deletion.
257
258($a = v300.196.172.300.196.172) =~ tr/\xc4//d;
259print "not " unless $a eq v300.172.300.172;
260print "ok 43\n";
261
262($a = v300.196.172.300.196.172) =~ tr/\x{12c}//d;
263print "not " unless $a eq v196.172.196.172;
264print "ok 44\n";
265
266# Transliterate with squeeze.
267
268($a = v196.196.172.300.300.196.172) =~ tr/\xc4/\xc5/s;
269print "not " unless $a eq v197.172.300.300.197.172;
270print "ok 45\n";
271
272($a = v196.172.300.300.196.172.172) =~ tr/\x{12c}/\x{12d}/s;
273print "not " unless $a eq v196.172.301.196.172.172;
274print "ok 46\n";
275
276# Tricky cases by Simon Cozens.
277
278($a = v196.172.200) =~ tr/\x{12c}/a/;
279print "not " unless sprintf("%vd", $a) eq '196.172.200';
280print "ok 47\n";
281
282($a = v196.172.200) =~ tr/\x{12c}/\x{12c}/;
283print "not " unless sprintf("%vd", $a) eq '196.172.200';
284print "ok 48\n";
285
286($a = v196.172.200) =~ tr/\x{12c}//d;
287print "not " unless sprintf("%vd", $a) eq '196.172.200';
288print "ok 49\n";
289
290# UTF8 range
291
292($a = v300.196.172.302.197.172) =~ tr/\x{12c}-\x{130}/\xc0-\xc4/;
293print "not " unless $a eq v192.196.172.194.197.172;
294print "ok 50\n";
295
296($a = v300.196.172.302.197.172) =~ tr/\xc4-\xc8/\x{12c}-\x{130}/;
297print "not " unless $a eq v300.300.172.302.301.172;
298print "ok 51\n";
299
300# misc
301($a = "R0_001") =~ tr/R_//d;
302print "not " if hex($a) != 1;
303print "ok 52\n";
304
305@a = (1,2); map { y/1/./ for $_ } @a;
306print "not " if "@a" ne ". 2";
307print "ok 53\n";
308
309@a = (1,2); map { y/1/./ for $_.'' } @a;
310print "not " if "@a" ne "1 2";
311print "ok 54\n";
312