1/*
2 * This test is for ICU collations.
3 */
4
5/* skip test if not UTF8 server encoding or no ICU collations installed */
6SELECT getdatabaseencoding() <> 'UTF8' OR
7       (SELECT count(*) FROM pg_collation WHERE collprovider = 'i') = 0
8       AS skip_test \gset
9\if :skip_test
10\quit
11\endif
12
13SET client_encoding TO UTF8;
14
15CREATE SCHEMA collate_tests;
16SET search_path = collate_tests;
17
18
19CREATE TABLE collate_test1 (
20    a int,
21    b text COLLATE "en-x-icu" NOT NULL
22);
23
24\d collate_test1
25
26CREATE TABLE collate_test_fail (
27    a int,
28    b text COLLATE "ja_JP.eucjp-x-icu"
29);
30
31CREATE TABLE collate_test_fail (
32    a int,
33    b text COLLATE "foo-x-icu"
34);
35
36CREATE TABLE collate_test_fail (
37    a int COLLATE "en-x-icu",
38    b text
39);
40
41CREATE TABLE collate_test_like (
42    LIKE collate_test1
43);
44
45\d collate_test_like
46
47CREATE TABLE collate_test2 (
48    a int,
49    b text COLLATE "sv-x-icu"
50);
51
52CREATE TABLE collate_test3 (
53    a int,
54    b text COLLATE "C"
55);
56
57INSERT INTO collate_test1 VALUES (1, 'abc'), (2, 'äbc'), (3, 'bbc'), (4, 'ABC');
58INSERT INTO collate_test2 SELECT * FROM collate_test1;
59INSERT INTO collate_test3 SELECT * FROM collate_test1;
60
61SELECT * FROM collate_test1 WHERE b >= 'bbc';
62SELECT * FROM collate_test2 WHERE b >= 'bbc';
63SELECT * FROM collate_test3 WHERE b >= 'bbc';
64SELECT * FROM collate_test3 WHERE b >= 'BBC';
65
66SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc';
67SELECT * FROM collate_test1 WHERE b >= 'bbc' COLLATE "C";
68SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc' COLLATE "C";
69SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc' COLLATE "en-x-icu";
70
71
72CREATE DOMAIN testdomain_sv AS text COLLATE "sv-x-icu";
73CREATE DOMAIN testdomain_i AS int COLLATE "sv-x-icu"; -- fails
74CREATE TABLE collate_test4 (
75    a int,
76    b testdomain_sv
77);
78INSERT INTO collate_test4 SELECT * FROM collate_test1;
79SELECT a, b FROM collate_test4 ORDER BY b;
80
81CREATE TABLE collate_test5 (
82    a int,
83    b testdomain_sv COLLATE "en-x-icu"
84);
85INSERT INTO collate_test5 SELECT * FROM collate_test1;
86SELECT a, b FROM collate_test5 ORDER BY b;
87
88
89SELECT a, b FROM collate_test1 ORDER BY b;
90SELECT a, b FROM collate_test2 ORDER BY b;
91SELECT a, b FROM collate_test3 ORDER BY b;
92
93SELECT a, b FROM collate_test1 ORDER BY b COLLATE "C";
94
95-- star expansion
96SELECT * FROM collate_test1 ORDER BY b;
97SELECT * FROM collate_test2 ORDER BY b;
98SELECT * FROM collate_test3 ORDER BY b;
99
100-- constant expression folding
101SELECT 'bbc' COLLATE "en-x-icu" > 'äbc' COLLATE "en-x-icu" AS "true";
102SELECT 'bbc' COLLATE "sv-x-icu" > 'äbc' COLLATE "sv-x-icu" AS "false";
103
104-- upper/lower
105
106CREATE TABLE collate_test10 (
107    a int,
108    x text COLLATE "en-x-icu",
109    y text COLLATE "tr-x-icu"
110);
111
112INSERT INTO collate_test10 VALUES (1, 'hij', 'hij'), (2, 'HIJ', 'HIJ');
113
114SELECT a, lower(x), lower(y), upper(x), upper(y), initcap(x), initcap(y) FROM collate_test10;
115SELECT a, lower(x COLLATE "C"), lower(y COLLATE "C") FROM collate_test10;
116
117SELECT a, x, y FROM collate_test10 ORDER BY lower(y), a;
118
119-- LIKE/ILIKE
120
121SELECT * FROM collate_test1 WHERE b LIKE 'abc';
122SELECT * FROM collate_test1 WHERE b LIKE 'abc%';
123SELECT * FROM collate_test1 WHERE b LIKE '%bc%';
124SELECT * FROM collate_test1 WHERE b ILIKE 'abc';
125SELECT * FROM collate_test1 WHERE b ILIKE 'abc%';
126SELECT * FROM collate_test1 WHERE b ILIKE '%bc%';
127
128SELECT 'Türkiye' COLLATE "en-x-icu" ILIKE '%KI%' AS "true";
129SELECT 'Türkiye' COLLATE "tr-x-icu" ILIKE '%KI%' AS "false";
130
131SELECT 'bıt' ILIKE 'BIT' COLLATE "en-x-icu" AS "false";
132SELECT 'bıt' ILIKE 'BIT' COLLATE "tr-x-icu" AS "true";
133
134-- The following actually exercises the selectivity estimation for ILIKE.
135SELECT relname FROM pg_class WHERE relname ILIKE 'abc%';
136
137-- regular expressions
138
139SELECT * FROM collate_test1 WHERE b ~ '^abc$';
140SELECT * FROM collate_test1 WHERE b ~ '^abc';
141SELECT * FROM collate_test1 WHERE b ~ 'bc';
142SELECT * FROM collate_test1 WHERE b ~* '^abc$';
143SELECT * FROM collate_test1 WHERE b ~* '^abc';
144SELECT * FROM collate_test1 WHERE b ~* 'bc';
145
146CREATE TABLE collate_test6 (
147    a int,
148    b text COLLATE "en-x-icu"
149);
150INSERT INTO collate_test6 VALUES (1, 'abc'), (2, 'ABC'), (3, '123'), (4, 'ab1'),
151                                 (5, 'a1!'), (6, 'a c'), (7, '!.;'), (8, '   '),
152                                 (9, 'äbç'), (10, 'ÄBÇ');
153SELECT b,
154       b ~ '^[[:alpha:]]+$' AS is_alpha,
155       b ~ '^[[:upper:]]+$' AS is_upper,
156       b ~ '^[[:lower:]]+$' AS is_lower,
157       b ~ '^[[:digit:]]+$' AS is_digit,
158       b ~ '^[[:alnum:]]+$' AS is_alnum,
159       b ~ '^[[:graph:]]+$' AS is_graph,
160       b ~ '^[[:print:]]+$' AS is_print,
161       b ~ '^[[:punct:]]+$' AS is_punct,
162       b ~ '^[[:space:]]+$' AS is_space
163FROM collate_test6;
164
165SELECT 'Türkiye' COLLATE "en-x-icu" ~* 'KI' AS "true";
166SELECT 'Türkiye' COLLATE "tr-x-icu" ~* 'KI' AS "true";  -- true with ICU
167
168SELECT 'bıt' ~* 'BIT' COLLATE "en-x-icu" AS "false";
169SELECT 'bıt' ~* 'BIT' COLLATE "tr-x-icu" AS "false";  -- false with ICU
170
171-- The following actually exercises the selectivity estimation for ~*.
172SELECT relname FROM pg_class WHERE relname ~* '^abc';
173
174
175/* not run by default because it requires tr_TR system locale
176-- to_char
177
178SET lc_time TO 'tr_TR';
179SELECT to_char(date '2010-04-01', 'DD TMMON YYYY');
180SELECT to_char(date '2010-04-01', 'DD TMMON YYYY' COLLATE "tr-x-icu");
181*/
182
183
184-- backwards parsing
185
186CREATE VIEW collview1 AS SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc';
187CREATE VIEW collview2 AS SELECT a, b FROM collate_test1 ORDER BY b COLLATE "C";
188CREATE VIEW collview3 AS SELECT a, lower((x || x) COLLATE "C") FROM collate_test10;
189
190SELECT table_name, view_definition FROM information_schema.views
191  WHERE table_name LIKE 'collview%' ORDER BY 1;
192
193
194-- collation propagation in various expression types
195
196SELECT a, coalesce(b, 'foo') FROM collate_test1 ORDER BY 2;
197SELECT a, coalesce(b, 'foo') FROM collate_test2 ORDER BY 2;
198SELECT a, coalesce(b, 'foo') FROM collate_test3 ORDER BY 2;
199SELECT a, lower(coalesce(x, 'foo')), lower(coalesce(y, 'foo')) FROM collate_test10;
200
201SELECT a, b, greatest(b, 'CCC') FROM collate_test1 ORDER BY 3;
202SELECT a, b, greatest(b, 'CCC') FROM collate_test2 ORDER BY 3;
203SELECT a, b, greatest(b, 'CCC') FROM collate_test3 ORDER BY 3;
204SELECT a, x, y, lower(greatest(x, 'foo')), lower(greatest(y, 'foo')) FROM collate_test10;
205
206SELECT a, nullif(b, 'abc') FROM collate_test1 ORDER BY 2;
207SELECT a, nullif(b, 'abc') FROM collate_test2 ORDER BY 2;
208SELECT a, nullif(b, 'abc') FROM collate_test3 ORDER BY 2;
209SELECT a, lower(nullif(x, 'foo')), lower(nullif(y, 'foo')) FROM collate_test10;
210
211SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test1 ORDER BY 2;
212SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test2 ORDER BY 2;
213SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test3 ORDER BY 2;
214
215CREATE DOMAIN testdomain AS text;
216SELECT a, b::testdomain FROM collate_test1 ORDER BY 2;
217SELECT a, b::testdomain FROM collate_test2 ORDER BY 2;
218SELECT a, b::testdomain FROM collate_test3 ORDER BY 2;
219SELECT a, b::testdomain_sv FROM collate_test3 ORDER BY 2;
220SELECT a, lower(x::testdomain), lower(y::testdomain) FROM collate_test10;
221
222SELECT min(b), max(b) FROM collate_test1;
223SELECT min(b), max(b) FROM collate_test2;
224SELECT min(b), max(b) FROM collate_test3;
225
226SELECT array_agg(b ORDER BY b) FROM collate_test1;
227SELECT array_agg(b ORDER BY b) FROM collate_test2;
228SELECT array_agg(b ORDER BY b) FROM collate_test3;
229
230SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test1 ORDER BY 2;
231SELECT a, b FROM collate_test2 UNION SELECT a, b FROM collate_test2 ORDER BY 2;
232SELECT a, b FROM collate_test3 WHERE a < 4 INTERSECT SELECT a, b FROM collate_test3 WHERE a > 1 ORDER BY 2;
233SELECT a, b FROM collate_test3 EXCEPT SELECT a, b FROM collate_test3 WHERE a < 2 ORDER BY 2;
234
235SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3 ORDER BY 2; -- fail
236SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3; -- ok
237SELECT a, b FROM collate_test1 UNION SELECT a, b FROM collate_test3 ORDER BY 2; -- fail
238SELECT a, b COLLATE "C" FROM collate_test1 UNION SELECT a, b FROM collate_test3 ORDER BY 2; -- ok
239SELECT a, b FROM collate_test1 INTERSECT SELECT a, b FROM collate_test3 ORDER BY 2; -- fail
240SELECT a, b FROM collate_test1 EXCEPT SELECT a, b FROM collate_test3 ORDER BY 2; -- fail
241
242CREATE TABLE test_u AS SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3; -- fail
243
244-- ideally this would be a parse-time error, but for now it must be run-time:
245select x < y from collate_test10; -- fail
246select x || y from collate_test10; -- ok, because || is not collation aware
247select x, y from collate_test10 order by x || y; -- not so ok
248
249-- collation mismatch between recursive and non-recursive term
250WITH RECURSIVE foo(x) AS
251   (SELECT x FROM (VALUES('a' COLLATE "en-x-icu"),('b')) t(x)
252   UNION ALL
253   SELECT (x || 'c') COLLATE "de-x-icu" FROM foo WHERE length(x) < 10)
254SELECT * FROM foo;
255
256
257-- casting
258
259SELECT CAST('42' AS text COLLATE "C");
260
261SELECT a, CAST(b AS varchar) FROM collate_test1 ORDER BY 2;
262SELECT a, CAST(b AS varchar) FROM collate_test2 ORDER BY 2;
263SELECT a, CAST(b AS varchar) FROM collate_test3 ORDER BY 2;
264
265
266-- propagation of collation in SQL functions (inlined and non-inlined cases)
267-- and plpgsql functions too
268
269CREATE FUNCTION mylt (text, text) RETURNS boolean LANGUAGE sql
270    AS $$ select $1 < $2 $$;
271
272CREATE FUNCTION mylt_noninline (text, text) RETURNS boolean LANGUAGE sql
273    AS $$ select $1 < $2 limit 1 $$;
274
275CREATE FUNCTION mylt_plpgsql (text, text) RETURNS boolean LANGUAGE plpgsql
276    AS $$ begin return $1 < $2; end $$;
277
278SELECT a.b AS a, b.b AS b, a.b < b.b AS lt,
279       mylt(a.b, b.b), mylt_noninline(a.b, b.b), mylt_plpgsql(a.b, b.b)
280FROM collate_test1 a, collate_test1 b
281ORDER BY a.b, b.b;
282
283SELECT a.b AS a, b.b AS b, a.b < b.b COLLATE "C" AS lt,
284       mylt(a.b, b.b COLLATE "C"), mylt_noninline(a.b, b.b COLLATE "C"),
285       mylt_plpgsql(a.b, b.b COLLATE "C")
286FROM collate_test1 a, collate_test1 b
287ORDER BY a.b, b.b;
288
289
290-- collation override in plpgsql
291
292CREATE FUNCTION mylt2 (x text, y text) RETURNS boolean LANGUAGE plpgsql AS $$
293declare
294  xx text := x;
295  yy text := y;
296begin
297  return xx < yy;
298end
299$$;
300
301SELECT mylt2('a', 'B' collate "en-x-icu") as t, mylt2('a', 'B' collate "C") as f;
302
303CREATE OR REPLACE FUNCTION
304  mylt2 (x text, y text) RETURNS boolean LANGUAGE plpgsql AS $$
305declare
306  xx text COLLATE "POSIX" := x;
307  yy text := y;
308begin
309  return xx < yy;
310end
311$$;
312
313SELECT mylt2('a', 'B') as f;
314SELECT mylt2('a', 'B' collate "C") as fail; -- conflicting collations
315SELECT mylt2('a', 'B' collate "POSIX") as f;
316
317
318-- polymorphism
319
320SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test1)) ORDER BY 1;
321SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test2)) ORDER BY 1;
322SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test3)) ORDER BY 1;
323
324CREATE FUNCTION dup (anyelement) RETURNS anyelement
325    AS 'select $1' LANGUAGE sql;
326
327SELECT a, dup(b) FROM collate_test1 ORDER BY 2;
328SELECT a, dup(b) FROM collate_test2 ORDER BY 2;
329SELECT a, dup(b) FROM collate_test3 ORDER BY 2;
330
331
332-- indexes
333
334CREATE INDEX collate_test1_idx1 ON collate_test1 (b);
335CREATE INDEX collate_test1_idx2 ON collate_test1 (b COLLATE "C");
336CREATE INDEX collate_test1_idx3 ON collate_test1 ((b COLLATE "C")); -- this is different grammatically
337CREATE INDEX collate_test1_idx4 ON collate_test1 (((b||'foo') COLLATE "POSIX"));
338
339CREATE INDEX collate_test1_idx5 ON collate_test1 (a COLLATE "C"); -- fail
340CREATE INDEX collate_test1_idx6 ON collate_test1 ((a COLLATE "C")); -- fail
341
342SELECT relname, pg_get_indexdef(oid) FROM pg_class WHERE relname LIKE 'collate_test%_idx%' ORDER BY 1;
343
344set enable_seqscan = off;
345explain (costs off)
346select * from collate_test1 where b ilike 'abc';
347select * from collate_test1 where b ilike 'abc';
348explain (costs off)
349select * from collate_test1 where b ilike 'ABC';
350select * from collate_test1 where b ilike 'ABC';
351reset enable_seqscan;
352
353
354-- schema manipulation commands
355
356CREATE ROLE regress_test_role;
357CREATE SCHEMA test_schema;
358
359-- We need to do this this way to cope with varying names for encodings:
360do $$
361BEGIN
362  EXECUTE 'CREATE COLLATION test0 (provider = icu, locale = ' ||
363          quote_literal(current_setting('lc_collate')) || ');';
364END
365$$;
366CREATE COLLATION test0 FROM "C"; -- fail, duplicate name
367do $$
368BEGIN
369  EXECUTE 'CREATE COLLATION test1 (provider = icu, lc_collate = ' ||
370          quote_literal(current_setting('lc_collate')) ||
371          ', lc_ctype = ' ||
372          quote_literal(current_setting('lc_ctype')) || ');';
373END
374$$;
375CREATE COLLATION test3 (provider = icu, lc_collate = 'en_US.utf8'); -- fail, need lc_ctype
376CREATE COLLATION testx (provider = icu, locale = 'nonsense'); /* never fails with ICU */  DROP COLLATION testx;
377
378CREATE COLLATION test4 FROM nonsense;
379CREATE COLLATION test5 FROM test0;
380
381SELECT collname FROM pg_collation WHERE collname LIKE 'test%' ORDER BY 1;
382
383ALTER COLLATION test1 RENAME TO test11;
384ALTER COLLATION test0 RENAME TO test11; -- fail
385ALTER COLLATION test1 RENAME TO test22; -- fail
386
387ALTER COLLATION test11 OWNER TO regress_test_role;
388ALTER COLLATION test11 OWNER TO nonsense;
389ALTER COLLATION test11 SET SCHEMA test_schema;
390
391COMMENT ON COLLATION test0 IS 'US English';
392
393SELECT collname, nspname, obj_description(pg_collation.oid, 'pg_collation')
394    FROM pg_collation JOIN pg_namespace ON (collnamespace = pg_namespace.oid)
395    WHERE collname LIKE 'test%'
396    ORDER BY 1;
397
398DROP COLLATION test0, test_schema.test11, test5;
399DROP COLLATION test0; -- fail
400DROP COLLATION IF EXISTS test0;
401
402SELECT collname FROM pg_collation WHERE collname LIKE 'test%';
403
404DROP SCHEMA test_schema;
405DROP ROLE regress_test_role;
406
407
408-- ALTER
409
410ALTER COLLATION "en-x-icu" REFRESH VERSION;
411
412
413-- dependencies
414
415CREATE COLLATION test0 FROM "C";
416
417CREATE TABLE collate_dep_test1 (a int, b text COLLATE test0);
418CREATE DOMAIN collate_dep_dom1 AS text COLLATE test0;
419CREATE TYPE collate_dep_test2 AS (x int, y text COLLATE test0);
420CREATE VIEW collate_dep_test3 AS SELECT text 'foo' COLLATE test0 AS foo;
421CREATE TABLE collate_dep_test4t (a int, b text);
422CREATE INDEX collate_dep_test4i ON collate_dep_test4t (b COLLATE test0);
423
424DROP COLLATION test0 RESTRICT; -- fail
425DROP COLLATION test0 CASCADE;
426
427\d collate_dep_test1
428\d collate_dep_test2
429
430DROP TABLE collate_dep_test1, collate_dep_test4t;
431DROP TYPE collate_dep_test2;
432
433-- test range types and collations
434
435create type textrange_c as range(subtype=text, collation="C");
436create type textrange_en_us as range(subtype=text, collation="en-x-icu");
437
438select textrange_c('A','Z') @> 'b'::text;
439select textrange_en_us('A','Z') @> 'b'::text;
440
441drop type textrange_c;
442drop type textrange_en_us;
443
444
445-- test ICU collation customization
446
447-- test the attributes handled by icu_set_collation_attributes()
448
449CREATE COLLATION testcoll_ignore_accents (provider = icu, locale = '@colStrength=primary;colCaseLevel=yes');
450SELECT 'aaá' > 'AAA' COLLATE "und-x-icu", 'aaá' < 'AAA' COLLATE testcoll_ignore_accents;
451
452CREATE COLLATION testcoll_backwards (provider = icu, locale = '@colBackwards=yes');
453SELECT 'coté' < 'côte' COLLATE "und-x-icu", 'coté' > 'côte' COLLATE testcoll_backwards;
454
455CREATE COLLATION testcoll_lower_first (provider = icu, locale = '@colCaseFirst=lower');
456CREATE COLLATION testcoll_upper_first (provider = icu, locale = '@colCaseFirst=upper');
457SELECT 'aaa' < 'AAA' COLLATE testcoll_lower_first, 'aaa' > 'AAA' COLLATE testcoll_upper_first;
458
459CREATE COLLATION testcoll_shifted (provider = icu, locale = '@colAlternate=shifted');
460SELECT 'de-luge' < 'deanza' COLLATE "und-x-icu", 'de-luge' > 'deanza' COLLATE testcoll_shifted;
461
462CREATE COLLATION testcoll_numeric (provider = icu, locale = '@colNumeric=yes');
463SELECT 'A-21' > 'A-123' COLLATE "und-x-icu", 'A-21' < 'A-123' COLLATE testcoll_numeric;
464
465CREATE COLLATION testcoll_error1 (provider = icu, locale = '@colNumeric=lower');
466
467-- test that attributes not handled by icu_set_collation_attributes()
468-- (handled by ucol_open() directly) also work
469CREATE COLLATION testcoll_de_phonebook (provider = icu, locale = 'de@collation=phonebook');
470SELECT 'Goldmann' < 'Götz' COLLATE "de-x-icu", 'Goldmann' > 'Götz' COLLATE testcoll_de_phonebook;
471
472
473-- nondeterministic collations
474
475CREATE COLLATION ctest_det (provider = icu, locale = '', deterministic = true);
476CREATE COLLATION ctest_nondet (provider = icu, locale = '', deterministic = false);
477
478CREATE TABLE test6 (a int, b text);
479-- same string in different normal forms
480INSERT INTO test6 VALUES (1, U&'\00E4bc');
481INSERT INTO test6 VALUES (2, U&'\0061\0308bc');
482SELECT * FROM test6;
483SELECT * FROM test6 WHERE b = 'äbc' COLLATE ctest_det;
484SELECT * FROM test6 WHERE b = 'äbc' COLLATE ctest_nondet;
485
486-- same with arrays
487CREATE TABLE test6a (a int, b text[]);
488INSERT INTO test6a VALUES (1, ARRAY[U&'\00E4bc']);
489INSERT INTO test6a VALUES (2, ARRAY[U&'\0061\0308bc']);
490SELECT * FROM test6a;
491SELECT * FROM test6a WHERE b = ARRAY['äbc'] COLLATE ctest_det;
492SELECT * FROM test6a WHERE b = ARRAY['äbc'] COLLATE ctest_nondet;
493
494CREATE COLLATION case_sensitive (provider = icu, locale = '');
495CREATE COLLATION case_insensitive (provider = icu, locale = '@colStrength=secondary', deterministic = false);
496
497SELECT 'abc' <= 'ABC' COLLATE case_sensitive, 'abc' >= 'ABC' COLLATE case_sensitive;
498SELECT 'abc' <= 'ABC' COLLATE case_insensitive, 'abc' >= 'ABC' COLLATE case_insensitive;
499
500CREATE TABLE test1cs (x text COLLATE case_sensitive);
501CREATE TABLE test2cs (x text COLLATE case_sensitive);
502CREATE TABLE test3cs (x text COLLATE case_sensitive);
503INSERT INTO test1cs VALUES ('abc'), ('def'), ('ghi');
504INSERT INTO test2cs VALUES ('ABC'), ('ghi');
505INSERT INTO test3cs VALUES ('abc'), ('ABC'), ('def'), ('ghi');
506
507SELECT x FROM test3cs WHERE x = 'abc';
508SELECT x FROM test3cs WHERE x <> 'abc';
509SELECT x FROM test3cs WHERE x LIKE 'a%';
510SELECT x FROM test3cs WHERE x ILIKE 'a%';
511SELECT x FROM test3cs WHERE x SIMILAR TO 'a%';
512SELECT x FROM test3cs WHERE x ~ 'a';
513SELECT x FROM test1cs UNION SELECT x FROM test2cs ORDER BY x;
514SELECT x FROM test2cs UNION SELECT x FROM test1cs ORDER BY x;
515SELECT x FROM test1cs INTERSECT SELECT x FROM test2cs;
516SELECT x FROM test2cs INTERSECT SELECT x FROM test1cs;
517SELECT x FROM test1cs EXCEPT SELECT x FROM test2cs;
518SELECT x FROM test2cs EXCEPT SELECT x FROM test1cs;
519SELECT DISTINCT x FROM test3cs ORDER BY x;
520SELECT count(DISTINCT x) FROM test3cs;
521SELECT x, count(*) FROM test3cs GROUP BY x ORDER BY x;
522SELECT x, row_number() OVER (ORDER BY x), rank() OVER (ORDER BY x) FROM test3cs ORDER BY x;
523CREATE UNIQUE INDEX ON test1cs (x);  -- ok
524INSERT INTO test1cs VALUES ('ABC');  -- ok
525CREATE UNIQUE INDEX ON test3cs (x);  -- ok
526SELECT string_to_array('ABC,DEF,GHI' COLLATE case_sensitive, ',', 'abc');
527SELECT string_to_array('ABCDEFGHI' COLLATE case_sensitive, NULL, 'b');
528
529CREATE TABLE test1ci (x text COLLATE case_insensitive);
530CREATE TABLE test2ci (x text COLLATE case_insensitive);
531CREATE TABLE test3ci (x text COLLATE case_insensitive);
532CREATE INDEX ON test3ci (x text_pattern_ops);  -- error
533INSERT INTO test1ci VALUES ('abc'), ('def'), ('ghi');
534INSERT INTO test2ci VALUES ('ABC'), ('ghi');
535INSERT INTO test3ci VALUES ('abc'), ('ABC'), ('def'), ('ghi');
536
537SELECT x FROM test3ci WHERE x = 'abc';
538SELECT x FROM test3ci WHERE x <> 'abc';
539SELECT x FROM test3ci WHERE x LIKE 'a%';
540SELECT x FROM test3ci WHERE x ILIKE 'a%';
541SELECT x FROM test3ci WHERE x SIMILAR TO 'a%';
542SELECT x FROM test3ci WHERE x ~ 'a';
543SELECT x FROM test1ci UNION SELECT x FROM test2ci ORDER BY x;
544SELECT x FROM test2ci UNION SELECT x FROM test1ci ORDER BY x;
545SELECT x FROM test1ci INTERSECT SELECT x FROM test2ci ORDER BY x;
546SELECT x FROM test2ci INTERSECT SELECT x FROM test1ci ORDER BY x;
547SELECT x FROM test1ci EXCEPT SELECT x FROM test2ci;
548SELECT x FROM test2ci EXCEPT SELECT x FROM test1ci;
549SELECT DISTINCT x FROM test3ci ORDER BY x;
550SELECT count(DISTINCT x) FROM test3ci;
551SELECT x, count(*) FROM test3ci GROUP BY x ORDER BY x;
552SELECT x, row_number() OVER (ORDER BY x), rank() OVER (ORDER BY x) FROM test3ci ORDER BY x;
553CREATE UNIQUE INDEX ON test1ci (x);  -- ok
554INSERT INTO test1ci VALUES ('ABC');  -- error
555CREATE UNIQUE INDEX ON test3ci (x);  -- error
556SELECT string_to_array('ABC,DEF,GHI' COLLATE case_insensitive, ',', 'abc');
557SELECT string_to_array('ABCDEFGHI' COLLATE case_insensitive, NULL, 'b');
558
559-- bpchar
560CREATE TABLE test1bpci (x char(3) COLLATE case_insensitive);
561CREATE TABLE test2bpci (x char(3) COLLATE case_insensitive);
562CREATE TABLE test3bpci (x char(3) COLLATE case_insensitive);
563CREATE INDEX ON test3bpci (x bpchar_pattern_ops);  -- error
564INSERT INTO test1bpci VALUES ('abc'), ('def'), ('ghi');
565INSERT INTO test2bpci VALUES ('ABC'), ('ghi');
566INSERT INTO test3bpci VALUES ('abc'), ('ABC'), ('def'), ('ghi');
567
568SELECT x FROM test3bpci WHERE x = 'abc';
569SELECT x FROM test3bpci WHERE x <> 'abc';
570SELECT x FROM test3bpci WHERE x LIKE 'a%';
571SELECT x FROM test3bpci WHERE x ILIKE 'a%';
572SELECT x FROM test3bpci WHERE x SIMILAR TO 'a%';
573SELECT x FROM test3bpci WHERE x ~ 'a';
574SELECT x FROM test1bpci UNION SELECT x FROM test2bpci ORDER BY x;
575SELECT x FROM test2bpci UNION SELECT x FROM test1bpci ORDER BY x;
576SELECT x FROM test1bpci INTERSECT SELECT x FROM test2bpci ORDER BY x;
577SELECT x FROM test2bpci INTERSECT SELECT x FROM test1bpci ORDER BY x;
578SELECT x FROM test1bpci EXCEPT SELECT x FROM test2bpci;
579SELECT x FROM test2bpci EXCEPT SELECT x FROM test1bpci;
580SELECT DISTINCT x FROM test3bpci ORDER BY x;
581SELECT count(DISTINCT x) FROM test3bpci;
582SELECT x, count(*) FROM test3bpci GROUP BY x ORDER BY x;
583SELECT x, row_number() OVER (ORDER BY x), rank() OVER (ORDER BY x) FROM test3bpci ORDER BY x;
584CREATE UNIQUE INDEX ON test1bpci (x);  -- ok
585INSERT INTO test1bpci VALUES ('ABC');  -- error
586CREATE UNIQUE INDEX ON test3bpci (x);  -- error
587SELECT string_to_array('ABC,DEF,GHI'::char(11) COLLATE case_insensitive, ',', 'abc');
588SELECT string_to_array('ABCDEFGHI'::char(9) COLLATE case_insensitive, NULL, 'b');
589
590-- This tests the issue described in match_pattern_prefix().  In the
591-- absence of that check, the case_insensitive tests below would
592-- return no rows where they should logically return one.
593CREATE TABLE test4c (x text COLLATE "C");
594INSERT INTO test4c VALUES ('abc');
595CREATE INDEX ON test4c (x);
596SET enable_seqscan = off;
597SELECT x FROM test4c WHERE x LIKE 'ABC' COLLATE case_sensitive;  -- ok, no rows
598SELECT x FROM test4c WHERE x LIKE 'ABC%' COLLATE case_sensitive;  -- ok, no rows
599SELECT x FROM test4c WHERE x LIKE 'ABC' COLLATE case_insensitive;  -- error
600SELECT x FROM test4c WHERE x LIKE 'ABC%' COLLATE case_insensitive;  -- error
601RESET enable_seqscan;
602
603-- Unicode special case: different variants of Greek lower case sigma.
604-- A naive implementation like citext that just does lower(x) =
605-- lower(y) will do the wrong thing here, because lower('Σ') is 'σ'
606-- but upper('ς') is 'Σ'.
607SELECT 'ὀδυσσεύς' = 'ὈΔΥΣΣΕΎΣ' COLLATE case_sensitive;
608SELECT 'ὀδυσσεύς' = 'ὈΔΥΣΣΕΎΣ' COLLATE case_insensitive;
609
610-- name vs. text comparison operators
611SELECT relname FROM pg_class WHERE relname = 'PG_CLASS'::text COLLATE case_insensitive;
612SELECT relname FROM pg_class WHERE 'PG_CLASS'::text = relname COLLATE case_insensitive;
613
614SELECT typname FROM pg_type WHERE typname LIKE 'int_' AND typname <> 'INT2'::text
615  COLLATE case_insensitive ORDER BY typname;
616SELECT typname FROM pg_type WHERE typname LIKE 'int_' AND 'INT2'::text <> typname
617  COLLATE case_insensitive ORDER BY typname;
618
619-- test case adapted from subselect.sql
620CREATE TEMP TABLE outer_text (f1 text COLLATE case_insensitive, f2 text);
621INSERT INTO outer_text VALUES ('a', 'a');
622INSERT INTO outer_text VALUES ('b', 'a');
623INSERT INTO outer_text VALUES ('A', NULL);
624INSERT INTO outer_text VALUES ('B', NULL);
625
626CREATE TEMP TABLE inner_text (c1 text COLLATE case_insensitive, c2 text);
627INSERT INTO inner_text VALUES ('a', NULL);
628
629SELECT * FROM outer_text WHERE (f1, f2) NOT IN (SELECT * FROM inner_text);
630
631-- accents
632CREATE COLLATION ignore_accents (provider = icu, locale = '@colStrength=primary;colCaseLevel=yes', deterministic = false);
633
634CREATE TABLE test4 (a int, b text);
635INSERT INTO test4 VALUES (1, 'cote'), (2, 'côte'), (3, 'coté'), (4, 'côté');
636SELECT * FROM test4 WHERE b = 'cote';
637SELECT * FROM test4 WHERE b = 'cote' COLLATE ignore_accents;
638SELECT * FROM test4 WHERE b = 'Cote' COLLATE ignore_accents;  -- still case-sensitive
639SELECT * FROM test4 WHERE b = 'Cote' COLLATE case_insensitive;
640
641-- foreign keys (should use collation of primary key)
642
643-- PK is case-sensitive, FK is case-insensitive
644CREATE TABLE test10pk (x text COLLATE case_sensitive PRIMARY KEY);
645INSERT INTO test10pk VALUES ('abc'), ('def'), ('ghi');
646CREATE TABLE test10fk (x text COLLATE case_insensitive REFERENCES test10pk (x) ON UPDATE CASCADE ON DELETE CASCADE);
647INSERT INTO test10fk VALUES ('abc');  -- ok
648INSERT INTO test10fk VALUES ('ABC');  -- error
649INSERT INTO test10fk VALUES ('xyz');  -- error
650SELECT * FROM test10pk;
651SELECT * FROM test10fk;
652-- restrict update even though the values are "equal" in the FK table
653UPDATE test10fk SET x = 'ABC' WHERE x = 'abc';  -- error
654SELECT * FROM test10fk;
655DELETE FROM test10pk WHERE x = 'abc';
656SELECT * FROM test10pk;
657SELECT * FROM test10fk;
658
659-- PK is case-insensitive, FK is case-sensitive
660CREATE TABLE test11pk (x text COLLATE case_insensitive PRIMARY KEY);
661INSERT INTO test11pk VALUES ('abc'), ('def'), ('ghi');
662CREATE TABLE test11fk (x text COLLATE case_sensitive REFERENCES test11pk (x) ON UPDATE CASCADE ON DELETE CASCADE);
663INSERT INTO test11fk VALUES ('abc');  -- ok
664INSERT INTO test11fk VALUES ('ABC');  -- ok
665INSERT INTO test11fk VALUES ('xyz');  -- error
666SELECT * FROM test11pk;
667SELECT * FROM test11fk;
668-- cascade update even though the values are "equal" in the PK table
669UPDATE test11pk SET x = 'ABC' WHERE x = 'abc';
670SELECT * FROM test11fk;
671DELETE FROM test11pk WHERE x = 'abc';
672SELECT * FROM test11pk;
673SELECT * FROM test11fk;
674
675-- partitioning
676CREATE TABLE test20 (a int, b text COLLATE case_insensitive) PARTITION BY LIST (b);
677CREATE TABLE test20_1 PARTITION OF test20 FOR VALUES IN ('abc');
678INSERT INTO test20 VALUES (1, 'abc');
679INSERT INTO test20 VALUES (2, 'ABC');
680SELECT * FROM test20_1;
681
682CREATE TABLE test21 (a int, b text COLLATE case_insensitive) PARTITION BY RANGE (b);
683CREATE TABLE test21_1 PARTITION OF test21 FOR VALUES FROM ('ABC') TO ('DEF');
684INSERT INTO test21 VALUES (1, 'abc');
685INSERT INTO test21 VALUES (2, 'ABC');
686SELECT * FROM test21_1;
687
688CREATE TABLE test22 (a int, b text COLLATE case_sensitive) PARTITION BY HASH (b);
689CREATE TABLE test22_0 PARTITION OF test22 FOR VALUES WITH (MODULUS 2, REMAINDER 0);
690CREATE TABLE test22_1 PARTITION OF test22 FOR VALUES WITH (MODULUS 2, REMAINDER 1);
691INSERT INTO test22 VALUES (1, 'def');
692INSERT INTO test22 VALUES (2, 'DEF');
693-- they end up in different partitions
694SELECT (SELECT count(*) FROM test22_0) = (SELECT count(*) FROM test22_1);
695
696-- same with arrays
697CREATE TABLE test22a (a int, b text[] COLLATE case_sensitive) PARTITION BY HASH (b);
698CREATE TABLE test22a_0 PARTITION OF test22a FOR VALUES WITH (MODULUS 2, REMAINDER 0);
699CREATE TABLE test22a_1 PARTITION OF test22a FOR VALUES WITH (MODULUS 2, REMAINDER 1);
700INSERT INTO test22a VALUES (1, ARRAY['def']);
701INSERT INTO test22a VALUES (2, ARRAY['DEF']);
702-- they end up in different partitions
703SELECT (SELECT count(*) FROM test22a_0) = (SELECT count(*) FROM test22a_1);
704
705CREATE TABLE test23 (a int, b text COLLATE case_insensitive) PARTITION BY HASH (b);
706CREATE TABLE test23_0 PARTITION OF test23 FOR VALUES WITH (MODULUS 2, REMAINDER 0);
707CREATE TABLE test23_1 PARTITION OF test23 FOR VALUES WITH (MODULUS 2, REMAINDER 1);
708INSERT INTO test23 VALUES (1, 'def');
709INSERT INTO test23 VALUES (2, 'DEF');
710-- they end up in the same partition (but it's platform-dependent which one)
711SELECT (SELECT count(*) FROM test23_0) <> (SELECT count(*) FROM test23_1);
712
713-- same with arrays
714CREATE TABLE test23a (a int, b text[] COLLATE case_insensitive) PARTITION BY HASH (b);
715CREATE TABLE test23a_0 PARTITION OF test23a FOR VALUES WITH (MODULUS 2, REMAINDER 0);
716CREATE TABLE test23a_1 PARTITION OF test23a FOR VALUES WITH (MODULUS 2, REMAINDER 1);
717INSERT INTO test23a VALUES (1, ARRAY['def']);
718INSERT INTO test23a VALUES (2, ARRAY['DEF']);
719-- they end up in the same partition (but it's platform-dependent which one)
720SELECT (SELECT count(*) FROM test23a_0) <> (SELECT count(*) FROM test23a_1);
721
722CREATE TABLE test30 (a int, b char(3) COLLATE case_insensitive) PARTITION BY LIST (b);
723CREATE TABLE test30_1 PARTITION OF test30 FOR VALUES IN ('abc');
724INSERT INTO test30 VALUES (1, 'abc');
725INSERT INTO test30 VALUES (2, 'ABC');
726SELECT * FROM test30_1;
727
728CREATE TABLE test31 (a int, b char(3) COLLATE case_insensitive) PARTITION BY RANGE (b);
729CREATE TABLE test31_1 PARTITION OF test31 FOR VALUES FROM ('ABC') TO ('DEF');
730INSERT INTO test31 VALUES (1, 'abc');
731INSERT INTO test31 VALUES (2, 'ABC');
732SELECT * FROM test31_1;
733
734CREATE TABLE test32 (a int, b char(3) COLLATE case_sensitive) PARTITION BY HASH (b);
735CREATE TABLE test32_0 PARTITION OF test32 FOR VALUES WITH (MODULUS 2, REMAINDER 0);
736CREATE TABLE test32_1 PARTITION OF test32 FOR VALUES WITH (MODULUS 2, REMAINDER 1);
737INSERT INTO test32 VALUES (1, 'def');
738INSERT INTO test32 VALUES (2, 'DEF');
739-- they end up in different partitions
740SELECT (SELECT count(*) FROM test32_0) = (SELECT count(*) FROM test32_1);
741
742CREATE TABLE test33 (a int, b char(3) COLLATE case_insensitive) PARTITION BY HASH (b);
743CREATE TABLE test33_0 PARTITION OF test33 FOR VALUES WITH (MODULUS 2, REMAINDER 0);
744CREATE TABLE test33_1 PARTITION OF test33 FOR VALUES WITH (MODULUS 2, REMAINDER 1);
745INSERT INTO test33 VALUES (1, 'def');
746INSERT INTO test33 VALUES (2, 'DEF');
747-- they end up in the same partition (but it's platform-dependent which one)
748SELECT (SELECT count(*) FROM test33_0) <> (SELECT count(*) FROM test33_1);
749
750
751-- cleanup
752RESET search_path;
753SET client_min_messages TO warning;
754DROP SCHEMA collate_tests CASCADE;
755RESET client_min_messages;
756
757-- leave a collation for pg_upgrade test
758CREATE COLLATION coll_icu_upgrade FROM "und-x-icu";
759