mirror of https://github.com/postgres/postgres
Windows can enumerate the locales that are either installed or supported by calling EnumSystemLocalesEx(), similar to what is already done in the READ_LOCALE_A_OUTPUT switch. We can refactor some of the logic already used in that switch into a new function create_collation_from_locale(). The enumerated locales have BCP 47 shape, that is with a hyphen between language and territory, instead of POSIX's underscore. The created collations will retain the BCP 47 shape, but we will also create a POSIX alias, so xx-YY will have an xx_YY alias. A new test collate.windows.win1252 is added that is like collate.linux.utf8. Author: Juan Jose Santamaria Flecha <juanjo.santamaria@gmail.com> Reviewed-by: Dmitry Koval <d.koval@postgrespro.ru> Reviewed-by: Peter Eisentraut <peter.eisentraut@enterprisedb.com> Discussion: https://www.postgresql.org/message-id/flat/0050ec23-34d9-2765-9015-98c04f0e18ac@postgrespro.rupull/111/head
parent
33ab0a2a52
commit
bf03cfd162
File diff suppressed because it is too large
Load Diff
@ -0,0 +1,13 @@ |
||||
/* |
||||
* This test is meant to run on Windows systems that has successfully |
||||
* run pg_import_system_collations(). Also, the database must have |
||||
* WIN1252 encoding, because of the locales' own encodings. Because |
||||
* of this, some test are lost from UTF-8 version, such as Turkish |
||||
* dotted and undotted 'i'. |
||||
*/ |
||||
SELECT getdatabaseencoding() <> 'WIN1252' OR |
||||
(SELECT count(*) FROM pg_collation WHERE collname IN ('de_DE', 'en_US', 'sv_SE') AND collencoding = pg_char_to_encoding('WIN1252')) <> 3 OR |
||||
(version() !~ 'Visual C\+\+' AND version() !~ 'mingw32' AND version() !~ 'windows') |
||||
AS skip_test \gset |
||||
\if :skip_test |
||||
\quit |
||||
@ -0,0 +1,423 @@ |
||||
/* |
||||
* This test is meant to run on Windows systems that has successfully |
||||
* run pg_import_system_collations(). Also, the database must have |
||||
* WIN1252 encoding, because of the locales' own encodings. Because |
||||
* of this, some test are lost from UTF-8 version, such as Turkish |
||||
* dotted and undotted 'i'. |
||||
*/ |
||||
SELECT getdatabaseencoding() <> 'WIN1252' OR |
||||
(SELECT count(*) FROM pg_collation WHERE collname IN ('de_DE', 'en_US', 'sv_SE') AND collencoding = pg_char_to_encoding('WIN1252')) <> 3 OR |
||||
(version() !~ 'Visual C\+\+' AND version() !~ 'mingw32' AND version() !~ 'windows') |
||||
AS skip_test \gset |
||||
\if :skip_test |
||||
\quit |
||||
\endif |
||||
|
||||
SET client_encoding TO WIN1252; |
||||
|
||||
CREATE SCHEMA collate_tests; |
||||
SET search_path = collate_tests; |
||||
|
||||
|
||||
CREATE TABLE collate_test1 ( |
||||
a int, |
||||
b text COLLATE "en_US" NOT NULL |
||||
); |
||||
|
||||
\d collate_test1 |
||||
|
||||
CREATE TABLE collate_test_fail ( |
||||
a int, |
||||
b text COLLATE "ja_JP.eucjp" |
||||
); |
||||
|
||||
CREATE TABLE collate_test_fail ( |
||||
a int, |
||||
b text COLLATE "foo" |
||||
); |
||||
|
||||
CREATE TABLE collate_test_fail ( |
||||
a int COLLATE "en_US", |
||||
b text |
||||
); |
||||
|
||||
CREATE TABLE collate_test_like ( |
||||
LIKE collate_test1 |
||||
); |
||||
|
||||
\d collate_test_like |
||||
|
||||
CREATE TABLE collate_test2 ( |
||||
a int, |
||||
b text COLLATE "sv_SE" |
||||
); |
||||
|
||||
CREATE TABLE collate_test3 ( |
||||
a int, |
||||
b text COLLATE "C" |
||||
); |
||||
|
||||
INSERT INTO collate_test1 VALUES (1, 'abc'), (2, 'äbc'), (3, 'bbc'), (4, 'ABC'); |
||||
INSERT INTO collate_test2 SELECT * FROM collate_test1; |
||||
INSERT INTO collate_test3 SELECT * FROM collate_test1; |
||||
|
||||
SELECT * FROM collate_test1 WHERE b >= 'bbc'; |
||||
SELECT * FROM collate_test2 WHERE b >= 'bbc'; |
||||
SELECT * FROM collate_test3 WHERE b >= 'bbc'; |
||||
SELECT * FROM collate_test3 WHERE b >= 'BBC'; |
||||
|
||||
SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc'; |
||||
SELECT * FROM collate_test1 WHERE b >= 'bbc' COLLATE "C"; |
||||
SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc' COLLATE "C"; |
||||
SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc' COLLATE "en_US"; |
||||
|
||||
|
||||
CREATE DOMAIN testdomain_sv AS text COLLATE "sv_SE"; |
||||
CREATE DOMAIN testdomain_i AS int COLLATE "sv_SE"; -- fails |
||||
CREATE TABLE collate_test4 ( |
||||
a int, |
||||
b testdomain_sv |
||||
); |
||||
INSERT INTO collate_test4 SELECT * FROM collate_test1; |
||||
SELECT a, b FROM collate_test4 ORDER BY b; |
||||
|
||||
CREATE TABLE collate_test5 ( |
||||
a int, |
||||
b testdomain_sv COLLATE "en_US" |
||||
); |
||||
INSERT INTO collate_test5 SELECT * FROM collate_test1; |
||||
SELECT a, b FROM collate_test5 ORDER BY b; |
||||
|
||||
|
||||
SELECT a, b FROM collate_test1 ORDER BY b; |
||||
SELECT a, b FROM collate_test2 ORDER BY b; |
||||
SELECT a, b FROM collate_test3 ORDER BY b; |
||||
|
||||
SELECT a, b FROM collate_test1 ORDER BY b COLLATE "C"; |
||||
|
||||
-- star expansion |
||||
SELECT * FROM collate_test1 ORDER BY b; |
||||
SELECT * FROM collate_test2 ORDER BY b; |
||||
SELECT * FROM collate_test3 ORDER BY b; |
||||
|
||||
-- constant expression folding |
||||
SELECT 'bbc' COLLATE "en_US" > 'äbc' COLLATE "en_US" AS "true"; |
||||
SELECT 'bbc' COLLATE "sv_SE" > 'äbc' COLLATE "sv_SE" AS "false"; |
||||
|
||||
-- LIKE/ILIKE |
||||
|
||||
SELECT * FROM collate_test1 WHERE b LIKE 'abc'; |
||||
SELECT * FROM collate_test1 WHERE b LIKE 'abc%'; |
||||
SELECT * FROM collate_test1 WHERE b LIKE '%bc%'; |
||||
SELECT * FROM collate_test1 WHERE b ILIKE 'abc'; |
||||
SELECT * FROM collate_test1 WHERE b ILIKE 'abc%'; |
||||
SELECT * FROM collate_test1 WHERE b ILIKE '%bc%'; |
||||
|
||||
|
||||
-- The following actually exercises the selectivity estimation for ILIKE. |
||||
SELECT relname FROM pg_class WHERE relname ILIKE 'abc%'; |
||||
|
||||
-- regular expressions |
||||
|
||||
SELECT * FROM collate_test1 WHERE b ~ '^abc$'; |
||||
SELECT * FROM collate_test1 WHERE b ~ '^abc'; |
||||
SELECT * FROM collate_test1 WHERE b ~ 'bc'; |
||||
SELECT * FROM collate_test1 WHERE b ~* '^abc$'; |
||||
SELECT * FROM collate_test1 WHERE b ~* '^abc'; |
||||
SELECT * FROM collate_test1 WHERE b ~* 'bc'; |
||||
|
||||
CREATE TABLE collate_test6 ( |
||||
a int, |
||||
b text COLLATE "en_US" |
||||
); |
||||
INSERT INTO collate_test6 VALUES (1, 'abc'), (2, 'ABC'), (3, '123'), (4, 'ab1'), |
||||
(5, 'a1!'), (6, 'a c'), (7, '!.;'), (8, ' '), |
||||
(9, 'äbç'), (10, 'ÄBÇ'); |
||||
SELECT b, |
||||
b ~ '^[[:alpha:]]+$' AS is_alpha, |
||||
b ~ '^[[:upper:]]+$' AS is_upper, |
||||
b ~ '^[[:lower:]]+$' AS is_lower, |
||||
b ~ '^[[:digit:]]+$' AS is_digit, |
||||
b ~ '^[[:alnum:]]+$' AS is_alnum, |
||||
b ~ '^[[:graph:]]+$' AS is_graph, |
||||
b ~ '^[[:print:]]+$' AS is_print, |
||||
b ~ '^[[:punct:]]+$' AS is_punct, |
||||
b ~ '^[[:space:]]+$' AS is_space |
||||
FROM collate_test6; |
||||
|
||||
|
||||
-- The following actually exercises the selectivity estimation for ~*. |
||||
SELECT relname FROM pg_class WHERE relname ~* '^abc'; |
||||
|
||||
|
||||
-- to_char |
||||
|
||||
SET lc_time TO 'de_DE'; |
||||
SELECT to_char(date '2010-03-01', 'DD TMMON YYYY'); |
||||
SELECT to_char(date '2010-03-01', 'DD TMMON YYYY' COLLATE "de_DE"); |
||||
|
||||
-- to_date |
||||
|
||||
SELECT to_date('01 MÄR 2010', 'DD TMMON YYYY'); |
||||
SELECT to_date('01 Mär 2010', 'DD TMMON YYYY'); |
||||
SELECT to_date('1234567890ab 2010', 'TMMONTH YYYY'); -- fail |
||||
|
||||
|
||||
-- backwards parsing |
||||
|
||||
CREATE VIEW collview1 AS SELECT * FROM collate_test1 WHERE b COLLATE "C" >= 'bbc'; |
||||
CREATE VIEW collview2 AS SELECT a, b FROM collate_test1 ORDER BY b COLLATE "C"; |
||||
|
||||
SELECT table_name, view_definition FROM information_schema.views |
||||
WHERE table_name LIKE 'collview%' ORDER BY 1; |
||||
|
||||
|
||||
-- collation propagation in various expression types |
||||
|
||||
SELECT a, coalesce(b, 'foo') FROM collate_test1 ORDER BY 2; |
||||
SELECT a, coalesce(b, 'foo') FROM collate_test2 ORDER BY 2; |
||||
SELECT a, coalesce(b, 'foo') FROM collate_test3 ORDER BY 2; |
||||
|
||||
SELECT a, b, greatest(b, 'CCC') FROM collate_test1 ORDER BY 3; |
||||
SELECT a, b, greatest(b, 'CCC') FROM collate_test2 ORDER BY 3; |
||||
SELECT a, b, greatest(b, 'CCC') FROM collate_test3 ORDER BY 3; |
||||
|
||||
SELECT a, nullif(b, 'abc') FROM collate_test1 ORDER BY 2; |
||||
SELECT a, nullif(b, 'abc') FROM collate_test2 ORDER BY 2; |
||||
SELECT a, nullif(b, 'abc') FROM collate_test3 ORDER BY 2; |
||||
|
||||
SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test1 ORDER BY 2; |
||||
SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test2 ORDER BY 2; |
||||
SELECT a, CASE b WHEN 'abc' THEN 'abcd' ELSE b END FROM collate_test3 ORDER BY 2; |
||||
|
||||
CREATE DOMAIN testdomain AS text; |
||||
SELECT a, b::testdomain FROM collate_test1 ORDER BY 2; |
||||
SELECT a, b::testdomain FROM collate_test2 ORDER BY 2; |
||||
SELECT a, b::testdomain FROM collate_test3 ORDER BY 2; |
||||
SELECT a, b::testdomain_sv FROM collate_test3 ORDER BY 2; |
||||
|
||||
SELECT min(b), max(b) FROM collate_test1; |
||||
SELECT min(b), max(b) FROM collate_test2; |
||||
SELECT min(b), max(b) FROM collate_test3; |
||||
|
||||
SELECT array_agg(b ORDER BY b) FROM collate_test1; |
||||
SELECT array_agg(b ORDER BY b) FROM collate_test2; |
||||
SELECT array_agg(b ORDER BY b) FROM collate_test3; |
||||
|
||||
SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test1 ORDER BY 2; |
||||
SELECT a, b FROM collate_test2 UNION SELECT a, b FROM collate_test2 ORDER BY 2; |
||||
SELECT a, b FROM collate_test3 WHERE a < 4 INTERSECT SELECT a, b FROM collate_test3 WHERE a > 1 ORDER BY 2; |
||||
SELECT a, b FROM collate_test3 EXCEPT SELECT a, b FROM collate_test3 WHERE a < 2 ORDER BY 2; |
||||
|
||||
SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3 ORDER BY 2; -- fail |
||||
SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3; -- ok |
||||
SELECT a, b FROM collate_test1 UNION SELECT a, b FROM collate_test3 ORDER BY 2; -- fail |
||||
SELECT a, b COLLATE "C" FROM collate_test1 UNION SELECT a, b FROM collate_test3 ORDER BY 2; -- ok |
||||
SELECT a, b FROM collate_test1 INTERSECT SELECT a, b FROM collate_test3 ORDER BY 2; -- fail |
||||
SELECT a, b FROM collate_test1 EXCEPT SELECT a, b FROM collate_test3 ORDER BY 2; -- fail |
||||
|
||||
CREATE TABLE test_u AS SELECT a, b FROM collate_test1 UNION ALL SELECT a, b FROM collate_test3; -- fail |
||||
|
||||
-- collation mismatch between recursive and non-recursive term |
||||
WITH RECURSIVE foo(x) AS |
||||
(SELECT x FROM (VALUES('a' COLLATE "en_US"),('b')) t(x) |
||||
UNION ALL |
||||
SELECT (x || 'c') COLLATE "de_DE" FROM foo WHERE length(x) < 10) |
||||
SELECT * FROM foo; |
||||
|
||||
|
||||
-- casting |
||||
|
||||
SELECT CAST('42' AS text COLLATE "C"); |
||||
|
||||
SELECT a, CAST(b AS varchar) FROM collate_test1 ORDER BY 2; |
||||
SELECT a, CAST(b AS varchar) FROM collate_test2 ORDER BY 2; |
||||
SELECT a, CAST(b AS varchar) FROM collate_test3 ORDER BY 2; |
||||
|
||||
|
||||
-- propagation of collation in SQL functions (inlined and non-inlined cases) |
||||
-- and plpgsql functions too |
||||
|
||||
CREATE FUNCTION mylt (text, text) RETURNS boolean LANGUAGE sql |
||||
AS $$ select $1 < $2 $$; |
||||
|
||||
CREATE FUNCTION mylt_noninline (text, text) RETURNS boolean LANGUAGE sql |
||||
AS $$ select $1 < $2 limit 1 $$; |
||||
|
||||
CREATE FUNCTION mylt_plpgsql (text, text) RETURNS boolean LANGUAGE plpgsql |
||||
AS $$ begin return $1 < $2; end $$; |
||||
|
||||
SELECT a.b AS a, b.b AS b, a.b < b.b AS lt, |
||||
mylt(a.b, b.b), mylt_noninline(a.b, b.b), mylt_plpgsql(a.b, b.b) |
||||
FROM collate_test1 a, collate_test1 b |
||||
ORDER BY a.b, b.b; |
||||
|
||||
SELECT a.b AS a, b.b AS b, a.b < b.b COLLATE "C" AS lt, |
||||
mylt(a.b, b.b COLLATE "C"), mylt_noninline(a.b, b.b COLLATE "C"), |
||||
mylt_plpgsql(a.b, b.b COLLATE "C") |
||||
FROM collate_test1 a, collate_test1 b |
||||
ORDER BY a.b, b.b; |
||||
|
||||
|
||||
-- collation override in plpgsql |
||||
|
||||
CREATE FUNCTION mylt2 (x text, y text) RETURNS boolean LANGUAGE plpgsql AS $$ |
||||
declare |
||||
xx text := x; |
||||
yy text := y; |
||||
begin |
||||
return xx < yy; |
||||
end |
||||
$$; |
||||
|
||||
SELECT mylt2('a', 'B' collate "en_US") as t, mylt2('a', 'B' collate "C") as f; |
||||
|
||||
CREATE OR REPLACE FUNCTION |
||||
mylt2 (x text, y text) RETURNS boolean LANGUAGE plpgsql AS $$ |
||||
declare |
||||
xx text COLLATE "POSIX" := x; |
||||
yy text := y; |
||||
begin |
||||
return xx < yy; |
||||
end |
||||
$$; |
||||
|
||||
SELECT mylt2('a', 'B') as f; |
||||
SELECT mylt2('a', 'B' collate "C") as fail; -- conflicting collations |
||||
SELECT mylt2('a', 'B' collate "POSIX") as f; |
||||
|
||||
|
||||
-- polymorphism |
||||
|
||||
SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test1)) ORDER BY 1; |
||||
SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test2)) ORDER BY 1; |
||||
SELECT * FROM unnest((SELECT array_agg(b ORDER BY b) FROM collate_test3)) ORDER BY 1; |
||||
|
||||
CREATE FUNCTION dup (anyelement) RETURNS anyelement |
||||
AS 'select $1' LANGUAGE sql; |
||||
|
||||
SELECT a, dup(b) FROM collate_test1 ORDER BY 2; |
||||
SELECT a, dup(b) FROM collate_test2 ORDER BY 2; |
||||
SELECT a, dup(b) FROM collate_test3 ORDER BY 2; |
||||
|
||||
|
||||
-- indexes |
||||
|
||||
CREATE INDEX collate_test1_idx1 ON collate_test1 (b); |
||||
CREATE INDEX collate_test1_idx2 ON collate_test1 (b COLLATE "C"); |
||||
CREATE INDEX collate_test1_idx3 ON collate_test1 ((b COLLATE "C")); -- this is different grammatically |
||||
CREATE INDEX collate_test1_idx4 ON collate_test1 (((b||'foo') COLLATE "POSIX")); |
||||
|
||||
CREATE INDEX collate_test1_idx5 ON collate_test1 (a COLLATE "C"); -- fail |
||||
CREATE INDEX collate_test1_idx6 ON collate_test1 ((a COLLATE "C")); -- fail |
||||
|
||||
SELECT relname, pg_get_indexdef(oid) FROM pg_class WHERE relname LIKE 'collate_test%_idx%' ORDER BY 1; |
||||
|
||||
|
||||
-- schema manipulation commands |
||||
|
||||
CREATE ROLE regress_test_role; |
||||
CREATE SCHEMA test_schema; |
||||
|
||||
-- We need to do this this way to cope with varying names for encodings: |
||||
do $$ |
||||
BEGIN |
||||
EXECUTE 'CREATE COLLATION test0 (locale = ' || |
||||
quote_literal(current_setting('lc_collate')) || ');'; |
||||
END |
||||
$$; |
||||
CREATE COLLATION test0 FROM "C"; -- fail, duplicate name |
||||
CREATE COLLATION IF NOT EXISTS test0 FROM "C"; -- ok, skipped |
||||
CREATE COLLATION IF NOT EXISTS test0 (locale = 'foo'); -- ok, skipped |
||||
do $$ |
||||
BEGIN |
||||
EXECUTE 'CREATE COLLATION test1 (lc_collate = ' || |
||||
quote_literal(current_setting('lc_collate')) || |
||||
', lc_ctype = ' || |
||||
quote_literal(current_setting('lc_ctype')) || ');'; |
||||
END |
||||
$$; |
||||
CREATE COLLATION test3 (lc_collate = 'en_US.utf8'); -- fail, need lc_ctype |
||||
CREATE COLLATION testx (locale = 'nonsense'); -- fail |
||||
|
||||
CREATE COLLATION test4 FROM nonsense; |
||||
CREATE COLLATION test5 FROM test0; |
||||
|
||||
SELECT collname FROM pg_collation WHERE collname LIKE 'test%' ORDER BY 1; |
||||
|
||||
ALTER COLLATION test1 RENAME TO test11; |
||||
ALTER COLLATION test0 RENAME TO test11; -- fail |
||||
ALTER COLLATION test1 RENAME TO test22; -- fail |
||||
|
||||
ALTER COLLATION test11 OWNER TO regress_test_role; |
||||
ALTER COLLATION test11 OWNER TO nonsense; |
||||
ALTER COLLATION test11 SET SCHEMA test_schema; |
||||
|
||||
COMMENT ON COLLATION test0 IS 'US English'; |
||||
|
||||
SELECT collname, nspname, obj_description(pg_collation.oid, 'pg_collation') |
||||
FROM pg_collation JOIN pg_namespace ON (collnamespace = pg_namespace.oid) |
||||
WHERE collname LIKE 'test%' |
||||
ORDER BY 1; |
||||
|
||||
DROP COLLATION test0, test_schema.test11, test5; |
||||
DROP COLLATION test0; -- fail |
||||
DROP COLLATION IF EXISTS test0; |
||||
|
||||
SELECT collname FROM pg_collation WHERE collname LIKE 'test%'; |
||||
|
||||
DROP SCHEMA test_schema; |
||||
DROP ROLE regress_test_role; |
||||
|
||||
|
||||
-- ALTER |
||||
|
||||
ALTER COLLATION "en_US" REFRESH VERSION; |
||||
|
||||
-- also test for database while we are here |
||||
SELECT current_database() AS datname \gset |
||||
ALTER DATABASE :"datname" REFRESH COLLATION VERSION; |
||||
|
||||
|
||||
-- dependencies |
||||
|
||||
CREATE COLLATION test0 FROM "C"; |
||||
|
||||
CREATE TABLE collate_dep_test1 (a int, b text COLLATE test0); |
||||
CREATE DOMAIN collate_dep_dom1 AS text COLLATE test0; |
||||
CREATE TYPE collate_dep_test2 AS (x int, y text COLLATE test0); |
||||
CREATE VIEW collate_dep_test3 AS SELECT text 'foo' COLLATE test0 AS foo; |
||||
CREATE TABLE collate_dep_test4t (a int, b text); |
||||
CREATE INDEX collate_dep_test4i ON collate_dep_test4t (b COLLATE test0); |
||||
|
||||
DROP COLLATION test0 RESTRICT; -- fail |
||||
DROP COLLATION test0 CASCADE; |
||||
|
||||
\d collate_dep_test1 |
||||
\d collate_dep_test2 |
||||
|
||||
DROP TABLE collate_dep_test1, collate_dep_test4t; |
||||
DROP TYPE collate_dep_test2; |
||||
|
||||
-- test range types and collations |
||||
|
||||
create type textrange_c as range(subtype=text, collation="C"); |
||||
create type textrange_en_us as range(subtype=text, collation="en_US"); |
||||
|
||||
select textrange_c('A','Z') @> 'b'::text; |
||||
select textrange_en_us('A','Z') @> 'b'::text; |
||||
|
||||
drop type textrange_c; |
||||
drop type textrange_en_us; |
||||
|
||||
|
||||
-- nondeterministic collations |
||||
-- (not supported with libc provider) |
||||
|
||||
CREATE COLLATION ctest_det (locale = 'en_US', deterministic = true); |
||||
CREATE COLLATION ctest_nondet (locale = 'en_US', deterministic = false); |
||||
|
||||
|
||||
-- cleanup |
||||
SET client_min_messages TO warning; |
||||
DROP SCHEMA collate_tests CASCADE; |
||||
Loading…
Reference in new issue