From 17ec2c5dfa8dc6fee3df749d214238d34ee681c9 Mon Sep 17 00:00:00 2001 From: Peter Eisentraut Date: Wed, 23 Aug 2023 11:23:42 +0200 Subject: [PATCH] doc: Add more ICU rules examples In particular, add an example EBCDIC collation. Author: Daniel Verite Discussion: https://www.postgresql.org/message-id/flat/35cc1684-e516-4a01-a256-351632d47066@manitou-mail.org --- doc/src/sgml/charset.sgml | 58 +++++++++++++++++++++++++- doc/src/sgml/ref/create_collation.sgml | 13 ++---- doc/src/sgml/ref/create_database.sgml | 4 +- 3 files changed, 62 insertions(+), 13 deletions(-) diff --git a/doc/src/sgml/charset.sgml b/doc/src/sgml/charset.sgml index dd092fddd61..25febcac4c0 100644 --- a/doc/src/sgml/charset.sgml +++ b/doc/src/sgml/charset.sgml @@ -1481,7 +1481,7 @@ SELECT 'x-y' = 'x_y' COLLATE level4; -- false - Examples + Collation Settings Examples @@ -1530,6 +1530,62 @@ SELECT 'x-y' = 'x_y' COLLATE level4; -- false + + ICU Tailoring Rules + + + If the options provided by the collation settings shown above are not + sufficient, the order of collation elements can be changed with tailoring + rules, whose syntax is detailed at . + + + + This small example creates a collation based on the root locale with a + tailoring rule: + + + + With this rule, the letter W is sorted after + V, but is treated as a secondary difference similar to an + accent. Rules like this are contained in the locale definitions of some + languages. (Of course, if a locale definition already contains the + desired rules, then they don't need to be specified again explicitly.) + + + + Here is a more complex example. The following statement sets up a + collation named ebcdic with rules to sort US-ASCII + characters in the order of the EBCDIC encoding. + + +' < '?' +< '`' < ':' < '#' < '@' < \' < '=' < '"' +<*a-r < '~' <*s-z < '^' < '[' < ']' +< '{' <*A-I < '}' <*J-R < '\' <*S-Z <*0-9 +$$);]]> + +SELECT c +FROM (VALUES ('a'), ('b'), ('A'), ('B'), ('1'), ('2'), ('!'), ('^')) AS x(c) +ORDER BY c COLLATE ebcdic; + c +--- + ! + a + b + ^ + A + B + 1 + 2 + + + + External References for ICU diff --git a/doc/src/sgml/ref/create_collation.sgml b/doc/src/sgml/ref/create_collation.sgml index b86a9bbb9ce..5cf9777764b 100644 --- a/doc/src/sgml/ref/create_collation.sgml +++ b/doc/src/sgml/ref/create_collation.sgml @@ -165,9 +165,8 @@ CREATE COLLATION [ IF NOT EXISTS ] name FROM Specifies additional collation rules to customize the behavior of the - collation. This is supported for ICU only. See - for details on the syntax. + collation. This is supported for ICU only. See for details. @@ -257,12 +256,8 @@ CREATE COLLATION german_phonebook (provider = icu, locale = 'de-u-co-phonebk'); - With this rule, the letter W is sorted after - V, but is treated as a secondary difference similar to an - accent. Rules like this are contained in the locale definitions of some - languages. (Of course, if a locale definition already contains the desired - rules, then they don't need to be specified again explicitly.) See the ICU - documentation for further details and examples on the rules syntax. + See for further details and examples + on the rules syntax. diff --git a/doc/src/sgml/ref/create_database.sgml b/doc/src/sgml/ref/create_database.sgml index b2c8aef1ad2..ce7317f81ba 100644 --- a/doc/src/sgml/ref/create_database.sgml +++ b/doc/src/sgml/ref/create_database.sgml @@ -232,9 +232,7 @@ CREATE DATABASE name Specifies additional collation rules to customize the behavior of the default collation of this database. This is supported for ICU only. - See - for details on the syntax. + See for details.