mirror of
				https://github.com/postgres/postgres.git
				synced 2025-11-03 09:13:20 +03:00 
			
		
		
		
	The tests of unaccent rely on UTF8 characters, and unlike any other test suite in the tree (fuzzystrmatch, citext, hstore, etc.), they would fail if run on a database that does not support UTF8 encoding. This commit fixes the tests of unaccent so as these are skipped when run on a database without UTF8 support, using the same method as the other test suits based on \if, getdatabaseencoding() and an alternate output file. This has been broken for a long time, but nobody has complained about that either, so no backpatch is done. This can be reproduced with something like REGRESS_OPTS="--no-locale --encoding=sql_ascii", for instance. To defend against that, this module's Makefile and meson.build enforced a UTF8 encoding without locales, but it did not offer protection for options given by REGRESS_OPTS. This switch makes this regression test suite more consistent with all the others, as well. Reviewed-by: Peter Eisentraut Discussion: https://postgr.es/m/ZIq1HUnIV2ksW85x@paquier.xyz
		
			
				
	
	
		
			43 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			SQL
		
	
	
	
	
	
			
		
		
	
	
			43 lines
		
	
	
		
			1.2 KiB
		
	
	
	
		
			SQL
		
	
	
	
	
	
/*
 | 
						||
 * This test must be run in a database with UTF-8 encoding,
 | 
						||
 * because other encodings don't support all the characters used.
 | 
						||
 */
 | 
						||
 | 
						||
SELECT getdatabaseencoding() <> 'UTF8'
 | 
						||
       AS skip_test \gset
 | 
						||
\if :skip_test
 | 
						||
\quit
 | 
						||
\endif
 | 
						||
 | 
						||
CREATE EXTENSION unaccent;
 | 
						||
 | 
						||
SET client_encoding TO 'UTF8';
 | 
						||
 | 
						||
SELECT unaccent('foobar');
 | 
						||
SELECT unaccent('ёлка');
 | 
						||
SELECT unaccent('ЁЖИК');
 | 
						||
SELECT unaccent('˃˖˗˜');
 | 
						||
SELECT unaccent('À');  -- Remove combining diacritical 0x0300
 | 
						||
SELECT unaccent('℃℉'); -- degree signs
 | 
						||
SELECT unaccent('℗'); -- sound recording copyright
 | 
						||
 | 
						||
SELECT unaccent('unaccent', 'foobar');
 | 
						||
SELECT unaccent('unaccent', 'ёлка');
 | 
						||
SELECT unaccent('unaccent', 'ЁЖИК');
 | 
						||
SELECT unaccent('unaccent', '˃˖˗˜');
 | 
						||
SELECT unaccent('unaccent', 'À');
 | 
						||
SELECT unaccent('unaccent', '℃℉');
 | 
						||
SELECT unaccent('unaccent', '℗');
 | 
						||
 | 
						||
SELECT ts_lexize('unaccent', 'foobar');
 | 
						||
SELECT ts_lexize('unaccent', 'ёлка');
 | 
						||
SELECT ts_lexize('unaccent', 'ЁЖИК');
 | 
						||
SELECT ts_lexize('unaccent', '˃˖˗˜');
 | 
						||
SELECT ts_lexize('unaccent', 'À');
 | 
						||
SELECT ts_lexize('unaccent', '℃℉');
 | 
						||
SELECT ts_lexize('unaccent', '℗');
 | 
						||
 | 
						||
-- Controversial case.  Black-Letter Capital H (U+210C) is translated by
 | 
						||
-- Latin-ASCII.xml as 'x', but it should be 'H'.
 | 
						||
SELECT unaccent('ℌ');
 |