Convert unaccent tests to UTF-8

This makes it easier to add new tests that are specific to Unicode
features.  The files were previously in KOI8-R.

Discussion: https://www.postgresql.org/message-id/8506.1545111362@sss.pgh.pa.us
This commit is contained in:
Peter Eisentraut 2019-01-02 18:36:05 +01:00
parent 1707a0d2aa
commit b6f3649bba
2 changed files with 20 additions and 20 deletions

View File

@ -6,23 +6,23 @@ SELECT getdatabaseencoding();
UTF8
(1 row)
SET client_encoding TO 'KOI8';
SET client_encoding TO 'UTF8';
SELECT unaccent('foobar');
unaccent
----------
foobar
(1 row)
SELECT unaccent('L肆');
SELECT unaccent('ёлка');
unaccent
----------
盘肆
елка
(1 row)
SELECT unaccent('出殡');
SELECT unaccent('ЁЖИК');
unaccent
----------
弼殡
ЕЖИК
(1 row)
SELECT unaccent('unaccent', 'foobar');
@ -31,16 +31,16 @@ SELECT unaccent('unaccent', 'foobar');
foobar
(1 row)
SELECT unaccent('unaccent', 'L肆');
SELECT unaccent('unaccent', 'ёлка');
unaccent
----------
盘肆
елка
(1 row)
SELECT unaccent('unaccent', '出殡');
SELECT unaccent('unaccent', 'ЁЖИК');
unaccent
----------
弼殡
ЕЖИК
(1 row)
SELECT ts_lexize('unaccent', 'foobar');
@ -49,15 +49,15 @@ SELECT ts_lexize('unaccent', 'foobar');
(1 row)
SELECT ts_lexize('unaccent', 'L肆');
SELECT ts_lexize('unaccent', 'ёлка');
ts_lexize
-----------
{盘肆}
{елка}
(1 row)
SELECT ts_lexize('unaccent', '出殡');
SELECT ts_lexize('unaccent', 'ЁЖИК');
ts_lexize
-----------
{弼殡}
{ЕЖИК}
(1 row)

View File

@ -3,16 +3,16 @@ CREATE EXTENSION unaccent;
-- must have a UTF8 database
SELECT getdatabaseencoding();
SET client_encoding TO 'KOI8';
SET client_encoding TO 'UTF8';
SELECT unaccent('foobar');
SELECT unaccent('L肆');
SELECT unaccent('出殡');
SELECT unaccent('ёлка');
SELECT unaccent('ЁЖИК');
SELECT unaccent('unaccent', 'foobar');
SELECT unaccent('unaccent', 'L肆');
SELECT unaccent('unaccent', '出殡');
SELECT unaccent('unaccent', 'ёлка');
SELECT unaccent('unaccent', 'ЁЖИК');
SELECT ts_lexize('unaccent', 'foobar');
SELECT ts_lexize('unaccent', 'L肆');
SELECT ts_lexize('unaccent', '出殡');
SELECT ts_lexize('unaccent', 'ёлка');
SELECT ts_lexize('unaccent', 'ЁЖИК');