mirror of
https://git.postgresql.org/git/postgresql.git
synced 2024-10-05 10:16:52 +02:00
a290378a37
This modernized version of Soundex works significantly better than the original, particularly for non-English names. Dag Lem, reviewed by quite a few people along the way Discussion: https://postgr.es/m/yger1atbgfy.fsf@sid.nimrod.no
62 lines
1.2 KiB
Plaintext
62 lines
1.2 KiB
Plaintext
/*
|
|
* This test must be run in a database with UTF-8 encoding,
|
|
* because other encodings don't support all the characters used.
|
|
*/
|
|
SELECT getdatabaseencoding() <> 'UTF8'
|
|
AS skip_test \gset
|
|
\if :skip_test
|
|
\quit
|
|
\endif
|
|
set client_encoding = utf8;
|
|
-- CREATE EXTENSION IF NOT EXISTS fuzzystrmatch;
|
|
-- Accents
|
|
SELECT daitch_mokotoff('Müller');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{689000}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('Schäfer');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{479000}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('Straßburg');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{294795}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('Éregon');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{095600}
|
|
(1 row)
|
|
|
|
-- Special characters added at https://www.jewishgen.org/InfoFiles/Soundex.html
|
|
SELECT daitch_mokotoff('gąszczu');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{564000,540000}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('brzęczy');
|
|
daitch_mokotoff
|
|
-------------------------------
|
|
{794640,794400,746400,744000}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('ţamas');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{364000,464000}
|
|
(1 row)
|
|
|
|
SELECT daitch_mokotoff('țamas');
|
|
daitch_mokotoff
|
|
-----------------
|
|
{364000,464000}
|
|
(1 row)
|
|
|