wordpress-develop/tests/phpunit/tests/formatting/removeAccents.php
Sergey Biryukov 2d5f6833fb I18N: Add a $locale parameter for remove_accents().
This highlights the fact that `remove_accents()` is locale-aware and makes it easier to utilize the function with different locales without having to use `switch_to_locale()` or the `locale` filter.

Additionally, this commit relaxes the check for character replacements in German locales to include formal and informal variants of any `de_*` locale, even if WordPress does not have a native translation for some of them yet.

Props malthert, johnbillion, knutsp, ocean90, SergeyBiryukov.
Fixes #54415.

git-svn-id: https://develop.svn.wordpress.org/trunk@52809 602fd350-edb4-49c9-b593-d223f7449a82
2022-02-28 15:40:15 +00:00

113 lines
4.2 KiB
PHP
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?php
/**
* @group formatting
*/
class Tests_Formatting_RemoveAccents extends WP_UnitTestCase {
public function test_remove_accents_simple() {
$this->assertSame( 'abcdefghijkl', remove_accents( 'abcdefghijkl' ) );
}
/**
* @ticket 9591
*/
public function test_remove_accents_latin1_supplement() {
$input = 'ªºÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ';
$output = 'aoAAAAAAAECEEEEIIIIDNOOOOOOUUUUYTHsaaaaaaaeceeeeiiiidnoooooouuuuythy';
$this->assertSame( $output, remove_accents( $input ), 'remove_accents replaces Latin-1 Supplement' );
}
public function test_remove_accents_latin_extended_a() {
$input = 'ĀāĂ㥹ĆćĈĉĊċČčĎďĐđĒēĔĕĖėĘęĚěĜĝĞğĠġĢģĤĥĦħĨĩĪīĬĭĮįİıIJijĴĵĶķĸĹĺĻļĽľĿŀŁłŃńŅņŇňʼnŊŋŌōŎŏŐőŒœŔŕŖŗŘřŚśŜŝŞşŠšŢţŤťŦŧŨũŪūŬŭŮůŰűŲųŴŵŶŷŸŹźŻżŽžſ';
$output = 'AaAaAaCcCcCcCcDdDdEeEeEeEeEeGgGgGgGgHhHhIiIiIiIiIiIJijJjKkkLlLlLlLlLlNnNnNnnNnOoOoOoOEoeRrRrRrSsSsSsSsTtTtTtUuUuUuUuUuUuWwYyYZzZzZzs';
$this->assertSame( $output, remove_accents( $input ), 'remove_accents replaces Latin Extended A' );
}
public function test_remove_accents_latin_extended_b() {
$this->assertSame( 'SsTt', remove_accents( 'ȘșȚț' ), 'remove_accents replaces Latin Extended B' );
}
public function test_remove_accents_euro_pound_signs() {
$this->assertSame( 'E', remove_accents( '€' ), 'remove_accents replaces euro sign' );
$this->assertSame( '', remove_accents( '£' ), 'remove_accents replaces pound sign' );
}
public function test_remove_accents_iso8859() {
// File is Latin1-encoded.
$file = DIR_TESTDATA . '/formatting/remove_accents.01.input.txt';
$input = file_get_contents( $file );
$input = trim( $input );
$output = 'EfSZszYcYuAAAAAACEEEEIIIINOOOOOOUUUUYaaaaaaceeeeiiiinoooooouuuuyyOEoeAEDHTHssaedhth';
$this->assertSame( $output, remove_accents( $input ), 'remove_accents from ISO-8859-1 text' );
}
/**
* @ticket 17738
*/
public function test_remove_accents_vowels_diacritic() {
// Vowels with diacritic.
// Unmarked.
$this->assertSame( 'OoUu', remove_accents( 'ƠơƯư' ) );
// Grave accent.
$this->assertSame( 'AaAaEeOoOoUuYy', remove_accents( 'ẦầẰằỀềỒồỜờỪừỲỳ' ) );
// Hook.
$this->assertSame( 'AaAaAaEeEeIiOoOoOoUuUuYy', remove_accents( 'ẢảẨẩẲẳẺẻỂểỈỉỎỏỔổỞởỦủỬửỶỷ' ) );
// Tilde.
$this->assertSame( 'AaAaEeEeOoOoUuYy', remove_accents( 'ẪẫẴẵẼẽỄễỖỗỠỡỮữỸỹ' ) );
// Acute accent.
$this->assertSame( 'AaAaEeOoOoUu', remove_accents( 'ẤấẮắẾếỐốỚớỨứ' ) );
// Dot below.
$this->assertSame( 'AaAaAaEeEeIiOoOoOoUuUuYy', remove_accents( 'ẠạẬậẶặẸẹỆệỊịỌọỘộỢợỤụỰựỴỵ' ) );
}
/**
* @ticket 20772
*/
public function test_remove_accents_hanyu_pinyin() {
// Vowels with diacritic (Chinese, Hanyu Pinyin).
// Macron.
$this->assertSame( 'aeiouuAEIOUU', remove_accents( 'āēīōūǖĀĒĪŌŪǕ' ) );
// Acute accent.
$this->assertSame( 'aeiouuAEIOUU', remove_accents( 'áéíóúǘÁÉÍÓÚǗ' ) );
// Caron.
$this->assertSame( 'aeiouuAEIOUU', remove_accents( 'ǎěǐǒǔǚǍĚǏǑǓǙ' ) );
// Grave accent.
$this->assertSame( 'aeiouuAEIOUU', remove_accents( 'àèìòùǜÀÈÌÒÙǛ' ) );
// Unmarked.
$this->assertSame( 'aaeiouuAEIOUU', remove_accents( 'aɑeiouüAEIOUÜ' ) );
}
/**
* @ticket 3782
*/
public function test_remove_accents_germanic_umlauts() {
$this->assertSame( 'AeOeUeaeoeuess', remove_accents( 'ÄÖÜäöüß', 'de_DE' ) );
}
/**
* @ticket 23907
*/
public function test_remove_danish_accents() {
$this->assertSame( 'AeOeAaaeoeaa', remove_accents( 'ÆØÅæøå', 'da_DK' ) );
}
/**
* @ticket 37086
*/
public function test_remove_catalan_middot() {
$this->assertSame( 'allallalla', remove_accents( 'al·lallaŀla', 'ca' ) );
$this->assertSame( 'al·lallalla', remove_accents( 'al·lallaŀla' ) );
}
/**
* @ticket 38078
*/
public function test_transcribe_serbian_crossed_d() {
$this->assertSame( 'DJdj', remove_accents( 'Đđ', 'sr_RS' ) );
$this->assertSame( 'Dd', remove_accents( 'Đđ' ) );
}
}