wordpress-develop/tests/phpunit/tests/formatting/RemoveAccents.php
Gary Pendergast 8f95800d52 Code is Poetry.
WordPress' code just... wasn't.
This is now dealt with.

Props jrf, pento, netweb, GaryJ, jdgrimes, westonruter, Greg Sherwood from PHPCS, and everyone who's ever contributed to WPCS and PHPCS.
Fixes #41057.



git-svn-id: https://develop.svn.wordpress.org/trunk@42343 602fd350-edb4-49c9-b593-d223f7449a82
2017-11-30 23:09:33 +00:00

147 lines
5.1 KiB
PHP
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

<?php
/**
* @group formatting
*/
class Tests_Formatting_RemoveAccents extends WP_UnitTestCase {
public function test_remove_accents_simple() {
$this->assertEquals( 'abcdefghijkl', remove_accents( 'abcdefghijkl' ) );
}
/**
* @ticket 9591
*/
public function test_remove_accents_latin1_supplement() {
$input = 'ªºÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ';
$output = 'aoAAAAAAAECEEEEIIIIDNOOOOOOUUUUYTHsaaaaaaaeceeeeiiiidnoooooouuuuythy';
$this->assertEquals( $output, remove_accents( $input ), 'remove_accents replaces Latin-1 Supplement' );
}
public function test_remove_accents_latin_extended_a() {
$input = 'ĀāĂ㥹ĆćĈĉĊċČčĎďĐđĒēĔĕĖėĘęĚěĜĝĞğĠġĢģĤĥĦħĨĩĪīĬĭĮįİıIJijĴĵĶķĸĹĺĻļĽľĿŀŁłŃńŅņŇňʼnŊŋŌōŎŏŐőŒœŔŕŖŗŘřŚśŜŝŞşŠšŢţŤťŦŧŨũŪūŬŭŮůŰűŲųŴŵŶŷŸŹźŻżŽžſ';
$output = 'AaAaAaCcCcCcCcDdDdEeEeEeEeEeGgGgGgGgHhHhIiIiIiIiIiIJijJjKkkLlLlLlLlLlNnNnNnnNnOoOoOoOEoeRrRrRrSsSsSsSsTtTtTtUuUuUuUuUuUuWwYyYZzZzZzs';
$this->assertEquals( $output, remove_accents( $input ), 'remove_accents replaces Latin Extended A' );
}
public function test_remove_accents_latin_extended_b() {
$this->assertEquals( 'SsTt', remove_accents( 'ȘșȚț' ), 'remove_accents replaces Latin Extended B' );
}
public function test_remove_accents_euro_pound_signs() {
$this->assertEquals( 'E', remove_accents( '€' ), 'remove_accents replaces euro sign' );
$this->assertEquals( '', remove_accents( '£' ), 'remove_accents replaces pound sign' );
}
public function test_remove_accents_iso8859() {
// File is Latin1 encoded
$file = DIR_TESTDATA . '/formatting/remove_accents.01.input.txt';
$input = file_get_contents( $file );
$input = trim( $input );
$output = 'EfSZszYcYuAAAAAACEEEEIIIINOOOOOOUUUUYaaaaaaceeeeiiiinoooooouuuuyyOEoeAEDHTHssaedhth';
$this->assertEquals( $output, remove_accents( $input ), 'remove_accents from ISO-8859-1 text' );
}
/**
* @ticket 17738
*/
public function test_remove_accents_vowels_diacritic() {
// Vowels with diacritic
// unmarked
$this->assertEquals( 'OoUu', remove_accents( 'ƠơƯư' ) );
// grave accent
$this->assertEquals( 'AaAaEeOoOoUuYy', remove_accents( 'ẦầẰằỀềỒồỜờỪừỲỳ' ) );
// hook
$this->assertEquals( 'AaAaAaEeEeIiOoOoOoUuUuYy', remove_accents( 'ẢảẨẩẲẳẺẻỂểỈỉỎỏỔổỞởỦủỬửỶỷ' ) );
// tilde
$this->assertEquals( 'AaAaEeEeOoOoUuYy', remove_accents( 'ẪẫẴẵẼẽỄễỖỗỠỡỮữỸỹ' ) );
// acute accent
$this->assertEquals( 'AaAaEeOoOoUu', remove_accents( 'ẤấẮắẾếỐốỚớỨứ' ) );
// dot below
$this->assertEquals( 'AaAaAaEeEeIiOoOoOoUuUuYy', remove_accents( 'ẠạẬậẶặẸẹỆệỊịỌọỘộỢợỤụỰựỴỵ' ) );
}
/**
* @ticket 20772
*/
public function test_remove_accents_hanyu_pinyin() {
// Vowels with diacritic (Chinese, Hanyu Pinyin)
// macron
$this->assertEquals( 'aeiouuAEIOUU', remove_accents( 'āēīōūǖĀĒĪŌŪǕ' ) );
// acute accent
$this->assertEquals( 'aeiouuAEIOUU', remove_accents( 'áéíóúǘÁÉÍÓÚǗ' ) );
// caron
$this->assertEquals( 'aeiouuAEIOUU', remove_accents( 'ǎěǐǒǔǚǍĚǏǑǓǙ' ) );
// grave accent
$this->assertEquals( 'aeiouuAEIOUU', remove_accents( 'àèìòùǜÀÈÌÒÙǛ' ) );
// unmarked
$this->assertEquals( 'aaeiouuAEIOUU', remove_accents( 'aɑeiouüAEIOUÜ' ) );
}
function _remove_accents_germanic_umlauts_cb() {
return 'de_DE';
}
/**
* @ticket 3782
*/
public function test_remove_accents_germanic_umlauts() {
add_filter( 'locale', array( $this, '_remove_accents_germanic_umlauts_cb' ) );
$this->assertEquals( 'AeOeUeaeoeuess', remove_accents( 'ÄÖÜäöüß' ) );
remove_filter( 'locale', array( $this, '_remove_accents_germanic_umlauts_cb' ) );
}
public function _set_locale_to_danish() {
return 'da_DK';
}
/**
* @ticket 23907
*/
public function test_remove_danish_accents() {
add_filter( 'locale', array( $this, '_set_locale_to_danish' ) );
$this->assertEquals( 'AeOeAaaeoeaa', remove_accents( 'ÆØÅæøå' ) );
remove_filter( 'locale', array( $this, '_set_locale_to_danish' ) );
}
public function _set_locale_to_catalan() {
return 'ca';
}
/**
* @ticket 37086
*/
public function test_remove_catalan_middot() {
add_filter( 'locale', array( $this, '_set_locale_to_catalan' ) );
$this->assertEquals( 'allallalla', remove_accents( 'al·lallaŀla' ) );
remove_filter( 'locale', array( $this, '_set_locale_to_catalan' ) );
$this->assertEquals( 'al·lallalla', remove_accents( 'al·lallaŀla' ) );
}
public function _set_locale_to_serbian() {
return 'sr_RS';
}
/**
* @ticket 38078
*/
public function test_transcribe_serbian_crossed_d() {
add_filter( 'locale', array( $this, '_set_locale_to_serbian' ) );
$this->assertEquals( 'DJdj', remove_accents( 'Đđ' ) );
remove_filter( 'locale', array( $this, '_set_locale_to_serbian' ) );
$this->assertEquals( 'Dd', remove_accents( 'Đđ' ) );
}
}