From ad57ef6314ec3fd4e50d2caedc1d1d103f4f7db5 Mon Sep 17 00:00:00 2001 From: Jb Audras Date: Thu, 25 May 2023 13:12:55 +0000 Subject: [PATCH] Formatting: Add support for schwa in remove_accents(). MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit This changeset adds support for schwa character. Ə (U+018F) and ə (U+0259) are part of Latin Extended-B and used in several languages like Azerbaijani or also in gender neutral Italian. Props suleymankenar, audrasjb, przemekhernik. Fixes #57609. git-svn-id: https://develop.svn.wordpress.org/trunk@55858 602fd350-edb4-49c9-b593-d223f7449a82 --- src/wp-includes/formatting.php | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/src/wp-includes/formatting.php b/src/wp-includes/formatting.php index d71ab2d6c1..58cc0ec69b 100644 --- a/src/wp-includes/formatting.php +++ b/src/wp-includes/formatting.php @@ -1440,6 +1440,8 @@ function utf8_uri_encode( $utf8_string, $length = 0, $encode_ascii_characters = * * | Code | Glyph | Replacement | Description | * | -------- | ----- | ----------- | ----------------------------------------- | + * | U+018F | Ə | E | Latin capital letter Ə | + * | U+0259 | ǝ | e | Latin small letter ǝ | * | U+0218 | Ș | S | Latin capital letter S with comma below | * | U+0219 | ș | s | Latin small letter s with comma below | * | U+021A | Ț | T | Latin capital letter T with comma below | @@ -1805,6 +1807,8 @@ function remove_accents( $text, $locale = '' ) { 'ž' => 'z', 'ſ' => 's', // Decompositions for Latin Extended-B. + 'Ə' => 'E', + 'ǝ' => 'e', 'Ș' => 'S', 'ș' => 's', 'Ț' => 'T',