* @ingroup Language
*/
class LanguageJa extends Language {
- function wordSegmentation( $string ) {
+ function segmentByWord( $string ) {
// Strip known punctuation ?
// $s = preg_replace( '/\xe3\x80[\x80-\xbf]/', '', $s ); # U3000-303f
return $s;
}
- function normalizeForSearch( $string ) {
- // Double-width roman characters
- $s = self::convertDoubleWidth( $string );
-
- # Do general case folding and UTF-8 armoring
- return parent::normalizeForSearch( $s );
- }
-
# Italic is not appropriate for Japanese script
# Unfortunately most browsers do not recognise this, and render <em> as italic
function emphasize( $text ) {