<?php
class SInflection
{
private static $plural_rules = array
(
'/(fish)$/i' => '\1\2', # fish
'/(x|ch|ss|sh)$/' => '\1es', # search, switch, fix, box, process, address
'/series$/' => '\1series',
'/([^aeiouy]|qu)ies$/' => '\1y',
'/([^aeiouy]|qu)y$/' => '\1ies', # query, ability, agency
'/(?:([^f])fe|([lr])f)$/' => '\1\2ves', # half, safe, wife
'/sis$/' => 'ses', # basis, diagnosis
'/([ti])um$/' => '\1a', # datum, medium
'/person$/' => 'people', # person, salesperson
'/man$/' => 'men', # man, woman, spokesman
'/child$/' => 'children', # child
'/(alias|status)$/i' => '\1es',
'/s$/' => 's', # no change (compatibility)
'/$/' => 's'
);
private static $singular_rules = array
(
'/(f)ish$/i' => '\1\2ish',
'/(x|ch|ss)es$/' => '\1',
'/movies$/' => 'movie',
'/series$/' => 'series',
'/([^aeiouy]|qu)ies$/' => '\1y',
'/([lr])ves$/' => '\1f',
'/([^f])ves$/' => '\1fe',
'/(analy|ba|diagno|parenthe|progno|synop|the)ses$/' => '\1sis',
'/([ti])a$/' => '\1um',
'/people$/' => 'person',
'/men$/' => 'man',
'/(alias|status)es$/i' => '\1',
'/children$/' => 'child',
'/news$/' => 'news',
'/s$/' => ''
);
/**
* UTF-8 lookup table for lower case accented letters
*
* This lookuptable defines replacements for accented characters from the ASCII-7
* range. This are lower case letters only.
*
* @author Andreas Gohr <hide@address.com>
*/
private static $utf8_lower_accents = array
(
'à ' => 'a', 'ô' => 'o', 'd' => 'd', '?' => 'f', 'ë' => 'e', 'š' => 's', 'o' => 'o',
'Ã' => 'ss', 'a' => 'a', 'r' => 'r', '?' => 't', 'n' => 'n', 'a' => 'a', 'k' => 'k',
's' => 's', '?' => 'y', 'n' => 'n', 'l' => 'l', 'h' => 'h', '?' => 'p', 'ó' => 'o',
'ú' => 'u', 'e' => 'e', 'é' => 'e', 'ç' => 'c', '?' => 'w', 'c' => 'c', 'õ' => 'o',
'?' => 's', 'ø' => 'o', 'g' => 'g', 't' => 't', '?' => 's', 'e' => 'e', 'c' => 'c',
's' => 's', 'î' => 'i', 'u' => 'u', 'c' => 'c', 'e' => 'e', 'w' => 'w', '?' => 't',
'u' => 'u', 'c' => 'c', 'ö' => 'oe', 'è' => 'e', 'y' => 'y', 'a' => 'a', 'l' => 'l',
'u' => 'u', 'u' => 'u', 's' => 's', 'g' => 'g', 'l' => 'l', 'Æ' => 'f', 'ž' => 'z',
'?' => 'w', '?' => 'b', 'å' => 'a', 'ì' => 'i', 'ï' => 'i', '?' => 'd', 't' => 't',
'r' => 'r', 'ä' => 'ae', 'Ã' => 'i', 'r' => 'r', 'ê' => 'e', 'ü' => 'ue', 'ò' => 'o',
'e' => 'e', 'ñ' => 'n', 'n' => 'n', 'h' => 'h', 'g' => 'g', 'd' => 'd', 'j' => 'j',
'ÿ' => 'y', 'u' => 'u', 'u' => 'u', 'u' => 'u', 't' => 't', 'ý' => 'y', 'o' => 'o',
'â' => 'a', 'l' => 'l', '?' => 'w', 'z' => 'z', 'i' => 'i', 'ã' => 'a', 'g' => 'g',
'?' => 'm', 'o' => 'o', 'i' => 'i', 'ù' => 'u', 'i' => 'i', 'z' => 'z', 'á' => 'a',
'û' => 'u', 'þ' => 'th', 'ð' => 'dh', 'æ' => 'ae', 'µ' => 'u',
);
/**
* UTF-8 lookup table for upper case accented letters
*
* This lookuptable defines replacements for accented characters from the ASCII-7
* range. This are upper case letters only.
*
* @author Andreas Gohr <hide@address.com>
*/
private static $utf8_upper_accents = array
(
'Ã' => 'A', 'Ã' => 'O', 'D' => 'D', '?' => 'F', 'Ã' => 'E', 'Å ' => 'S', 'O' => 'O',
'A' => 'A', 'R' => 'R', '?' => 'T', 'N' => 'N', 'A' => 'A', 'K' => 'K',
'S' => 'S', '?' => 'Y', 'N' => 'N', 'L' => 'L', 'H' => 'H', '?' => 'P', 'Ã' => 'O',
'Ã' => 'U', 'E' => 'E', 'Ã' => 'E', 'Ã' => 'C', '?' => 'W', 'C' => 'C', 'Ã' => 'O',
'?' => 'S', 'Ã' => 'O', 'G' => 'G', 'T' => 'T', '?' => 'S', 'E' => 'E', 'C' => 'C',
'S' => 'S', 'Ã' => 'I', 'U' => 'U', 'C' => 'C', 'E' => 'E', 'W' => 'W', '?' => 'T',
'U' => 'U', 'C' => 'C', 'Ã' => 'Oe', 'Ã' => 'E', 'Y' => 'Y', 'A' => 'A', 'L' => 'L',
'U' => 'U', 'U' => 'U', 'S' => 'S', 'G' => 'G', 'L' => 'L', 'Æ' => 'F', 'Ž' => 'Z',
'?' => 'W', '?' => 'B', 'Ã
' => 'A', 'Ã' => 'I', 'Ã' => 'I', '?' => 'D', 'T' => 'T',
'R' => 'R', 'Ã' => 'Ae', 'Ã' => 'I', 'R' => 'R', 'Ã' => 'E', 'Ã' => 'Ue', 'Ã' => 'O',
'E' => 'E', 'Ã' => 'N', 'N' => 'N', 'H' => 'H', 'G' => 'G', 'Ã' => 'D', 'J' => 'J',
'Ÿ' => 'Y', 'U' => 'U', 'U' => 'U', 'U' => 'U', 'T' => 'T', 'Ã' => 'Y', 'O' => 'O',
'Ã' => 'A', 'L' => 'L', '?' => 'W', 'Z' => 'Z', 'I' => 'I', 'Ã' => 'A', 'G' => 'G',
'?' => 'M', 'O' => 'O', 'I' => 'I', 'Ã' => 'U', 'I' => 'I', 'Z' => 'Z', 'Ã' => 'A',
'Ã' => 'U', 'Ã' => 'Th', 'Ã' => 'Dh', 'Ã' => 'Ae',
);
public static function add_singular_rule($regex, $singular)
{
self::$singular_rules = array($regex => $singular) + self::$singular_rules;
}
public static function add_plural_rule($regex, $plural)
{
self::$plural_rules = array($regex => $plural) + self::$plural_rules;
}
/**
* Returns the plural form of the <var>$word</var> argument.
*/
public static function pluralize($word)
{
foreach (self::$plural_rules as $rule => $replace)
{
if (preg_match($rule, $word))
return preg_replace($rule, $replace, $word);
}
return $word;
}
/**
* Returns the singular form of the <var>$word</var> argument.
*/
public static function singularize($word)
{
foreach (self::$singular_rules as $rule => $replace)
{
if (preg_match($rule, $word))
return preg_replace($rule, $replace, $word);
}
return $word;
}
/**
* Makes an underscored, lowercase form from the <var>$camel_cased_word</var> argument.
*
* Example : <code>SInflection::underscore('ActionController'); // => 'action_controller'</code>
*/
public static function underscore($camel_cased_word)
{
return strtolower(preg_replace('/([a-z\d])([A-Z])/', '\1_\2',
preg_replace('/([A-Z]+)([A-Z][a-z])/', '\1_\2', $camel_cased_word)));
}
/**
* Replaces underscores with dashes in the <var>$underscore_word</var> string.
*
* Example : <code>SInflection::dasherize('action_controller'); // => 'action-controller'</code>
*/
public static function dasherize($underscore_word)
{
return preg_replace('/_/', '-', $underscore_word);
}
/**
* Converts the <var>$underscore_word</var> argument to UpperCamelCase style.
*
* Example : <code>SInflection::camelize('action_controller'); // => 'ActionController'</code>
*/
public static function camelize($underscore_word)
{
return preg_replace('/(^|_)(.)/e', "strtoupper('\\2')", $underscore_word);
}
/**
* Capitalizes the first word, turns underscores into spaces and strips _id.
*
* Example : <code>
* SInflection::humanize('date_of_birth'); // => 'Date of birth'
* SInflection::humanize('user_id'); // => 'User'
* </code>
*/
public static function humanize($word)
{
return ucfirst(preg_replace('/_/', ' ', preg_replace('/_id/', '', $word)));
}
/**
* Transforms a sentence into an underscored wiki page name.
*
* Example : <code>SInflection::wikify('Hello world'); // => 'hello_world'</code>
*/
public static function wikify($sentence)
{
return strtolower(preg_replace('/\W/', '', preg_replace('/\s/', '_', $sentence)));
}
/**
* Transforms a sentence into a URL-usable string.
*
* Example : <code>SInflection::urlize('Hello world'); // => 'hello-world'</code>
*/
public static function urlize($sentence)
{
$sentence = self::deaccent($sentence);
$sentence = preg_replace('/[^a-z0-9_-\s]/','',strtolower($sentence));
$sentence = preg_replace('/[\s]+/',' ',trim($sentence));
$sentence = str_replace(' ','-',$sentence);
return $sentence;
}
/**
* Sanitizes an upload's filename by removing non-alphanumeric characters, deaccenting and
* replacing spaces by underscores.
*
* Example : <code>SInflection::sanitize_filename('Compte rendu réunion.doc'); // => 'compte_rendu_reunion.doc'</code>
*/
public static function sanitize_filename($filename)
{
$filename = self::deaccent($filename);
$filename = preg_replace('/[^a-z0-9_\.-\s]/','',strtolower($filename));
$filename = preg_replace('/[\s]+/',' ',trim($filename));
$filename = str_replace(' ','_',$filename);
return $filename;
}
/**
* Replace accented UTF-8 characters by unaccented ASCII-7 equivalents
*
* Use the optional parameter to just deaccent lower ($case = -1) or upper ($case = 1)
* letters. Default is to deaccent both cases ($case = 0)
*
* @author Andreas Gohr <hide@address.com>
*/
public static function deaccent($string, $case=0)
{
if ($case <= 0)
$string = str_replace(array_keys(self::$utf8_lower_accents), array_values(self::$utf8_lower_accents), $string);
if ($case >= 0)
$string = str_replace(array_keys(self::$utf8_upper_accents), array_values(self::$utf8_upper_accents), $string);
return $string;
}
}
?>