Detect whether a string contains non-ascii multibyte sequences in the UTF-8 range
static public utf8_is_valid ( $str ) : boolean | ||
$str | string input string | |
Результат | boolean |
/** * Sanitize a variable. * Removes leading and trailing whitespace, normalizes all characters to UTF-8. * @param $var string * @return string */ static function cleanVar($var) { // only normalize strings that are not UTF-8 already, and when the system is using UTF-8 if (Config::getVar('i18n', 'charset_normalization') == 'On' && strtolower_codesafe(Config::getVar('i18n', 'client_charset')) == 'utf-8' && !PKPString::utf8_is_valid($var)) { $var = PKPString::utf8_normalize($var); // convert HTML entities into valid UTF-8 characters (do not transcode) $var = html_entity_decode($var, ENT_COMPAT, 'UTF-8'); // strip any invalid UTF-8 sequences $var = PKPString::utf8_bad_strip($var); $var = htmlspecialchars($var, ENT_NOQUOTES, 'UTF-8', false); } // strip any invalid ASCII control characters $var = PKPString::utf8_strip_ascii_ctrl($var); return trim($var); }