• 设为首页
  • 点击收藏
  • 手机版
    手机扫一扫访问
    迪恩网络手机版
  • 关注官方公众号
    微信扫一扫关注
    迪恩网络公众号

PHP normalizer_normalize函数代码示例

原作者: [db:作者] 来自: [db:来源] 收藏 邀请

本文整理汇总了PHP中normalizer_normalize函数的典型用法代码示例。如果您正苦于以下问题:PHP normalizer_normalize函数的具体用法?PHP normalizer_normalize怎么用?PHP normalizer_normalize使用的例子?那么恭喜您, 这里精选的函数代码示例或许可以为您提供帮助。



在下文中一共展示了normalizer_normalize函数的20个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于我们的系统推荐出更棒的PHP代码示例。

示例1: cleanChars

 private static function cleanChars($book)
 {
     foreach ($book as $key => $value) {
         $value = normalizer_normalize($value, \Normalizer::FORM_C);
         $value = preg_replace('/\\x{009c}/u', '', $value);
         $value = preg_replace('/\\x{0098}/u', '', $value);
         //debug (json_encode($value));
         $book[$key] = $value;
     }
     return $book;
 }
开发者ID:matthiasmoritz,项目名称:exlibris-openlibrary,代码行数:11,代码来源:Dnb.php


示例2: clean

 public static function clean($string)
 {
     $string = filter_var($string, FILTER_SANITIZE_STRING, FILTER_FLAG_NO_ENCODE_QUOTES);
     // Ensure bytestream is valid
     if (!mb_check_encoding($string, 'UTF-8')) {
         throw new \InvalidArgumentException('Invalid unicode input.');
     }
     // Clean and normalise unicode
     $string = iconv('UTF-8', 'UTF-8//IGNORE', $string);
     $string = normalizer_normalize($string);
     // Strip control characters
     $string = preg_replace('~\\p{C}+~u', '', $string);
     return $string;
 }
开发者ID:tuimedia,项目名称:forum,代码行数:14,代码来源:StringCleaner.php


示例3: normalizeEncoding

 /**
  * Normalizes the encoding of a string (UTF8 NFD to NFC).
  *
  * On HFS+ filesystem (OS X) filenames are stored in UTF8 NFD while all other filesystems are
  * using UTF8 NFC. NFC is more common in general.
  *
  * @param string $string Input string
  *
  * @return string
  */
 public static function normalizeEncoding($string)
 {
     static $normalizer;
     if (null === $normalizer) {
         if (function_exists('normalizer_normalize')) {
             $normalizer = function ($string) {
                 return normalizer_normalize($string, Normalizer::FORM_C);
             };
         } else {
             $normalizer = function ($string) {
                 return str_replace(["Ä", "ä", "Ö", "ö", "Ü", "ü"], ['Ä', 'ä', 'Ö', 'ö', 'Ü', 'ü'], $string);
             };
         }
     }
     return $normalizer($string);
 }
开发者ID:redaxo,项目名称:redaxo,代码行数:26,代码来源:string.php


示例4: strip_diacriticals

function strip_diacriticals($in)
{
    if (function_exists('transliterator_transliterate')) {
        // PHP 5.4 + intl
        return transliterator_transliterate('Any-Latin; Latin-ASCII', $in);
    }
    if (function_exists('normalizer_normalize')) {
        // PHP 5.3 + intl
        return normalizer_normalize(preg_replace('/\\p{Mn}+/u', '', normalizer_normalize($in, Normalizer::FORM_D)), Normalizer::FORM_C);
    }
    if (function_exists('iconv') && ICONV_IMPL == 'glibc') {
        return iconv('UTF-8', 'ASCII//TRANSLIT', $in);
    }
    // version incomplète (limitée au latin1)
    $patterns = array('~&([A-za-z])(?:grave|acute|circ|tilde|uml|ring|cedil|slash|caron);~' => '\\1', '~&([A-za-z]{2})lig;~' => '\\1', '~&[^;]+;~' => '');
    $out = htmlentities($in, ENT_NOQUOTES, 'UTF-8');
    $out = preg_replace(array_keys($patterns), array_values($patterns), $out);
    return $out;
}
开发者ID:jacquesmattheij,项目名称:SRS,代码行数:19,代码来源:learn.php


示例5: remove_accents

 /**
  * Enhanced 'remove_accents'. If the php Normalizer extension installed, use it.
  *
  * @since 1.0.0
  *
  * @see remove_accents()
  *
  * @param string $string Text that might have accent characters
  * @return string Filtered string with replaced "nice" characters.
  */
 public function remove_accents($string)
 {
     if (function_exists('normalizer_normalize')) {
         if (!normalizer_is_normalized($string, Normalizer::FORM_C)) {
             $string = normalizer_normalize($string, Normalizer::FORM_C);
         }
     }
     return remove_accents($string);
 }
开发者ID:barryceelen,项目名称:wp-pimp-my-ride,代码行数:19,代码来源:class-pimp-my-ride.php


示例6: encodeRelativeDescriptorString

 public static function encodeRelativeDescriptorString($str)
 {
     if (function_exists('normalizer_normalize')) {
         $str = normalizer_normalize($str);
     }
     $str = Z_Unicode::convertCharStr2UTF8($str);
     // convertNumbers2Char($str, 'hex')
     $str = preg_replace_callback("/([A-Fa-f0-9]{2})/", function ($matches) {
         return Z_Unicode::hex2char($matches[0]);
     }, str_replace(" ", "", $str));
     return $str;
 }
开发者ID:selenus,项目名称:dataserver,代码行数:12,代码来源:Attachments.inc.php


示例7: normalize

 /**
  * Remove all unwanted caracters
  *
  * @param string $text
  *
  * @return string
  */
 public function normalize($text)
 {
     return preg_replace('/\\pM*/u', '', normalizer_normalize($text, \Normalizer::FORM_D));
 }
开发者ID:TMSolution,项目名称:ETSPaymentDotpayBundle,代码行数:11,代码来源:String.php


示例8: hasNormalizerSupport

 /**
  * Tests that "normalizer_normalize" exists and works
  *
  * @return bool
  */
 public static function hasNormalizerSupport()
 {
     static $ret = null;
     if (null === $ret) {
         $form_c = "Å";
         // 'LATIN CAPITAL LETTER A WITH RING ABOVE' (U+00C5)
         $form_d = "Å";
         // A followed by 'COMBINING RING ABOVE' (U+030A)
         $ret = function_exists('normalizer_normalize') && $form_c === normalizer_normalize($form_d);
     }
     return $ret;
 }
开发者ID:tjcaverly,项目名称:Elgg,代码行数:17,代码来源:Translit.php


示例9: searchable

 function searchable($text, $lang = false)
 {
     global $cfg;
     if (function_exists('normalizer_normalize')) {
         // Normalize text input :: remove diacritics and such
         $text = normalizer_normalize($text, Normalizer::FORM_C);
     } else {
         // As a lightweight compatiblity, use a lightweight C
         // normalizer with diacritic removal, thanks
         // http://ahinea.com/en/tech/accented-translate.html
         $tr = array("ä" => "a", "ñ" => "n", "ö" => "o", "ü" => "u", "ÿ" => "y");
         $text = strtr($text, $tr);
     }
     // Decompose compatible versions of characters (ä => ae)
     $tr = array("ß" => "ss", "Æ" => "AE", "æ" => "ae", "IJ" => "IJ", "ij" => "ij", "Œ" => "OE", "œ" => "oe", "Ð" => "D", "Đ" => "D", "ð" => "d", "đ" => "d", "Ħ" => "H", "ħ" => "h", "ı" => "i", "ĸ" => "k", "Ŀ" => "L", "Ł" => "L", "ŀ" => "l", "ł" => "l", "Ŋ" => "N", "ʼn" => "n", "ŋ" => "n", "Ø" => "O", "ø" => "o", "ſ" => "s", "Þ" => "T", "Ŧ" => "T", "þ" => "t", "ŧ" => "t", "ä" => "ae", "ö" => "oe", "ü" => "ue", "Ä" => "AE", "Ö" => "OE", "Ü" => "UE");
     $text = strtr($text, $tr);
     // Drop separated diacritics
     $text = preg_replace('/\\p{M}/u', '', $text);
     // Drop extraneous whitespace
     $text = preg_replace('/(\\s)\\s+/u', '$1', $text);
     // Drop leading and trailing whitespace
     $text = trim($text);
     if (false && class_exists('IntlBreakIterator')) {
         // Split by word boundaries
         if ($tokenizer = IntlBreakIterator::createWordInstance($lang ?: ($cfg ? $cfg->getSystemLanguage() : 'en_US'))) {
             $tokenizer->setText($text);
             $tokens = array();
             foreach ($tokenizer as $token) {
                 $tokens[] = $token;
             }
             $text = implode(' ', $tokens);
         }
     } else {
         // Approximate word boundaries from Unicode chart at
         // http://www.unicode.org/reports/tr29/#Word_Boundaries
         // Punt for now
     }
     return $text;
 }
开发者ID:gizur,项目名称:osticket,代码行数:39,代码来源:class.format.php


示例10: safe_normalize

    /**
     * Normalise a UTf-8 string to FORM_C, avoiding the pitfalls in PHP's
     * normalizer_normalize function.
     * @param string $string the input string.
     * @return string the normalised string.
     */
    protected static function safe_normalize($string) {
        if ($string === '') {
            return '';
        }

        if (!function_exists('normalizer_normalize')) {
            return $string;
        }

        $normalised = normalizer_normalize($string, Normalizer::FORM_C);
        if (is_null($normalised)) {
            // An error occurred in normalizer_normalize, but we have no idea what.
            debugging('Failed to normalise string: ' . $string, DEBUG_DEVELOPER);
            return $string; // Return the original string, since it is the best we have.
        }

        return $normalised;
    }
开发者ID:ncsu-delta,项目名称:moodle,代码行数:24,代码来源:question.php


示例11: apply

 /**
  *
  * @see \X501\StringPrep\StringPrep::prepare()
  * @param string $string UTF-8 encoded string
  * @return string
  */
 public function apply($string)
 {
     return normalizer_normalize($string, \Normalizer::NFKC);
 }
开发者ID:sop,项目名称:x501,代码行数:10,代码来源:NormalizeStep.php


示例12: normalizeValue

 protected static function normalizeValue($value) {
     return isset($value) ? preg_replace('/(\p{M})/ui', '', normalizer_normalize($value, Normalizer::FORM_D)) : NULL;
 }
开发者ID:reisystems-india,项目名称:GovDashboard-Community,代码行数:3,代码来源:AbstractDimensionLookupHandler.php


示例13: fewer_specials

function fewer_specials($w, $strip = "̄")
{
    $w = normalizer_normalize($w, Normalizer::FORM_D);
    $w = str_replace("æ", "ae", $w);
    $w = str_replace("œ", "oe", $w);
    $w = str_replace("Æ", "ae", $w);
    $w = str_replace("Œ", "oe", $w);
    $w = str_replace($strip, "", $w);
    return $w;
}
开发者ID:NasalMusician,项目名称:Pantheum,代码行数:10,代码来源:display.php


示例14: normalize

 /**
  * Normalize the given UTF-8 string
  *
  * @see http://stackoverflow.com/a/7934397/99923
  * @param string $string to normalize
  * @param int $form to normalize as
  * @return string
  */
 public static function normalize($string, $form = Normalizer::FORM_KD)
 {
     return normalizer_normalize($string, $form);
 }
开发者ID:xeoncross,项目名称:kit,代码行数:12,代码来源:Core.php


示例15: normalize_keyword

function normalize_keyword($keyword)
{
    global $normalize_keywords, $keywords_remove_diacritics;
    //Normalize the text if function available
    if ($normalize_keywords && function_exists('normalizer_normalize')) {
        $keyword = normalizer_normalize($keyword);
    }
    if ($keywords_remove_diacritics) {
        $keyword = remove_accents($keyword);
    }
    return $keyword;
}
开发者ID:perryrothjohnson,项目名称:resourcespace,代码行数:12,代码来源:language_functions.php


示例16: normalize

 /**
  * Remove all unwanted characters and unset the optional data, if it is too long.
  *
  * @param array $additionalData
  *
  * @return array
  */
 public static function normalize(array $additionalData)
 {
     foreach ($additionalData as $key => $value) {
         $additionalData[$key] = preg_replace('/\\pM*/u', '', normalizer_normalize($value, \Normalizer::FORM_D));
         if (strlen($additionalData[$key]) > self::getAdditionalDataMaxLength($key)) {
             unset($additionalData[$key]);
         }
     }
     return $additionalData;
 }
开发者ID:valiton-forks,项目名称:ETSPaymentOgoneBundle,代码行数:17,代码来源:OgoneGatewayPlugin.php


示例17: normalizeNFC

 /**
  * Normalize the note to Unicode NFC.
  *
  * @param  string  The original note
  *
  * @return string The normalized note
  */
 public function normalizeNFC($note)
 {
     return normalizer_normalize($note, Normalizer::FORM_C);
 }
开发者ID:jonnybarnes,项目名称:indieweb,代码行数:11,代码来源:NotePrep.php


示例18: sil_dictionary_custom_join

function sil_dictionary_custom_join($join)
{
    global $wp_query, $wpdb;
    $search_table_name = SEARCHTABLE;
    /*
     * The query I'm going for will hopefully end up looking something like this
     * example:
     * SELECT id, language_code, relevance, post_title
     * FROM wp_posts p
     * JOIN (
     *	SELECT post_id, language_code, MAX(relevance) AS relevance, search_strings
     *	FROM sil_multilingual_search
     *	WHERE search_strings like '%sleeping%'
     *	GROUP BY post_id, language_code
     *	ORDER BY relevance DESC
     *	) sil_multilingual_search ON sil_multilingual_search.post_id = p.id
     * ORDER BY relevance DESC, post_title;
     */
    mb_internal_encoding("UTF-8");
    if (!empty($wp_query->query_vars['s'])) {
        //search string gets trimmed and normalized to NFC
        if (class_exists("Normalizer", $autoload = false)) {
            $search = normalizer_normalize(trim($wp_query->query_vars['s']), Normalizer::FORM_C);
        } else {
            $search = trim($wp_query->query_vars['s']);
        }
        $key = $_GET['key'];
        if (!isset($key)) {
            $key = $wp_query->query_vars['langcode'];
        }
        $partialsearch = $_GET['partialsearch'];
        if (!isset($_GET['partialsearch'])) {
            $partialsearch = get_option("include_partial_words");
        }
        if (strlen($search) == 0 && $_GET['tax'] > 1) {
            $partialsearch = 1;
        }
        $subquery_where = "";
        if (strlen(trim($key)) > 0) {
            $subquery_where .= " WHERE " . $search_table_name . ".language_code = '{$key}' ";
        }
        $subquery_where .= empty($subquery_where) ? " WHERE " : " AND ";
        if (isset($wp_query->query_vars['letter'])) {
            $letter = trim($wp_query->query_vars['letter']);
            $noletters = trim($wp_query->query_vars['noletters']);
            //by default we use collate utf8_bin and à, ä, etc. are handled as different letters
            $collate = "COLLATE 'UTF8_BIN'";
            if (get_option('IncludeCharactersWithDiacritics') == 1) {
                $collate = "";
            }
            $subquery_where .= "(" . $search_table_name . ".search_strings LIKE '" . addslashes($letter) . "%' " . $collate . " OR " . $search_table_name . ".search_strings LIKE '" . addslashes(strtoupper($letter)) . "%' " . $collate . " OR " . $search_table_name . ".search_strings LIKE '" . addslashes("-" . $letter) . "%' " . $collate . ") " . " AND relevance >= 95 AND language_code = '{$key}' ";
            $arrNoLetters = explode(",", $noletters);
            foreach ($arrNoLetters as $noLetter) {
                if (strlen($noLetter) > 0) {
                    $subquery_where .= " AND " . $search_table_name . ".search_strings NOT LIKE '" . $noLetter . "%' " . $collate . " AND " . $search_table_name . ".search_strings NOT LIKE '" . strtoupper($noLetter) . "%' " . $collate;
                }
            }
        } else {
            if (is_CJK($search) || mb_strlen($search) > 3 || $partialsearch == 1) {
                $subquery_where .= $search_table_name . ".search_strings LIKE '%" . addslashes($search) . "%'";
            } else {
                if (mb_strlen($search) > 1) {
                    $subquery_where .= $search_table_name . ".search_strings REGEXP '[[:<:]]" . addslashes($search) . "[[:>:]]'";
                }
            }
        }
        //if($_GET['tax'] < 1)
        //{
        $subquery = " (SELECT post_id, language_code, MAX(relevance) AS relevance, search_strings, sortorder " . "FROM " . $search_table_name . $subquery_where . " GROUP BY post_id, language_code, search_strings " . " ORDER BY relevance DESC) ";
        $join = " JOIN " . $subquery . $search_table_name . " ON {$wpdb->posts}.ID = " . $search_table_name . ".post_id ";
        //}
    }
    $tax = 0;
    if (isset($_GET['tax'])) {
        $tax = $_GET['tax'];
    }
    if ($tax > 1 || strlen($wp_query->query_vars['semdomain']) > 0) {
        $join .= " LEFT JOIN {$wpdb->term_relationships} ON {$wpdb->posts}.ID = {$wpdb->term_relationships}.object_id ";
        $join .= " INNER JOIN {$wpdb->term_taxonomy} ON {$wpdb->term_relationships}.term_taxonomy_id = {$wpdb->term_taxonomy}.term_id ";
        if (get_option("useSemDomainNumbers") == 1) {
            $join .= " INNER JOIN {$wpdb->terms} ON {$wpdb->term_relationships}.term_taxonomy_id = {$wpdb->terms}.term_id ";
        }
    }
    return $join;
}
开发者ID:rick-maclean,项目名称:sil-dictionary-webonaryRicks,代码行数:85,代码来源:dictionary-search.php


示例19: no_specials2

function no_specials2($w, $extras = "1-9/; ,\\n")
{
    $w = normalizer_normalize($w, Normalizer::FORM_D);
    /*$w = str_replace("æ", "ae", $w);
    	$w = str_replace("œ", "oe", $w);
    	$w = str_replace("Æ", "ae", $w);
    	$w = str_replace("Œ", "oe", $w);
    	$w = str_replace("þ", "th", $w);
    	$w = str_replace("Þ", "th", $w);
    	$w = str_replace("ð", "th", $w);
    	$w = str_replace("Ð", "th", $w);
    	/*/
    $w = transliterator_transliterate('Any-Latin; Latin-ASCII', $w);
    # TODO: use more on this function
    /**/
    $w = preg_replace("#[^\\p{L}{$extras}]#ui", "", $w);
    return $w;
}
开发者ID:NasalMusician,项目名称:Pantheum,代码行数:18,代码来源:string.php


示例20: toNFKD

 /**
  * Convert a UTF-8 string to normal form KD, compatibility decomposition.
  * This may cause irreversible information loss, use judiciously.
  * Fast return for pure ASCII strings.
  *
  * @param $string String: a valid UTF-8 string. Input is not validated.
  * @return string a UTF-8 string in normal form KD
  */
 static function toNFKD($string)
 {
     if (NORMALIZE_INTL) {
         return normalizer_normalize($string, Normalizer::FORM_KD);
     } elseif (NORMALIZE_ICU) {
         return utf8_normalize($string, UNORM_NFKD);
     } elseif (preg_match('/[\\x80-\\xff]/', $string)) {
         return UtfNormal::NFKD($string);
     } else {
         return $string;
     }
 }
开发者ID:GodelDesign,项目名称:Godel,代码行数:20,代码来源:UtfNormal.php



注:本文中的normalizer_normalize函数示例整理自Github/MSDocs等源码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。


鲜花

握手

雷人

路过

鸡蛋
该文章已有0人参与评论

请发表评论

全部评论

专题导读
上一篇:
PHP not函数代码示例发布时间:2022-05-15
下一篇:
PHP normalize_whitespace函数代码示例发布时间:2022-05-15
热门推荐
阅读排行榜

扫描微信二维码

查看手机版网站

随时了解更新最新资讯

139-2527-9053

在线客服(服务时间 9:00~18:00)

在线QQ客服
地址:深圳市南山区西丽大学城创智工业园
电邮:jeky_zhao#qq.com
移动电话:139-2527-9053

Powered by 互联科技 X3.4© 2001-2213 极客世界.|Sitemap