php中文支援函數

/**

* 将一個字串中含有全角的數字字元、字母、空格或'%+-()'字元轉換為相應半角字元

* @access public

* @param string $str 待轉換字串

* @return string $str 處理後字串

function make_semiangle($str)

{

$arr = array('０' => '0', '１' => '1', '２' => '2', '３' => '3', '４' => '4',

'５' => '5', '６' => '6', '７' => '7', '８' => '8', '９' => '9',

'Ａ' => 'a', 'Ｂ' => 'b', 'Ｃ' => 'c', 'Ｄ' => 'd', 'Ｅ' => 'e',

'Ｆ' => 'f', 'Ｇ' => 'g', 'Ｈ' => 'h', 'Ｉ' => 'i', 'Ｊ' => 'j',

'Ｋ' => 'k', 'Ｌ' => 'l', 'Ｍ' => 'm', 'Ｎ' => 'n', 'Ｏ' => 'o',

'Ｐ' => 'p', 'Ｑ' => 'q', 'Ｒ' => 'r', 'Ｓ' => 's', 'Ｔ' => 't',

'Ｕ' => 'u', 'Ｖ' => 'v', 'Ｗ' => 'w', 'Ｘ' => 'x', 'Ｙ' => 'y',

'Ｚ' => 'z', 'ａ' => 'a', 'ｂ' => 'b', 'ｃ' => 'c', 'ｄ' => 'd',

'ｅ' => 'e', 'ｆ' => 'f', 'ｇ' => 'g', 'ｈ' => 'h', 'ｉ' => 'i',

'ｊ' => 'j', 'ｋ' => 'k', 'ｌ' => 'l', 'ｍ' => 'm', 'ｎ' => 'n',

'ｏ' => 'o', 'ｐ' => 'p', 'ｑ' => 'q', 'ｒ' => 'r', 'ｓ' => 's',

'ｔ' => 't', 'ｕ' => 'u', 'ｖ' => 'v', 'ｗ' => 'w', 'ｘ' => 'x',

'ｙ' => 'y', 'ｚ' => 'z',

'（' => '(', '）' => ')', '〔' => '[', '〕' => ']', '【' => '[',

'】' => ']', '〖' => '[', '〗' => ']', '“' => '[', '”' => ']',

'‘' => '[', '’' => ']', '｛' => '{', '｝' => '}', '《' => '<',

'》' => '>',

'％' => '%', '＋' => '+', '—' => '-', '－' => '-', '～' => '-',

'：' => ':', '。' => '.', '、' => ',', '，' => '.', '、' => '.',

'；' => ',', '？' => '?', '！' => '!', '…' => '-', '‖' => '|',

'”' => '"', '’' => '`', '‘' => '`', '｜' => '|', '〃' => '"',

'　' => ' ','＄'=>'$','＠'=>'@','＃'=>'#','＾'=>'^','＆'=>'&','＊'=>'*');

return strtr($str, $arr);

}

php中文截取字元串

<?php

utf-8、gb2312都支援的漢字截取函數

cut_str(字元串, 截取長度, 開始長度, 編碼);

編碼預設為 utf-8

開始長度預設為 0

function cut_str($string, $sublen, $start = 0, $code = 'utf-8') {

if ($code == 'utf-8') {

preg_match_all ( $pa, $string, $t_string );

if (count ( $t_string [0] ) - $start > $sublen)

return join ( '', array_slice ( $t_string [0], $start, $sublen ) ) . "...";

return join ( '', array_slice ( $t_string [0], $start, $sublen ) );

} else {

$start = $start * 2;

$sublen = $sublen * 2;

$strlen = strlen ( $string );

$tmpstr = '';

for($i = 0; $i < $strlen; $i ++) {

if ($i >= $start && $i < ($start + $sublen)) {

if (ord ( substr ( $string, $i, 1 ) ) > 129) {

$tmpstr .= substr ( $string, $i, 2 );

} else {

$tmpstr .= substr ( $string, $i, 1 );

}

if (ord ( substr ( $string, $i, 1 ) ) > 129)

$i ++;

}

if (strlen ( $tmpstr ) < $strlen)

$tmpstr .= "...";

return $tmpstr;

}

$str = "abcd需要截取的字元串";

echo cut_str ( $str, 1, 0, 'gb2312' );

* 字元截取支援utf8/gbk

* @param $string

* @param $length

* @param $dot

function str_cut($string, $length, $charset = 'utf-8', $dot = '...') {

$strlen = strlen($string);

if($strlen <= $length) return $string;

$string = str_replace(array(' ','&nbsp;', '&amp;', '&quot;', '&#039;', '&ldquo;', '&rdquo;', '&mdash;', '&lt;', '&gt;', '&middot;', '&hellip;'), array('∵',' ', '&', '"', "'", '“', '”', '—', '<', '>', '·', '…'), $string);

$strcut = '';

if(strtolower($charset) == 'utf-8') {

$length = intval($length-strlen($dot)-$length/3);

$n = $tn = $noc = 0;

while($n < strlen($string)) {

$t = ord($string[$n]);

if($t == 9 || $t == 10 || (32 <= $t && $t <= 126)) {

$tn = 1; $n++; $noc++;

} elseif(194 <= $t && $t <= 223) {

$tn = 2; $n += 2; $noc += 2;

} elseif(224 <= $t && $t <= 239) {

$tn = 3; $n += 3; $noc += 2;

} elseif(240 <= $t && $t <= 247) {

$tn = 4; $n += 4; $noc += 2;

} elseif(248 <= $t && $t <= 251) {

$tn = 5; $n += 5; $noc += 2;

} elseif($t == 252 || $t == 253) {

$tn = 6; $n += 6; $noc += 2;

} else {

$n++;

if($noc >= $length) {

break;

if($noc > $length) {

$n -= $tn;

$strcut = substr($string, 0, $n);

$strcut = str_replace(array('∵', '&', '"', "'", '“', '”', '—', '<', '>', '·', '…'), array(' ', '&amp;', '&quot;', '&#039;', '&ldquo;', '&rdquo;', '&mdash;', '&lt;', '&gt;', '&middot;', '&hellip;'), $strcut);

$dotlen = strlen($dot);

$maxi = $length - $dotlen - 1;

$current_str = '';

$search_arr = array('&',' ', '"', "'", '“', '”', '—', '<', '>', '·', '…','∵');

$replace_arr = array('&amp;','&nbsp;', '&quot;', '&#039;', '&ldquo;', '&rdquo;', '&mdash;', '&lt;', '&gt;', '&middot;', '&hellip;',' ');

$search_flip = array_flip($search_arr);

for ($i = 0; $i < $maxi; $i++) {

$current_str = ord($string[$i]) > 127 ? $string[$i].$string[++$i] : $string[$i];

if (in_array($current_str, $search_arr)) {

$key = $search_flip[$current_str];

$current_str = str_replace($search_arr[$key], $replace_arr[$key], $current_str);

$strcut .= $current_str;

return $strcut.$dot;

php中文字元串翻轉

通常情況下翻轉一個字元串隻需要strrev()函數就可以了，但有時我需要處理是字元串是含中文的，這樣用strrev就會出現亂碼，是以我們需要自定義一個函數來處理含中文的字元。

function cstrrev($str)

$len = strlen($str);

for($i = 0; $i < $len; $i++)

{

$char = $str{0};

if(ord($char) > 127)

{

$i++;

if($i < $len)

{

$arr[] = substr($str, 0, 2);

$str = substr($str, 2);

else

$arr[] = $char;

$str = substr($str, 1);

return join(array_reverse($arr));

#使用方法：

$str = '中文.look!';

echo cstrrev($str);

#結果輸出：!kool.文中

str_replace

function str_replace_cn($needle, $str, $haystack, $charset = "utf-8"){

$re['utf-8'] = "/[\x01-\x7f]|[\xc2-\xdf][\x80-\xbf]|[\xe0-\xef][\x80-\xbf]{2}|[\xf0-\xff][\x80-\xbf]{3}/";

$re['gb2312'] = "/[\x01-\x7f]|[\xb0-\xf7][\xa0-\xfe]/";

$re['gbk'] = "/[\x01-\x7f]|[\x81-\xfe][\x40-\xfe]/";

$re['big5'] = "/[\x01-\x7f]|[\x81-\xfe]([\x40-\x7e]|\xa1-\xfe])/";

preg_match_all($re[$charset], $haystack, $match_haystack);

preg_match_all($re[$charset], $needle, $match_needle);

for($i = 0; $i < count($match_needle); $i ++){

if(!in_array($match_needle[0][$i], $match_haystack[0]))return $haystack;//無比對

$match_haystack = $match_haystack[0];

$match_needle = $match_needle[0];

for($i = 0; $i < count($match_haystack); $i ++){

if($match_haystack[$i] == "")continue;

if($match_haystack[$i] == $match_needle[0]){

if(count($match_needle) == 1){//如果隻一個字元

$match_haystack[$i] = $str;

}else{

$flag = true;

for($j = 1; $j < count($match_needle); $j ++){

if($match_haystack[$i + $j] != $match_needle[$j]){

$flag = false;

break;

}

if($flag){//比對

$match_haystack[$i] = $str;

for($j = 1; $j < count($match_needle); $j ++){

$match_haystack[$i + $j] = "";

return implode("", $match_haystack);

* 實作多種字元編碼方式

* @param $input 需要編碼的字元串

* @param $_output_charset 輸出的編碼格式

* @param $_input_charset 輸入的編碼格式

* return 編碼後的字元串

function charsetencode($input, $_output_charset, $_input_charset) {

$output = "";

if (!isset($_output_charset)) $_output_charset = $_input_charset;

if ($_input_charset == $_output_charset || $input == null) {

$output = $input;

} elseif (function_exists("mb_convert_encoding")) {

$output = mb_convert_encoding($input, $_output_charset, $_input_charset);

} elseif (function_exists("iconv")) {

$output = iconv($_input_charset, $_output_charset, $input);

} else die("sorry, you have no libs support for charset change.");

return $output;

* 實作多種字元解碼方式

* @param $input 需要解碼的字元串

* @param $_output_charset 輸出的解碼格式

* @param $_input_charset 輸入的解碼格式

* return 解碼後的字元串

function charsetdecode($input, $_input_charset, $_output_charset) {

if (!isset($_input_charset)) $_input_charset = $_input_charset;

} else die("sorry, you have no libs support for charset changes.");

sfds

php中文支援函數

繼續閱讀

Java String.format方法的簡單使用

neo4j之cypher使用文檔

GitHub連夜封殺！這份阿裡 10W 字内部 Java 字面試手冊到底有多強？

Cloud Studio初體驗

spark/scala關于【資源檔案】加載方法概述外部檔案加載方案測試資源檔案打包入jar包中小結

NOSQL安全攻擊

mybatis_入門程式Mybatis入門

AOP程式設計_Android優雅權限架構(1)概念基礎，2021金三銀四前言正文大綱正文

php 去掉字元串的最後一個字元及截取原字元串1,2,3,4,5,6,

Effective Java 8:通用程式設計

php——水印

OOM三種類型

工廠模式-三種類型

【遞歸】高效率求2的n次幂

win10本地scala和spark安裝安裝scala安裝spark

scala (3) Function 和 Method