In order to do the database Pinyin keyword search Think of the product name generation Pinyin as the key word into the database, so the Internet to collect information to complete a such thing
/**
* Chinese Pinyin Conversion class
* @author Julian.song
* Part of the code source with the Internet, the copyright belongs to the original author all
*/
Class pinyin{
Public Function __construct ()
{
}
/**
* Convert string to Pinyin
* @param $string ASCII code
* @param $charset Code
*/
Public Function Getpinyin ($string, $charset = ' gb2312 ')
{
$dataKey = "a|ai|an|ang|ao|ba|bai|ban|bang|bao|bei|ben|beng|bi|bian|biao|bie|bin|bing|bo|bu|ca|cai|can|cang|cao| Ce|ceng|cha ".
"|chai|chan|chang|chao|che|chen|cheng|chi|chong|chou|chu|chuai|chuan|chuang|chui|chun|chuo|ci|cong|cou|cu|".
"Cuan|cui|cun|cuo|da|dai|dan|dang|dao|de|deng|di|dian|diao|die|ding|diu|dong|dou|du|duan|dui|dun|duo|e|en|er".
"|fa|fan|fang|fei|fen|feng|fo|fou|fu|ga|gai|gan|gang|gao|ge|gei|gen|geng|gong|gou|gu|gua|guai|guan|guang|gui".
"|gun|guo|ha|hai|han|hang|hao|he|hei|hen|heng|hong|hou|hu|hua|huai|huan|huang|hui|hun|huo|ji|jia|jian|jiang".
"|jiao|jie|jin|jing|jiong|jiu|ju|juan|jue|jun|ka|kai|kan|kang|kao|ke|ken|keng|kong|kou|ku|kua|kuai|kuan|kuang" .
"|kui|kun|kuo|la|lai|lan|lang|lao|le|lei|leng|li|lia|lian|liang|liao|lie|lin|ling|liu|long|lou|lu|lv|luan|lue" .
"|lun|luo|ma|mai|man|mang|mao|me|mei|men|meng|mi|mian|miao|mie|min|ming|miu|mo|mou|mu|na|nai|nan|nang|nao|ne".
"|nei|nen|neng|ni|nian|niang|niao|nie|nin|ning|niu|nong|nu|nv|nuan|nue|nuo|o|ou|pa|pai|pan|pang|pao|pei|pen".
"|peng|pi|pian|piao|pie|pin|ping|po|pu|qi|qia|qian|qiang|qiao|qie|qin|qing|qiong|qiu|qu|quan|que|qun|ran|rang" .
"|rao|re|ren|reng|ri|rong|rou|ru|ruan|rui|run|ruo|sa|sai|san|sang|sao|se|sen|seng|sha|shai|shan|shang|shao|".
"She|shen|sheng|shi|shou|shu|shua|shuai|shuan|shuang|shui|shun|shuo|si|song|sou|su|suan|sui|sun|suo|ta|tai|".
"Tan|tang|tao|te|teng|ti|tian|tiao|tie|ting|tong|tou|tu|tuan|tui|tun|tuo|wa|wai|wan|wang|wei|wen|weng|wo|wu".
"|xi|xia|xian|xiang|xiao|xie|xin|xing|xiong|xiu|xu|xuan|xue|xun|ya|yan|yang|yao|ye|yi|yin|ying|yo|yong|you".
"|yu|yuan|yue|yun|za|zai|zan|zang|zao|ze|zei|zen|zeng|zha|zhai|zhan|zhang|zhao|zhe|zhen|zheng|zhi|zhong|".
"Zhou|zhu|zhua|zhuai|zhuan|zhuang|zhui|zhun|zhuo|zi|zong|zou|zu|zuan|zui|zun|zuo";
$dataValue = " -20319|-20317|-20304|-20295|-20292|-20283|-20265|-20257|-20242|-20230|-20051|-20036|-20032|-20026| -20002|-19990 ".
"|-19986|-19982|-19976|-19805|-19784|-19775|-19774|-19763|-19756|-19751|-19746|-19741|-19739|-19728|-19725".
"|-19715|-19540|-19531|-19525|-19515|-19500|-19484|-19479|-19467|-19289|-19288|-19281|-19275|-19270|-19263".
"|-19261|-19249|-19243|-19242|-19238|-19235|-19227|-19224|-19218|-19212|-19038|-19023|-19018|-19006|-19003".
"|-18996|-18977|-18961|-18952|-18783|-18774|-18773|-18763|-18756|-18741|-18735|-18731|-18722|-18710|-18697".
"|-18696|-18526|-18518|-18501|-18490|-18478|-18463|-18448|-18447|-18446|-18239|-18237|-18231|-18220|-18211".
"|-18201|-18184|-18183|-18181|-18012|-17997|-17988|-17970|-17964|-17961|-17950|-17947|-17931|-17928|-17922".
"|-17759|-17752|-17733|-17730|-17721|-17703|-17701|-17697|-17692|-17683|-17676|-17496|-17487|-17482|-17468".
"|-17454|-17433|-17427|-17417|-17202|-17185|-16983|-16970|-16942|-16915|-16733|-16708|-16706|-16689|-16664".
"|-16657|-16647|-16474|-16470|-16465|-16459|-16452|-16448|-16433|-16429|-16427|-16423|-16419|-16412|-16407".
"|-16403|-16401|-16393|-16220|-16216|-16212|-16205|-16202|-16187|-16180|-16171|-16169|-16158|-16155|-15959".
"|-15958|-15944|-15933|-15920|-15915|-15903|-15889|-15878|-15707|-15701|-15681|-15667|-15661|-15659|-15652".
"|-15640|-15631|-15625|-15454|-15448|-15436|-15435|-15419|-15416|-15408|-15394|-15385|-15377|-15375|-15369".
"|-15363|-15362|-15183|-15180|-15165|-15158|-15153|-15150|-15149|-15144|-15143|-15141|-15140|-15139|-15128".
"|-15121|-15119|-15117|-15110|-15109|-14941|-14937|-14933|-14930|-14929|-14928|-14926|-14922|-14921|-14914".
"|-14908|-14902|-14894|-14889|-14882|-14873|-14871|-14857|-14678|-14674|-14670|-14668|-14663|-14654|-14645".
"|-14630|-14594|-14429|-14407|-14399|-14384|-14379|-14368|-14355|-14353|-14345|-14170|-14159|-14151|-14149".
"|-14145|-14140|-14137|-14135|-14125|-14123|-14122|-14112|-14109|-14099|-14097|-14094|-14092|-14090|-14087".
"|-14083|-13917|-13914|-13910|-13907|-13906|-13905|-13896|-13894|-13878|-13870|-13859|-13847|-13831|-13658".
"|-13611|-13601|-13406|-13404|-13400|-13398|-13395|-13391|-13387|-13383|-13367|-13359|-13356|-13343|-13340".
"|-13329|-13326|-13318|-13147|-13138|-13120|-13107|-13096|-13095|-13091|-13076|-13068|-13063|-13060|-12888".
"|-12875|-12871|-12860|-12858|-12852|-12849|-12838|-12831|-12829|-12812|-12802|-12607|-12597|-12594|-12585".
"|-12556|-12359|-12346|-12320|-12300|-12120|-12099|-12089|-12074|-12067|-12058|-12039|-11867|-11861|-11847".
"|-11831|-11798|-11781|-11604|-11589|-11536|-11358|-11340|-11339|-11324|-11303|-11097|-11077|-11067|-11055".
"|-11052|-11045|-11041|-11038|-11024|-11020|-11019|-11018|-11014|-10838|-10832|-10815|-10800|-10790|-10780".
"|-10764|-10587|-10544|-10533|-10519|-10331|-10329|-10328|-10322|-10315|-10309|-10307|-10296|-10281|-10274".
"|-10270|-10262|-10260|-10256|-10254";
$tDataKey = Explode (' | ', $dataKey);
$tDataValue = Explode (' | ', $dataValue);
$data = (php_version>= ' 5.0 ')? Array_combine ($tDataKey, $tDataValue): $this->arraycombine ($tDataKey, $tDataValue);
Arsort ($data);
Reset ($data);
if ($charset! = ' gb2312 ') $string = $this->utf82gb2312 ($string);
$res = ";
for ($i =0; $i < p="">
{
$ASC = Ord (substr ($string, $i, 1));
if ($asc >160) {$q = Ord (substr ($string, + + $i, 1)), $ASC = $asc *256 + $q-65536;}
$res. = $this->asc2pinyin ($ASC, $data);
}
Return Preg_replace ("/[^a-z0-9]*/", ", $res);
}
/**
* Convert ASCII code to the corresponding pinyin
* @param $asc ASCII code
* @param $data ASCII code pinyin character comparison table
*/
Public Function Asc2pinyin ($ASC, $data)
{
if ($asc >0 && $asc <160) return Chr ($ASC);
ElseIf ($asc <-20319 | | $asc >-10247) return ";
else {
foreach ($data as $k = + $v) {if ($v <= $asc) break;}
return $k;
}
}
/**
* Converts the encoding of UFT8 characters to GB2312
* @param $char
*/
Public Function utf82gb2312 ($char)
{
$string = ";
if ($char < 0x80) $string. = $char;
ElseIf ($char < 0x800)
{
$string. = Chr (0xC0 | $char >>6);
$string. = Chr (0x80 | $char & 0x3F);
}elseif ($char < 0x10000) {
$string. = Chr (0xE0 | $char >>12);
$string. = Chr (0x80 | $char >>6 & 0x3F);
$string. = Chr (0x80 | $char & 0x3F);
} elseif ($char < 0x200000) {
$string. = Chr (0xF0 | $char >>18);
$string. = Chr (0x80 | $char >>12 & 0x3F);
$string. = Chr (0x80 | $char >>6 & 0x3F);
$string. = Chr (0x80 | $char & 0x3F);
}
Return Iconv (' UTF-8 ', ' Gb2312//ignore ', $string);
}
/**
* Compare arrays
* @param $arr 1 Array 1
* @param $arr 2 Array 2
*/
Public Function Arraycombine ($arr 1, $arr 2)
{
for ($i =0; $i
return $res;
}
/**
* Get pinyin initials of Chinese characters
* @param $str string
*/
Public Function getinitial ($STR, $charset) {
if ($charset = = "UTF-8") $str = $this->utf82gb2312 ($STR);
$ASC = Ord (substr ($str, 0, 1));
if ($asc < 160) {//Non-Chinese
if ($asc >= && $asc <= 57) {
return Chr ($ASC); Digital
} elseif ($asc >= && $ASC <= 90) {
return Chr ($ASC); A--z
} elseif ($asc >= && $asc <= 122) {
Return Chr ($ASC-32); A--z
} else {
Return '-'; Other
}
} else {//Chinese
$ASC = $ASC * + ord (substr ($STR, 1, 1));
Get Pinyin First Letter A--z
if ($asc >= 176161 && $asc < 176197) {
Return ' A ';
} elseif ($asc >= 176197 && $asc < 178193) {
Return ' B ';
} elseif ($asc >= 178193 && $asc < 180238) {
Return ' C ';
} elseif ($asc >= 180238 && $asc < 182234) {
Return ' D ';
} elseif ($asc >= 182234 && $asc < 183162) {
Return ' E ';
} elseif ($asc >= 183162 && $asc < 184193) {
Return ' F ';
} elseif ($asc >= 184193 && $asc < 185254) {
Return ' G ';
} elseif ($asc >= 185254 && $asc < 187247) {
Return ' H ';
} elseif ($asc >= 187247 && $asc < 191166) {
Return ' J ';
} elseif ($asc >= 191166 && $asc < 192172) {
Return ' K ';
} elseif ($asc >= 192172 && $asc < 194232) {
Return ' L ';
} elseif ($asc >= 194232 && $asc < 196195) {
Return ' M ';
} elseif ($asc >= 196195 && $asc < 197182) {
Return ' N ';
} elseif ($asc >= 197182 && $asc < 197190) {
Return ' O ';
} elseif ($asc >= 197190 && $asc < 198218) {
Return ' P ';
} elseif ($asc >= 198218 && $asc < 200187) {
Return ' Q ';
} elseif ($asc >= 200187 && $asc < 200246) {
Return ' R ';
} elseif ($asc >= 200246 && $asc < 203250) {
Return ' S ';
} elseif ($asc >= 203250 && $asc < 205218) {
Return ' T ';
} elseif ($asc >= 205218 && $asc < 206244) {
Return ' W ';
} elseif ($asc >= 206244 && $asc < 209185) {
Return ' X ';
} elseif ($asc >= 209185 && $asc < 212209) {
Return ' Y ';
} elseif ($asc >= 212209) {
Return ' Z ';
} else {
Return '-';
}
}
}
/**
* Splitting strings into arrays
* @param $str string
* @param $charset Code
*/
Public Function Mbstringtoarray ($STR, $charset) {
$strlen =mb_strlen ($STR);
while ($strlen) {
$array []=mb_substr ($str, 0,1, $charset);
$str =mb_substr ($str, 1, $strlen, $charset);
$strlen =mb_strlen ($STR);
}
return $array;
}
Public Function Getinitials ($STR, $charset) {
$initials = "";
foreach ($this->mbstringtoarray ($str, $charset) as $char) {
$initials. = $this->getinitial ($char, $charset);
}
return $initials;
}
}
This article is from the "Dabailiang" blog
http://www.bkjia.com/PHPjc/478599.html www.bkjia.com true http://www.bkjia.com/PHPjc/478599.html techarticle in order to do the database Pinyin keyword search Think of the product name generation Pinyin as the key word into the database, so the Internet to collect information to complete a such thing? php/** * Pinyin ...