The first letter of Chinese characters in php to pinyin. PHP obtains the first letter of pinyin.
After running the program, some characters in the string cannot be converted. If you enter these words separately, you can directly convert them to read the first letter of the alphabet.
It won't work in the string. The program code is as follows:
Function getfirstchar ($ s0 ){
$ Fchar = ord ($ s0 {0 });
If ($ fchar> = ord ("a") and $ fchar <= ord ("Z") return strtoupper ($ s0 {0 });
$ S1 = iconv ("UTF-8", "gb2312", $ s0 );
$ S2 = iconv ("gb2312", "UTF-8", $ s1 );
If ($ s2 = $ s0) {$ s = $ s1;} else {$ s = $ s0 ;}
$ Asc = ord ($ s {0}) * 256 + ord ($ s {1})-65536;
If ($ asc >=- 20319 and $ asc <=-20284) return "";
If ($ asc >=- 20283 and $ asc <=-19776) return "B ";
If ($ asc >=- 19775 and $ asc <=-19219) return "C ";
If ($ asc >=- 19218 and $ asc <=-18711) return "D ";
If ($ asc >=- 18710 and $ asc <=-18527) return "E ";
If ($ asc >=- 18526 and $ asc <=-18240) return "F ";
If ($ asc >=- 18239 and $ asc <=-17923) return "G ";
If ($ asc >=- 17922 and $ asc <=-17418) return "H ";
If ($ asc >=- 17417 and $ asc <=-16475) return "J ";
If ($ asc >=- 16474 and $ asc <=-16213) return "K ";
If ($ asc >=- 16212 and $ asc <=-15641) return "L ";
If ($ asc >=- 15640 and $ asc <=-15166) return "M ";
If ($ asc >=- 15165 and $ asc <=-14923) return "N ";
If ($ asc >=- 14922 and $ asc <=-14915) return "O ";
If ($ asc >=- 14914 and $ asc <=- 14631) return "P ";
If ($ asc >=- 14630 and $ asc <=-14150) return "Q ";
If ($ asc >=- 14149 and $ asc <=-14091) return "R ";
If ($ asc >=- 14090 and $ asc <=-13319) return "S ";
If ($ asc >=- 13318 and $ asc <=-12839) return "T ";
If ($ asc >=- 12838 and $ asc <=-12557) return "W ";
If ($ asc >=- 12556 and $ asc <=-11848) return "X ";
If ($ asc >=- 11847 and $ asc <=-11056) return "Y ";
If ($ asc >=- 11055 and $ asc <=- 10247) return "Z ";
Return null;
}
Function pinyin1 ($ zh ){
$ Ret = "";
$ S1 = iconv ("UTF-8", "gb2312", $ zh );
$ S2 = iconv ("gb2312", "UTF-8", $ s1 );
If ($ s2 = $ zh) {$ zh = $ s1 ;}
For ($ I = 0; $ I <strlen ($ zh); $ I ++ ){
$ S1 = substr ($ zh, $ I, 1 );
$ P = ord ($ s1 );
If ($ p & gt; 160 ){
$ S2 = substr ($ zh, $ I ++, 2 );
$ Ret. = getfirstchar ($ s2 );
} Else {
$ Ret. = $ s1;
}
}
Return $ ret;
}
Echo "Postal Road Primary School ";
Echo pinyin1 ('postal Road Primary School ');
?>
Output result: YZLX, Postal Road Primary School
Enter a small character separately. you can use getfirstchar ("small") to convert it successfully.
Reply to discussion (solution)
Your algorithm is only applicable to the gb2312 primary font library.
No need for study
Dictionary provided by qq
0x80) {$ c = $ str [$ I]. $ str [$ I + 1]; $ I ++; if (isset ($ pinyins [$ c]) {if (! $ Ishead AND $ ucfirst) {$ restr. = ucfirst ($ pinyins [$ c]);} elseif (! $ Ishead AND! $ Ucfirst) {$ restr. = '_'. $ pinyins [$ c];} else {$ restr. = $ pinyins [$ c] [0] ;}} else {$ restr. = "_" ;}} else if (preg_match ("/[a-z0-9]/", $ str [$ I]) {$ restr. = $ str [$ I];} else {$ restr. = "_" ;}} if ($ restr [0] ==' _ ') {return substr ($ restr, 1) ;}else {return $ restr ;}} /* End of file pinyin_helper.php * // * Location. /application/helpers/pinyin_helper.php */
Function Pinyin ($ _ String, $ _ Code = 'gb2312 ') {$ _ DataKey = "a | ai | an | ang | ao | ba | bai | ban | bang | bao | bei | ben | beng | bi | bian | biao | bie | bin | bing | bo | bu | ca | cai | can | cang | cao | ce | ceng | cha ". "| chai | chan | chang | chao | che | chen | cheng | chi | chong | chou | chu | chuai | chuan | chuang | chui | chun | chuo | ci | cong | cou | cu | ". "cuan | cui | cun | cuo | da | dai | dan | dang | dao | de | deng | di | dian | diao | die | ding | diu | dong | dou | du | duan | dui | dun | duo | e | en | er ". "| fa | fan | f Ang | fei | fen | feng | fo | fou | fu | ga | gai | gan | gang | gao | ge | gei | gen | geng | gong | gou | gu | gua | guai | guan | guang | gui ". "| gun | guo | ha | hai | han | hang | hao | he | hei | hen | heng | hong | hou | hu | hua | huai | huan | huang | hui | hun | huo | ji | jia | jian | jiang ". "| jiao | jie | jin | jing | jiong | jiu | ju | juan | jue | jun | ka | kai | kan | kang | kao | ke | ken | keng | kong | kou | ku | kua | kuai | kuan | kuang ". "| kui | kun | kuo | la | lai | lan | lang | lao | le | lei | leng | li | lia | lian | liang | liao | lie | lin | Ling | liu | long | lou | lu | lv | luan | lue ". "| lun | luo | ma | mai | man | mang | mao | me | mei | men | meng | mi | mian | miao | mie | min | ming | miu | mo | mou | mu | na | nai | nan | nang | nao | ne ". "| nei | nen | neng | ni | nian | niang | niao | nie | nin | ning | niu | nong | nu | nv | nuan | nue | nuo | o | ou | pa | pai | pan | pang | pao | pei | pen ". "| peng | pi | pian | piao | pie | pin | ping | po | pu | qi | qia | qian | qiang | qiao | qie | qin | qing | qiong | qiu | qu | quan | que | qun | ran | rang ". "| rao | re | ren | reng | ri | rong | rou | ru | Ruan | rui | run | ruo | sa | sai | san | sang | sao | se | sen | seng | sha | shai | shan | shang | shao | ". "she | shen | sheng | shi | shou | shu | shuai | shuan | shuang | shui | shun | shuo | si | song | sou | su | suan | sui | sun | suo | ta | tai | ". "tan | tang | tao | te | teng | ti | tian | tiao | tie | ting | tong | tou | tu | tuan | tui | tun | tuo | wa | wai | wan | wang | wei | wen | weng | wo | wu ". "| xi | xia | xian | xiang | xiao | xie | xin | xing | xiong | xiu | xu | xuan | xue | xun | ya | yan | yang | yao | ye | yi | yin | ying | yo | yong | You ". "| yu | yuan | yue | yun | za | zai | zan | zang | zao | ze | zei | zen | zeng | zha | zhai | zhan | zhang | zhao | zhe | zhen | zheng | zhi | zhong | ". "zhou | zhu | zhua | zhuai | zhuan | zhuang | zhui | zhun | zhuo | zi | zong | zou | zu | zuan | zui | zun | zuo "; $ _ DataValue = "-20319 |-20317 |-20304 |-20295 |-20292 |-20283 |-20265 |-20257 |-20242 |-20230 |-20051 |-20036 |-|-20032 |-20026 |-20002 |-19990 ". "|-19986 |-19982 |-19976 |-19805 |-19784 |-19775 |-19774 |-19763 |-19756 |-19751 |-1 9746 |-19741 |-19739 |-19728 |-19725 ". "|-19715 |-19540 |-19531 |-19525 |-19515 |-19500 |-19484 |-19479 |-19467 |-19289 |-19288 |-19281 |-19275 |-|-19270 |-19263 ". "|-19261 |-19249 |-19243 |-19242 |-19238 |-19235 |-19227 |-19224 |-19218 |-19212 |-19038 |-19023 |-19018 |-|-19006 |-19003 ". "|-18996 |-18977 |-18961 |-18952 |-18783 |-18774 |-18773 |-18763 |-18756 |-18741 |-18735 |-18731 |-18722 |-|-18710 |-18697 ". "|-18696 |-18526 |-18518 |-18501 |-18490 |- 18478 |-18463 |-18448 |-18447 |-18446 |-18239 |-18237 |-18231 |-18220 |-18211 ". "|-18201 |-18184 |-18183 |-18181 |-18012 |-17997 |-17988 |-17970 |-17964 |-17961 |-17950 |-17947 |-17931 |-|-17928 |-17922 ". "|-17759 |-17752 |-17733 |-17730 |-17721 |-17703 |-17701 |-17697 |-17692 |-17683 |-17676 |-17496 |-17487 |-|-17482 |-17468 ". "|-17454 |-17433 |-17427 |-17417 |-17202 |-17185 |-16983 |-16970 |-16942 |-16915 |-16733 |-16708 |-16706 |-|-16689 |-16664 ". "| -16657 |-16647 |-16474 |-16470 |-16465 |-16459 |-16452 |-16448 |-16433 |-16429 |-16427 |-16423 |-16419 |- 16412 |-16407 ". "|-16403 |-16401 |-16393 |-16220 |-16216 |-16212 |-16205 |-16202 |-16187 |-16180 |-16171 |-16169 |-16158 |-|-16155 |-15959 ". "|-15958 |-15944 |-15933 |-15920 |-15915 |-15903 |-15889 |-15878 |-15707 |-15701 |-15681 |-15667 |-15661 |-|-15659 |-15652 ". "|-15640 |-15631 |-15625 |-15454 |-15448 |-15436 |-15435 |-15419 |-15416 |-15408 |-15 394 |-15385 |-15377 |-15375 |-15369 ". "|-15363 |-15362 |-15183 |-15180 |-15165 |-15158 |-15153 |-15150 |-15149 |-15144 |-15143 |-15141 |-15140 |-|-15139 |-15128 ". "|-15121 |-15119 |-15117 |-15110 |-15109 |-14941 |-14937 |-14933 |-14930 |-14929 |-14928 |-14926 |-14922 |-|-14921 |-14914 ". "|-14908 |-14902 |-14894 |-14889 |-14882 |-14873 |-14871 |-14857 |-14678 |-14674 |-14670 |-14668 |-14663 |-|-14654 |-14645 ". "|-14630 |-14594 |-14429 |-14407 |-14399 |-1 4384 |-14379 |-14368 |-14355 |-14353 |-14345 |-14170 |-14159 |-14151 |-14149 ". "|-14145 |-14140 |-14137 |-14135 |-14125 |-14123 |-14122 |-14112 |-14109 |-14099 |-14097 |-14094 |-14092 |-|-14090 |-14087 ". "|-14083 |-13917 |-13914 |-13910 |-13907 |-13906 |-13905 |-13896 |-13894 |-13878 |-13870 |-13859 |-13847 |-|-13831 |-13658 ". "|-13611 |-13601 |-13406 |-13404 |-13400 |-13398 |-13395 |-13391 |-13387 |-13383 |-13367 |-13359 |-13356 |-|-13343 |-13340 ". "|- 13329 |-13326 |-13318 |-13147 |-13138 |-13120 |-13107 |-13096 |-13095 |-13091 |-13076 |-13068 |-13063 |-13060 |-|-12888 ". "|-12875 |-12871 |-12860 |-12858 |-12852 |-12849 |-12838 |-12831 |-12829 |-12812 |-12802 |-12607 |-12597 |-|-12594 |-12585 ". "|-12556 |-12359 |-12346 |-12320 |-12300 |-12120 |-12099 |-12089 |-12074 |-12067 |-12058 |-12039 |-11867 |-|-11861 |-11847 ". "|-11831 |-11798 |-11781 |-11604 |-11589 |-11536 |-11358 |-11340 |-11339 |-11324 |-113 |- 03 |-11097 |-11077 |-11067 |-11055 ". "|-11052 |-11045 |-11041 |-11038 |-11024 |-11020 |-11019 |-11018 |-11014 |-10838 |-10832 |-10815 |-10800 |-|-10790 |-10780 ". "|-10764 |-10587 |-10544 |-10533 |-10519 |-10331 |-10329 |-10328 |-10322 |-10315 |-10309 |-10307 |-10296 |-|-10281 |-10274 ". "|-10270 |-10262 |-10260 |-10256 |-10254"; $ _ TDataKey = explode ('|', $ _ DataKey ); $ _ TDataValue = explode ('|', $ _ DataValue); $ _ Data = (php_VERSION> = '5. 0 ')? Array_combine ($ _ TDataKey, $ _ TDataValue): _ Array_Combine ($ _ TDataKey, $ _ TDataValue); arsort ($ _ Data); reset ($ _ Data ); if ($ _ Code! = 'Gb2312') $ _ String = _ U2_Utf8_Gb ($ _ String); $ _ Res = ''; for ($ I = 0; $ I
160) {$ _ Q = ord (substr ($ _ String, ++ $ I, 1 )); $ _ P = $ _ P * 256 + $ _ Q-65536;} $ _ Res. = _ Pinyin ($ _ P, $ _ Data);} return preg_replace ("/[^ a-z0-9] */", '', $ _ Res );} function _ Pinyin ($ _ Num, $ _ Data) {if ($ _ Num> 0 & $ _ Num <160) return chr ($ _ Num ); elseif ($ _ Num <-20319 | $ _ Num>-10247) return ''; else {foreach ($ _ Data as $ k => $ v) {if ($ v <= $ _ Num) break;} return $ k;} function _ U2_Utf8_Gb ($ _ C) {$ _ String = ''; if ($ _ C <0x80) $ _ String. = $ _ C; elseif ($ _ C <0x800) {$ _ String. = chr (0xC0 | $ _ C> 6); $ _ String. = chr (0x80 | $ _ C & 0x3F);} elseif ($ _ C <0x10000) {$ _ String. = chr (0xE0 | $ _ C> 12); $ _ String. = chr (0x80 | $ _ C> 6 & 0x3F); $ _ String. = chr (0x80 | $ _ C & 0x3F);} elseif ($ _ C <0x200000) {$ _ String. = chr (0xF0 | $ _ C> 18); $ _ String. = chr (0x80 | $ _ C> 12 & 0x3F); $ _ String. = chr (0x80 | $ _ C> 6 & 0x3F); $ _ String. = chr (0x80 | $ _ C & 0x3F);} return iconv ('utf-8', 'gb2312 ', $ _ String );} function _ Array_Combine ($ _ Arr1, $ _ Arr2) {for ($ I = 0; $ I
Thank you. Try Me
Dictionary provided by qq
Where can I find a dictionary... Can I change the bat address in the source code?
Pinyin. dat search
Http://www.baidu.com? Wd = pinyin. dat & ie = UTF-8