Class for converting Chinese characters to PinYin (C #):
//// <Summary> <br/> // convert Chinese characters to PinYin <br/> /// </Summary> <br/> public class chs2py <br/ >{< br/> Private Static int [] pyvalue = new int [] {-20319, -20317,-20304,-20295,-20292,-20283,-20265,-20257,-20242,-20230,-20051,-20036,-20032,-20026, <br/>-20002,-19990,-19986,-19982,-19976,-19805,-19784,-19775,-19774,-19763,-19756,-19751, -19746,-19741,-19739,-19728, <br/>-19725,-19715,-19540,-19531,-19525,-19515,-19500, -19479,-19467,-19289,-19288,-19281,-19275,-19270,-19263, <br/>-19261,-19249,-19243,-19242, -19238,-19235,-19227,-19224,-19218,-19212,-19038,-19023,-19018,-19006,-19003,-18996, <br/>-18977,-18961,-18952,-18783,-18774,-18773,-18763,-18756,-18741,-18735,-18731,-18722, -18710,-18697,-18696,-18526, <br/>-18518,-18501,-18490,-18478,-18463,-18448,-18447, -18239,-18237,-18231,-18220,-18211,-18201,-18184,-18183, <br/>-18181,-18012,-17997,-17988, -17970,-17964,-17961,-17950,-17947,-17931,-17928,-17922,-17759,-17752,-17733,-17730, <br/>-17721,-17703,-17701,-17697,-17692,-17683,-17676,-17496,-17487,-17482,-17468,-17454, -17433,-17427,-17417,-17202, <br/>-17185,-16983,-16970,-16942,-16915,-16733,-16708, -16689,-16664,-16657,-16647,-16474,-16470,-16465,-16459, <br/>-16452,-16448,-16433,-16429, -16427,-16423,-16419,-16412,-16407,-16403,-16401,-16393,-16220,-16216,-16212,-16205, <br/>-16202,-16187,-16180,-16171,-16169,-16158,-16155,-15959,-15958,-15944,-15933,-15920, -15915,-15903,-15889,-15878, <br/>-15707,-15701,-15681,-15667,-15661,-15659,-15652, -15631,-15625,-15454,-15448,-15436,-15435,-15419,-15416, <br/>-15408,-15394,-15385,-15377, -15375,-15369,-15363,-15362,-15183,-15180,-15165,-15158,-15153,-15150,-15149,-15144, <br/>-15143,-15141,-15140,-15139,-15128,-15121,-15119,-15117,-15110,-15109,-14941,-14937, -14933,-14930,-14929,-14928, <br/>-14926,-14922,-14921,-14914,-14908,-14902,-14894, -14882,-14873,-14871,-14857,-14678,-14674,-14670,-14668, <br/>-14663,-14654,-14645,-14630, -14594,-14429,-14407,-14399,-14384,-14379,-14368,-14355,-14353,-14345,-14170,-14159, <br/>-14151,-14149,-14145,-14140,-14137,-14135,-14125,-14123,-14122,-14112,-14109,-14099, -14097,-14094,-14092,-14090, <br/>-14087,-14083,-13917,-13914,-13910,-13907,-13906, -13896,-13894,-13878,-13870,-13859,-13847,-13831,-13658, <br/>-13611,-13601,-13406,-13404, -13400,-13398,-13395,-13391,-13387,-13383,-13367,-13359,-13356,-13343,-13340,-13329, <br/>-13326,-13318,-13147,-13138,-13120,-13107,-13096,-13095,-13091,-13076,-13068,-13063, -13060,-12888,-12875,-12871, <br/>-12860,-12858,-12852,-12849,-12838,-12831,-12829, -12802,-12607,-12597,-12594,-12585,-12556,-12359,-12346, <br/>-12320,-12300,-12120,-12099, -12089,-12074,-12067,-12058,-12039,-11867,-11861,-11847,-11831,-11798,-11781,-11604, <br/>-11589,-11536,-11358,-11340,-11339,-11324,-11303,-11097,-11077,-11067,-11055,-11052, -11045,-11041,-11038,-11024, <br/>-11020,-11019,-11018,-11014,-10838,-10832,-10815, -10790,-10780,-10764,-10587,-10544,-10533,-10519,-10331, <br/>-10329,-10328,-10322,-10315, -10309,-10307,-10296,-10281,-10274,-10270,-10262,-10260,-10256,-10254 }; <br/> Private Static string [] pystr = new string [] {"A", "AI", "an", "Ang", "Ao", "ba ", "bai", "ban", "bang", "Bao", "Bei", "Ben", "Beng", "bi", "Bian", "Biao ", <br/> "bie", "bin", "bing", "Bo", "bu", "ca", "Cai", "can", "Cang ", "Cao", "CE", "Ceng", "cha", "chai", "Chan", "Chang", "Chao", "Che", "Chen ", <br/> "Cheng", "Chi", "Chong", "Chou", "chu", "Chuai", "Chuan", "Chuang", "Chui ", "Chun", "Chuo", "Ci", "Cong", "cou", "Cu", "Cuan", "Cui", <br/> "cun ", "CuO", "da", "Dai", "Dan", "Dang", "Dao", "de", "Deng", "Di", "Dian ", "Diao", "die", "ding", "Diu", "Dong", "dou", "Du", "Duan", <br/> "DUI ", "Dun", "duo", "E", "en", "er", "Fa", "fan", "fang", "fei", "Fen ", "Feng", "FO", "fou", "Fu", "Ga", "Gai", "Gan", "Gang", "Gao ", <br/> "Ge", "gei", "gen", "Geng", "Gong", "gou", "Gu", "Gua", "Guai ", "Guan", "Guang", "Gui", "gun", "Guo", "ha", "Hai", "Han", "hang ", <br/> "hao", "he", "Hei", "Hu", "Heng", "Hong", "Hou", "Hu", "Hua ", "Huai", "Huan", "Huang", "Hui", "hun", "Huo", "Ji", "Jia", "jian ", <br/> "Jiang", "Jiao", "Jie", "Jin", "jing", "jiong", "Jiu", "Ju", "Juan ", "Jue", "Jun", "ka", "Kai", "kan", "Kang", "kao", "Ke", "Ken ", <br/> "Keng", "Kong", "Kou", "ku", "Kua", "Kuai", "Kuan", "Kuang", "Kui ", "Kun", "Kuo", "La", "Lai", "Lan", "Lang", "Lao", "Le", "lei ", <br/> "leng", "Li", "Lia", "Lian", "Liang", "liao", "lie", "Lin", "Ling ", "Liu", "long", "Lou", "Lu", "LV", "Luan", "Lue", "Lun", "Luo ", <br/> "Ma", "Mai", "man", "mang", "Mao", "me", "Mei", "men", "Meng ", "Mi", "Mian", "Miao", "Mie", "min", "Ming", "Miu", "Mo", "MOU", "Mu ", <br/> "Na", "Nai", "Nan", "Nang", "Nao", "ne", "Nei", "Nen", "Neng ", "Ni", "Nian", "Niang", "niao", "Nie", "Nin", "Ning", "niu", "Nong ", <br/> "Nu", "NV", "Nuan", "nue", "nuo", "O", "ou", "Pa", "Pai ", "pan", "Pang", "pao", "Pei", "pen", "peng", "Pi", "pian", "Piao", "pie ", <br/> "pin", "ping", "po", "Pu", "Qi", "QIA", "Qian", "Qiang", "Qiao ", "Qie", "Qin", "Qing", "Qiong", "Qiu", "Qu", "Quan", "que", "Qun ", <br/> "ran", "rang", "Rao", "re", "Ren", "reng", "Ri", "rong", "Rou ", "Ru", "Ruan", "Rui", "run", "RuO", "sa", "sai", "San", "sang ", <br/> "Sao", "se", "Sen", "Seng", "Sha", "Shai", "Shan", "Shang", "shao ", "She", "shen", "Sheng", "Shi", "Shou", "Shu", "Shua", <br/> "Shuai", "Shuan ", "Shuang", "Shui", "Shun", "Shuo", "Si", "Song", "Sou", "Su", "Suan", "Sui ", "Sun", "Suo", "ta", "Tai", <br/> "Tan", "Tang", "Tao", "te", "Teng ", "ti", "Tian", "tiao", "Tie", "ting", "tong", "TOU", "tu", "tuan", "Tui ", "tun", "Tuo", <br/> "wa", "Wai", "Wan", "Wang", "wei", "Wen", "Weng ", "wo", "Wu", "Xi", "xia", "Xian", "Xiang", "Xiao", "xie", "Xin", "Xing ", <br/> "Xiong", "Xiu", "Xu", "Xuan", "Xue", "Xun", "ya", "Yan", "Yang ", "Yao", "Ye", "Yi", "Yin", "ying", "yo", "Yong", "you", <br/> "yu ", "Yuan", "Yue", "Yun", "za", "Zai", "Zan", "Zang", "Zao", "ze", "Zei ", "Zen", "Zeng", "Zha", "Zhai", "Zhan", "Zhang", <br/> "Zhao", "zhe", "Zhen ", "zheng", "Zhi", "Zhong", "Zhou", "zhu", "zhua", "zhuai", "Zhuan", "Zhuang", "Zhui ", "Zhun", "Zhuo", <br/> "zi", "Zong", "zou", "Zu", "Zuan", "Zui", "Zun ", "Zuo" };< br/> Public chs2py () <br/>{< br/> // <br/> // todo: add the constructor logic here <br/> // <br/>}< br/> Public static string convert (string chrstr) <br/>{< br/> byte [] array = new byte [2]; <br/> string returnstr = ""; <br/> int chrasc = 0; <br/> int I1 = 0; <br/> int I2 = 0; <br/> char [] nowchar = chrstr. tochararray (); <br/> for (Int J = 0; j <nowchar. length; j ++) <br/>{< br/> array = system. text. encoding. default. getbytes (nowchar [J]. tostring (); <br/> I1 = (short) (array [0]); <br/> I2 = (short) (array [1]); <br/> chrasc = I1 * 256 + I2-65536; <br/> If (chrasc> 0 & chrasc <160) <br/>{< br/> returnstr + = nowchar [J]; <br/>}< br/> else <br/> {<br/> for (INT I = (pyvalue. length-1); I >=0; I --) <br/>{< br/> If (pyvalue [I] <= chrasc) <br/>{< br/> returnstr + = pystr [I]; <br/> break; <br/>}< br/> return returnstr; <br/>}< br/>}
To obtain the first letter of a Chinese character:
/// <Summary> <br/> // obtain the letter prefix of a Chinese character <br/> /// </Summary> <br/> // <Param name = "HZ"> Chinese characters </param> <br/> // <returns> first Chinese Character </returns> <br/> Public String chinesechartopinyin (string Hz) // obtain the location code of Chinese characters <br/>{< br/> byte [] Sarr = system. text. encoding. default. getbytes (HZ); <br/> int Len = Sarr. length; <br/> If (LEN> 1) <br/>{< br/> byte [] array = new byte [2]; <br/> array = system. text. encoding. default. getbytes (HZ); </P> <p> int I1 = (short) (array [0]-'/0'); <br/> int I2 = (short) (array [1]-'/0'); </P> <p> // Chinese character code in Unicode decoding mode <br/> // array = system. text. encoding. unicode. getbytes (HZ); </P> <p> int TMP = I1 * 256 + I2; <br/> string getpychar = "*"; // If the pinyin Code cannot be found, use the * complement </P> <p> If (TMP> = 45217 & TMP <= 45252) {getpychar = "";} <br/> else if (TMP> = 45253 & TMP <= 45760) {getpychar = "B ";} <br/> else if (TMP> = 45761 & TMP <= 46317) {getpychar = "C ";} <br/> else if (TMP> = 46318 & TMP <= 46825) {getpychar = "D ";} <br/> else if (TMP> = 46826 & TMP <= 47009) {getpychar = "e ";} <br/> else if (TMP> = 47010 & TMP <= 47296) {getpychar = "F ";} <br/> else if (TMP> = 47297 & TMP <= 47613) {getpychar = "G ";} <br/> else if (TMP> = 47614 & TMP <= 48118) {getpychar = "H ";} <br/> else if (TMP> = 48119 & TMP <= 49061) {getpychar = "J ";} <br/> else if (TMP> = 49062 & TMP <= 49323) {getpychar = "K ";} <br/> else if (TMP> = 49324 & TMP <= 49895) {getpychar = "L ";} <br/> else if (TMP> = 49896 & TMP <= 50370) {getpychar = "M ";} <br/> else if (TMP> = 50371 & TMP <= 50613) {getpychar = "N ";} <br/> else if (TMP> = 50614 & TMP <= 50621) {getpychar = "O ";} <br/> else if (TMP> = 50622 & TMP <= 50905) {getpychar = "p ";} <br/> else if (TMP> = 50906 & TMP <= 51386) {getpychar = "Q ";} <br/> else if (TMP> = 51387 & TMP <= 51445) {getpychar = "R ";} <br/> else if (TMP> = 51446 & TMP <= 52217) {getpychar = "S ";} <br/> else if (TMP> = 52218 & TMP <= 52697) {getpychar = "T ";} <br/> else if (TMP> = 52698 & TMP <= 52979) {getpychar = "W ";} <br/> else if (TMP> = 52980 & TMP <= 53640) {getpychar = "X ";} <br/> else if (TMP> = 53689 & TMP <= 54480) {getpychar = "Y ";} <br/> else if (TMP >=54481 & TMP <= 55289) {getpychar = "Z" ;}< br/> return getpychar; <br/>}< br/> else <br/>{< br/> return Hz; <br/>}< br/>}
Copyright Notice
This article is an original work. Please respect the work achievements of the author. Reprinting must maintain the integrity of the article, and the original author "tingsking18" and the main site address must be indicated in the form of a hyperlink, so that other friends can ask and correct.