The problem of converting php Chinese into pinyin initials
& lt? Server-side programming language (abbreviation of professional hypertext preprocessor)
/*
A simple PHP implementation method for converting Chinese characters into pinyin initials.
Requirements:? It can only be Chinese characters in GB23 12 code table.
Convert the pinyin initials corresponding to the character string to uppercase.
Usage:
Echo? Zh2py::conv ('Chinese? People's Republic of China (PRC) (China)'); //Chinese? ZHRMGHG
or
$py? =? New? zh2py
Echo? $ py-& gt; Conv ('Chinese? People's Republic of China (PRC) (China)'); //Chinese? ZHRMGHG
*/
Class? zh2py
{
//According to the Chinese character position table
//We can see that the area from 16-55 is sorted by pinyin letters, so we only need to judge the position code of a Chinese character to know its pinyin initials.
//The first part of the location table is arranged in alphabetical order.
// 16 -55
/*
A ' = & gt0xB0A 1,? B ' = & gt0xB0C5,? c ' = >; 0xB2C 1,? D ' = & gt0xB4EE,? E ' = & gt0xB6EA,? F ' = & gt0xB7A2,? g ' = >; 0xB8C 1,' H ' = & gt0xB9FE,
j ' = >; 0xBBF7,? K ' = & gt0xBFA6,? L ' = & gt0xC0AC,? m ' = >; 0xC2E8,? N ' = & gt0xC4C3,? O ' = & gt0xC5B6,? P ' = & gt0xC5BE,' Q ' = & gt0xC6DA,
R ' = & gt0xC8BB,? S ' = & gt0cx8f 6,? T ' = & gt0xCBFA,? W ' = & gt0xCDDA,? X ' = & gt0xCEF4,? Y ' = & gt0xD 1B9,? Z ' = & gt0xD4D 1
*/
Private? Static electricity $FirstTable? =? Array (
0xB0C5,? 0xB2C 1,? 0xB4EE,? 0xB6EA,? 0xB7A2,? 0xB8C 1,? 0xB9FE,? 0xBBF7,? 0xBFA6,? 0xC0AC,? 0xC2E8,
0xC4C3,? 0xC5B6,? 0xC5BE,? 0xC6DA,? 0xC8BB,? 0cx8f 6,? 0xCBFA,? 0xCDDA,? 0xCEF4,? 0xD 1B9,? 0xD4D 1,0xD7FA
);
Private? Static electricity $FirstLetter? =? ”abcdefghjklmnopqrstwyz”;
//The second part of the location table is irregular, and the letters below are the pinyin initials of the corresponding words in each area. It was compiled through online inquiry, and there may be some mistakes.
//Area 56-Area 87
Private? Static electricity $SecondTable? =? Array (
" cjwgnspgcgnegypbtyyzxykygtzjnmjqmbsgzscyjsyyfpgkbzgydywjkljswkpjqhyjwrdzlsymrypywwcckznkyyg ",
" ttngjeykkzytcjnmcylqlypysfqrpzslwbtgkjfyxjjjtxttsqzycdxxhgcbphffsstybbgmxlpbylbhlx ",
" smzmyjhsojnghdzqyklgjhsgqzhxqgkxzzwyscscjxyeyxadzpmdssmzjzqjyzcjjfwqjbdzbxgznzcphwxhqkmwfbpby ",
" dtjzzkxhylygxfptyjyzpszlfchmqshgmxxsxjyyqdcsbbqbefsjyhwgzkplqbgldlcdtnmayddkssngycsgxlyzaypn ",
" ptsdkdylhgymylcxpycjndqjwxqxxfyjlejpzrxccqwqqsbzkymgplbmjrqcflnymyqmsqyrbcjthzt qfrxqhxmqjcjly ",
" qgjmshzkbswyemylxfsydxwlycjqxsjnqbsctyhbftdcyzdjwyghqfrxwck qkxebptlpxjzsrmebwhjlbjslysmdxlcl ",
" qkxlhxjrzjmf qhxhwywsbhtrxxglhqhfnmgykldyxzpylggsmtcfbajjzyljtyanjgbjplqgszyqyaxbkysecjsznslyzh ",
" zxlzcghpxzhznytdsbcjkdlzayffydlebbgbqyzkxgldnyskjshdlyxbcghhxypkdjmmzngmmclgwzszjfznmlzzthcs ",
" ydbdllscddnlkjykjsycjlkwhqasdknhcsgaghdaashtcplcpqybszmplpcjoqlcdhjysprchnwjnllyyqyywzptczg ",
" wwmzffjqqqyxaclbhkdjxdgmydjxzllsygxkjrywzwyclzmssjzldbydcfcxyhlxchyzjqsqqamnyxpfrkssbjlyxy ",
" syglnscmhcwwmnzjjlxxhchysttxrycyxxbyhcsmxjsznpwgpxxtaybgajcxlyxdcwzocwkccsbnhcpdyznfcytyckx ",
" kybsqkkytqqxfcmhcykelzqbsqyjqcclmthsywhmktlkjlycxwheqqhtqkzpqscfymmdmgbwhwlgsllysdlmxpthmj ",
" hwljzyhzjxktxjlhxrswlwzjcb xmhzqxsdzpsgfcsglsxymjshxpjxwmyqksmyplrthbxftpmhyxlchlhzylxgsssstcl ",
" sldclrpbhzhxyyfhbmgdmycnqqwlqhjcywjzyejjdhpblqxtqkwhlchqxagtlxjxmsljhtzkzjecxjcjnfbycsfywyb ",
" jzgnysdzsqyrsljpclpwxsdwejbjcbnaytwgmpapclyqpclzxsbnmsggfnzjbzsfzyntxhplqkzzwalsbczjxsyzgwk ",
" ypsgxfzfcdkhjgxtlqfsdslqwzkxtmhsbgzmjzrglyjbpmmlmsxlzjqhzyjczydjwfmjkldpmjegxyhylxhlqyqhkycw ",
" cjmyxnatjhycccxzpcqlbzwwytwbqcmlpmyrjcccxfpznzzljplxxyztzlgdltcklyrzzzgqttjhhhjljaxfgjzslcfdqz ",
" lclgjdjzsnzljpjqdcclcjxmyzftsxgcgsbrzxjqctzhgyqtjqqlzjylbcyamcstylpdjbyregklzyzhlyszqlznw ",
" czcllwjqjjjkdgjzolbzppglightgzxyghzmycnqsycyhbgxkamtxyxnbskyzzgjzlqjtfcjxdygjqjpmgwgjjpkqsb ",
" gbmmcjssclpqpqpqdxcdyykypcjdyygywrhjrtgznyqldkljszzgzqzjgdykshpzmtlcpwnjyyzdjcnmwescyglbtzgmss ",
" llyxyxxbsjsbbsgghfjlypmzjnlyywdqshzxtyywhmcyywddbxbbtlmsyyyfsxjcbdxxlhjhfss xzqhfzmzzt qcxzxrtt ",
" djhnryzqqmtqdmgnydxmjgdxcdyzbffallztdltfxmxqzdngwqddbdczjdxbzgsqqdjcmbkzffxmkdmdsyyszcmljdsyn ",
" sprskmkmpcklgtbqtfzswtglypljzhgjjgypzltcsmcnbtjbbqfkdhbyzgkpbbymtdssxtbnpdkleycjnycdykztdhqh ",
" syzsctarrlltkzlgecllkjlqjaqnbdkghpjtzqksecshalqfmgjnlyjbtmlyzxdxjpldlpcqdhzycbzsczsbzmsljflkr ",
" zjsnfrgjhxpdhyjybzgdlqcsezgxlblgyxtwmabchemwyjyzljyhlgndjlslygkdzpzxjyyzlwcxszfgwyydlyhcljs ",
" cmbjhblyzlycblydpdqysxqzbytdkyxjyycnrjmpdjgklcljbctbdblczqrpyxjcjlzcshltoljnmddlngkathqh ",
" jhykheznmshrhqqjchgmfprxhjgdychglyrzqlcyqjymszswlcfqqxyfggyptqwlmcrnfkkfsyylqbmqamm ",
" myxctpshcptxxxzzsmphpshmclmldqfyqxszyjdjjzzhqpdszglstjbckxyqzjsgpsxqzqzrqtbdkyxzkhgflbcsmdldg ",
" dzdblzyycxnncsybzbglzxswmsccmqnjqsbdqsjtxxmbltxzclzcshzxrqjgjylxzfjphymzqqydfqjjlzznzcdgzyg ",
" ctxmzysctlkphtxhtlbjlxxscdqxcbbtjfqzfsltjbtkqbxjljcchczdbzjdzjdccprnpqcjpczlclzdmxmphjsgz ",
" gszzqlylwtjpfsyasmcjbzyycwmytzsjljcqlwzmalbxyfbpnlsfhtgjwejjxxglljstgshjqlzfkcgnnnszfdeqfhbs ",
" aqtgylbxmmygszldydqmjjrgbjttkgdhgkblqkbdmbylxwcxyttybkmrtjzxqjbhlhmjzmqasldcyxyqdlqcafywyxqhz ",
);
Public? Static electricity Function? Utf8_to_gbk($string)// transcoding must be converted into GB23 12 characters. The simple judgment here is not very accurate. You can write one yourself.
{
What if? (mb_check_encoding($string,' gb23 12 '))
Return? $ string
What if? (function_exists('iconv ')。
Return? iconv("utf-8 "," gb23 12//IGNORE ",$ string);
Return? mb_convert_encoding($string,' gb23 12 ',' utf-8 '); ?
}
Public? Static electricity Function? Conv (USD)
{
$str? =? self::utf8 _ to _ gbk($ str);
$len? =? strlen($ str);
$newStr? =? '';
for($ I = 0; ? $ i & lt$len? ; ? ++$i)
{
$H? =? order($ str[$ I]);
$L? =? order($ str[$ I+ 1]);
//Illegal character set
What if? ($H? & lt? 0xB0? ||? $L? & lt? 0xA 1? ||? $H? & gt? 0xF7? ||? $L? ==? 0xFF)
{
$newStr? . =? $ str[$ I];
Continue;
}
What if? ($H? & lt? 0xD8)//($H? & gt=? 0xB0? & amp& amp? $H? & lt=0xD7)// The query text is in the first-level Chinese character area (16-55).
{
$W? =? ($H? & lt& lt? 8)? |? $ L;
foreach(self::$FirstTable? As? $ key => USD value)
{
What if? ($W? & lt? Dollar value)
{
$newStr? . =? self::$ first letter[$ key];
Break;
}
}
}
else//? What if? (H? & gt=? 0xD8? & amp& amp? h? & lt=? 0xF7)// Query Chinese in the secondary Chinese character area (56-87)
$newStr? . =self::$SecondTable[$H? -? 0xd 8][$ L-0xa 1];
++ $ I;
}
Return? $ newStr
}
}
Echo? Zh2py:: conv ('Princess'); //F