China Naming Network - Ziwei Dou Shu - The problem of converting php Chinese into pinyin initials

The problem of converting php Chinese into pinyin initials

There was something wrong with the original code, and I made some changes. Github's original address is chenall/chenall/blob/master/PHP/tools/zh-cn _ to _ pinyin.php.

& lt? Server-side programming language (abbreviation of professional hypertext preprocessor)

/*

A simple PHP implementation method for converting Chinese characters into pinyin initials.

Requirements:? It can only be Chinese characters in GB23 12 code table.

Convert the pinyin initials corresponding to the character string to uppercase.

Usage:

Echo? Zh2py::conv ('Chinese? People's Republic of China (PRC) (China)'); //Chinese? ZHRMGHG

or

$py? =? New? zh2py

Echo? $ py-& gt; Conv ('Chinese? People's Republic of China (PRC) (China)'); //Chinese? ZHRMGHG

*/

Class? zh2py

{

//According to the Chinese character position table

//We can see that the area from 16-55 is sorted by pinyin letters, so we only need to judge the position code of a Chinese character to know its pinyin initials.

//The first part of the location table is arranged in alphabetical order.

// 16 -55

/*

A ' = & gt0xB0A 1,? B ' = & gt0xB0C5,? c ' = >; 0xB2C 1,? D ' = & gt0xB4EE,? E ' = & gt0xB6EA,? F ' = & gt0xB7A2,? g ' = >; 0xB8C 1,' H ' = & gt0xB9FE,

j ' = >; 0xBBF7,? K ' = & gt0xBFA6,? L ' = & gt0xC0AC,? m ' = >; 0xC2E8,? N ' = & gt0xC4C3,? O ' = & gt0xC5B6,? P ' = & gt0xC5BE,' Q ' = & gt0xC6DA,

R ' = & gt0xC8BB,? S ' = & gt0cx8f 6,? T ' = & gt0xCBFA,? W ' = & gt0xCDDA,? X ' = & gt0xCEF4,? Y ' = & gt0xD 1B9,? Z ' = & gt0xD4D 1

*/

Private? Static electricity $FirstTable? =? Array (

0xB0C5,? 0xB2C 1,? 0xB4EE,? 0xB6EA,? 0xB7A2,? 0xB8C 1,? 0xB9FE,? 0xBBF7,? 0xBFA6,? 0xC0AC,? 0xC2E8,

0xC4C3,? 0xC5B6,? 0xC5BE,? 0xC6DA,? 0xC8BB,? 0cx8f 6,? 0xCBFA,? 0xCDDA,? 0xCEF4,? 0xD 1B9,? 0xD4D 1,0xD7FA

);

Private? Static electricity $FirstLetter? =? ”abcdefghjklmnopqrstwyz”;

//The second part of the location table is irregular, and the letters below are the pinyin initials of the corresponding words in each area. It was compiled through online inquiry, and there may be some mistakes.

//Area 56-Area 87

Private? Static electricity $SecondTable? =? Array (

" cjwgnspgcgnegypbtyyzxykygtzjnmjqmbsgzscyjsyyfpgkbzgydywjkljswkpjqhyjwrdzlsymrypywwcckznkyyg ",

" ttngjeykkzytcjnmcylqlypysfqrpzslwbtgkjfyxjjjtxttsqzycdxxhgcbphffsstybbgmxlpbylbhlx ",

" smzmyjhsojnghdzqyklgjhsgqzhxqgkxzzwyscscjxyeyxadzpmdssmzjzqjyzcjjfwqjbdzbxgznzcphwxhqkmwfbpby ",

" dtjzzkxhylygxfptyjyzpszlfchmqshgmxxsxjyyqdcsbbqbefsjyhwgzkplqbgldlcdtnmayddkssngycsgxlyzaypn ",

" ptsdkdylhgymylcxpycjndqjwxqxxfyjlejpzrxccqwqqsbzkymgplbmjrqcflnymyqmsqyrbcjthzt qfrxqhxmqjcjly ",

" qgjmshzkbswyemylxfsydxwlycjqxsjnqbsctyhbftdcyzdjwyghqfrxwck qkxebptlpxjzsrmebwhjlbjslysmdxlcl ",

" qkxlhxjrzjmf qhxhwywsbhtrxxglhqhfnmgykldyxzpylggsmtcfbajjzyljtyanjgbjplqgszyqyaxbkysecjsznslyzh ",

" zxlzcghpxzhznytdsbcjkdlzayffydlebbgbqyzkxgldnyskjshdlyxbcghhxypkdjmmzngmmclgwzszjfznmlzzthcs ",

" ydbdllscddnlkjykjsycjlkwhqasdknhcsgaghdaashtcplcpqybszmplpcjoqlcdhjysprchnwjnllyyqyywzptczg ",

" wwmzffjqqqyxaclbhkdjxdgmydjxzllsygxkjrywzwyclzmssjzldbydcfcxyhlxchyzjqsqqamnyxpfrkssbjlyxy ",

" syglnscmhcwwmnzjjlxxhchysttxrycyxxbyhcsmxjsznpwgpxxtaybgajcxlyxdcwzocwkccsbnhcpdyznfcytyckx ",

" kybsqkkytqqxfcmhcykelzqbsqyjqcclmthsywhmktlkjlycxwheqqhtqkzpqscfymmdmgbwhwlgsllysdlmxpthmj ",

" hwljzyhzjxktxjlhxrswlwzjcb xmhzqxsdzpsgfcsglsxymjshxpjxwmyqksmyplrthbxftpmhyxlchlhzylxgsssstcl ",

" sldclrpbhzhxyyfhbmgdmycnqqwlqhjcywjzyejjdhpblqxtqkwhlchqxagtlxjxmsljhtzkzjecxjcjnfbycsfywyb ",

" jzgnysdzsqyrsljpclpwxsdwejbjcbnaytwgmpapclyqpclzxsbnmsggfnzjbzsfzyntxhplqkzzwalsbczjxsyzgwk ",

" ypsgxfzfcdkhjgxtlqfsdslqwzkxtmhsbgzmjzrglyjbpmmlmsxlzjqhzyjczydjwfmjkldpmjegxyhylxhlqyqhkycw ",

" cjmyxnatjhycccxzpcqlbzwwytwbqcmlpmyrjcccxfpznzzljplxxyztzlgdltcklyrzzzgqttjhhhjljaxfgjzslcfdqz ",

" lclgjdjzsnzljpjqdcclcjxmyzftsxgcgsbrzxjqctzhgyqtjqqlzjylbcyamcstylpdjbyregklzyzhlyszqlznw ",

" czcllwjqjjjkdgjzolbzppglightgzxyghzmycnqsycyhbgxkamtxyxnbskyzzgjzlqjtfcjxdygjqjpmgwgjjpkqsb ",

" gbmmcjssclpqpqpqdxcdyykypcjdyygywrhjrtgznyqldkljszzgzqzjgdykshpzmtlcpwnjyyzdjcnmwescyglbtzgmss ",

" llyxyxxbsjsbbsgghfjlypmzjnlyywdqshzxtyywhmcyywddbxbbtlmsyyyfsxjcbdxxlhjhfss xzqhfzmzzt qcxzxrtt ",

" djhnryzqqmtqdmgnydxmjgdxcdyzbffallztdltfxmxqzdngwqddbdczjdxbzgsqqdjcmbkzffxmkdmdsyyszcmljdsyn ",

" sprskmkmpcklgtbqtfzswtglypljzhgjjgypzltcsmcnbtjbbqfkdhbyzgkpbbymtdssxtbnpdkleycjnycdykztdhqh ",

" syzsctarrlltkzlgecllkjlqjaqnbdkghpjtzqksecshalqfmgjnlyjbtmlyzxdxjpldlpcqdhzycbzsczsbzmsljflkr ",

" zjsnfrgjhxpdhyjybzgdlqcsezgxlblgyxtwmabchemwyjyzljyhlgndjlslygkdzpzxjyyzlwcxszfgwyydlyhcljs ",

" cmbjhblyzlycblydpdqysxqzbytdkyxjyycnrjmpdjgklcljbctbdblczqrpyxjcjlzcshltoljnmddlngkathqh ",

" jhykheznmshrhqqjchgmfprxhjgdychglyrzqlcyqjymszswlcfqqxyfggyptqwlmcrnfkkfsyylqbmqamm ",

" myxctpshcptxxxzzsmphpshmclmldqfyqxszyjdjjzzhqpdszglstjbckxyqzjsgpsxqzqzrqtbdkyxzkhgflbcsmdldg ",

" dzdblzyycxnncsybzbglzxswmsccmqnjqsbdqsjtxxmbltxzclzcshzxrqjgjylxzfjphymzqqydfqjjlzznzcdgzyg ",

" ctxmzysctlkphtxhtlbjlxxscdqxcbbtjfqzfsltjbtkqbxjljcchczdbzjdzjdccprnpqcjpczlclzdmxmphjsgz ",

" gszzqlylwtjpfsyasmcjbzyycwmytzsjljcqlwzmalbxyfbpnlsfhtgjwejjxxglljstgshjqlzfkcgnnnszfdeqfhbs ",

" aqtgylbxmmygszldydqmjjrgbjttkgdhgkblqkbdmbylxwcxyttybkmrtjzxqjbhlhmjzmqasldcyxyqdlqcafywyxqhz ",

);

Public? Static electricity Function? Utf8_to_gbk($string)// transcoding must be converted into GB23 12 characters. The simple judgment here is not very accurate. You can write one yourself.

{

What if? (mb_check_encoding($string,' gb23 12 '))

Return? $ string

What if? (function_exists('iconv ')。

Return? iconv("utf-8 "," gb23 12//IGNORE ",$ string);

Return? mb_convert_encoding($string,' gb23 12 ',' utf-8 '); ?

}

Public? Static electricity Function? Conv (USD)

{

$str? =? self::utf8 _ to _ gbk($ str);

$len? =? strlen($ str);

$newStr? =? '';

for($ I = 0; ? $ i & lt$len? ; ? ++$i)

{

$H? =? order($ str[$ I]);

$L? =? order($ str[$ I+ 1]);

//Illegal character set

What if? ($H? & lt? 0xB0? ||? $L? & lt? 0xA 1? ||? $H? & gt? 0xF7? ||? $L? ==? 0xFF)

{

$newStr? . =? $ str[$ I];

Continue;

}

What if? ($H? & lt? 0xD8)//($H? & gt=? 0xB0? & amp& amp? $H? & lt=0xD7)// The query text is in the first-level Chinese character area (16-55).

{

$W? =? ($H? & lt& lt? 8)? |? $ L;

foreach(self::$FirstTable? As? $ key => USD value)

{

What if? ($W? & lt? Dollar value)

{

$newStr? . =? self::$ first letter[$ key];

Break;

}

}

}

else//? What if? (H? & gt=? 0xD8? & amp& amp? h? & lt=? 0xF7)// Query Chinese in the secondary Chinese character area (56-87)

$newStr? . =self::$SecondTable[$H? -? 0xd 8][$ L-0xa 1];

++ $ I;

}

Return? $ newStr

}

}

Echo? Zh2py:: conv ('Princess'); //F