Home >Backend Development >PHP Tutorial >php-Chinese pinyin initial letter tool class, php-Chinese character tool class_PHP tutorial

php-Chinese pinyin initial letter tool class, php-Chinese character tool class_PHP tutorial

WBOY
WBOYOriginal
2016-07-13 10:12:00874browse

php-Chinese pinyin initial letter tool class, php-Chinese character tool class

<?<span>php


</span><span>/*</span><span>*
* 汉字拼音首字母工具类
*  注: 英文的字串:不变返回(包括数字)    eg .abc123 => abc123
*      中文字符串:返回拼音首字符        eg. 测试字符串 => CSZFC
*      中英混合串: 返回拼音首字符和英文   eg. 我i我j => WIWJ
*  eg.
*  $py = new str2PY();
*  
*  $result = $py->getInitials('周杰伦');
*
*  //获取首字母
*  $result = $py->getFirstString('abc');  //A
*  $resutl = $py->getFirstString("周杰伦"); //Z
*
</span><span>*/</span>

<span>class</span><span> str2py
{

    </span><span>private</span> <span>$_pinyins</span> = <span>array</span><span>(
        </span>176161 => 'A',
        176197 => 'B',
        178193 => 'C',
        180238 => 'D',
        182234 => 'E',
        183162 => 'F',
        184193 => 'G',
        185254 => 'H',
        187247 => 'J',
        191166 => 'K',
        192172 => 'L',
        194232 => 'M',
        196195 => 'N',
        197182 => 'O',
        197190 => 'P',
        198218 => 'Q',
        200187 => 'R',
        200246 => 'S',
        203250 => 'T',
        205218 => 'W',
        206244 => 'X',
        209185 => 'Y',
        212209 => 'Z',<span>
    );
    </span><span>private</span> <span>$_charset</span> = <span>null</span><span>;

    </span><span>/*</span><span>*
     * 构造函数, 指定需要的编码 default: utf-8
     * 支持utf-8, gb2312
     *
     * @param unknown_type $charset
     </span><span>*/</span>
    <span>public</span> <span>function</span> __construct(<span>$charset</span> = 'utf-8'<span>)
    {
        </span><span>$this</span>->_charset = <span>$charset</span><span>;
    }

    </span><span>/*</span><span>*
     * 中文字符串 substr
     *
     * @param string $str
     * @param int    $start
     * @param int    $len
     * @return string
     </span><span>*/</span>
    <span>private</span> <span>function</span> _msubstr(<span>$str</span>, <span>$start</span>, <span>$len</span><span>)
    {
        </span><span>$start</span> = <span>$start</span> * 2<span>;
        </span><span>$len</span> = <span>$len</span> * 2<span>;
        </span><span>$strlen</span> = <span>strlen</span>(<span>$str</span><span>);
        </span><span>$result</span> = ''<span>;
        </span><span>for</span> (<span>$i</span> = 0; <span>$i</span> < <span>$strlen</span>; <span>$i</span>++<span>)
        {
            </span><span>if</span> (<span>$i</span> >= <span>$start</span> && <span>$i</span> < (<span>$start</span> + <span>$len</span><span>))
            {
                </span><span>if</span> (<span>ord</span>(<span>substr</span>(<span>$str</span>, <span>$i</span>, 1)) > 129<span>)
                {
                    </span><span>$result</span> .= <span>substr</span>(<span>$str</span>, <span>$i</span>, 2<span>);
                }
                </span><span>else</span><span>
                {
                    </span><span>$result</span> .= <span>substr</span>(<span>$str</span>, <span>$i</span>, 1<span>);
                }
            }
            </span><span>if</span> (<span>ord</span>(<span>substr</span>(<span>$str</span>, <span>$i</span>, 1)) > 129<span>)
            {
                </span><span>$i</span>++<span>;
            }
        }
        </span><span>return</span> <span>$result</span><span>;
    }

    </span><span>/*</span><span>*
     * 字符串切分为数组 (汉字或者一个字符为单位)
     *
     * @param string $str
     * @return array
     </span><span>*/</span>
    <span>private</span> <span>function</span> _cutWord(<span>$str</span><span>)
    {
        </span><span>$words</span> = <span>array</span><span>();
        </span><span>while</span> (<span>$str</span> != ""<span>)
        {
            </span><span>if</span> (<span>$this</span>->_isAscii(<span>$str</span><span>))
            {</span><span>/*</span><span> 非中文 </span><span>*/</span>
                <span>$words</span>[] = <span>$str</span>[0<span>];
                </span><span>$str</span> = <span>substr</span>(<span>$str</span>, <span>strlen</span>(<span>$str</span>[0<span>]));
            }
            </span><span>else</span><span>
            {
                </span><span>$word</span> = <span>$this</span>->_msubstr(<span>$str</span>, 0, 1<span>);
                </span><span>$words</span>[] = <span>$word</span><span>;
                </span><span>$str</span> = <span>substr</span>(<span>$str</span>, <span>strlen</span>(<span>$word</span><span>));
            }
        }
        </span><span>return</span> <span>$words</span><span>;
    }

    </span><span>/*</span><span>*
     * 判断字符是否是ascii字符
     *
     * @param string $char
     * @return bool
     </span><span>*/</span>
    <span>private</span> <span>function</span> _isAscii(<span>$char</span><span>)
    {
        </span><span>return</span> ( <span>ord</span>(<span>substr</span>(<span>$char</span>, 0, 1)) < 160<span> );
    }

    </span><span>/*</span><span>*
     * 判断字符串前3个字符是否是ascii字符
     *
     * @param string $str
     * @return bool
     </span><span>*/</span>
    <span>private</span> <span>function</span> _isAsciis(<span>$str</span><span>)
    {
        </span><span>$len</span> = <span>strlen</span>(<span>$str</span>) >= 3 ? 3 : 2<span>;
        </span><span>$chars</span> = <span>array</span><span>();
        </span><span>for</span> (<span>$i</span> = 1; <span>$i</span> < <span>$len</span> - 1; <span>$i</span>++<span>)
        {
            </span><span>$chars</span>[] = <span>$this</span>->_isAscii(<span>$str</span>[<span>$i</span>]) ? 'yes' : 'no'<span>;
        }
        </span><span>$result</span> = <span>array_count_values</span>(<span>$chars</span><span>);
        </span><span>if</span> (<span>empty</span>(<span>$result</span>['no'<span>]))
        {
            </span><span>return</span> <span>true</span><span>;
        }
        </span><span>return</span> <span>false</span><span>;
    }

    </span><span>/*</span><span>*
     * 获取中文字串的拼音首字符
     *
     * @param string $str
     * @return string
     </span><span>*/</span>
    <span>public</span> <span>function</span> getInitials(<span>$str</span><span>)
    {
        </span><span>if</span> (<span>empty</span>(<span>$str</span><span>))
            </span><span>return</span> ''<span>;
        </span><span>if</span> (<span>$this</span>->_isAscii(<span>$str</span>[0]) && <span>$this</span>->_isAsciis(<span>$str</span><span>))
        {
            </span><span>return</span> <span>$str</span><span>;
        }
        </span><span>$result</span> = <span>array</span><span>();
        </span><span>if</span> (<span>$this</span>->_charset == 'utf-8'<span>)
        {
            </span><span>$str</span> = <span>iconv</span>('utf-8', 'gb2312', <span>$str</span><span>);
        }
        </span><span>$words</span> = <span>$this</span>->_cutWord(<span>$str</span><span>);
        </span><span>foreach</span> (<span>$words</span> <span>as</span> <span>$word</span><span>)
        {
            </span><span>if</span> (<span>$this</span>->_isAscii(<span>$word</span><span>))
            {</span><span>/*</span><span> 非中文 </span><span>*/</span>
                <span>$result</span>[] = <span>$word</span><span>;
                </span><span>continue</span><span>;
            }
            </span><span>$code</span> = <span>ord</span>(<span>substr</span>(<span>$word</span>, 0, 1)) * 1000 + <span>ord</span>(<span>substr</span>(<span>$word</span>, 1, 1<span>));
            </span><span>/*</span><span> 获取拼音首字母A--Z </span><span>*/</span>
            <span>if</span> ((<span>$i</span> = <span>$this</span>->_search(<span>$code</span>)) != -1<span>)
            {
                </span><span>$result</span>[] = <span>$this</span>->_pinyins[<span>$i</span><span>];
            }
        }
        </span><span>return</span> <span>strtoupper</span>(<span>implode</span>('', <span>$result</span><span>));
    }

    </span><span>/*</span><span>*
     *  20140624 wangtianbao 获取首字母
     *  @param string $str
     *  @return string
     </span><span>*/</span>
    <span>public</span> <span>function</span> getFirstString(<span>$str</span><span>)
    {
        </span><span>//</span><span>先把中文转换成字母</span>
        <span>$new_string</span> = <span>$this</span>->getInitials(<span>$str</span><span>);

        </span><span>if</span> (<span>empty</span>(<span>$new_string</span><span>))
        {
            </span><span>return</span> ''<span>;
        }
        </span><span>else</span><span>
        {
            </span><span>return</span> <span>strtoupper</span>(<span>substr</span>(<span>$new_string</span>, 0, 1<span>));
        }
    }

    </span><span>private</span> <span>function</span> _getChar(<span>$ascii</span><span>)
    {
        </span><span>if</span> (<span>$ascii</span> >= 48 && <span>$ascii</span> <= 57<span>)
        {
            </span><span>return</span> <span>chr</span>(<span>$ascii</span>);  <span>/*</span><span> 数字 </span><span>*/</span><span>
        }
        </span><span>elseif</span> (<span>$ascii</span> >= 65 && <span>$ascii</span> <= 90<span>)
        {
            </span><span>return</span> <span>chr</span>(<span>$ascii</span>);   <span>/*</span><span> A--Z </span><span>*/</span><span>
        }
        </span><span>elseif</span> (<span>$ascii</span> >= 97 && <span>$ascii</span> <= 122<span>)
        {
            </span><span>return</span> <span>chr</span>(<span>$ascii</span> - 32); <span>/*</span><span> a--z </span><span>*/</span><span>
        }
        </span><span>else</span><span>
        {
            </span><span>return</span> '-'; <span>/*</span><span> 其他 </span><span>*/</span><span>
        }
    }

    </span><span>/*</span><span>*
     * 查找需要的汉字内码(gb2312) 对应的拼音字符( 二分法 )
     *
     * @param int $code
     * @return int
     </span><span>*/</span>
    <span>private</span> <span>function</span> _search(<span>$code</span><span>)
    {
        </span><span>$data</span> = <span>array_keys</span>(<span>$this</span>-><span>_pinyins);
        </span><span>$lower</span> = 0<span>;
        </span><span>$upper</span> = <span>sizeof</span>(<span>$data</span>) - 1<span>;
        </span><span>$middle</span> = (int) <span>round</span>((<span>$lower</span> + <span>$upper</span>) / 2<span>);
        </span><span>if</span> (<span>$code</span> < <span>$data</span>[0<span>])
            </span><span>return</span> -1<span>;
        </span><span>for</span><span> (;;)
        {
            </span><span>if</span> (<span>$lower</span> > <span>$upper</span><span>)
            {
                </span><span>return</span> <span>$data</span>[<span>$lower</span> - 1<span>];
            }
            </span><span>$tmp</span> = (int) <span>round</span>((<span>$lower</span> + <span>$upper</span>) / 2<span>);
            </span><span>if</span> (!<span>isset</span>(<span>$data</span>[<span>$tmp</span><span>]))
            {
                </span><span>return</span> <span>$data</span>[<span>$middle</span><span>];
            }
            </span><span>else</span><span>
            {
                </span><span>$middle</span> = <span>$tmp</span><span>;
            }
            </span><span>if</span> (<span>$data</span>[<span>$middle</span>] < <span>$code</span><span>)
            {
                </span><span>$lower</span> = (int) <span>$middle</span> + 1<span>;
            }
            </span><span>else</span> <span>if</span> (<span>$data</span>[<span>$middle</span>] == <span>$code</span><span>)
            {
                </span><span>return</span> <span>$data</span>[<span>$middle</span><span>];
            }
            </span><span>else</span><span>
            {
                </span><span>$upper</span> = (int) <span>$middle</span> - 1<span>;
            }
        }
    }

}</span>

www.bkjia.comtruehttp: //www.bkjia.com/PHPjc/925549.htmlTechArticlephp-the first letter of Chinese pinyin tool class, php-the first letter of Chinese character pinyin? php /* ** the first letter of Chinese pinyin Tool class* Note: English strings: returned unchanged (including numbers) eg .abc123 = abc123* Chinese characters...
Statement:
The content of this article is voluntarily contributed by netizens, and the copyright belongs to the original author. This site does not assume corresponding legal responsibility. If you find any content suspected of plagiarism or infringement, please contact admin@php.cn