1. 程式人生 > 其它 >PHP獲取漢字首字母並分組排序

PHP獲取漢字首字母並分組排序

<?php

class Character
{
    /**
     * 二維陣列根據首字母分組排序
     * @param array  $data      二維陣列
     * @param string $targetKey 首字母的鍵名
     * @return array             根據首字母關聯的二維陣列
     */
    public function groupByInitials(array $data, $targetKey = 'name')
    {
        $data = array_map(function ($item) use ($targetKey) {
            return array_merge($item, [
                'initials' => $this->getInitials($item[$targetKey]),
            ]);
        }, $data);
        $data = $this->sortInitials($data);
        return $data;
    }

    /**
     * 按字母排序
     * @param array $data
     * @return array
     */
    public function sortInitials(array $data)
    {
        $sortData = [];
        foreach ($data as $key => $value) {
            $sortData[$value['initials']][] = $value;
        }
        ksort($sortData);
        return $sortData;
    }

    /**
     * 獲取首字母
     * @param string $str 漢字字串
     * @return string 首字母
     */
    public function getInitials($str)
    {
        if (empty($str)) {
            return '';
        }
        $fchar = ord($str{0});
        if ($fchar >= ord('A') && $fchar <= ord('z')) {
            return strtoupper($str{0});
        }
        $s1 = iconv('UTF-8', 'gb2312', $str);
        $s2 = iconv('gb2312', 'UTF-8', $s1);
        $s = $s2 == $str ? $s1 : $str;
        $asc = ord($s{0}) * 256 + ord($s{1}) - 65536;
        if ($asc >= -20319 && $asc <= -20284) {
            return 'A';
        }
        if ($asc >= -20283 && $asc <= -19776) {
            return 'B';
        }
        if ($asc >= -19775 && $asc <= -19219) {
            return 'C';
        }
        if ($asc >= -19218 && $asc <= -18711) {
            return 'D';
        }
        if ($asc >= -18710 && $asc <= -18527) {
            return 'E';
        }
        if ($asc >= -18526 && $asc <= -18240) {
            return 'F';
        }
        if ($asc >= -18239 && $asc <= -17923) {
            return 'G';
        }
        if ($asc >= -17922 && $asc <= -17418) {
            return 'H';
        }
        if ($asc >= -17417 && $asc <= -16475) {
            return 'J';
        }
        if ($asc >= -16474 && $asc <= -16213) {
            return 'K';
        }
        if ($asc >= -16212 && $asc <= -15641) {
            return 'L';
        }
        if ($asc >= -15640 && $asc <= -15166) {
            return 'M';
        }
        if ($asc >= -15165 && $asc <= -14923) {
            return 'N';
        }
        if ($asc >= -14922 && $asc <= -14915) {
            return 'O';
        }
        if ($asc >= -14914 && $asc <= -14631) {
            return 'P';
        }
        if ($asc >= -14630 && $asc <= -14150) {
            return 'Q';
        }
        if ($asc >= -14149 && $asc <= -14091) {
            return 'R';
        }
        if ($asc >= -14090 && $asc <= -13319) {
            return 'S';
        }
        if ($asc >= -13318 && $asc <= -12839) {
            return 'T';
        }
        if ($asc >= -12838 && $asc <= -12557) {
            return 'W';
        }
        if ($asc >= -12556 && $asc <= -11848) {
            return 'X';
        }
        if ($asc >= -11847 && $asc <= -11056) {
            return 'Y';
        }
        if ($asc >= -11055 && $asc <= -10247) {
            return 'Z';
        }
        return null;
    }
}

//用法示例
// 按首字母排序
$data = [
    ['id' => 1, 'area_name' => '山東'],
    ['id' => 1, 'area_name' => '江蘇'],
    ['id' => 1, 'area_name' => '安徽'],
    ['id' => 1, 'area_name' => '福建'],
    ['id' => 1, 'area_name' => '江西'],
    ['id' => 1, 'area_name' => '廣東'],
    ['id' => 1, 'area_name' => '廣西'],
    ['id' => 1, 'area_name' => '海南'],
    ['id' => 1, 'area_name' => '河南'],
    ['id' => 1, 'area_name' => '湖南'],
    ['id' => 1, 'area_name' => '湖北'],
];
$data = (new Character)->groupByInitials($data, 'area_name');
//輸出結果
$data = array(
    'A' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '安徽',
            'initials'  => 'A'
        )
    ),
    'F' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '福建',
            'initials'  => 'F'
        )
    ),
    'G' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '廣東',
            'initials'  => 'G'
        ),
        1 => array(
            'id'        => 1,
            'area_name' => '廣西',
            'initials'  => 'G'
        )
    ),
    'H' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '海南',
            'initials'  => 'H'
        ),
        1 => array(
            'id'        => 1,
            'area_name' => '河南',
            'initials'  => 'H'
        ),
        2 => array(
            'id'        => 1,
            'area_name' => '湖南',
            'initials'  => 'H'
        ),
        3 => array(
            'id'        => 1,
            'area_name' => '湖北',
            'initials'  => 'H'
        )
    ),
    'J' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '江蘇',
            'initials'  => 'J'
        ),
        1 => array(
            'id'        => 1,
            'area_name' => '江西',
            'initials'  => 'J'
        )
    ),
    'S' => array(
        0 => array(
            'id'        => 1,
            'area_name' => '山東',
            'initials'  => 'S'
        )
    )
);