zoukankan      html  css  js  c++  java
  • java pinyin4j

    pom:

    <dependency>
        <groupId>com.belerweb</groupId>
        <artifactId>pinyin4j</artifactId>
        <version>2.5.1</version>
    </dependency>

    demo:

        public static String getAllPinyin(String hanzi) {
            //输出格式设置
            HanyuPinyinOutputFormat format = new HanyuPinyinOutputFormat();
            /**
             * 输出大小写设置
             * LOWERCASE:输出小写
             * UPPERCASE:输出大写
             */
            format.setCaseType(HanyuPinyinCaseType.LOWERCASE);
    
            /**
             * 输出音标设置
             * WITH_TONE_MARK:直接用音标符(必须设置WITH_U_UNICODE,否则会抛出异常)
             * WITH_TONE_NUMBER:1-4数字表示音标
             * WITHOUT_TONE:没有音标
             */
            format.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
    
            /**
             * 特殊音标ü设置
             *
             * WITH_V:用v表示ü
             * WITH_U_AND_COLON:用"u:"表示ü
             * WITH_U_UNICODE:直接用ü
             */
            format.setVCharType(HanyuPinyinVCharType.WITH_U_UNICODE);
    
            char[] hanYuArr = hanzi.trim().toCharArray();
            StringBuilder pinYin = new StringBuilder();
    
            try {
                for (int i = 0, len = hanYuArr.length; i < len; i++) {
                    //匹配是否是汉字
                    if (Character.toString(hanYuArr[i]).matches("[\u4E00-\u9FA5]+")) {
                        //如果是多音字,返回多个拼音,这里只取第一个
                        String[] pys = PinyinHelper.toHanyuPinyinStringArray(hanYuArr[i], format);
                        pinYin.append(pys[0]).append(" ");
                    } else {
                        pinYin.append(hanYuArr[i]).append(" ");
                    }
                }
            } catch (BadHanyuPinyinOutputFormatCombination badHanyuPinyinOutputFormatCombination) {
                badHanyuPinyinOutputFormatCombination.printStackTrace();
            }
            return pinYin.toString();
        }
    
        public static String getFirstPinYin(String hanyu) {
            HanyuPinyinOutputFormat format = new HanyuPinyinOutputFormat();
            format.setCaseType(HanyuPinyinCaseType.UPPERCASE);
            format.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
    
            StringBuilder firstPinyin = new StringBuilder();
            char[] hanyuArr = hanyu.trim().toCharArray();
            try {
                for (int i = 0, len = hanyuArr.length; i < len; i++) {
                    if (Character.toString(hanyuArr[i]).matches("[\u4E00-\u9FA5]+")) {
                        String[] pys = PinyinHelper.toHanyuPinyinStringArray(hanyuArr[i], format);
                        firstPinyin.append(pys[0].charAt(0));
                    } else {
                        firstPinyin.append(hanyuArr[i]);
                    }
                }
            } catch (BadHanyuPinyinOutputFormatCombination badHanyuPinyinOutputFormatCombination) {
                badHanyuPinyinOutputFormatCombination.printStackTrace();
            }
            return firstPinyin.toString();
        }
  • 相关阅读:
    设备管理器里“SM总线控制器”、“其它PCI桥设备”驱动有问题
    MapReduce实现两表的Join--原理及python和java代码实现
    Calendar类经常用法 日期间的转换 set方法有巨坑
    Java 装饰模式(4.4)
    LoadRunner访问Mysql数据库(转)
    linux下定时执行任务的方法
    docker 常用命令
    Docker exec与Docker attach
    docker容器跨服务器的迁移方式export和save(转)
    cpu时间 / cpu利用率计算
  • 原文地址:https://www.cnblogs.com/dhName/p/14560471.html
Copyright © 2011-2022 走看看