java 将中文数字转为阿拉伯数字

由于项目需求要将中文数字转为阿拉伯数字,找了一些博客有些不满足需求。于是参考了一些博客完成以下代码

import java.math.BigDecimal;
import java.util.Objects;

/**
 * 
 * @author Andy
 * @since 2023-04-23 18:45
 */
public class CNToNumber {

    /**
     * 中文数字
     */
    private static char[] cnArr_a = new char [] {'零','一','二','三','四','五','六','七','八','九'};
    private static char[] cnArr_A = new char [] {'零','壹','贰','叁','肆','伍','陆','柒','捌','玖'};
    private static final String allChineseNum = "零一二三四五六七八九壹贰叁肆伍陆柒捌玖十拾百佰千仟万萬亿";

    /**
     * 中文单位
     */
    private static char[] unit_a = new char [] {'亿','万','千','百','十'};
    private static char[] unit_A = new char [] {'亿','萬','仟','佰','拾'};
    private static final String allChineseUnit = "十拾百佰千仟万萬亿";

    /**
     * 将汉字中的数字转换为阿拉伯数字
     * (例如:三万叁仟零肆拾伍亿零贰佰萬柒仟陆佰零伍)
     *
     * @param chineseNum;
     * @return long
     */
    public static BigDecimal chineseNumToArabicNum(String chineseNum) {
        try {
            // 最终返回的结果
            BigDecimal result = new BigDecimal(0);

            if (chineseNum == null || chineseNum.trim().length() == 0) {
                return result;
            }

            char firstUnit = chineseNum.charAt(0);
            char lastUnit = chineseNum.charAt(chineseNum.length() - 1);

            Boolean appendUnit = true;
            long lastUnitNum = 1;
            if (isCnUnit(firstUnit) && chineseNum.length() > 1) {
                // 两位数
                long firstNum = chnNameValue[chnUnitToValue(String.valueOf(firstUnit))].value;
                if (!isCnUnit(lastUnit) && chineseNum.length() == 2) {
                    long number = chnStringToNumber(String.valueOf(lastUnit));
                    result = result.add(BigDecimal.valueOf(firstNum).add(BigDecimal.valueOf(number)));
                    return result;
                } else if (isCnUnit(lastUnit)) {
                    ChnNameValue chnValue = chnNameValue[chnUnitToValue(String.valueOf(lastUnit))];
                    if (firstNum == 10 && chnValue.secUnit) {
                        chineseNum = "一" + chineseNum;
                    } else {
                        throw new NumberFormatException("中文数字异常");
                    }
                }
            }

            if (isCnUnit(lastUnit)) {
                chineseNum = chineseNum.substring(0, chineseNum.length() - 1);
                lastUnitNum = chnNameValue[chnUnitToValue(String.valueOf(lastUnit))].value;
                appendUnit = chnNameValue[chnUnitToValue(String.valueOf(lastUnit))].secUnit;
            }else if (chineseNum.length() == 1) {
                // 如果长度为1时
                int num = strToNum(chineseNum);
                if (num != -1) {
                    return BigDecimal.valueOf(num);
                } else {
                    return null;
                }
            }

            // 将小写中文数字转为大写中文数字
            for (int i = 0; i < cnArr_a.length; i++) {
                chineseNum = chineseNum.replaceAll(String.valueOf(cnArr_a[i]), String.valueOf(cnArr_A[i]));
            }
            // 将小写单位转为大写单位
            for (int i = 0; i < unit_a.length; i++) {
                chineseNum = chineseNum.replaceAll(String.valueOf(unit_a[i]), String.valueOf(unit_A[i]));
            }

            for (int i = 0; i < unit_A.length; i++) {
                if (chineseNum.trim().length() == 0) {
                    break;
                }
                String unitUpperCase = String.valueOf(unit_A[i]);
                String str = null;
                if (chineseNum.contains(unitUpperCase)) {
                    str = chineseNum.substring(0, chineseNum.lastIndexOf(unitUpperCase) + 1);
                }
                if (str != null && str.trim().length() > 0) {
                    // 下次循环截取的基础字符串
                    chineseNum = chineseNum.replaceAll(str, "");
                    // 单位基础值
                    long unitNum = chnNameValue[chnUnitToValue(unitUpperCase)].value;
                    String temp = str.substring(0, str.length() - 1);
                    long number = chnStringToNumber(temp);
                    result = result.add(BigDecimal.valueOf(number).multiply(BigDecimal.valueOf(unitNum)));
                }
                // 最后一次循环,被传入的数字没有处理完并且没有单位的个位数处理
                if (i + 1 == unit_a.length && !"".equals(chineseNum)) {
                    long number = chnStringToNumber(chineseNum);
                    if (!appendUnit) {
                        number = BigDecimal.valueOf(number).multiply(BigDecimal.valueOf(lastUnitNum)).longValue();
                    }
                    result = result.add(BigDecimal.valueOf(number));
                }
            }
            // 加上单位
            if (appendUnit && lastUnitNum > 1) {
                result = result.multiply(BigDecimal.valueOf(lastUnitNum));
            } else if (lastUnitNum > 0) {
                if (result.compareTo(BigDecimal.ZERO) == BigDecimal.ZERO.intValue()) {
                    result = BigDecimal.ONE;
                    result = result.multiply(BigDecimal.valueOf(lastUnitNum));
                }
            }
            return result;
        } catch (Exception e) {
            e.printStackTrace();
            return null;
        }
    }

    /**
     * 返回中文数字汉字所对应的阿拉伯数字,若str不为中文数字,则返回-1
     *
     * @param string;
     * @return int
     */
    private static int strToNum(String string){
        for(int i = 0;i<cnArr_a.length;i++){
            if (Objects.equals(string,String.valueOf(cnArr_a[i])) || Objects.equals(string,String.valueOf(cnArr_A[i]))){
                return i;
            }
        }
        return -1;
    }

    /**
     * 判断传入的字符串是否全是汉字数字和单位
     *
     * @param chineseStr;
     * @return boolean
     */
    public static boolean isCnNumAll(String chineseStr){
        if (isBlank(chineseStr)){
            return true;
        }
        char [] charArray = chineseStr.toCharArray();
        for(char c : charArray){
            if (!allChineseNum.contains(String.valueOf(c))) {
                return false;
            }
        }
        return true;
    }

    /**
     * 判断字符串是空的
     *
     * @param cs
     * @return
     */
    public static boolean isBlank(CharSequence cs) {
        int strLen;
        if (cs != null && (strLen = cs.length()) != 0) {
            for (int i = 0; i < strLen; ++i) {
                if (!Character.isWhitespace(cs.charAt(i))) {
                    return false;
                }
            }
            return true;
        } else {
            return true;
        }
    }

    /**
     * 判断传入的字符是否是汉字数字和单位
     *
     * @param chineseChar;
     * @return boolean
     */
    public static boolean isCnNum(char chineseChar) {
        if (!allChineseNum.contains(String.valueOf(chineseChar))) {
            return false;
        }else{
            return true;
        }
    }

    /**
     * 判断是否是中文单位
     *
     * @param unitStr;
     * @return boolean
     */
    public static boolean isCnUnit(char unitStr) {
        if (!allChineseUnit.contains(String.valueOf(unitStr))) {
            return false;
        }else{
            return true;
        }
    }

    /**
     * 中文转换成阿拉伯数字,中文字符串除了包括0-9的中文汉字,还包括十,百,千,万等权位。
     * 此处是完成对这些权位的类型定义。
     * name是指这些权位的汉字字符串。
     * value是指权位多对应的数值的大小。诸如:十对应的值的大小为10,百对应为100等
     * secUnit若为true,代表该权位为节权位,即万,亿,万亿等
     */
    public static class ChnNameValue{
        String name;
        long value;
        Boolean secUnit;
        ChnNameValue(String name,long value,Boolean secUnit){
            this.name=name;
            this.value=value;
            this.secUnit=secUnit;
        }
    }

    static ChnNameValue chnNameValue[] = {
            new ChnNameValue("十",10,false),
            new ChnNameValue("拾",10,false),
            new ChnNameValue("百",100,false),
            new ChnNameValue("佰",100,false),
            new ChnNameValue("千",1000,false),
            new ChnNameValue("仟",1000,false),
            new ChnNameValue("万",10000,true),
            new ChnNameValue("萬",10000,true),
            new ChnNameValue("亿",100000000,true)
    };

    /**
     * 返回中文汉字权位在chnNameValue数组中所对应的索引号,若不为中文汉字权位,则返回-1
     *
     * @param str;
     * @return int
     */
    private static int chnUnitToValue(String str){
        for(int i=0;i<chnNameValue.length;i++){
            if(str.equals(chnNameValue[i].name)){
                return i;
            }
        }
        return -1;
    }

    /**
     * 返回中文数字字符串所对应的int类型的阿拉伯数字
     * (千亿/12位数)
     *
     * @param str;
     * @return long
     */
    private static long chnStringToNumber(String str){
        long returnNumber=0;
        long section=0;
        int index=0;
        long number=0;
        while (index<str.length()){
            // 从左向右依次获取对应中文数字,取不到返回-1
            int num = strToNum(str.substring(index,index+1));
            //若num>=0,代表该位置(pos),所对应的是数字不是权位。若小于0,则表示为权位
            if(num >= 0){
                number = num;
                index++;
                //pos是最后一位,直接将number加入到section中。
                if(index>=str.length()){
                    section += number;
                    returnNumber += section;
                    break;
                }
            }else{
                int chnNameValueIndex=chnUnitToValue(str.substring(index,index+1));

                if (chnNameValueIndex == -1) {
                    // 字符串存在除 数字和单位 以外的中文
                    throw new NumberFormatException("字符串存在除 <数字和单位> 以外的中文");
                }

                //chnNameValue[chnNameValueIndex].secUnit==true,表示该位置所对应的权位是节权位,
                if(chnNameValue[chnNameValueIndex].secUnit){
                    section = (section + number) * chnNameValue[chnNameValueIndex].value;
                    returnNumber += section;
                    section=0;
                }else{
                    section += number*chnNameValue[chnNameValueIndex].value;
                }
                index++;
                number=0;
                if(index>=str.length()){
                    returnNumber += section;
                    break;
                }
            }
        }
        return returnNumber;
    }

    public static void main(String[] args) {
        String str = "三万叁仟零肆拾伍亿零贰佰萬柒仟陆佰零伍万";
        String str1 = "三万叁仟零肆拾伍亿零贰佰萬柒仟陆佰零伍";
        String str2 = "三万叁仟零肆拾伍亿零柒仟陆佰零伍";
        String str3 = "三仟零肆十万";
        String str4 = "三万三千";
        String str5 = "三万零四十";
        String str6 = "三万叁仟零肆拾伍亿";
        String str7 = "十";
        String str8 = "十五";
        String str9 = "十万";
        String str10 = "十一万";
        String str11 = "九十一万";
        String str12 = "十亿";
        String str13 = "十五亿";
        String str14 = "一百";
        String str15 = "一百零一";
        String str16 = "一千";
        String str17 = "一千零一";
        String str18 = "一千零一十";
        String str19 = "零";
        String str20 = "一";
        String str21 = "贰";
        String str22 = "万";
        String str23 = "空";
        String str24 = "空万";
        String str25 = "百万";

        System.out.println();
        System.out.println(">>> " + str + " : " + chineseNumToArabicNum(str));
        System.out.println(">>> " + str1 + " : " + chineseNumToArabicNum(str1));
        System.out.println(">>> " + str2 + " : " + chineseNumToArabicNum(str2));
        System.out.println(">>> " + str3 + " : " + chineseNumToArabicNum(str3));
        System.out.println(">>> " + str4 + " : " + chineseNumToArabicNum(str4));
        System.out.println(">>> " + str5 + " : " + chineseNumToArabicNum(str5));
        System.out.println(">>> " + str6 + " : " + chineseNumToArabicNum(str6));
        System.out.println(">>> " + str7 + " : " + chineseNumToArabicNum(str7));
        System.out.println(">>> " + str8 + " : " + chineseNumToArabicNum(str8));
        System.out.println(">>> " + str9 + " : " + chineseNumToArabicNum(str9));
        System.out.println(">>> " + str10 + " : " + chineseNumToArabicNum(str10));
        System.out.println(">>> " + str11 + " : " + chineseNumToArabicNum(str11));
        System.out.println(">>> " + str12 + " : " + chineseNumToArabicNum(str12));
        System.out.println(">>> " + str13 + " : " + chineseNumToArabicNum(str13));
        System.out.println(">>> " + str14 + " : " + chineseNumToArabicNum(str14));
        System.out.println(">>> " + str15 + " : " + chineseNumToArabicNum(str15));
        System.out.println(">>> " + str16 + " : " + chineseNumToArabicNum(str16));
        System.out.println(">>> " + str17 + " : " + chineseNumToArabicNum(str17));
        System.out.println(">>> " + str18 + " : " + chineseNumToArabicNum(str18));
        System.out.println(">>> " + str19 + " : " + chineseNumToArabicNum(str19));
        System.out.println(">>> " + str20 + " : " + chineseNumToArabicNum(str20));
        System.out.println(">>> " + str21 + " : " + chineseNumToArabicNum(str21));
        System.out.println(">>> " + str22 + " : " + chineseNumToArabicNum(str22));
        System.out.println(">>> " + str23 + " : " + chineseNumToArabicNum(str23));
        System.out.println(">>> " + str24 + " : " + chineseNumToArabicNum(str24));
        System.out.println(">>> " + str25 + " : " + chineseNumToArabicNum(str25));
        System.out.println();

    }

}

运行结果

java将中文转换为GBK java将中文转换为数字_java

写的不好,还望包涵
希望对各位有所帮助
如有缺漏,还望个位大神指出