rep1/python37/Lib/site-packages/cn2an/an2cn.py

193 lines
7.7 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

from typing import Union
from proces import preprocess
from . import utils
class An2Cn(object):
def __init__(self) -> None:
self.conf = utils.get_default_conf()
self.all_num = "0123456789"
self.number_low = self.conf["number_low_an2cn"]
self.number_up = self.conf["number_up_an2cn"]
self.mode_list = ["low", "up", "rmb", "direct"]
def an2cn(self, inputs: Union[str, int, float] = None, mode: str = "low") -> str:
"""阿拉伯数字转中文数字
:param inputs: 阿拉伯数字
:param mode: low 小写数字up 大写数字rmb 人民币大写direct 直接转化
:return: 中文数字
"""
if inputs is not None and inputs != "":
if mode not in self.mode_list:
raise ValueError(f"mode 仅支持 {str(self.mode_list)} ")
# 将数字转化为字符串这里会有Python会自动做转化
# 1. -> 1.0 1.00 -> 1.0 -0 -> 0
if not isinstance(inputs, str):
inputs = self.__number_to_string(inputs)
# 数据预处理:
# 1. 繁体转简体
# 2. 全角转半角
inputs = preprocess(inputs, pipelines=[
"traditional_to_simplified",
"full_angle_to_half_angle"
])
# 检查数据是否有效
self.__check_inputs_is_valid(inputs)
# 判断正负
if inputs[0] == "-":
sign = ""
inputs = inputs[1:]
else:
sign = ""
if mode == "direct":
output = self.__direct_convert(inputs)
else:
# 切割整数部分和小数部分
split_result = inputs.split(".")
len_split_result = len(split_result)
if len_split_result == 1:
# 不包含小数的输入
integer_data = split_result[0]
if mode == "rmb":
output = self.__integer_convert(integer_data, "up") + "元整"
else:
output = self.__integer_convert(integer_data, mode)
elif len_split_result == 2:
# 包含小数的输入
integer_data, decimal_data = split_result
if mode == "rmb":
int_data = self.__integer_convert(integer_data, "up")
dec_data = self.__decimal_convert(decimal_data, "up")
len_dec_data = len(dec_data)
if len_dec_data == 0:
output = int_data + "元整"
elif len_dec_data == 1:
raise ValueError(f"异常输出:{dec_data}")
elif len_dec_data == 2:
if dec_data[1] != "":
if int_data == "":
output = dec_data[1] + ""
else:
output = int_data + "" + dec_data[1] + ""
else:
output = int_data + "元整"
else:
if dec_data[1] != "":
if dec_data[2] != "":
if int_data == "":
output = dec_data[1] + "" + dec_data[2] + ""
else:
output = int_data + "" + dec_data[1] + "" + dec_data[2] + ""
else:
if int_data == "":
output = dec_data[1] + ""
else:
output = int_data + "" + dec_data[1] + ""
else:
if dec_data[2] != "":
if int_data == "":
output = dec_data[2] + ""
else:
output = int_data + "" + "" + dec_data[2] + ""
else:
output = int_data + "元整"
else:
output = self.__integer_convert(integer_data, mode) + self.__decimal_convert(decimal_data, mode)
else:
raise ValueError(f"输入格式错误:{inputs}")
else:
raise ValueError("输入数据为空!")
return sign + output
def __direct_convert(self, inputs: str) -> str:
_output = ""
for d in inputs:
if d == ".":
_output += ""
else:
_output += self.number_low[int(d)]
return _output
@staticmethod
def __number_to_string(number_data: Union[int, float]) -> str:
# 小数处理python 会自动把 0.00005 转化成 5e-05因此 str(0.00005) != "0.00005"
string_data = str(number_data)
if "e" in string_data:
string_data_list = string_data.split("e")
string_key = string_data_list[0]
string_value = string_data_list[1]
if string_value[0] == "-":
string_data = "0." + "0" * (int(string_value[1:]) - 1) + string_key
else:
string_data = string_key + "0" * int(string_value)
return string_data
def __check_inputs_is_valid(self, check_data: str) -> None:
# 检查输入数据是否在规定的字典中
all_check_keys = self.all_num + ".-"
for data in check_data:
if data not in all_check_keys:
raise ValueError(f"输入的数据不在转化范围内:{data}")
def __integer_convert(self, integer_data: str, mode: str) -> str:
numeral_list = self.conf[f"number_{mode}_an2cn"]
unit_list = self.conf[f"unit_{mode}_order_an2cn"]
# 去除前面的 0比如 007 => 7
integer_data = str(int(integer_data))
len_integer_data = len(integer_data)
if len_integer_data > len(unit_list):
raise ValueError(f"超出数据范围,最长支持 {len(unit_list)}")
output_an = ""
for i, d in enumerate(integer_data):
if int(d):
output_an += numeral_list[int(d)] + unit_list[len_integer_data - i - 1]
else:
if not (len_integer_data - i - 1) % 4:
output_an += numeral_list[int(d)] + unit_list[len_integer_data - i - 1]
if i > 0 and not output_an[-1] == "":
output_an += numeral_list[int(d)]
output_an = output_an.replace("零零", "").replace("零万", "").replace("零亿", "亿").replace("亿万", "亿") \
.strip("")
# 解决「一十几」问题
if output_an[:2] in ["一十"]:
output_an = output_an[1:]
# 0 - 1 之间的小数
if not output_an:
output_an = ""
return output_an
def __decimal_convert(self, decimal_data: str, o_mode: str) -> str:
len_decimal_data = len(decimal_data)
if len_decimal_data > 16:
print(f"注意:小数部分长度为 {len_decimal_data} ,将自动截取前 16 位有效精度!")
decimal_data = decimal_data[:16]
if len_decimal_data:
output_an = ""
else:
output_an = ""
numeral_list = self.conf[f"number_{o_mode}_an2cn"]
for data in decimal_data:
output_an += numeral_list[int(data)]
return output_an