From 26ec83b5f5d5d67e1df9bf2d49b9df1cdd212532 Mon Sep 17 00:00:00 2001 From: tiglog Date: Thu, 21 Sep 2023 20:56:57 +0800 Subject: [PATCH] =?UTF-8?q?imp:=20=E4=BD=BF=E7=94=A8=20unicode=20=E6=A0=87?= =?UTF-8?q?=E5=87=86=E8=B0=83=E6=95=B4=E8=8C=83=E5=9B=B4?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- helper/str_helper.go | 34 +++++++++++++++++++++++++++++----- 1 file changed, 29 insertions(+), 5 deletions(-) diff --git a/helper/str_helper.go b/helper/str_helper.go index 8f83928..385a130 100644 --- a/helper/str_helper.go +++ b/helper/str_helper.go @@ -165,7 +165,9 @@ func Uniq(l int) string { func GetCjkRange(code int) string { var result string - if code >= 0x3400 && code <= 0x4DBF { + if code >= 0x4E00 && code <= 0x9FFF { + result = "CJK" + } else if code >= 0x3400 && code <= 0x4DBF { result = "EXT-A" } else if code >= 0x20000 && code <= 0x2A6DF { result = "EXT-B" @@ -181,12 +183,34 @@ func GetCjkRange(code int) string { result = "EXT-G" } else if code >= 0x31350 && code <= 0x323AF { result = "EXT-H" + } else if code >= 0x2EBF0 && code <= 0x2EE5D { + result = "EXT-I" + } else if code == 0x3007 { + result = "零" + } else if code >= 0x31C0 && code <= 0x631EF { + result = "笔画" + } else if code >= 0x1F600 && code <= 0x1F64F { + result = "表情符号" + } else if code >= 0x1FA00 && code <= 0x1FA6F { + result = "象棋符号" + } else if code >= 0x1F000 && code <= 0x1F02F { + result = "麻将牌" + } else if code >= 0x1F0A0 && code <= 0x1F0FF { + result = "扑克牌" + } else if code >= 0x20A0 && code <= 0x20CF { + result = "货币符号" } else if code >= 0xE000 && code <= 0xF8FF { result = "PUA" - } else if (code >= 0x4e00 && code <= 0x9FFF) || code == 0x3007 { - result = "GBK" - } else { - result = "Other" + } else if code >= 0x2F00 && code <= 0x2FDF { + result = "康熙部首" + } else if code >= 0xF900 && code <= 0xFAD9 { + result = "兼容区" + } else if code >= 0x2F800 && code <= 0x2FA1D { + result = "兼容补充区" + } else if code >= 0x17000 && code <= 0x187F7 { + result = "西夏文" + } else if code >= 0x2FF0 && code <= 0x2FFF { + result = "表意文字描述符" } return result