From 6d422287b4c9438bd2f30674847e8e91636317a0 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Xingchen=20Song=28=E5=AE=8B=E6=98=9F=E8=BE=B0=29?= Date: Mon, 6 Nov 2023 18:44:27 +0800 Subject: [PATCH] =?UTF-8?q?fix(cadinal):=20=E5=AF=B9=E8=BF=9E=E7=BB=AD?= =?UTF-8?q?=E5=9B=9B=E4=B8=AAdigit=E8=BF=9B=E8=A1=8C=E8=BD=AC=E6=8D=A2=20(?= =?UTF-8?q?#134)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * fix(cadinal): translate 4 digits * fix(cadinal): translate 4 digits * fix(cadinal): translate 4 digits --- itn/chinese/data/measure/units_zh.tsv | 1 - itn/chinese/rules/cardinal.py | 2 +- requirements.txt | 2 +- 3 files changed, 2 insertions(+), 3 deletions(-) diff --git a/itn/chinese/data/measure/units_zh.tsv b/itn/chinese/data/measure/units_zh.tsv index 767307f..b227173 100644 --- a/itn/chinese/data/measure/units_zh.tsv +++ b/itn/chinese/data/measure/units_zh.tsv @@ -12,7 +12,6 @@ 艘 套 段 -号 匹 张 座 diff --git a/itn/chinese/rules/cardinal.py b/itn/chinese/rules/cardinal.py index 811cebc..0a5c683 100644 --- a/itn/chinese/rules/cardinal.py +++ b/itn/chinese/rules/cardinal.py @@ -116,7 +116,7 @@ def build_tagger(self): # float number like 1.11 cardinal |= (number + dot + digits.plus) # cardinal string like 110 or 12306 or 13125617878, used in phone - cardinal |= (digits**3 | digits**5 | digits**11) + cardinal |= (digits**3 | digits**4 | digits**5 | digits**11) # cardinal string like 23 if self.enable_standalone_number: if self.enable_0_to_9: diff --git a/requirements.txt b/requirements.txt index 8fb727c..9adbf8f 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,4 +1,4 @@ flake8 importlib_resources -pynini +pynini==2.1.5 pytest