From 2f1f9fae66735b12af015f6d2be9ee647b75150a Mon Sep 17 00:00:00 2001 From: smurak Date: Fri, 12 Aug 2022 16:07:21 +0900 Subject: [PATCH] Improve Japanese support --- dateparser/data/date_translation_data/ja.py | 9 +++++++++ .../date_translation_data/ja.yaml | 5 +++++ tests/test_languages.py | 3 +++ tests/test_search.py | 3 +++ 4 files changed, 20 insertions(+) diff --git a/dateparser/data/date_translation_data/ja.py b/dateparser/data/date_translation_data/ja.py index aacba6f4b..7892b783f 100644 --- a/dateparser/data/date_translation_data/ja.py +++ b/dateparser/data/date_translation_data/ja.py @@ -172,6 +172,9 @@ ], "2 week ago": [ "先々週" + ], + "in 2 day": [ + "明後日" ] }, "relative-type-regex": { @@ -250,6 +253,9 @@ "|", "," ], + "pertain": [ + "の" + ], "ago": [ "前" ], @@ -272,6 +278,9 @@ }, { "(\\d+)時$": "\\1:00" + }, + { + "正午": "12:00" } ] } diff --git a/dateparser_data/supplementary_language_data/date_translation_data/ja.yaml b/dateparser_data/supplementary_language_data/date_translation_data/ja.yaml index 820004d79..77aba4a64 100644 --- a/dateparser_data/supplementary_language_data/date_translation_data/ja.yaml +++ b/dateparser_data/supplementary_language_data/date_translation_data/ja.yaml @@ -4,6 +4,8 @@ sentence_splitter_group : 4 skip: ["約"] +pertain: ["の"] + monday: - (月) tuesday: @@ -73,6 +75,8 @@ relative-type: - 先々週 1 year ago: - 去年 + in 2 day: + - 明後日 simplifications: - (\d+)年(?:\s+)?(\d+)月(?:\s+)?(\d+)日: \1-\2-\3 @@ -80,3 +84,4 @@ simplifications: - (\d+)時(?:\s+)?(\d+)分(?:\s+)?(\d+)秒: \1:\2:\3 - (\d+)時(?:\s+)?(\d+)分: \1:\2 - (\d+)時$: \1:00 + - 正午: '12:00' diff --git a/tests/test_languages.py b/tests/test_languages.py index a9d292d8f..e0688302c 100644 --- a/tests/test_languages.py +++ b/tests/test_languages.py @@ -169,6 +169,8 @@ def setUp(self): param('ja', "2016年3月21日(月) 14時48分", "2016-3-21 monday 14:48"), param('ja', "2016年3月20日(日) 21時40分", "2016-3-20 sunday 21:40"), param('ja', "2016年3月20日 (日) 21時40分", "2016-3-20 sunday 21:40"), + param('ja', "正午", "12:00"), + param('ja', "明日の13時20分", "in 1 day 13:20"), # Hebrew param('he', "20 לאפריל 2012", "20 april 2012"), @@ -1026,6 +1028,7 @@ def test_translation(self, shortname, datetime_string, expected_translation): param('ja', "60秒", "60 second"), param('ja', "3秒前", "3 second ago"), param('ja', "現在", "0 second ago"), + param('ja', "明後日", "in 2 day"), # Hebrew param('he', "אתמול", "1 day ago"), param('he', "אתמול בשעה 3", "1 day ago 3"), diff --git a/tests/test_search.py b/tests/test_search.py index 1ea7b7bff..f6478baf9 100644 --- a/tests/test_search.py +++ b/tests/test_search.py @@ -189,6 +189,9 @@ def check_error_message(self, message): param('ja', "2016年3月21日(月) 14時48分"), param('ja', "2016年3月20日(日) 21時40分"), param('ja', "2016年3月20日 (日) 21時40分"), + param('ja', "正午"), + param('ja', "明後日"), + param('ja', "明後日の正午"), # Hebrew param('he', "20 לאפריל 2012"),