Skip to content

Commit 7636266

Browse files
authored
Improve Japanese support (scrapinghub#1068)
1 parent 0cbf46a commit 7636266

File tree

4 files changed

+20
-0
lines changed

4 files changed

+20
-0
lines changed

dateparser/data/date_translation_data/ja.py

Lines changed: 9 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -172,6 +172,9 @@
172172
],
173173
"2 week ago": [
174174
"先々週"
175+
],
176+
"in 2 day": [
177+
"明後日"
175178
]
176179
},
177180
"relative-type-regex": {
@@ -250,6 +253,9 @@
250253
"|",
251254
","
252255
],
256+
"pertain": [
257+
"の"
258+
],
253259
"ago": [
254260
"前"
255261
],
@@ -272,6 +278,9 @@
272278
},
273279
{
274280
"(\\d+[.,]?\\d*)時$": "\\1:00"
281+
},
282+
{
283+
"正午": "12:00"
275284
}
276285
]
277286
}

dateparser_data/supplementary_language_data/date_translation_data/ja.yaml

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,8 @@ sentence_splitter_group : 4
44

55
skip: ["約"]
66

7+
pertain: ["の"]
8+
79
monday:
810
- (月)
911
tuesday:
@@ -73,10 +75,13 @@ relative-type:
7375
- 先々週
7476
1 year ago:
7577
- 去年
78+
in 2 day:
79+
- 明後日
7680

7781
simplifications:
7882
- (\d+[.,]?\d*)年(?:\s+)?(\d+[.,]?\d*)月(?:\s+)?(\d+[.,]?\d*)日: \1-\2-\3
7983
- (\d+[.,]?\d*)月(?:\s+)?(\d+[.,]?\d*)日: \1-\2
8084
- (\d+[.,]?\d*)時(?:\s+)?(\d+[.,]?\d*)分(?:\s+)?(\d+[.,]?\d*)秒: \1:\2:\3
8185
- (\d+[.,]?\d*)時(?:\s+)?(\d+[.,]?\d*)分: \1:\2
8286
- (\d+[.,]?\d*)時$: \1:00
87+
- 正午: '12:00'

tests/test_languages.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -191,6 +191,8 @@ def setUp(self):
191191
param('ja', "2016年3月21日(月) 14時48分", "2016-3-21 monday 14:48"),
192192
param('ja', "2016年3月20日(日) 21時40分", "2016-3-20 sunday 21:40"),
193193
param('ja', "2016年3月20日 (日) 21時40分", "2016-3-20 sunday 21:40"),
194+
param('ja', "正午", "12:00"),
195+
param('ja', "明日の13時20分", "in 1 day 13:20"),
194196
195197
# Hebrew
196198
param('he', "20 לאפריל 2012", "20 april 2012"),
@@ -1070,6 +1072,7 @@ def test_translation(self, shortname, datetime_string, expected_translation):
10701072
param('ja', "60秒", "60 second"),
10711073
param('ja', "3秒前", "3 second ago"),
10721074
param('ja', "現在", "0 second ago"),
1075+
param('ja', "明後日", "in 2 day"),
10731076
# Hebrew
10741077
param('he', "אתמול", "1 day ago"),
10751078
param('he', "אתמול בשעה 3", "1 day ago 3"),

tests/test_search.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -189,6 +189,9 @@ def check_error_message(self, message):
189189
param('ja', "2016年3月21日(月) 14時48分"),
190190
param('ja', "2016年3月20日(日) 21時40分"),
191191
param('ja', "2016年3月20日 (日) 21時40分"),
192+
param('ja', "正午"),
193+
param('ja', "明後日"),
194+
param('ja', "明後日の正午"),
192195
193196
# Hebrew
194197
param('he', "20 לאפריל 2012"),

0 commit comments

Comments
 (0)