From 08eb332b4bf623dced21b7c8d3b6bf6d4821bf2c Mon Sep 17 00:00:00 2001 From: Magnus Hagander Date: Fri, 19 Oct 2018 17:48:25 +0200 Subject: [PATCH] Add another strange timezone offset format --- loader/lib/parser.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/loader/lib/parser.py b/loader/lib/parser.py index ac0b2f2..22f91f2 100644 --- a/loader/lib/parser.py +++ b/loader/lib/parser.py @@ -348,6 +348,7 @@ class ArchivesParser(object): _date_multi_re = re.compile(' \(([^\s]+\s[^\s]+(\s+[^\s]+)*|)\)$') _date_multi_re2 = re.compile(' ([\+-]\d{4}) \([^)]+\)$') _date_multiminus_re = re.compile(' -(-\d+)$') + _date_offsetnoplus_re = re.compile(' (\d{4})$') def forgiving_date_decode(self, d): if d.strip() == '': raise IgnorableException("Failed to parse empty date") @@ -390,6 +391,9 @@ class ArchivesParser(object): if self._date_multiminus_re.search(d): d = self._date_multiminus_re.sub(' \\1', d) + if self._date_offsetnoplus_re.search(d): + d = self._date_offsetnoplus_re.sub('+\\1', d) + # We have a number of dates in the format # " +0200 (MET DST)" -- 2.39.5