2023-04-13 07:04:58 +00:00
|
|
|
# Copyright 2010-2023 Kurt McKee <contactme@kurtmckee.org>
|
2023-01-12 01:04:47 +00:00
|
|
|
# Copyright 2002-2008 Mark Pilgrim
|
|
|
|
# All rights reserved.
|
|
|
|
#
|
|
|
|
# This file is a part of feedparser.
|
|
|
|
#
|
|
|
|
# Redistribution and use in source and binary forms, with or without
|
|
|
|
# modification, are permitted provided that the following conditions are met:
|
|
|
|
#
|
|
|
|
# * Redistributions of source code must retain the above copyright notice,
|
|
|
|
# this list of conditions and the following disclaimer.
|
|
|
|
# * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
# this list of conditions and the following disclaimer in the documentation
|
|
|
|
# and/or other materials provided with the distribution.
|
|
|
|
#
|
|
|
|
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 'AS IS'
|
|
|
|
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
# POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
from .w3dtf import _parse_date_w3dtf
|
|
|
|
|
|
|
|
# Unicode strings for Hungarian date strings
|
|
|
|
_hungarian_months = {
|
2023-04-13 07:04:58 +00:00
|
|
|
"janu\u00e1r": "01", # e1 in iso-8859-2
|
|
|
|
"febru\u00e1ri": "02", # e1 in iso-8859-2
|
|
|
|
"m\u00e1rcius": "03", # e1 in iso-8859-2
|
|
|
|
"\u00e1prilis": "04", # e1 in iso-8859-2
|
|
|
|
"m\u00e1ujus": "05", # e1 in iso-8859-2
|
|
|
|
"j\u00fanius": "06", # fa in iso-8859-2
|
|
|
|
"j\u00falius": "07", # fa in iso-8859-2
|
|
|
|
"augusztus": "08",
|
|
|
|
"szeptember": "09",
|
|
|
|
"okt\u00f3ber": "10", # f3 in iso-8859-2
|
|
|
|
"november": "11",
|
|
|
|
"december": "12",
|
2023-01-12 01:04:47 +00:00
|
|
|
}
|
|
|
|
|
2023-04-13 07:04:58 +00:00
|
|
|
_hungarian_date_format_re = re.compile(
|
|
|
|
r"(\d{4})-([^-]+)-(\d{,2})T(\d{,2}):(\d{2})([+-](\d{,2}:\d{2}))"
|
|
|
|
)
|
2023-01-12 01:04:47 +00:00
|
|
|
|
|
|
|
|
|
|
|
def _parse_date_hungarian(date_string):
|
|
|
|
"""Parse a string according to a Hungarian 8-bit date format."""
|
|
|
|
m = _hungarian_date_format_re.match(date_string)
|
|
|
|
if not m or m.group(2) not in _hungarian_months:
|
|
|
|
return None
|
|
|
|
month = _hungarian_months[m.group(2)]
|
|
|
|
day = m.group(3)
|
|
|
|
if len(day) == 1:
|
2023-04-13 07:04:58 +00:00
|
|
|
day = "0" + day
|
2023-01-12 01:04:47 +00:00
|
|
|
hour = m.group(4)
|
|
|
|
if len(hour) == 1:
|
2023-04-13 07:04:58 +00:00
|
|
|
hour = "0" + hour
|
|
|
|
w3dtfdate = f"{m.group(1)}-{month}-{day}T{hour}:{m.group(5)}{m.group(6)}"
|
2023-01-12 01:04:47 +00:00
|
|
|
return _parse_date_w3dtf(w3dtfdate)
|