2023-04-13 07:04:58 +00:00
|
|
|
# Copyright 2010-2023 Kurt McKee <contactme@kurtmckee.org>
|
2023-01-12 01:04:47 +00:00
|
|
|
# Copyright 2002-2008 Mark Pilgrim
|
|
|
|
# All rights reserved.
|
|
|
|
#
|
|
|
|
# This file is a part of feedparser.
|
|
|
|
#
|
|
|
|
# Redistribution and use in source and binary forms, with or without
|
|
|
|
# modification, are permitted provided that the following conditions are met:
|
|
|
|
#
|
|
|
|
# * Redistributions of source code must retain the above copyright notice,
|
|
|
|
# this list of conditions and the following disclaimer.
|
|
|
|
# * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
# this list of conditions and the following disclaimer in the documentation
|
|
|
|
# and/or other materials provided with the distribution.
|
|
|
|
#
|
|
|
|
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 'AS IS'
|
|
|
|
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
# POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
|
|
|
import re
|
|
|
|
|
|
|
|
from .rfc822 import _parse_date_rfc822
|
|
|
|
|
|
|
|
# Unicode strings for Greek date strings
|
|
|
|
_greek_months = {
|
2023-04-13 07:04:58 +00:00
|
|
|
"\u0399\u03b1\u03bd": "Jan", # c9e1ed in iso-8859-7
|
|
|
|
"\u03a6\u03b5\u03b2": "Feb", # d6e5e2 in iso-8859-7
|
|
|
|
"\u039c\u03ac\u03ce": "Mar", # ccdcfe in iso-8859-7
|
|
|
|
"\u039c\u03b1\u03ce": "Mar", # cce1fe in iso-8859-7
|
|
|
|
"\u0391\u03c0\u03c1": "Apr", # c1f0f1 in iso-8859-7
|
|
|
|
"\u039c\u03ac\u03b9": "May", # ccdce9 in iso-8859-7
|
|
|
|
"\u039c\u03b1\u03ca": "May", # cce1fa in iso-8859-7
|
|
|
|
"\u039c\u03b1\u03b9": "May", # cce1e9 in iso-8859-7
|
|
|
|
"\u0399\u03bf\u03cd\u03bd": "Jun", # c9effded in iso-8859-7
|
|
|
|
"\u0399\u03bf\u03bd": "Jun", # c9efed in iso-8859-7
|
|
|
|
"\u0399\u03bf\u03cd\u03bb": "Jul", # c9effdeb in iso-8859-7
|
|
|
|
"\u0399\u03bf\u03bb": "Jul", # c9f9eb in iso-8859-7
|
|
|
|
"\u0391\u03cd\u03b3": "Aug", # c1fde3 in iso-8859-7
|
|
|
|
"\u0391\u03c5\u03b3": "Aug", # c1f5e3 in iso-8859-7
|
|
|
|
"\u03a3\u03b5\u03c0": "Sep", # d3e5f0 in iso-8859-7
|
|
|
|
"\u039f\u03ba\u03c4": "Oct", # cfeaf4 in iso-8859-7
|
|
|
|
"\u039d\u03bf\u03ad": "Nov", # cdefdd in iso-8859-7
|
|
|
|
"\u039d\u03bf\u03b5": "Nov", # cdefe5 in iso-8859-7
|
|
|
|
"\u0394\u03b5\u03ba": "Dec", # c4e5ea in iso-8859-7
|
2023-01-12 01:04:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
_greek_wdays = {
|
2023-04-13 07:04:58 +00:00
|
|
|
"\u039a\u03c5\u03c1": "Sun", # caf5f1 in iso-8859-7
|
|
|
|
"\u0394\u03b5\u03c5": "Mon", # c4e5f5 in iso-8859-7
|
|
|
|
"\u03a4\u03c1\u03b9": "Tue", # d4f1e9 in iso-8859-7
|
|
|
|
"\u03a4\u03b5\u03c4": "Wed", # d4e5f4 in iso-8859-7
|
|
|
|
"\u03a0\u03b5\u03bc": "Thu", # d0e5ec in iso-8859-7
|
|
|
|
"\u03a0\u03b1\u03c1": "Fri", # d0e1f1 in iso-8859-7
|
|
|
|
"\u03a3\u03b1\u03b2": "Sat", # d3e1e2 in iso-8859-7
|
2023-01-12 01:04:47 +00:00
|
|
|
}
|
|
|
|
|
2023-04-13 07:04:58 +00:00
|
|
|
_greek_date_format_re = re.compile(
|
|
|
|
r"([^,]+),\s+(\d{2})\s+([^\s]+)\s+(\d{4})\s+(\d{2}):(\d{2}):(\d{2})\s+([^\s]+)"
|
|
|
|
)
|
2023-01-12 01:04:47 +00:00
|
|
|
|
|
|
|
|
|
|
|
def _parse_date_greek(date_string):
|
|
|
|
"""Parse a string according to a Greek 8-bit date format."""
|
|
|
|
m = _greek_date_format_re.match(date_string)
|
|
|
|
if not m:
|
|
|
|
return
|
|
|
|
wday = _greek_wdays[m.group(1)]
|
|
|
|
month = _greek_months[m.group(3)]
|
2023-04-13 07:04:58 +00:00
|
|
|
rfc822date = (
|
|
|
|
"%(wday)s, %(day)s %(month)s %(year)s %(hour)s:%(minute)s:%(second)s %(offset)s"
|
|
|
|
% {
|
|
|
|
"wday": wday,
|
|
|
|
"day": m.group(2),
|
|
|
|
"month": month,
|
|
|
|
"year": m.group(4),
|
|
|
|
"hour": m.group(5),
|
|
|
|
"minute": m.group(6),
|
|
|
|
"second": m.group(7),
|
|
|
|
"offset": m.group(8),
|
|
|
|
}
|
|
|
|
)
|
2023-01-12 01:04:47 +00:00
|
|
|
return _parse_date_rfc822(rfc822date)
|