168 lines
5.8 KiB
Python
168 lines
5.8 KiB
Python
# pyquarantine is free software: you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
#
|
|
# pyquarantine is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
#
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with pyquarantine. If not, see <http://www.gnu.org/licenses/>.
|
|
#
|
|
|
|
import encodings
|
|
|
|
|
|
#####################################
|
|
# patch pythons email library #
|
|
#####################################
|
|
#
|
|
# https://bugs.python.org/issue27257
|
|
# https://bugs.python.org/issue30988
|
|
#
|
|
# fix: https://github.com/python/cpython/pull/15600
|
|
|
|
import email._header_value_parser
|
|
from email._header_value_parser import TokenList, NameAddr
|
|
from email._header_value_parser import get_display_name, get_angle_addr
|
|
from email._header_value_parser import get_cfws, errors
|
|
from email._header_value_parser import CFWS_LEADER, PHRASE_ENDS
|
|
|
|
|
|
class DisplayName(email._header_value_parser.DisplayName):
|
|
@property
|
|
def display_name(self):
|
|
res = TokenList(self)
|
|
if len(res) == 0:
|
|
return res.value
|
|
if res[0].token_type == 'cfws':
|
|
res.pop(0)
|
|
else:
|
|
if isinstance(res[0], TokenList) and \
|
|
res[0][0].token_type == 'cfws':
|
|
res[0] = TokenList(res[0][1:])
|
|
if res[-1].token_type == 'cfws':
|
|
res.pop()
|
|
else:
|
|
if isinstance(res[-1], TokenList) and \
|
|
res[-1][-1].token_type == 'cfws':
|
|
res[-1] = TokenList(res[-1][:-1])
|
|
return res.value
|
|
|
|
|
|
def get_name_addr(value):
|
|
""" name-addr = [display-name] angle-addr
|
|
|
|
"""
|
|
name_addr = NameAddr()
|
|
# Both the optional display name and the angle-addr can start with cfws.
|
|
leader = None
|
|
if value[0] in CFWS_LEADER:
|
|
leader, value = get_cfws(value)
|
|
if not value:
|
|
raise errors.HeaderParseError(
|
|
"expected name-addr but found '{}'".format(leader))
|
|
if value[0] != '<':
|
|
if value[0] in PHRASE_ENDS:
|
|
raise errors.HeaderParseError(
|
|
"expected name-addr but found '{}'".format(value))
|
|
token, value = get_display_name(value)
|
|
if not value:
|
|
raise errors.HeaderParseError(
|
|
"expected name-addr but found '{}'".format(token))
|
|
if leader is not None:
|
|
if isinstance(token[0], TokenList):
|
|
token[0][:0] = [leader]
|
|
else:
|
|
token[:0] = [leader]
|
|
leader = None
|
|
name_addr.append(token)
|
|
token, value = get_angle_addr(value)
|
|
if leader is not None:
|
|
token[:0] = [leader]
|
|
name_addr.append(token)
|
|
return name_addr, value
|
|
|
|
|
|
setattr(email._header_value_parser, "DisplayName", DisplayName)
|
|
setattr(email._header_value_parser, "get_name_addr", get_name_addr)
|
|
|
|
|
|
# https://bugs.python.org/issue42484
|
|
#
|
|
# fix: https://github.com/python/cpython/pull/24669
|
|
|
|
from email._header_value_parser import DOT, ObsLocalPart, ValueTerminal, get_word
|
|
|
|
|
|
def get_obs_local_part(value):
|
|
""" obs-local-part = word *("." word)
|
|
"""
|
|
obs_local_part = ObsLocalPart()
|
|
last_non_ws_was_dot = False
|
|
while value and (value[0]=='\\' or value[0] not in PHRASE_ENDS):
|
|
if value[0] == '.':
|
|
if last_non_ws_was_dot:
|
|
obs_local_part.defects.append(errors.InvalidHeaderDefect(
|
|
"invalid repeated '.'"))
|
|
obs_local_part.append(DOT)
|
|
last_non_ws_was_dot = True
|
|
value = value[1:]
|
|
continue
|
|
elif value[0]=='\\':
|
|
obs_local_part.append(ValueTerminal(value[0],
|
|
'misplaced-special'))
|
|
value = value[1:]
|
|
obs_local_part.defects.append(errors.InvalidHeaderDefect(
|
|
"'\\' character outside of quoted-string/ccontent"))
|
|
last_non_ws_was_dot = False
|
|
continue
|
|
if obs_local_part and obs_local_part[-1].token_type != 'dot':
|
|
obs_local_part.defects.append(errors.InvalidHeaderDefect(
|
|
"missing '.' between words"))
|
|
try:
|
|
token, value = get_word(value)
|
|
last_non_ws_was_dot = False
|
|
except errors.HeaderParseError:
|
|
if value[0] not in CFWS_LEADER:
|
|
raise
|
|
token, value = get_cfws(value)
|
|
obs_local_part.append(token)
|
|
if not obs_local_part:
|
|
return obs_local_part, value
|
|
if (obs_local_part[0].token_type == 'dot' or
|
|
obs_local_part[0].token_type=='cfws' and
|
|
obs_local_part[1].token_type=='dot'):
|
|
obs_local_part.defects.append(errors.InvalidHeaderDefect(
|
|
"Invalid leading '.' in local part"))
|
|
if (obs_local_part[-1].token_type == 'dot' or
|
|
obs_local_part[-1].token_type=='cfws' and
|
|
obs_local_part[-2].token_type=='dot'):
|
|
obs_local_part.defects.append(errors.InvalidHeaderDefect(
|
|
"Invalid trailing '.' in local part"))
|
|
if obs_local_part.defects:
|
|
obs_local_part.token_type = 'invalid-obs-local-part'
|
|
return obs_local_part, value
|
|
|
|
|
|
setattr(email._header_value_parser, "get_obs_local_part", get_obs_local_part)
|
|
|
|
|
|
#######################################
|
|
# add charset alias for windows-874 #
|
|
#######################################
|
|
#
|
|
# https://bugs.python.org/issue17254
|
|
#
|
|
# fix: https://github.com/python/cpython/pull/10237
|
|
|
|
aliases = encodings.aliases.aliases
|
|
|
|
for alias in ["windows-874", "windows_874"]:
|
|
if alias not in aliases:
|
|
aliases[alias] = "cp874"
|
|
|
|
setattr(encodings.aliases, "aliases", aliases)
|