fix for a "popular" typo 'iso-5889-1' reported by David Guimaraes

This commit is contained in:
Miroslav Stampar 2011-04-16 06:44:29 +00:00
parent 88c76147e1
commit 5e70eac98c

View File

@ -104,6 +104,8 @@ def checkCharEncoding(encoding):
# popular typos/errors # popular typos/errors
if '8858' in encoding: if '8858' in encoding:
encoding = encoding.replace('8858', '8859') # iso-8858 -> iso-8859 encoding = encoding.replace('8858', '8859') # iso-8858 -> iso-8859
elif '5889' in encoding:
encoding = encoding.replace('5889', '8859') # iso-5889 -> iso-8859
elif '2313' in encoding: elif '2313' in encoding:
encoding = encoding.replace('2313', '2312') # gb2313 -> gb2312 encoding = encoding.replace('2313', '2312') # gb2313 -> gb2312
@ -125,7 +127,7 @@ def checkCharEncoding(encoding):
try: try:
codecs.lookup(encoding) codecs.lookup(encoding)
except LookupError: except LookupError:
warnMsg = "unknown charset '%s'. " % encoding warnMsg = "unknown web page charset '%s'. " % encoding
warnMsg += "Please report by e-mail to %s." % ML warnMsg += "Please report by e-mail to %s." % ML
logger.warn(warnMsg) logger.warn(warnMsg)
encoding = UNICODE_ENCODING encoding = UNICODE_ENCODING