Patch for an Issue #304

This commit is contained in:
Miroslav Stampar
2012-12-18 09:36:26 +01:00
parent 45d6fdcdc8
commit 2b64c10710
3 changed files with 16 additions and 4 deletions

View File

@@ -231,7 +231,7 @@ def decodePage(page, contentEncoding, contentType):
kb.pageEncoding = conf.charset
# can't do for all responses because we need to support binary files too
if contentType and not isinstance(page, unicode) and any(map(lambda x: x in contentType.lower(), ("text/txt", "text/raw", "text/html", "text/xml"))):
if contentType and not isinstance(page, unicode) and any(map(lambda _: _ in contentType.lower(), ("text/txt", "text/raw", "text/html", "text/xml"))):
# e.g. Ãëàâà
if "&#" in page:
page = re.sub('&#(\d{1,3});', lambda _: chr(int(_.group(1))) if int(_.group(1)) < 256 else _.group(0), page)