diff --git a/lib/core/common.py b/lib/core/common.py index b133c00f5..a51fbbfe9 100644 --- a/lib/core/common.py +++ b/lib/core/common.py @@ -1286,8 +1286,7 @@ def getFilteredPageContent(page, onlyText=True): retVal = page if isinstance(page, basestring): - retVal = re.sub(r"(?s)|%s" % (r"|<[^>]+>|\t|\n|\r" if onlyText else ""), " ", page) - + retVal = re.sub(r"(?s)||%s" % (r"|<[^>]+>|\t|\n|\r" if onlyText else ""), " ", page) while retVal.find(" ") != -1: retVal = retVal.replace(" ", " ")