Fix for an Issue #59

This commit is contained in:
Miroslav Stampar 2012-08-16 11:31:43 +02:00
parent 1af81c0de4
commit 0d8fca30c9

View File

@ -46,7 +46,7 @@ CHAR_INFERENCE_MARK = "%c"
PRINTABLE_CHAR_REGEX = r"[^\x00-\x1f\x7e-\xff]"
# regular expression used for extracting results from google search
GOOGLE_REGEX = r"url\?\w+=(http[^>]+)&(sa=U|rct=j)"
GOOGLE_REGEX = r"url\?\w+=(http[^>]+)&(sa=U|rct=j)"
# regular expression used for extracting content from "textual" tags
TEXT_TAG_REGEX = r"(?si)<(abbr|acronym|b|blockquote|br|center|cite|code|dt|em|font|h\d|i|li|p|pre|q|strong|sub|sup|td|th|title|tt|u)(?!\w).*?>(?P<result>[^<]+)"