fix (google is changing that class r to class "r")

This commit is contained in:
Miroslav Stampar 2010-05-15 21:51:31 +00:00
parent b8a5a54395
commit d20b99ed65

View File

@ -54,7 +54,7 @@ class Google:
matches = [] matches = []
regExpr = "class=r\076\074a href=\042(http[s]*://.+?)\042\sclass=l" regExpr = "class=\042?r\042?\076\074a href=\042(http[s]*://.+?)\042\sclass=\042?l\042?"
matches = re.findall(regExpr, page, re.I | re.M) matches = re.findall(regExpr, page, re.I | re.M)
return matches return matches