2008-12-05 18:34:13 +03:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
|
|
|
"""
|
|
|
|
$Id$
|
|
|
|
|
2010-10-14 18:41:14 +04:00
|
|
|
Copyright (c) 2006-2010 sqlmap developers (http://sqlmap.sourceforge.net/)
|
2010-10-15 03:18:29 +04:00
|
|
|
See the file 'doc/COPYING' for copying permission
|
2008-12-05 18:34:13 +03:00
|
|
|
"""
|
|
|
|
|
|
|
|
import re
|
|
|
|
|
2010-10-12 23:41:29 +04:00
|
|
|
from lib.core.common import getFilteredPageContent
|
2010-09-13 17:31:01 +04:00
|
|
|
from lib.core.common import preparePageForLineComparison
|
2010-10-25 18:06:56 +04:00
|
|
|
from lib.core.common import wasLastRequestError
|
2008-12-05 18:34:13 +03:00
|
|
|
from lib.core.data import conf
|
2010-09-13 17:31:01 +04:00
|
|
|
from lib.core.data import kb
|
2009-02-09 13:28:03 +03:00
|
|
|
from lib.core.data import logger
|
2009-04-22 15:48:07 +04:00
|
|
|
from lib.core.session import setMatchRatio
|
2008-12-05 18:34:13 +03:00
|
|
|
|
2010-09-16 13:32:09 +04:00
|
|
|
def comparison(page, headers=None, getSeqMatcher=False, pageLength=None):
|
2008-12-05 18:34:13 +03:00
|
|
|
regExpResults = None
|
|
|
|
|
2008-12-09 00:24:24 +03:00
|
|
|
# String to be excluded before calculating page hash
|
2008-12-05 18:34:13 +03:00
|
|
|
if conf.eString and conf.eString in page:
|
|
|
|
index = page.index(conf.eString)
|
|
|
|
length = len(conf.eString)
|
|
|
|
pageWithoutString = page[:index]
|
|
|
|
pageWithoutString += page[index+length:]
|
|
|
|
page = pageWithoutString
|
|
|
|
|
2008-12-09 00:24:24 +03:00
|
|
|
# Regular expression matches to be excluded before calculating page hash
|
2008-12-05 18:34:13 +03:00
|
|
|
if conf.eRegexp:
|
|
|
|
regExpResults = re.findall(conf.eRegexp, page, re.I | re.M)
|
|
|
|
|
2008-12-09 00:24:24 +03:00
|
|
|
if regExpResults:
|
|
|
|
for regExpResult in regExpResults:
|
|
|
|
index = page.index(regExpResult)
|
|
|
|
length = len(regExpResult)
|
|
|
|
pageWithoutRegExp = page[:index]
|
|
|
|
pageWithoutRegExp += page[index+length:]
|
|
|
|
page = pageWithoutRegExp
|
2008-12-05 18:34:13 +03:00
|
|
|
|
2008-12-09 00:24:24 +03:00
|
|
|
# String to match in page when the query is valid
|
2008-12-05 18:34:13 +03:00
|
|
|
if conf.string:
|
2010-05-14 18:21:13 +04:00
|
|
|
return conf.string in page
|
2008-12-05 18:34:13 +03:00
|
|
|
|
2008-12-09 00:24:24 +03:00
|
|
|
# Regular expression to match in page when the query is valid
|
|
|
|
if conf.regexp:
|
2010-05-14 18:21:13 +04:00
|
|
|
return re.search(conf.regexp, page, re.I | re.M) is not None
|
2008-12-05 18:34:13 +03:00
|
|
|
|
2010-09-13 17:31:01 +04:00
|
|
|
# Dynamic content lines to be excluded before calculating page hash
|
2010-10-25 14:41:37 +04:00
|
|
|
for item in kb.dynamicMarkings:
|
|
|
|
prefix, postfix = item
|
|
|
|
if prefix is None:
|
|
|
|
page = re.sub('(?s)^.+%s' % postfix, postfix, page)
|
|
|
|
elif postfix is None:
|
|
|
|
page = re.sub('(?s)%s.+$' % prefix, prefix, page)
|
|
|
|
else:
|
|
|
|
page = re.sub('(?s)%s.+%s' % (prefix, postfix), '%s%s' % (prefix, postfix), page)
|
2010-09-13 17:31:01 +04:00
|
|
|
|
2010-11-03 15:40:11 +03:00
|
|
|
if not pageLength and page:
|
|
|
|
pageLength = len(page)
|
|
|
|
|
2010-11-02 12:06:38 +03:00
|
|
|
if kb.locks.seqLock:
|
|
|
|
kb.locks.seqLock.acquire()
|
2010-03-10 17:14:27 +03:00
|
|
|
|
2010-11-03 15:40:11 +03:00
|
|
|
if not conf.eRegexp and not conf.eString and kb.nullConnection and pageLength:
|
2010-09-16 13:32:09 +04:00
|
|
|
ratio = 1. * pageLength / len(conf.seqMatcher.a)
|
|
|
|
if ratio > 1.:
|
|
|
|
ratio = 1. / ratio
|
|
|
|
else:
|
2010-10-12 23:41:29 +04:00
|
|
|
conf.seqMatcher.set_seq2(page if not conf.textOnly else getFilteredPageContent(page))
|
2010-09-16 13:32:09 +04:00
|
|
|
ratio = round(conf.seqMatcher.ratio(), 3)
|
2009-02-09 13:28:03 +03:00
|
|
|
|
2010-11-02 12:06:38 +03:00
|
|
|
if kb.locks.seqLock:
|
|
|
|
kb.locks.seqLock.release()
|
2010-03-10 17:14:27 +03:00
|
|
|
|
2009-02-09 13:28:03 +03:00
|
|
|
# If the url is stable and we did not set yet the match ratio and the
|
|
|
|
# current injected value changes the url page content
|
2010-01-02 05:02:12 +03:00
|
|
|
if conf.matchRatio is None:
|
2010-09-14 14:35:01 +04:00
|
|
|
if conf.thold:
|
|
|
|
conf.matchRatio = conf.thold
|
|
|
|
|
2010-10-25 17:52:21 +04:00
|
|
|
elif kb.pageStable and ratio > 0.6 and ratio < 1:
|
2009-02-12 03:17:44 +03:00
|
|
|
logger.debug("setting match ratio to %.3f" % ratio)
|
2009-04-22 15:48:07 +04:00
|
|
|
conf.matchRatio = ratio
|
2010-01-02 05:02:12 +03:00
|
|
|
|
2010-10-25 17:52:21 +04:00
|
|
|
elif not kb.pageStable or ( kb.pageStable and ratio < 0.6 ):
|
2009-02-12 03:17:44 +03:00
|
|
|
logger.debug("setting match ratio to default value 0.900")
|
2009-04-22 15:48:07 +04:00
|
|
|
conf.matchRatio = 0.900
|
|
|
|
|
2010-09-14 14:35:01 +04:00
|
|
|
if conf.matchRatio is not None:
|
|
|
|
setMatchRatio()
|
2009-02-09 13:28:03 +03:00
|
|
|
|
|
|
|
# If it has been requested to return the ratio and not a comparison
|
|
|
|
# response
|
2008-12-20 04:54:08 +03:00
|
|
|
if getSeqMatcher:
|
2009-02-09 13:28:03 +03:00
|
|
|
return ratio
|
|
|
|
|
2010-10-25 16:00:59 +04:00
|
|
|
# In case of an DBMS error page return False
|
2010-10-25 18:06:56 +04:00
|
|
|
elif wasLastRequestError():
|
2010-10-25 16:00:59 +04:00
|
|
|
return False
|
|
|
|
|
2009-02-09 13:28:03 +03:00
|
|
|
# If the url is not stable it returns sequence matcher between the
|
|
|
|
# first untouched HTTP response page content and this content
|
2008-12-20 04:54:08 +03:00
|
|
|
else:
|
2010-05-14 18:21:13 +04:00
|
|
|
return ratio > conf.matchRatio
|