sqlmap/lib/parse/html.py

63 lines
1.6 KiB
Python
Raw Normal View History

2008-10-15 19:38:22 +04:00
#!/usr/bin/env python
"""
2008-10-15 19:56:32 +04:00
$Id$
2008-10-15 19:38:22 +04:00
Copyright (c) 2006-2010 sqlmap developers (http://sqlmap.sourceforge.net/)
2010-10-15 03:18:29 +04:00
See the file 'doc/COPYING' for copying permission
2008-10-15 19:38:22 +04:00
"""
import re
from xml.sax.handler import ContentHandler
from lib.core.common import checkFile
2010-04-16 23:57:00 +04:00
from lib.core.common import parseXmlFile
2008-10-15 19:38:22 +04:00
from lib.core.common import sanitizeStr
from lib.core.data import kb
from lib.core.data import paths
2008-10-15 19:38:22 +04:00
class htmlHandler(ContentHandler):
"""
This class defines methods to parse the input HTML page to
fingerprint the back-end database management system
"""
def __init__(self, page):
self.__dbms = None
self.__page = page
2008-10-15 19:38:22 +04:00
self.__regexp = None
self.__match = None
2008-10-15 19:38:22 +04:00
self.dbms = None
2008-10-15 19:38:22 +04:00
def startElement(self, name, attrs):
if name == "dbms":
self.__dbms = attrs.get("value")
if name == "error":
self.__regexp = attrs.get("regexp")
self.__match = re.search(self.__regexp, self.__page, re.I)
if self.__match:
self.dbms = self.__dbms
self.__match = None
2010-10-11 16:26:35 +04:00
kb.lastErrorPage = (kb.lastRequestUID, self.__page)
2008-10-15 19:38:22 +04:00
2008-11-17 03:13:49 +03:00
def htmlParser(page):
2008-10-15 19:38:22 +04:00
"""
This function calls a class that parses the input HTML page to
fingerprint the back-end database management system
"""
2008-11-17 03:13:49 +03:00
xmlfile = paths.ERRORS_XML
2008-10-15 19:38:22 +04:00
checkFile(xmlfile)
page = sanitizeStr(page)
handler = htmlHandler(page)
2010-04-16 23:57:00 +04:00
parseXmlFile(xmlfile, handler)
2008-10-15 19:38:22 +04:00
if handler.dbms and handler.dbms not in kb.htmlFp:
kb.htmlFp.append(handler.dbms)
2008-10-15 19:38:22 +04:00
return handler.dbms