sqlmap/lib/utils/har.py

230 lines
7.5 KiB
Python
Raw Normal View History

2017-07-03 17:55:24 +03:00
#!/usr/bin/env python
"""
2018-01-02 02:48:10 +03:00
Copyright (c) 2006-2018 sqlmap developers (http://sqlmap.org/)
2017-10-11 15:50:46 +03:00
See the file 'LICENSE' for copying permission
2017-07-03 17:55:24 +03:00
"""
import base64
import BaseHTTPServer
2017-07-04 13:14:17 +03:00
import datetime
2017-07-03 17:55:24 +03:00
import httplib
import re
import StringIO
2017-07-04 13:14:17 +03:00
import time
2017-07-03 17:55:24 +03:00
2017-07-05 15:07:21 +03:00
from lib.core.bigarray import BigArray
2017-07-03 17:55:24 +03:00
from lib.core.settings import VERSION
2017-07-04 13:14:17 +03:00
# Reference: https://dvcs.w3.org/hg/webperf/raw-file/tip/specs/HAR/Overview.html
# http://www.softwareishard.com/har/viewer/
2017-07-03 17:55:24 +03:00
class HTTPCollectorFactory:
def __init__(self, harFile=False):
self.harFile = harFile
def create(self):
2017-07-04 13:14:17 +03:00
return HTTPCollector()
2017-07-03 17:55:24 +03:00
class HTTPCollector:
def __init__(self):
2017-07-05 15:07:21 +03:00
self.messages = BigArray()
self.extendedArguments = {}
def setExtendedArguments(self, arguments):
self.extendedArguments = arguments
2017-07-03 17:55:24 +03:00
2017-07-04 13:14:17 +03:00
def collectRequest(self, requestMessage, responseMessage, startTime=None, endTime=None):
self.messages.append(RawPair(requestMessage, responseMessage,
startTime=startTime, endTime=endTime,
extendedArguments=self.extendedArguments))
2017-07-03 17:55:24 +03:00
def obtain(self):
return {"log": {
"version": "1.2",
"creator": {"name": "sqlmap", "version": VERSION},
"entries": [pair.toEntry().toDict() for pair in self.messages],
}}
class RawPair:
def __init__(self, request, response, startTime=None, endTime=None, extendedArguments=None):
2017-07-03 17:55:24 +03:00
self.request = request
self.response = response
2017-07-04 13:14:17 +03:00
self.startTime = startTime
self.endTime = endTime
self.extendedArguments = extendedArguments or {}
2017-07-03 17:55:24 +03:00
def toEntry(self):
return Entry(request=Request.parse(self.request), response=Response.parse(self.response),
startTime=self.startTime, endTime=self.endTime,
extendedArguments=self.extendedArguments)
2017-07-03 17:55:24 +03:00
class Entry:
def __init__(self, request, response, startTime, endTime, extendedArguments):
2017-07-03 17:55:24 +03:00
self.request = request
self.response = response
2017-07-04 13:14:17 +03:00
self.startTime = startTime or 0
self.endTime = endTime or 0
self.extendedArguments = extendedArguments
2017-07-03 17:55:24 +03:00
def toDict(self):
out = {
2017-07-03 17:55:24 +03:00
"request": self.request.toDict(),
"response": self.response.toDict(),
2017-07-04 13:14:17 +03:00
"cache": {},
"timings": {
"send": -1,
"wait": -1,
"receive": -1,
},
2017-07-04 13:14:17 +03:00
"time": int(1000 * (self.endTime - self.startTime)),
"startedDateTime": "%s%s" % (datetime.datetime.fromtimestamp(self.startTime).isoformat(), time.strftime("%z")) if self.startTime else None
2017-07-03 17:55:24 +03:00
}
out.update(self.extendedArguments)
return out
2017-07-03 17:55:24 +03:00
class Request:
def __init__(self, method, path, httpVersion, headers, postBody=None, raw=None, comment=None):
self.method = method
self.path = path
self.httpVersion = httpVersion
self.headers = headers or {}
self.postBody = postBody
2017-07-04 13:14:17 +03:00
self.comment = comment.strip() if comment else comment
2017-07-03 17:55:24 +03:00
self.raw = raw
@classmethod
def parse(cls, raw):
request = HTTPRequest(raw)
return cls(method=request.command,
path=request.path,
httpVersion=request.request_version,
headers=request.headers,
postBody=request.rfile.read(),
comment=request.comment,
raw=raw)
@property
def url(self):
host = self.headers.get("Host", "unknown")
return "http://%s%s" % (host, self.path)
def toDict(self):
out = {
"httpVersion": self.httpVersion,
"method": self.method,
"url": self.url,
"headers": [dict(name=key.capitalize(), value=value) for key, value in self.headers.items()],
2017-07-04 13:14:17 +03:00
"cookies": [],
"queryString": [],
"headersSize": -1,
"bodySize": -1,
2017-07-03 17:55:24 +03:00
"comment": self.comment,
}
if self.postBody:
contentType = self.headers.get("Content-Type")
out["postData"] = {
"mimeType": contentType,
"text": self.postBody.rstrip("\r\n"),
}
return out
class Response:
extract_status = re.compile(r'\((\d{3}) (.*)\)')
def __init__(self, httpVersion, status, statusText, headers, content, raw=None, comment=None):
self.raw = raw
self.httpVersion = httpVersion
self.status = status
self.statusText = statusText
self.headers = headers
self.content = content
2017-07-04 13:14:17 +03:00
self.comment = comment.strip() if comment else comment
2017-07-03 17:55:24 +03:00
@classmethod
def parse(cls, raw):
altered = raw
comment = ""
2017-07-03 17:55:24 +03:00
if altered.startswith("HTTP response [") or altered.startswith("HTTP redirect ["):
2017-07-03 17:55:24 +03:00
io = StringIO.StringIO(raw)
first_line = io.readline()
parts = cls.extract_status.search(first_line)
status_line = "HTTP/1.0 %s %s" % (parts.group(1), parts.group(2))
remain = io.read()
2017-07-04 13:14:17 +03:00
altered = status_line + "\r\n" + remain
2017-07-03 17:55:24 +03:00
comment = first_line
response = httplib.HTTPResponse(FakeSocket(altered))
response.begin()
try:
content = response.read(-1)
except httplib.IncompleteRead:
2017-07-04 13:14:17 +03:00
content = raw[raw.find("\r\n\r\n") + 4:].rstrip("\r\n")
2017-07-03 17:55:24 +03:00
return cls(httpVersion="HTTP/1.1" if response.version == 11 else "HTTP/1.0",
status=response.status,
statusText=response.reason,
headers=response.msg,
content=content,
comment=comment,
raw=raw)
def toDict(self):
content = {
"mimeType": self.headers.get("Content-Type"),
"text": self.content,
2017-07-04 13:14:17 +03:00
"size": len(self.content or "")
2017-07-03 17:55:24 +03:00
}
binary = set(['\0', '\1'])
if any(c in binary for c in self.content):
content["encoding"] = "base64"
content["text"] = base64.b64encode(self.content)
return {
"httpVersion": self.httpVersion,
"status": self.status,
"statusText": self.statusText,
"headers": [dict(name=key.capitalize(), value=value) for key, value in self.headers.items() if key.lower() != "uri"],
2017-07-04 13:14:17 +03:00
"cookies": [],
2017-07-03 17:55:24 +03:00
"content": content,
2017-07-04 13:14:17 +03:00
"headersSize": -1,
"bodySize": -1,
"redirectURL": "",
2017-07-03 17:55:24 +03:00
"comment": self.comment,
}
class FakeSocket:
# Original source:
# https://stackoverflow.com/questions/24728088/python-parse-http-response-string
def __init__(self, response_text):
self._file = StringIO.StringIO(response_text)
def makefile(self, *args, **kwargs):
return self._file
class HTTPRequest(BaseHTTPServer.BaseHTTPRequestHandler):
# Original source:
# https://stackoverflow.com/questions/4685217/parse-raw-http-headers
def __init__(self, request_text):
self.comment = None
self.rfile = StringIO.StringIO(request_text)
self.raw_requestline = self.rfile.readline()
if self.raw_requestline.startswith("HTTP request ["):
self.comment = self.raw_requestline
self.raw_requestline = self.rfile.readline()
self.error_code = self.error_message = None
self.parse_request()
def send_error(self, code, message):
self.error_code = code
self.error_message = message