[40] | 1 | #!/usr/bin/env python3 |
---|
[4] | 2 | |
---|
[40] | 3 | # Requires Python 3+ |
---|
[4] | 4 | |
---|
| 5 | ''' |
---|
[40] | 6 | This script reads a raw HTTP request and writes to stdout a Python |
---|
| 7 | script. The generated script sends the same (or a very similar) |
---|
| 8 | request using the standard httplib/http.client library, or optionally |
---|
| 9 | using the more user friendly python-requests library. |
---|
[4] | 10 | |
---|
| 11 | Certainly if you have a raw request, you could simply send it via TCP |
---|
| 12 | sockets, but if for some reason the server behaves oddly with flow control, |
---|
| 13 | insists on using gzip/deflate encoding, insists on using chunked encoding, |
---|
| 14 | or any number of other annoying things, then using an HTTP library is a |
---|
| 15 | lot more convenient. This script attempts to make that conversion easy. |
---|
| 16 | |
---|
| 17 | |
---|
[39] | 18 | Copyright (C) 2011-2013 Virtual Security Research, LLC |
---|
[4] | 19 | Author: Timothy D. Morgan |
---|
| 20 | |
---|
| 21 | This program is free software: you can redistribute it and/or modify |
---|
| 22 | it under the terms of the GNU Lesser General Public License, version 3, |
---|
| 23 | as published by the Free Software Foundation. |
---|
| 24 | |
---|
| 25 | This program is distributed in the hope that it will be useful, |
---|
| 26 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
| 27 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
---|
| 28 | GNU General Public License for more details. |
---|
| 29 | |
---|
| 30 | You should have received a copy of the GNU General Public License |
---|
| 31 | along with this program. If not, see <http://www.gnu.org/licenses/>. |
---|
| 32 | ''' |
---|
| 33 | |
---|
| 34 | |
---|
| 35 | import sys |
---|
| 36 | import argparse |
---|
| 37 | |
---|
[47] | 38 | bopen = lambda f: open(f, 'rb') |
---|
| 39 | |
---|
[28] | 40 | parser = argparse.ArgumentParser( |
---|
| 41 | description='A script which accepts an HTTP request and prints out a' |
---|
| 42 | ' generated Python script which sends a similar request. This is useful' |
---|
| 43 | ' when one wants to automate sending a large number of requests to a' |
---|
| 44 | ' particular page or application.' |
---|
| 45 | ' For more information, see: http://code.google.com/p/bletchley/wiki/Overview') |
---|
| 46 | parser.add_argument( |
---|
[47] | 47 | 'requestfile', type=bopen, nargs='?', default=sys.stdin.buffer, |
---|
[28] | 48 | help='A file containing an HTTP request. Defaults to stdin if omitted.') |
---|
| 49 | parser.add_argument( |
---|
[40] | 50 | '--requests', action='store_true', help='Generate a script that uses the' |
---|
| 51 | ' python-requests module rather than httplib/http.client (experimental).') |
---|
| 52 | |
---|
[4] | 53 | args = parser.parse_args() |
---|
[40] | 54 | input_req = args.requestfile.read() |
---|
[4] | 55 | |
---|
| 56 | |
---|
[47] | 57 | if b'\r\n\r\n' in input_req: |
---|
| 58 | raw_headers,body = input_req.split(b'\r\n\r\n', 1) |
---|
| 59 | elif b'\n\n' in input_req: |
---|
| 60 | raw_headers,body = input_req.split(b'\n\n', 1) |
---|
[4] | 61 | else: |
---|
| 62 | raw_headers = input_req |
---|
[47] | 63 | body = b'' |
---|
[4] | 64 | |
---|
[47] | 65 | raw_headers = raw_headers.decode('utf-8') |
---|
| 66 | |
---|
[4] | 67 | header_lines = raw_headers.split('\n') |
---|
| 68 | method,path,version = header_lines[0].split(' ', 2) |
---|
| 69 | |
---|
| 70 | host = 'TODO' |
---|
[14] | 71 | port = 80 |
---|
[4] | 72 | use_ssl = False |
---|
[40] | 73 | protocol = 'http' |
---|
[4] | 74 | |
---|
| 75 | headers = [] |
---|
| 76 | for l in header_lines[1:]: |
---|
| 77 | if len(l) < 1: |
---|
| 78 | break |
---|
| 79 | # Handle header line continuations |
---|
[40] | 80 | if l[0] in ' \t': |
---|
[4] | 81 | if len(headers) == 0: |
---|
| 82 | continue |
---|
| 83 | name,values = headers[-1] |
---|
| 84 | values.append(l.lstrip('\t')) |
---|
| 85 | headers[-1] = (name,values) |
---|
| 86 | continue |
---|
| 87 | |
---|
| 88 | name,value = l.split(':',1) |
---|
| 89 | value = value.lstrip(' ').rstrip('\r') |
---|
| 90 | |
---|
| 91 | # Skip headers that have to do with transfer encodings and connection longevity |
---|
| 92 | if name.lower() not in ['accept','accept-language', |
---|
| 93 | 'accept-encoding','accept-charset', |
---|
| 94 | 'connection', 'keep-alive', 'host', |
---|
[39] | 95 | 'content-length', 'proxy-connection']: |
---|
[4] | 96 | headers.append((name,[value])) |
---|
| 97 | |
---|
| 98 | if name.lower() == 'host': |
---|
| 99 | if ':' in value: |
---|
| 100 | host,port = value.split(':',1) |
---|
[51] | 101 | port = int(port, 10) |
---|
[4] | 102 | if port == 443: |
---|
| 103 | use_ssl = True |
---|
[40] | 104 | protocol = 'https' |
---|
[4] | 105 | else: |
---|
| 106 | host = value |
---|
| 107 | |
---|
[39] | 108 | |
---|
[47] | 109 | formatted_body = '\n '.join([repr(body[i:i+40]) for i in range(0,len(body),40)]) |
---|
[51] | 110 | if formatted_body == '': |
---|
[40] | 111 | formatted_body = "b''" |
---|
[39] | 112 | |
---|
[40] | 113 | |
---|
| 114 | if args.requests: |
---|
| 115 | print('''#!/usr/bin/env python3 |
---|
| 116 | |
---|
[39] | 117 | import sys |
---|
| 118 | try: |
---|
[40] | 119 | import requests |
---|
[39] | 120 | except: |
---|
[40] | 121 | sys.stderr.write('ERROR: Could not import requests module. Ensure it is installed.\\n') |
---|
| 122 | sys.stderr.write(' Under Debian, the package name is "python3-requests"\\n.') |
---|
| 123 | sys.exit(1) |
---|
| 124 | |
---|
| 125 | |
---|
| 126 | # TODO: ensure the host, port, and SSL settings are correct. |
---|
| 127 | host = %s |
---|
| 128 | port = %s |
---|
| 129 | protocol = %s |
---|
| 130 | ''' % (repr(host),repr(port),repr(protocol))) |
---|
| 131 | |
---|
| 132 | headers = dict(headers) |
---|
| 133 | # XXX: We don't currently support exactly formatted header |
---|
| 134 | # continuations with python requests, but this should be |
---|
| 135 | # semantically equivalent. |
---|
| 136 | for h in headers.keys(): |
---|
| 137 | headers[h] = ' '.join(headers[h]) |
---|
| 138 | |
---|
| 139 | print(''' |
---|
| 140 | session = requests.Session() |
---|
| 141 | # TODO: use "data" to supply any parameters to be included in the request |
---|
| 142 | def sendRequest(session, data=None): |
---|
| 143 | method = %s |
---|
| 144 | path = %s |
---|
| 145 | headers = %s |
---|
| 146 | url = "%%s://%%s:%%d%%s" %% (protocol,host,port,path) |
---|
| 147 | body = (%s) |
---|
| 148 | |
---|
| 149 | return session.request(method, url, headers=headers, data=body) |
---|
| 150 | ''' % (repr(method), repr(path), repr(headers), formatted_body)) |
---|
| 151 | |
---|
| 152 | print(''' |
---|
| 153 | |
---|
| 154 | def fetch(data): |
---|
| 155 | global session |
---|
| 156 | ret_val = None |
---|
| 157 | |
---|
| 158 | # TODO: customize code here to retrieve what you need from the response(s) |
---|
| 159 | # For information on the response object's interface, see: |
---|
| 160 | # http://docs.python-requests.org/en/latest/api/#requests.Response |
---|
| 161 | response = sendRequest(session, data) |
---|
| 162 | print(response.headers) |
---|
| 163 | print(repr(response.content)) |
---|
| 164 | |
---|
| 165 | return ret_val |
---|
| 166 | |
---|
| 167 | data = '' |
---|
| 168 | fetch(data) |
---|
[39] | 169 | ''') |
---|
| 170 | |
---|
| 171 | |
---|
[40] | 172 | |
---|
| 173 | else: |
---|
| 174 | print('''#!/usr/bin/env python3 |
---|
| 175 | |
---|
| 176 | import sys |
---|
| 177 | import http.client as httpc |
---|
| 178 | |
---|
| 179 | |
---|
[4] | 180 | # TODO: ensure the host, port, and SSL settings are correct. |
---|
| 181 | host = %s |
---|
| 182 | port = %s |
---|
| 183 | use_ssl = %s |
---|
| 184 | ''' % (repr(host),repr(port),repr(use_ssl))) |
---|
| 185 | |
---|
[40] | 186 | print(''' |
---|
[39] | 187 | # TODO: use "data" to supply any parameters to be included in the request |
---|
| 188 | def sendRequest(connection, data=None): |
---|
[4] | 189 | method = %s |
---|
| 190 | path = %s |
---|
[14] | 191 | body = (%s) |
---|
| 192 | |
---|
[4] | 193 | connection.putrequest(method, path) |
---|
[40] | 194 | ''' % (repr(method), repr(path), formatted_body)) |
---|
[4] | 195 | |
---|
[40] | 196 | for name,values in headers: |
---|
| 197 | if len(values) > 1: |
---|
| 198 | continuations = ','.join([repr(v) for v in values[1:]]) |
---|
| 199 | print(''' connection.putheader(%s, %s, %s)''' % (repr(name),repr(values[0]),continuations)) |
---|
| 200 | else: |
---|
| 201 | print(''' connection.putheader(%s, %s)''' % (repr(name),repr(values[0]))) |
---|
[4] | 202 | |
---|
[40] | 203 | print(''' |
---|
[4] | 204 | if len(body) > 0: |
---|
| 205 | connection.putheader('Content-Length', len(body)) |
---|
| 206 | connection.endheaders() |
---|
| 207 | connection.send(body) |
---|
| 208 | |
---|
| 209 | return connection.getresponse() |
---|
| 210 | |
---|
| 211 | |
---|
[39] | 212 | def newConnection(): |
---|
| 213 | if use_ssl: |
---|
| 214 | return httpc.HTTPSConnection(host, port) |
---|
| 215 | else: |
---|
| 216 | return httpc.HTTPConnection(host, port) |
---|
[4] | 217 | |
---|
| 218 | |
---|
[39] | 219 | def fetch(data): |
---|
| 220 | ret_val = None |
---|
| 221 | connection = newConnection() |
---|
| 222 | |
---|
| 223 | # TODO: customize code here to retrieve what you need from the response(s) |
---|
| 224 | # For information on the response object's interface, see: |
---|
| 225 | # http://docs.python.org/library/httplib.html#httpresponse-objects |
---|
| 226 | response = sendRequest(connection, data) |
---|
| 227 | print(response.getheaders()) |
---|
| 228 | print(repr(response.read())) |
---|
| 229 | |
---|
| 230 | connection.close() |
---|
| 231 | return ret_val |
---|
| 232 | |
---|
| 233 | data = '' |
---|
| 234 | fetch(data) |
---|
[4] | 235 | ''') |
---|