2012-02-23 02:52:01 +00:00
|
|
|
# Copyright (C) 2012 Aldo Cortesi
|
|
|
|
#
|
|
|
|
# This program is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2010-02-16 04:09:07 +00:00
|
|
|
"""
|
|
|
|
A simple proxy server implementation, which always reads all of a server
|
|
|
|
response into memory, performs some transformation, and then writes it back
|
2011-07-16 09:47:06 +00:00
|
|
|
to the client.
|
2010-02-16 04:09:07 +00:00
|
|
|
"""
|
2011-08-18 21:22:25 +00:00
|
|
|
import sys, os, string, socket, time
|
2011-08-03 10:38:23 +00:00
|
|
|
import shutil, tempfile, threading
|
2011-02-19 23:53:42 +00:00
|
|
|
import optparse, SocketServer, ssl
|
2012-04-23 21:43:14 +00:00
|
|
|
import utils, flow, certutils, version, wsgi
|
2012-06-13 06:16:47 +00:00
|
|
|
from OpenSSL import SSL
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
|
|
|
|
class ProxyError(Exception):
|
|
|
|
def __init__(self, code, msg):
|
|
|
|
self.code, self.msg = code, msg
|
|
|
|
|
|
|
|
def __str__(self):
|
|
|
|
return "ProxyError(%s, %s)"%(self.code, self.msg)
|
|
|
|
|
|
|
|
|
2011-09-09 02:49:34 +00:00
|
|
|
class ProxyConfig:
|
2012-05-23 21:09:03 +00:00
|
|
|
def __init__(self, certfile = None, ciphers = None, cacert = None, clientcerts = None, cert_wait_time=0, upstream_cert=False, body_size_limit = None, reverse_proxy=None):
|
2011-02-08 17:00:59 +00:00
|
|
|
self.certfile = certfile
|
2011-02-08 15:58:38 +00:00
|
|
|
self.ciphers = ciphers
|
2011-02-08 17:00:59 +00:00
|
|
|
self.cacert = cacert
|
2012-05-23 21:09:03 +00:00
|
|
|
self.clientcerts = clientcerts
|
2011-02-20 00:29:41 +00:00
|
|
|
self.certdir = None
|
2011-06-27 04:10:17 +00:00
|
|
|
self.cert_wait_time = cert_wait_time
|
2012-02-27 22:37:48 +00:00
|
|
|
self.upstream_cert = upstream_cert
|
2011-09-09 03:27:31 +00:00
|
|
|
self.body_size_limit = body_size_limit
|
2012-02-18 01:45:22 +00:00
|
|
|
self.reverse_proxy = reverse_proxy
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
|
2012-02-19 21:34:32 +00:00
|
|
|
def read_headers(fp):
|
|
|
|
"""
|
|
|
|
Read a set of headers from a file pointer. Stop once a blank line
|
|
|
|
is reached. Return a ODict object.
|
|
|
|
"""
|
|
|
|
ret = []
|
|
|
|
name = ''
|
|
|
|
while 1:
|
|
|
|
line = fp.readline()
|
|
|
|
if not line or line == '\r\n' or line == '\n':
|
|
|
|
break
|
|
|
|
if line[0] in ' \t':
|
|
|
|
# continued header
|
|
|
|
ret[-1][1] = ret[-1][1] + '\r\n ' + line.strip()
|
|
|
|
else:
|
|
|
|
i = line.find(':')
|
|
|
|
# We're being liberal in what we accept, here.
|
|
|
|
if i > 0:
|
|
|
|
name = line[:i]
|
|
|
|
value = line[i+1:].strip()
|
|
|
|
ret.append([name, value])
|
2012-02-19 22:29:36 +00:00
|
|
|
return flow.ODictCaseless(ret)
|
2012-02-19 21:34:32 +00:00
|
|
|
|
|
|
|
|
2011-09-09 02:49:34 +00:00
|
|
|
def read_chunked(fp, limit):
|
2010-11-12 15:01:17 +00:00
|
|
|
content = ""
|
2011-09-09 02:49:34 +00:00
|
|
|
total = 0
|
2010-11-12 15:01:17 +00:00
|
|
|
while 1:
|
2011-09-09 02:49:34 +00:00
|
|
|
line = fp.readline(128)
|
2010-11-12 15:01:17 +00:00
|
|
|
if line == "":
|
|
|
|
raise IOError("Connection closed")
|
|
|
|
if line == '\r\n' or line == '\n':
|
|
|
|
continue
|
2011-09-09 02:49:34 +00:00
|
|
|
try:
|
|
|
|
length = int(line,16)
|
|
|
|
except ValueError:
|
|
|
|
# FIXME: Not strictly correct - this could be from the server, in which
|
|
|
|
# case we should send a 502.
|
|
|
|
raise ProxyError(400, "Invalid chunked encoding length: %s"%line)
|
2010-11-12 15:01:17 +00:00
|
|
|
if not length:
|
|
|
|
break
|
2011-09-09 02:49:34 +00:00
|
|
|
total += length
|
|
|
|
if limit is not None and total > limit:
|
|
|
|
msg = "HTTP Body too large."\
|
|
|
|
" Limit is %s, chunked content length was at least %s"%(limit, total)
|
|
|
|
raise ProxyError(509, msg)
|
2010-11-12 15:01:17 +00:00
|
|
|
content += fp.read(length)
|
2011-09-09 02:49:34 +00:00
|
|
|
line = fp.readline(5)
|
2010-11-12 15:01:17 +00:00
|
|
|
if line != '\r\n':
|
|
|
|
raise IOError("Malformed chunked body")
|
|
|
|
while 1:
|
|
|
|
line = fp.readline()
|
|
|
|
if line == "":
|
|
|
|
raise IOError("Connection closed")
|
|
|
|
if line == '\r\n' or line == '\n':
|
|
|
|
break
|
|
|
|
return content
|
2011-07-16 09:47:06 +00:00
|
|
|
|
2010-11-12 15:01:17 +00:00
|
|
|
|
2012-06-10 04:49:59 +00:00
|
|
|
def has_chunked_encoding(headers):
|
|
|
|
for i in headers["transfer-encoding"]:
|
|
|
|
for j in i.split(","):
|
|
|
|
if j.lower() == "chunked":
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
|
|
|
def read_http_body(rfile, headers, all, limit):
|
|
|
|
if has_chunked_encoding(headers):
|
2011-09-09 02:49:34 +00:00
|
|
|
content = read_chunked(rfile, limit)
|
2011-07-14 03:59:27 +00:00
|
|
|
elif "content-length" in headers:
|
2011-09-09 02:49:34 +00:00
|
|
|
try:
|
|
|
|
l = int(headers["content-length"][0])
|
|
|
|
except ValueError:
|
|
|
|
# FIXME: Not strictly correct - this could be from the server, in which
|
|
|
|
# case we should send a 502.
|
|
|
|
raise ProxyError(400, "Invalid content-length header: %s"%headers["content-length"])
|
|
|
|
if limit is not None and l > limit:
|
|
|
|
raise ProxyError(509, "HTTP Body too large. Limit is %s, content-length was %s"%(limit, l))
|
|
|
|
content = rfile.read(l)
|
2010-11-12 15:01:17 +00:00
|
|
|
elif all:
|
2011-09-09 02:49:34 +00:00
|
|
|
content = rfile.read(limit if limit else None)
|
2010-11-12 15:01:17 +00:00
|
|
|
else:
|
2011-02-16 02:10:00 +00:00
|
|
|
content = ""
|
2010-11-12 15:01:17 +00:00
|
|
|
return content
|
|
|
|
|
|
|
|
|
2012-06-03 13:04:57 +00:00
|
|
|
def parse_http_protocol(s):
|
|
|
|
if not s.startswith("HTTP/"):
|
|
|
|
return None
|
|
|
|
major, minor = s.split('/')[1].split('.')
|
|
|
|
major = int(major)
|
|
|
|
minor = int(minor)
|
|
|
|
return major, minor
|
|
|
|
|
|
|
|
|
|
|
|
def parse_init_connect(line):
|
|
|
|
try:
|
|
|
|
method, url, protocol = string.split(line)
|
|
|
|
except ValueError:
|
|
|
|
return None
|
|
|
|
if method != 'CONNECT':
|
|
|
|
return None
|
|
|
|
try:
|
|
|
|
host, port = url.split(":")
|
|
|
|
except ValueError:
|
|
|
|
return None
|
|
|
|
port = int(port)
|
2012-06-09 22:31:04 +00:00
|
|
|
httpversion = parse_http_protocol(protocol)
|
|
|
|
if not httpversion:
|
2012-06-03 13:04:57 +00:00
|
|
|
return None
|
2012-06-09 22:31:04 +00:00
|
|
|
return host, port, httpversion
|
2012-06-03 13:04:57 +00:00
|
|
|
|
|
|
|
|
|
|
|
def parse_init_proxy(line):
|
|
|
|
try:
|
|
|
|
method, url, protocol = string.split(line)
|
|
|
|
except ValueError:
|
|
|
|
return None
|
|
|
|
parts = utils.parse_url(url)
|
|
|
|
if not parts:
|
|
|
|
return None
|
|
|
|
scheme, host, port, path = parts
|
2012-06-09 22:31:04 +00:00
|
|
|
httpversion = parse_http_protocol(protocol)
|
|
|
|
if not httpversion:
|
2012-06-03 13:04:57 +00:00
|
|
|
return None
|
2012-06-09 22:31:04 +00:00
|
|
|
return method, scheme, host, port, path, httpversion
|
2012-06-03 13:04:57 +00:00
|
|
|
|
|
|
|
|
|
|
|
def parse_init_http(line):
|
2012-06-09 22:31:04 +00:00
|
|
|
"""
|
|
|
|
Returns (method, url, httpversion)
|
|
|
|
"""
|
2012-06-03 13:04:57 +00:00
|
|
|
try:
|
|
|
|
method, url, protocol = string.split(line)
|
|
|
|
except ValueError:
|
|
|
|
return None
|
|
|
|
if not (url.startswith("/") or url == "*"):
|
|
|
|
return None
|
2012-06-09 22:31:04 +00:00
|
|
|
httpversion = parse_http_protocol(protocol)
|
|
|
|
if not httpversion:
|
2012-06-03 13:04:57 +00:00
|
|
|
return None
|
2012-06-09 22:31:04 +00:00
|
|
|
return method, url, httpversion
|
2012-06-03 13:04:57 +00:00
|
|
|
|
|
|
|
|
2012-06-10 04:49:59 +00:00
|
|
|
def request_connection_close(httpversion, headers):
|
2010-02-16 04:09:07 +00:00
|
|
|
"""
|
2012-06-10 04:49:59 +00:00
|
|
|
Checks the request to see if the client connection should be closed.
|
2010-02-16 04:09:07 +00:00
|
|
|
"""
|
2012-06-09 22:10:46 +00:00
|
|
|
if "connection" in headers:
|
|
|
|
for value in ",".join(headers['connection']).split(","):
|
|
|
|
value = value.strip()
|
|
|
|
if value == "close":
|
|
|
|
return True
|
|
|
|
elif value == "keep-alive":
|
|
|
|
return False
|
|
|
|
# HTTP 1.1 connections are assumed to be persistent
|
2012-06-09 22:31:04 +00:00
|
|
|
if httpversion == (1, 1):
|
2012-06-09 22:10:46 +00:00
|
|
|
return False
|
|
|
|
return True
|
2012-01-20 23:43:00 +00:00
|
|
|
|
2011-07-31 22:41:12 +00:00
|
|
|
|
2012-06-10 04:49:59 +00:00
|
|
|
def response_connection_close(httpversion, headers):
|
|
|
|
"""
|
|
|
|
Checks the response to see if the client connection should be closed.
|
|
|
|
"""
|
|
|
|
if request_connection_close(httpversion, headers):
|
|
|
|
return True
|
|
|
|
elif not has_chunked_encoding(headers) and "content-length" in headers:
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
|
|
|
|
|
|
|
def read_http_body_request(rfile, wfile, headers, httpversion, limit):
|
2012-06-10 04:02:48 +00:00
|
|
|
if "expect" in headers:
|
|
|
|
# FIXME: Should be forwarded upstream
|
|
|
|
expect = ",".join(headers['expect'])
|
|
|
|
if expect == "100-continue" and httpversion >= (1, 1):
|
|
|
|
wfile.write('HTTP/1.1 100 Continue\r\n')
|
|
|
|
wfile.write('Proxy-agent: %s\r\n'%version.NAMEVERSION)
|
|
|
|
wfile.write('\r\n')
|
|
|
|
del headers['expect']
|
2012-06-10 04:49:59 +00:00
|
|
|
return read_http_body(rfile, headers, False, limit)
|
2012-06-10 04:02:48 +00:00
|
|
|
|
|
|
|
|
2010-02-16 04:09:07 +00:00
|
|
|
class FileLike:
|
|
|
|
def __init__(self, o):
|
|
|
|
self.o = o
|
|
|
|
|
|
|
|
def __getattr__(self, attr):
|
|
|
|
return getattr(self.o, attr)
|
|
|
|
|
|
|
|
def flush(self):
|
|
|
|
pass
|
2012-06-13 06:16:47 +00:00
|
|
|
|
2010-09-05 13:04:22 +00:00
|
|
|
def read(self, length):
|
2010-09-05 23:21:51 +00:00
|
|
|
result = ''
|
|
|
|
while len(result) < length:
|
2011-06-23 05:00:55 +00:00
|
|
|
try:
|
|
|
|
data = self.o.read(length)
|
|
|
|
except AttributeError:
|
|
|
|
break
|
2012-06-13 06:16:47 +00:00
|
|
|
except SSL.ZeroReturnError:
|
|
|
|
break
|
2010-09-05 23:21:51 +00:00
|
|
|
if not data:
|
|
|
|
break
|
|
|
|
result += data
|
|
|
|
return result
|
|
|
|
|
2012-06-13 06:16:47 +00:00
|
|
|
def write(self, v):
|
|
|
|
self.o.sendall(v)
|
|
|
|
|
2012-03-08 22:10:21 +00:00
|
|
|
def readline(self, size = None):
|
2010-02-16 04:09:07 +00:00
|
|
|
result = ''
|
2012-03-08 22:10:21 +00:00
|
|
|
bytes_read = 0
|
2010-02-16 04:09:07 +00:00
|
|
|
while True:
|
2012-03-08 22:10:21 +00:00
|
|
|
if size is not None and bytes_read >= size:
|
|
|
|
break
|
2010-02-16 04:09:07 +00:00
|
|
|
ch = self.read(1)
|
2012-03-08 22:10:21 +00:00
|
|
|
bytes_read += 1
|
2010-02-16 04:09:07 +00:00
|
|
|
if not ch:
|
|
|
|
break
|
|
|
|
else:
|
|
|
|
result += ch
|
|
|
|
if ch == '\n':
|
|
|
|
break
|
|
|
|
return result
|
|
|
|
|
|
|
|
|
2011-08-03 10:38:23 +00:00
|
|
|
class RequestReplayThread(threading.Thread):
|
2012-02-18 01:45:22 +00:00
|
|
|
def __init__(self, config, flow, masterq):
|
|
|
|
self.config, self.flow, self.masterq = config, flow, masterq
|
2011-08-03 10:38:23 +00:00
|
|
|
threading.Thread.__init__(self)
|
|
|
|
|
|
|
|
def run(self):
|
|
|
|
try:
|
2012-06-09 20:13:50 +00:00
|
|
|
r = self.flow.request
|
|
|
|
server = ServerConnection(self.config, r.scheme, r.host, r.port)
|
|
|
|
server.send(r)
|
|
|
|
response = server.read_response(r)
|
2011-08-03 11:02:33 +00:00
|
|
|
response._send(self.masterq)
|
2011-08-03 10:38:23 +00:00
|
|
|
except ProxyError, v:
|
|
|
|
err = flow.Error(self.flow.request, v.msg)
|
2011-08-03 11:02:33 +00:00
|
|
|
err._send(self.masterq)
|
2011-08-03 10:38:23 +00:00
|
|
|
|
2011-02-02 23:16:03 +00:00
|
|
|
|
2010-02-16 04:09:07 +00:00
|
|
|
class ServerConnection:
|
2012-06-09 20:13:50 +00:00
|
|
|
def __init__(self, config, scheme, host, port):
|
|
|
|
self.config, self.scheme, self.host, self.port = config, scheme, host, port
|
2012-04-02 04:19:00 +00:00
|
|
|
self.cert = None
|
2012-04-23 21:43:14 +00:00
|
|
|
self.sock, self.rfile, self.wfile = None, None, None
|
2010-02-16 04:09:07 +00:00
|
|
|
self.connect()
|
2012-06-10 04:02:48 +00:00
|
|
|
self.requestcount = 0
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
def connect(self):
|
|
|
|
try:
|
2010-11-12 15:01:17 +00:00
|
|
|
addr = socket.gethostbyname(self.host)
|
2010-02-16 04:09:07 +00:00
|
|
|
server = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
|
2010-11-12 15:01:17 +00:00
|
|
|
if self.scheme == "https":
|
2012-05-23 21:09:03 +00:00
|
|
|
if self.config.clientcerts:
|
|
|
|
clientcert = os.path.join(self.config.clientcerts, self.host) + ".pem"
|
|
|
|
if not os.path.exists(clientcert):
|
|
|
|
clientcert = None
|
|
|
|
else:
|
|
|
|
clientcert = None
|
|
|
|
server = ssl.wrap_socket(server, certfile = clientcert)
|
2010-11-12 15:01:17 +00:00
|
|
|
server.connect((addr, self.port))
|
2012-04-02 04:19:00 +00:00
|
|
|
if self.scheme == "https":
|
|
|
|
self.cert = server.getpeercert(True)
|
2010-02-16 04:09:07 +00:00
|
|
|
except socket.error, err:
|
2011-09-09 02:49:34 +00:00
|
|
|
raise ProxyError(502, 'Error connecting to "%s": %s' % (self.host, err))
|
2012-04-23 21:43:14 +00:00
|
|
|
self.sock = server
|
2010-02-16 04:09:07 +00:00
|
|
|
self.rfile, self.wfile = server.makefile('rb'), server.makefile('wb')
|
|
|
|
|
2012-06-09 20:13:50 +00:00
|
|
|
def send(self, request):
|
2012-06-10 04:02:48 +00:00
|
|
|
self.requestcount += 1
|
2010-02-16 04:09:07 +00:00
|
|
|
try:
|
2012-06-09 20:13:50 +00:00
|
|
|
d = request._assemble()
|
2012-05-16 03:42:58 +00:00
|
|
|
if not d:
|
|
|
|
raise ProxyError(502, "Incomplete request could not not be readied for transmission.")
|
|
|
|
self.wfile.write(d)
|
2010-02-16 04:09:07 +00:00
|
|
|
self.wfile.flush()
|
|
|
|
except socket.error, err:
|
2012-06-09 20:13:50 +00:00
|
|
|
raise ProxyError(502, 'Error sending data to "%s": %s' % (request.host, err))
|
2010-02-16 04:09:07 +00:00
|
|
|
|
2012-06-09 20:13:50 +00:00
|
|
|
def read_response(self, request):
|
2010-11-12 15:01:17 +00:00
|
|
|
line = self.rfile.readline()
|
|
|
|
if line == "\r\n" or line == "\n": # Possible leftover from previous message
|
|
|
|
line = self.rfile.readline()
|
|
|
|
if not line:
|
|
|
|
raise ProxyError(502, "Blank server response.")
|
|
|
|
parts = line.strip().split(" ", 2)
|
2011-09-25 21:44:43 +00:00
|
|
|
if len(parts) == 2: # handle missing message gracefully
|
|
|
|
parts.append("")
|
2010-02-16 04:09:07 +00:00
|
|
|
if not len(parts) == 3:
|
2010-11-12 15:01:17 +00:00
|
|
|
raise ProxyError(502, "Invalid server response: %s."%line)
|
2010-02-16 04:09:07 +00:00
|
|
|
proto, code, msg = parts
|
2012-06-10 01:27:43 +00:00
|
|
|
httpversion = parse_http_protocol(proto)
|
|
|
|
if httpversion is None:
|
|
|
|
raise ProxyError(502, "Invalid HTTP version: %s."%httpversion)
|
2011-09-04 19:47:47 +00:00
|
|
|
try:
|
|
|
|
code = int(code)
|
|
|
|
except ValueError:
|
|
|
|
raise ProxyError(502, "Invalid server response: %s."%line)
|
2012-02-19 21:34:32 +00:00
|
|
|
headers = read_headers(self.rfile)
|
2010-11-12 15:01:17 +00:00
|
|
|
if code >= 100 and code <= 199:
|
|
|
|
return self.read_response()
|
2012-06-09 20:13:50 +00:00
|
|
|
if request.method == "HEAD" or code == 204 or code == 304:
|
2011-02-16 03:43:35 +00:00
|
|
|
content = ""
|
2010-02-16 04:09:07 +00:00
|
|
|
else:
|
2012-06-10 04:49:59 +00:00
|
|
|
content = read_http_body(self.rfile, headers, True, self.config.body_size_limit)
|
2012-06-10 01:27:43 +00:00
|
|
|
return flow.Response(request, httpversion, code, msg, headers, content, self.cert)
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
def terminate(self):
|
|
|
|
try:
|
|
|
|
if not self.wfile.closed:
|
|
|
|
self.wfile.flush()
|
2012-04-23 21:43:14 +00:00
|
|
|
self.sock.close()
|
2010-02-16 04:09:07 +00:00
|
|
|
except IOError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
|
|
class ProxyHandler(SocketServer.StreamRequestHandler):
|
2011-02-19 23:53:42 +00:00
|
|
|
def __init__(self, config, request, client_address, server, q):
|
2010-02-16 04:09:07 +00:00
|
|
|
self.mqueue = q
|
2012-06-10 04:02:48 +00:00
|
|
|
self.config = config
|
2012-06-09 22:10:46 +00:00
|
|
|
self.server_conn = None
|
2012-06-10 04:02:48 +00:00
|
|
|
self.proxy_connect_state = None
|
2010-02-16 04:09:07 +00:00
|
|
|
SocketServer.StreamRequestHandler.__init__(self, request, client_address, server)
|
|
|
|
|
|
|
|
def handle(self):
|
2011-08-03 10:38:23 +00:00
|
|
|
cc = flow.ClientConnect(self.client_address)
|
2011-08-03 11:02:33 +00:00
|
|
|
cc._send(self.mqueue)
|
2012-06-10 04:02:48 +00:00
|
|
|
while self.handle_request(cc) and not cc.close:
|
|
|
|
pass
|
|
|
|
cc.close = True
|
2011-08-03 10:38:23 +00:00
|
|
|
cd = flow.ClientDisconnect(cc)
|
2011-08-03 11:02:33 +00:00
|
|
|
cd._send(self.mqueue)
|
2010-11-12 15:01:17 +00:00
|
|
|
self.finish()
|
|
|
|
|
2012-06-10 04:02:48 +00:00
|
|
|
def server_connect(self, scheme, host, port):
|
|
|
|
sc = self.server_conn
|
|
|
|
if sc and (scheme, host, port) != (sc.scheme, sc.host, sc.port):
|
|
|
|
sc.terminate()
|
|
|
|
self.server_conn = None
|
|
|
|
if not self.server_conn:
|
|
|
|
self.server_conn = ServerConnection(self.config, scheme, host, port)
|
|
|
|
|
2010-11-12 15:01:17 +00:00
|
|
|
def handle_request(self, cc):
|
2010-02-16 04:09:07 +00:00
|
|
|
try:
|
2012-06-10 04:02:48 +00:00
|
|
|
request, err = None, None
|
2011-07-23 01:37:06 +00:00
|
|
|
try:
|
|
|
|
request = self.read_request(cc)
|
|
|
|
except IOError, v:
|
|
|
|
raise IOError, "Reading request: %s"%v
|
2010-11-12 15:01:17 +00:00
|
|
|
if request is None:
|
|
|
|
return
|
2011-07-23 01:37:06 +00:00
|
|
|
cc.requestcount += 1
|
2011-02-16 09:37:04 +00:00
|
|
|
|
2012-04-23 21:43:14 +00:00
|
|
|
app = self.server.apps.get(request)
|
|
|
|
if app:
|
|
|
|
app.serve(request, self.wfile)
|
2010-11-12 12:18:42 +00:00
|
|
|
else:
|
2012-04-23 21:43:14 +00:00
|
|
|
request = request._send(self.mqueue)
|
|
|
|
if request is None:
|
|
|
|
return
|
|
|
|
|
|
|
|
if isinstance(request, flow.Response):
|
|
|
|
response = request
|
|
|
|
request = False
|
|
|
|
response = response._send(self.mqueue)
|
|
|
|
else:
|
2012-06-09 20:13:50 +00:00
|
|
|
if self.config.reverse_proxy:
|
|
|
|
scheme, host, port = self.config.reverse_proxy
|
|
|
|
else:
|
2012-06-09 22:10:46 +00:00
|
|
|
scheme, host, port = request.scheme, request.host, request.port
|
2012-06-10 04:02:48 +00:00
|
|
|
self.server_connect(scheme, host, port)
|
|
|
|
self.server_conn.send(request)
|
2012-04-23 21:43:14 +00:00
|
|
|
try:
|
2012-06-10 04:02:48 +00:00
|
|
|
response = self.server_conn.read_response(request)
|
2012-04-23 21:43:14 +00:00
|
|
|
except IOError, v:
|
|
|
|
raise IOError, "Reading response: %s"%v
|
|
|
|
response = response._send(self.mqueue)
|
|
|
|
if response is None:
|
2012-06-10 04:02:48 +00:00
|
|
|
self.server_conn.terminate()
|
2010-11-12 12:18:42 +00:00
|
|
|
if response is None:
|
2012-04-23 21:43:14 +00:00
|
|
|
return
|
|
|
|
self.send_response(response)
|
2012-06-10 04:49:59 +00:00
|
|
|
if request_connection_close(request.httpversion, request.headers):
|
|
|
|
return
|
|
|
|
# We could keep the client connection when the server
|
|
|
|
# connection needs to go away. However, we want to mimic
|
|
|
|
# behaviour as closely as possible to the client, so we
|
|
|
|
# disconnect.
|
|
|
|
if response_connection_close(response.httpversion, response.headers):
|
2012-06-10 04:02:48 +00:00
|
|
|
return
|
2011-07-23 01:37:06 +00:00
|
|
|
except IOError, v:
|
|
|
|
cc.connection_error = v
|
2010-02-16 04:09:07 +00:00
|
|
|
except ProxyError, e:
|
2011-07-23 01:37:06 +00:00
|
|
|
cc.connection_error = "%s: %s"%(e.code, e.msg)
|
|
|
|
if request:
|
2011-08-03 10:38:23 +00:00
|
|
|
err = flow.Error(request, e.msg)
|
2011-08-03 11:02:33 +00:00
|
|
|
err._send(self.mqueue)
|
2011-07-23 01:37:06 +00:00
|
|
|
self.send_error(e.code, e.msg)
|
2012-06-10 04:02:48 +00:00
|
|
|
else:
|
|
|
|
return True
|
2010-02-16 04:09:07 +00:00
|
|
|
|
2012-02-27 02:05:45 +00:00
|
|
|
def find_cert(self, host, port):
|
2011-02-19 23:53:42 +00:00
|
|
|
if self.config.certfile:
|
|
|
|
return self.config.certfile
|
2011-02-08 17:00:59 +00:00
|
|
|
else:
|
2012-02-27 02:05:45 +00:00
|
|
|
sans = []
|
2012-02-27 22:37:48 +00:00
|
|
|
if self.config.upstream_cert:
|
2012-03-04 21:22:47 +00:00
|
|
|
cert = certutils.get_remote_cert(host, port)
|
|
|
|
sans = cert.altnames
|
|
|
|
host = cert.cn
|
2012-02-29 00:20:53 +00:00
|
|
|
ret = certutils.dummy_cert(self.config.certdir, self.config.cacert, host, sans)
|
2011-06-27 04:10:17 +00:00
|
|
|
time.sleep(self.config.cert_wait_time)
|
2011-02-19 23:53:42 +00:00
|
|
|
if not ret:
|
2011-09-09 02:49:34 +00:00
|
|
|
raise ProxyError(502, "mitmproxy: Unable to generate dummy cert.")
|
2011-02-19 23:53:42 +00:00
|
|
|
return ret
|
2011-02-08 17:00:59 +00:00
|
|
|
|
2012-06-03 08:54:11 +00:00
|
|
|
def convert_to_ssl(self, cert):
|
2012-06-13 06:16:47 +00:00
|
|
|
ctx = SSL.Context(SSL.SSLv23_METHOD)
|
|
|
|
ctx.use_privatekey_file(self.config.certfile or self.config.cacert)
|
|
|
|
ctx.use_certificate_file(cert)
|
|
|
|
self.connection = SSL.Connection(ctx, self.connection)
|
|
|
|
self.connection.set_accept_state()
|
|
|
|
#kwargs = dict(
|
|
|
|
# certfile = cert,
|
|
|
|
# keyfile = self.config.certfile or self.config.cacert,
|
|
|
|
# server_side = True,
|
|
|
|
# ssl_version = ssl.PROTOCOL_SSLv23,
|
|
|
|
# do_handshake_on_connect = True,
|
|
|
|
#)
|
|
|
|
#if sys.version_info[1] > 6:
|
|
|
|
# kwargs["ciphers"] = self.config.ciphers
|
|
|
|
#self.connection = ssl.wrap_socket(self.connection, **kwargs)
|
2012-06-03 08:54:11 +00:00
|
|
|
self.rfile = FileLike(self.connection)
|
|
|
|
self.wfile = FileLike(self.connection)
|
|
|
|
|
2011-02-03 01:51:32 +00:00
|
|
|
def read_request(self, client_conn):
|
2010-11-12 15:01:17 +00:00
|
|
|
line = self.rfile.readline()
|
|
|
|
if line == "\r\n" or line == "\n": # Possible leftover from previous message
|
|
|
|
line = self.rfile.readline()
|
|
|
|
if line == "":
|
|
|
|
return None
|
2012-06-09 09:27:43 +00:00
|
|
|
|
|
|
|
if self.config.reverse_proxy:
|
|
|
|
scheme, host, port = self.config.reverse_proxy
|
2012-06-09 22:31:04 +00:00
|
|
|
method, path, httpversion = parse_init_http(line)
|
2012-06-09 09:27:43 +00:00
|
|
|
headers = read_headers(self.rfile)
|
2012-06-10 04:02:48 +00:00
|
|
|
content = read_http_body_request(
|
2012-06-10 04:49:59 +00:00
|
|
|
self.rfile, self.wfile, headers, httpversion, self.config.body_size_limit
|
2012-06-10 04:02:48 +00:00
|
|
|
)
|
2012-06-09 22:46:22 +00:00
|
|
|
return flow.Request(client_conn, httpversion, host, port, "http", method, path, headers, content)
|
2012-06-09 09:27:43 +00:00
|
|
|
else:
|
2012-06-10 04:02:48 +00:00
|
|
|
if line.startswith("CONNECT"):
|
|
|
|
host, port, httpversion = parse_init_connect(line)
|
|
|
|
# FIXME: Discard additional headers sent to the proxy. Should I expose
|
|
|
|
# these to users?
|
|
|
|
while 1:
|
|
|
|
d = self.rfile.readline()
|
|
|
|
if d == '\r\n' or d == '\n':
|
|
|
|
break
|
|
|
|
self.wfile.write(
|
|
|
|
'HTTP/1.1 200 Connection established\r\n' +
|
|
|
|
('Proxy-agent: %s\r\n'%version.NAMEVERSION) +
|
|
|
|
'\r\n'
|
|
|
|
)
|
|
|
|
self.wfile.flush()
|
|
|
|
certfile = self.find_cert(host, port)
|
|
|
|
self.convert_to_ssl(certfile)
|
|
|
|
self.proxy_connect_state = (host, port, httpversion)
|
|
|
|
line = self.rfile.readline(line)
|
|
|
|
|
|
|
|
if self.proxy_connect_state:
|
|
|
|
host, port, httpversion = self.proxy_connect_state
|
|
|
|
method, path, httpversion = parse_init_http(line)
|
|
|
|
headers = read_headers(self.rfile)
|
|
|
|
content = read_http_body_request(
|
2012-06-10 04:49:59 +00:00
|
|
|
self.rfile, self.wfile, headers, httpversion, self.config.body_size_limit
|
2012-06-10 04:02:48 +00:00
|
|
|
)
|
|
|
|
return flow.Request(client_conn, httpversion, host, port, "https", method, path, headers, content)
|
|
|
|
else:
|
|
|
|
method, scheme, host, port, path, httpversion = parse_init_proxy(line)
|
|
|
|
headers = read_headers(self.rfile)
|
|
|
|
content = read_http_body_request(
|
2012-06-10 04:49:59 +00:00
|
|
|
self.rfile, self.wfile, headers, httpversion, self.config.body_size_limit
|
2012-06-10 04:02:48 +00:00
|
|
|
)
|
|
|
|
return flow.Request(client_conn, httpversion, host, port, scheme, method, path, headers, content)
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
def send_response(self, response):
|
2012-05-16 03:42:58 +00:00
|
|
|
d = response._assemble()
|
|
|
|
if not d:
|
|
|
|
raise ProxyError(502, "Incomplete response could not not be readied for transmission.")
|
|
|
|
self.wfile.write(d)
|
2010-02-16 04:09:07 +00:00
|
|
|
self.wfile.flush()
|
|
|
|
|
|
|
|
def terminate(self, connection, wfile, rfile):
|
2011-01-27 00:32:24 +00:00
|
|
|
self.request.close()
|
2010-02-16 04:09:07 +00:00
|
|
|
try:
|
|
|
|
if not getattr(wfile, "closed", False):
|
|
|
|
wfile.flush()
|
|
|
|
connection.close()
|
|
|
|
except IOError:
|
|
|
|
pass
|
|
|
|
|
|
|
|
def finish(self):
|
|
|
|
self.terminate(self.connection, self.wfile, self.rfile)
|
|
|
|
|
|
|
|
def send_error(self, code, body):
|
2011-01-27 01:19:48 +00:00
|
|
|
try:
|
|
|
|
import BaseHTTPServer
|
|
|
|
response = BaseHTTPServer.BaseHTTPRequestHandler.responses[code][0]
|
2010-11-12 15:01:17 +00:00
|
|
|
self.wfile.write("HTTP/1.1 %s %s\r\n" % (code, response))
|
2012-04-23 21:43:14 +00:00
|
|
|
self.wfile.write("Server: %s\r\n"%version.NAMEVERSION)
|
2010-11-12 15:01:17 +00:00
|
|
|
self.wfile.write("Connection: close\r\n")
|
2011-01-27 01:19:48 +00:00
|
|
|
self.wfile.write("Content-type: text/html\r\n")
|
|
|
|
self.wfile.write("\r\n")
|
|
|
|
self.wfile.write('<html><head>\n<title>%d %s</title>\n</head>\n'
|
|
|
|
'<body>\n%s\n</body>\n</html>' % (code, response, body))
|
|
|
|
self.wfile.flush()
|
2011-06-23 05:00:55 +00:00
|
|
|
except:
|
2011-01-27 01:19:48 +00:00
|
|
|
pass
|
2010-02-16 04:09:07 +00:00
|
|
|
|
|
|
|
|
2011-03-12 00:47:37 +00:00
|
|
|
class ProxyServerError(Exception): pass
|
|
|
|
|
2010-02-16 04:09:07 +00:00
|
|
|
ServerBase = SocketServer.ThreadingTCPServer
|
2011-02-10 01:56:14 +00:00
|
|
|
ServerBase.daemon_threads = True # Terminate workers when main thread terminates
|
2010-02-16 04:09:07 +00:00
|
|
|
class ProxyServer(ServerBase):
|
2011-01-27 01:19:48 +00:00
|
|
|
request_queue_size = 20
|
2010-02-16 04:09:07 +00:00
|
|
|
allow_reuse_address = True
|
2012-04-02 01:24:51 +00:00
|
|
|
bound = True
|
2011-02-19 23:53:42 +00:00
|
|
|
def __init__(self, config, port, address=''):
|
2011-03-12 00:47:37 +00:00
|
|
|
"""
|
|
|
|
Raises ProxyServerError if there's a startup problem.
|
|
|
|
"""
|
2011-02-19 23:53:42 +00:00
|
|
|
self.config, self.port, self.address = config, port, address
|
2011-03-12 00:47:37 +00:00
|
|
|
try:
|
|
|
|
ServerBase.__init__(self, (address, port), ProxyHandler)
|
|
|
|
except socket.error, v:
|
|
|
|
raise ProxyServerError('Error starting proxy server: ' + v.strerror)
|
2010-02-16 04:09:07 +00:00
|
|
|
self.masterq = None
|
2011-02-20 00:29:41 +00:00
|
|
|
self.certdir = tempfile.mkdtemp(prefix="mitmproxy")
|
|
|
|
config.certdir = self.certdir
|
2012-04-23 21:43:14 +00:00
|
|
|
self.apps = wsgi.AppRegistry()
|
2010-02-16 04:09:07 +00:00
|
|
|
|
2012-04-02 01:24:51 +00:00
|
|
|
def start_slave(self, klass, masterq):
|
|
|
|
slave = klass(masterq, self)
|
|
|
|
slave.start()
|
|
|
|
|
2010-02-16 04:09:07 +00:00
|
|
|
def set_mqueue(self, q):
|
|
|
|
self.masterq = q
|
|
|
|
|
|
|
|
def finish_request(self, request, client_address):
|
2011-02-19 23:53:42 +00:00
|
|
|
self.RequestHandlerClass(self.config, request, client_address, self, self.masterq)
|
2010-02-16 04:09:07 +00:00
|
|
|
|
2011-02-19 23:12:55 +00:00
|
|
|
def shutdown(self):
|
|
|
|
ServerBase.shutdown(self)
|
2011-09-10 21:06:46 +00:00
|
|
|
try:
|
|
|
|
shutil.rmtree(self.certdir)
|
|
|
|
except OSError:
|
|
|
|
pass
|
2011-02-19 23:12:55 +00:00
|
|
|
|
2011-02-19 23:53:42 +00:00
|
|
|
|
2012-04-02 01:24:51 +00:00
|
|
|
class DummyServer:
|
|
|
|
bound = False
|
|
|
|
def __init__(self, config):
|
|
|
|
self.config = config
|
|
|
|
|
|
|
|
def start_slave(self, klass, masterq):
|
|
|
|
pass
|
|
|
|
|
|
|
|
def shutdown(self):
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
2011-02-19 23:53:42 +00:00
|
|
|
# Command-line utils
|
|
|
|
def certificate_option_group(parser):
|
|
|
|
group = optparse.OptionGroup(parser, "SSL")
|
|
|
|
group.add_option(
|
|
|
|
"--cert", action="store",
|
|
|
|
type = "str", dest="cert", default=None,
|
|
|
|
help = "User-created SSL certificate file."
|
|
|
|
)
|
|
|
|
group.add_option(
|
|
|
|
"--ciphers", action="store",
|
|
|
|
type = "str", dest="ciphers", default=None,
|
|
|
|
help = "SSL ciphers."
|
|
|
|
)
|
2012-05-23 21:09:03 +00:00
|
|
|
group.add_option(
|
|
|
|
"--client-certs", action="store",
|
|
|
|
type = "str", dest = "clientcerts", default=None,
|
|
|
|
help = "Client certificate directory."
|
|
|
|
)
|
2011-02-19 23:53:42 +00:00
|
|
|
parser.add_option_group(group)
|
|
|
|
|
|
|
|
|
2011-09-09 03:27:31 +00:00
|
|
|
def process_proxy_options(parser, options):
|
2011-02-19 23:53:42 +00:00
|
|
|
if options.cert:
|
|
|
|
options.cert = os.path.expanduser(options.cert)
|
|
|
|
if not os.path.exists(options.cert):
|
|
|
|
parser.error("Manually created certificate does not exist: %s"%options.cert)
|
2011-03-18 03:45:31 +00:00
|
|
|
|
|
|
|
cacert = os.path.join(options.confdir, "mitmproxy-ca.pem")
|
|
|
|
cacert = os.path.expanduser(cacert)
|
|
|
|
if not os.path.exists(cacert):
|
2012-02-29 00:20:53 +00:00
|
|
|
certutils.dummy_ca(cacert)
|
2011-02-19 23:53:42 +00:00
|
|
|
if getattr(options, "cache", None) is not None:
|
|
|
|
options.cache = os.path.expanduser(options.cache)
|
2011-09-09 03:27:31 +00:00
|
|
|
body_size_limit = utils.parse_size(options.body_size_limit)
|
2012-02-18 01:45:22 +00:00
|
|
|
|
|
|
|
if options.reverse_proxy:
|
|
|
|
rp = utils.parse_proxy_spec(options.reverse_proxy)
|
|
|
|
if not rp:
|
|
|
|
parser.error("Invalid reverse proxy specification: %s"%options.reverse_proxy)
|
|
|
|
else:
|
|
|
|
rp = None
|
|
|
|
|
2012-05-23 21:09:03 +00:00
|
|
|
if options.clientcerts:
|
|
|
|
options.clientcerts = os.path.expanduser(options.clientcerts)
|
|
|
|
if not os.path.exists(options.clientcerts) or not os.path.isdir(options.clientcerts):
|
|
|
|
parser.error("Client certificate directory does not exist or is not a directory: %s"%options.clientcerts)
|
|
|
|
|
2011-09-09 02:49:34 +00:00
|
|
|
return ProxyConfig(
|
2011-02-19 23:53:42 +00:00
|
|
|
certfile = options.cert,
|
2011-03-18 03:45:31 +00:00
|
|
|
cacert = cacert,
|
2012-05-23 21:09:03 +00:00
|
|
|
clientcerts = options.clientcerts,
|
2011-06-27 04:10:17 +00:00
|
|
|
ciphers = options.ciphers,
|
2011-09-09 03:27:31 +00:00
|
|
|
cert_wait_time = options.cert_wait_time,
|
2012-02-16 14:33:27 +00:00
|
|
|
body_size_limit = body_size_limit,
|
2012-02-27 22:37:48 +00:00
|
|
|
upstream_cert = options.upstream_cert,
|
2012-02-18 01:45:22 +00:00
|
|
|
reverse_proxy = rp
|
2011-02-19 23:53:42 +00:00
|
|
|
)
|