mitmproxy/netlib/wsgi.py

164 lines
5.5 KiB
Python
Raw Normal View History

2014-08-16 13:53:07 +00:00
from __future__ import (absolute_import, print_function, division)
2015-09-20 22:44:17 +00:00
from io import BytesIO, StringIO
import urllib
import time
import traceback
2015-09-20 16:12:55 +00:00
import six
2015-09-20 22:44:17 +00:00
from six.moves import urllib
2015-09-20 16:12:55 +00:00
2015-09-20 22:44:17 +00:00
from netlib.utils import always_bytes, native
2015-09-05 16:15:47 +00:00
from . import http, tcp
2012-06-18 22:42:25 +00:00
2015-04-09 00:09:33 +00:00
class ClientConn(object):
def __init__(self, address):
self.address = tcp.Address.wrap(address)
2015-04-09 00:09:33 +00:00
class Flow(object):
def __init__(self, address, request):
self.client_conn = ClientConn(address)
self.request = request
2015-04-09 00:09:33 +00:00
class Request(object):
2015-09-20 22:44:17 +00:00
def __init__(self, scheme, method, path, http_version, headers, body):
self.scheme, self.method, self.path = scheme, method, path
2015-07-19 16:17:30 +00:00
self.headers, self.body = headers, body
2015-09-20 22:44:17 +00:00
self.http_version = http_version
2012-06-18 22:42:25 +00:00
def date_time_string():
"""Return the current date and time formatted for a message header."""
WEEKS = ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun']
MONTHS = [
None,
'Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun',
'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'
]
2012-06-18 22:42:25 +00:00
now = time.time()
2015-06-18 13:32:52 +00:00
year, month, day, hh, mm, ss, wd, y_, z_ = time.gmtime(now)
2012-06-18 22:42:25 +00:00
s = "%s, %02d %3s %4d %02d:%02d:%02d GMT" % (
WEEKS[wd],
day, MONTHS[month], year,
hh, mm, ss
)
2012-06-18 22:42:25 +00:00
return s
2015-04-09 00:09:33 +00:00
class WSGIAdaptor(object):
2012-06-18 22:42:25 +00:00
def __init__(self, app, domain, port, sversion):
self.app, self.domain, self.port, self.sversion = app, domain, port, sversion
def make_environ(self, flow, errsoc, **extra):
2015-09-20 22:44:17 +00:00
path = native(flow.request.path)
if '?' in path:
path_info, query = native(path).split('?', 1)
2012-06-18 22:42:25 +00:00
else:
2015-09-20 22:44:17 +00:00
path_info = path
2012-06-18 22:42:25 +00:00
query = ''
environ = {
'wsgi.version': (1, 0),
2015-09-20 22:44:17 +00:00
'wsgi.url_scheme': native(flow.request.scheme),
2015-09-20 16:12:55 +00:00
'wsgi.input': BytesIO(flow.request.body or b""),
'wsgi.errors': errsoc,
'wsgi.multithread': True,
'wsgi.multiprocess': False,
'wsgi.run_once': False,
'SERVER_SOFTWARE': self.sversion,
2015-09-20 22:44:17 +00:00
'REQUEST_METHOD': native(flow.request.method),
'SCRIPT_NAME': '',
2015-09-20 22:44:17 +00:00
'PATH_INFO': urllib.parse.unquote(path_info),
'QUERY_STRING': query,
2015-09-20 22:44:17 +00:00
'CONTENT_TYPE': native(flow.request.headers.get('Content-Type', '')),
'CONTENT_LENGTH': native(flow.request.headers.get('Content-Length', '')),
'SERVER_NAME': self.domain,
'SERVER_PORT': str(self.port),
2015-09-20 22:44:17 +00:00
'SERVER_PROTOCOL': native(flow.request.http_version),
2012-06-18 22:42:25 +00:00
}
environ.update(extra)
if flow.client_conn.address:
2015-09-20 22:44:17 +00:00
environ["REMOTE_ADDR"] = native(flow.client_conn.address.host)
environ["REMOTE_PORT"] = flow.client_conn.address.port
2012-06-18 22:42:25 +00:00
for key, value in flow.request.headers.items():
2015-09-20 22:44:17 +00:00
key = 'HTTP_' + native(key).upper().replace('-', '_')
2012-06-18 22:42:25 +00:00
if key not in ('HTTP_CONTENT_TYPE', 'HTTP_CONTENT_LENGTH'):
environ[key] = value
return environ
def error_page(self, soc, headers_sent, s):
"""
Make a best-effort attempt to write an error page. If headers are
already sent, we just bung the error into the page.
"""
2015-09-20 16:12:55 +00:00
c = b"""
2012-06-18 22:42:25 +00:00
<html>
<h1>Internal Server Error</h1>
<pre>%s"</pre>
</html>
2015-09-20 22:44:17 +00:00
""".strip() % s.encode()
2012-06-18 22:42:25 +00:00
if not headers_sent:
2015-09-20 16:12:55 +00:00
soc.write(b"HTTP/1.1 500 Internal Server Error\r\n")
soc.write(b"Content-Type: text/html\r\n")
soc.write(b"Content-Length: %s\r\n" % len(c))
soc.write(b"\r\n")
2012-06-18 22:42:25 +00:00
soc.write(c)
def serve(self, request, soc, **env):
2012-06-18 22:42:25 +00:00
state = dict(
response_started=False,
headers_sent=False,
status=None,
headers=None
2012-06-18 22:42:25 +00:00
)
2012-06-18 22:42:25 +00:00
def write(data):
if not state["headers_sent"]:
2015-09-20 22:44:17 +00:00
soc.write(b"HTTP/1.1 %s\r\n" % state["status"].encode())
2015-09-05 16:15:47 +00:00
headers = state["headers"]
if 'server' not in headers:
headers["Server"] = self.sversion
if 'date' not in headers:
headers["Date"] = date_time_string()
2015-09-20 16:12:55 +00:00
soc.write(bytes(headers))
soc.write(b"\r\n")
2012-06-18 22:42:25 +00:00
state["headers_sent"] = True
2012-06-26 02:49:23 +00:00
if data:
soc.write(data)
2012-06-18 22:42:25 +00:00
soc.flush()
def start_response(status, headers, exc_info=None):
if exc_info:
2015-09-20 22:44:17 +00:00
if state["headers_sent"]:
six.reraise(*exc_info)
2012-06-18 22:42:25 +00:00
elif state["status"]:
raise AssertionError('Response already started')
state["status"] = status
2015-09-20 22:44:17 +00:00
state["headers"] = http.Headers([[always_bytes(k), always_bytes(v)] for k,v in headers])
if exc_info:
self.error_page(soc, state["headers_sent"], traceback.format_tb(exc_info[2]))
state["headers_sent"] = True
2012-06-18 22:42:25 +00:00
2015-09-20 22:44:17 +00:00
errs = six.BytesIO()
2012-06-18 22:42:25 +00:00
try:
dataiter = self.app(
self.make_environ(request, errs, **env), start_response
)
2012-06-18 22:42:25 +00:00
for i in dataiter:
write(i)
if not state["headers_sent"]:
2015-09-20 16:12:55 +00:00
write(b"")
2015-09-05 16:15:47 +00:00
except Exception as e:
2012-06-18 22:42:25 +00:00
try:
s = traceback.format_exc()
2015-09-20 22:44:17 +00:00
errs.write(s.encode("utf-8", "replace"))
2012-06-18 22:42:25 +00:00
self.error_page(soc, state["headers_sent"], s)
except Exception: # pragma: no cover
pass
2012-06-18 22:42:25 +00:00
return errs.getvalue()