mitmproxy/test/http/http1/test_protocol.py

467 lines
14 KiB
Python
Raw Normal View History

2015-09-15 17:12:15 +00:00
from io import BytesIO
2015-04-20 23:19:00 +00:00
import textwrap
2015-09-15 17:12:15 +00:00
from http.http1.protocol import _parse_authority_form
from netlib.exceptions import HttpSyntaxException, HttpReadDisconnect, HttpException
2012-06-18 21:42:32 +00:00
2015-09-15 17:12:15 +00:00
from netlib import http, tcp, tutils
2015-09-05 16:15:47 +00:00
from netlib.http import semantics, Headers
2015-09-15 17:12:15 +00:00
from netlib.http.http1 import HTTP1Protocol, read_message_body, read_request, \
read_message_body_chunked, expected_http_body_size
2015-08-01 12:49:15 +00:00
from ... import tservers
2012-06-23 03:07:42 +00:00
2015-08-05 19:32:53 +00:00
class NoContentLengthHTTPHandler(tcp.BaseHandler):
def handle(self):
self.wfile.write("HTTP/1.1 200 OK\r\n\r\nbar\r\n\r\n")
self.wfile.flush()
def mock_protocol(data=''):
2015-09-15 17:12:15 +00:00
rfile = BytesIO(data)
wfile = BytesIO()
2015-07-22 11:01:24 +00:00
return HTTP1Protocol(rfile=rfile, wfile=wfile)
2015-07-16 20:56:34 +00:00
2015-08-05 19:32:53 +00:00
def match_http_string(data):
return textwrap.dedent(data).strip().replace('\n', '\r\n')
def test_stripped_chunked_encoding_no_content():
"""
https://github.com/mitmproxy/mitmproxy/issues/186
"""
r = tutils.treq(content="")
2015-09-05 16:15:47 +00:00
r.headers["Transfer-Encoding"] = "chunked"
2015-08-05 19:32:53 +00:00
assert "Content-Length" in mock_protocol()._assemble_request_headers(r)
r = tutils.tresp(content="")
2015-09-05 16:15:47 +00:00
r.headers["Transfer-Encoding"] = "chunked"
2015-08-05 19:32:53 +00:00
assert "Content-Length" in mock_protocol()._assemble_response_headers(r)
2015-07-16 20:56:34 +00:00
2012-06-18 21:42:32 +00:00
def test_read_chunked():
2015-09-15 17:12:15 +00:00
req = tutils.treq(None)
req.headers["Transfer-Encoding"] = "chunked"
2014-07-21 12:01:24 +00:00
2015-09-15 17:12:15 +00:00
data = b"1\r\na\r\n0\r\n"
with tutils.raises(HttpSyntaxException):
read_message_body(BytesIO(data), req)
2012-06-18 21:42:32 +00:00
2015-09-15 17:12:15 +00:00
data = b"1\r\na\r\n0\r\n\r\n"
assert read_message_body(BytesIO(data), req) == b"a"
2012-06-23 03:07:42 +00:00
2015-09-15 17:12:15 +00:00
data = b"\r\n\r\n1\r\na\r\n1\r\nb\r\n0\r\n\r\n"
assert read_message_body(BytesIO(data), req) == b"ab"
2012-06-18 21:42:32 +00:00
2015-09-15 17:12:15 +00:00
data = b"\r\n"
with tutils.raises("closed prematurely"):
read_message_body(BytesIO(data), req)
2012-06-18 21:42:32 +00:00
2015-09-15 17:12:15 +00:00
data = b"1\r\nfoo"
with tutils.raises("malformed chunked body"):
read_message_body(BytesIO(data), req)
2012-06-18 21:42:32 +00:00
2015-09-15 17:12:15 +00:00
data = b"foo\r\nfoo"
with tutils.raises(HttpSyntaxException):
read_message_body(BytesIO(data), req)
2012-06-23 03:07:42 +00:00
2015-09-15 17:12:15 +00:00
data = b"5\r\naaaaa\r\n0\r\n\r\n"
with tutils.raises("too large"):
read_message_body(BytesIO(data), req, limit=2)
2013-11-19 03:11:24 +00:00
def test_connection_close():
2015-09-05 16:15:47 +00:00
headers = Headers()
assert HTTP1Protocol.connection_close((1, 0), headers)
assert not HTTP1Protocol.connection_close((1, 1), headers)
2012-06-18 21:42:32 +00:00
2015-09-05 16:15:47 +00:00
headers["connection"] = "keep-alive"
assert not HTTP1Protocol.connection_close((1, 1), headers)
2012-06-18 21:42:32 +00:00
2015-09-05 16:15:47 +00:00
headers["connection"] = "close"
assert HTTP1Protocol.connection_close((1, 1), headers)
2012-06-23 03:07:42 +00:00
2012-06-23 03:07:42 +00:00
def test_read_http_body_request():
2015-09-05 16:15:47 +00:00
headers = Headers()
2015-07-16 20:56:34 +00:00
data = "testing"
2015-09-05 16:15:47 +00:00
assert mock_protocol(data).read_http_body(headers, None, "GET", None, True) == ""
2012-06-23 03:07:42 +00:00
2013-12-15 05:43:54 +00:00
def test_read_http_body_response():
2015-09-05 16:15:47 +00:00
headers = Headers()
2015-07-16 20:56:34 +00:00
data = "testing"
2015-09-05 16:15:47 +00:00
assert mock_protocol(data).read_http_body(headers, None, "GET", 200, False) == "testing"
2012-06-18 21:42:32 +00:00
2012-06-18 21:42:32 +00:00
def test_read_http_body():
2013-12-15 05:43:54 +00:00
# test default case
2015-09-05 16:15:47 +00:00
headers = Headers()
headers["content-length"] = "7"
2015-07-16 20:56:34 +00:00
data = "testing"
2015-09-05 16:15:47 +00:00
assert mock_protocol(data).read_http_body(headers, None, "GET", 200, False) == "testing"
2012-06-18 21:42:32 +00:00
2013-12-15 05:43:54 +00:00
# test content length: invalid header
2015-09-05 16:15:47 +00:00
headers["content-length"] = "foo"
2015-07-16 20:56:34 +00:00
data = "testing"
2015-04-20 23:19:00 +00:00
tutils.raises(
2015-07-16 20:56:34 +00:00
http.HttpError,
mock_protocol(data).read_http_body,
2015-09-05 16:15:47 +00:00
headers, None, "GET", 200, False
2015-04-20 23:19:00 +00:00
)
2012-06-18 21:42:32 +00:00
2013-12-15 05:43:54 +00:00
# test content length: invalid header #2
2015-09-05 16:15:47 +00:00
headers["content-length"] = "-1"
2015-07-16 20:56:34 +00:00
data = "testing"
2015-04-20 23:19:00 +00:00
tutils.raises(
2015-07-16 20:56:34 +00:00
http.HttpError,
mock_protocol(data).read_http_body,
2015-09-05 16:15:47 +00:00
headers, None, "GET", 200, False
2015-04-20 23:19:00 +00:00
)
2013-12-15 05:43:54 +00:00
# test content length: content length > actual content
2015-09-05 16:15:47 +00:00
headers["content-length"] = "5"
2015-07-16 20:56:34 +00:00
data = "testing"
2015-04-20 23:19:00 +00:00
tutils.raises(
2015-07-16 20:56:34 +00:00
http.HttpError,
mock_protocol(data).read_http_body,
2015-09-05 16:15:47 +00:00
headers, 4, "GET", 200, False
2015-04-20 23:19:00 +00:00
)
2013-12-15 05:43:54 +00:00
# test content length: content length < actual content
2015-07-16 20:56:34 +00:00
data = "testing"
2015-09-05 16:15:47 +00:00
assert len(mock_protocol(data).read_http_body(headers, None, "GET", 200, False)) == 5
2012-06-18 21:42:32 +00:00
2013-12-15 05:43:54 +00:00
# test no content length: limit > actual content
2015-09-05 16:15:47 +00:00
headers = Headers()
2015-07-16 20:56:34 +00:00
data = "testing"
2015-09-05 16:15:47 +00:00
assert len(mock_protocol(data).read_http_body(headers, 100, "GET", 200, False)) == 7
2013-12-15 05:43:54 +00:00
# test no content length: limit < actual content
2015-07-16 20:56:34 +00:00
data = "testing"
2015-04-20 23:19:00 +00:00
tutils.raises(
2015-07-16 20:56:34 +00:00
http.HttpError,
2015-08-05 19:32:53 +00:00
mock_protocol(data).read_http_body,
2015-09-05 16:15:47 +00:00
headers, 4, "GET", 200, False
2015-04-20 23:19:00 +00:00
)
2012-06-23 03:07:42 +00:00
2013-12-15 05:43:54 +00:00
# test chunked
2015-09-05 16:15:47 +00:00
headers = Headers()
headers["transfer-encoding"] = "chunked"
2015-07-16 20:56:34 +00:00
data = "5\r\naaaaa\r\n0\r\n\r\n"
2015-09-05 16:15:47 +00:00
assert mock_protocol(data).read_http_body(headers, 100, "GET", 200, False) == "aaaaa"
2012-06-23 03:07:42 +00:00
def test_expected_http_body_size():
# gibber in the content-length field
2015-09-05 16:15:47 +00:00
headers = Headers(content_length="foo")
2015-09-15 17:12:15 +00:00
with tutils.raises(HttpSyntaxException):
expected_http_body_size(headers, False, "GET", 200) is None
# negative number in the content-length field
2015-09-05 16:15:47 +00:00
headers = Headers(content_length="-7")
2015-09-15 17:12:15 +00:00
with tutils.raises(HttpSyntaxException):
expected_http_body_size(headers, False, "GET", 200) is None
# explicit length
2015-09-05 16:15:47 +00:00
headers = Headers(content_length="5")
2015-09-15 17:12:15 +00:00
assert expected_http_body_size(headers, False, "GET", 200) == 5
# no length
2015-09-05 16:15:47 +00:00
headers = Headers()
2015-09-15 17:12:15 +00:00
assert expected_http_body_size(headers, False, "GET", 200) == -1
# no length request
2015-09-05 16:15:47 +00:00
headers = Headers()
2015-09-15 17:12:15 +00:00
assert expected_http_body_size(headers, True, "GET", None) == 0
# expect header
headers = Headers(content_length="5", expect="100-continue")
assert expected_http_body_size(headers, True, "GET", None) == 0
2012-06-18 21:42:32 +00:00
def test_parse_init_connect():
2015-09-15 17:12:15 +00:00
assert _parse_authority_form(b"CONNECT host.com:443 HTTP/1.0")
tutils.raises(ValueError,_parse_authority_form, b"\0host.com:443")
tutils.raises(ValueError,_parse_authority_form, b"host.com:444444")
tutils.raises(ValueError,_parse_authority_form, b"CONNECT host.com443 HTTP/1.0")
tutils.raises(ValueError,_parse_authority_form, b"CONNECT host.com:foo HTTP/1.0")
2012-06-18 21:42:32 +00:00
2013-05-05 01:49:20 +00:00
def test_parse_init_proxy():
2015-09-15 17:12:15 +00:00
u = b"GET http://foo.com:8888/test HTTP/1.1"
m, s, h, po, pa, httpversion = HTTP1Protocol._parse_absolute_form(u)
2012-06-18 21:42:32 +00:00
assert m == "GET"
assert s == "http"
assert h == "foo.com"
assert po == 8888
assert pa == "/test"
assert httpversion == (1, 1)
2013-03-03 09:13:23 +00:00
u = "G\xfeET http://foo.com:8888/test HTTP/1.1"
2015-09-15 17:12:15 +00:00
assert not HTTP1Protocol._parse_absolute_form(u)
2013-03-03 09:13:23 +00:00
2015-09-15 17:12:15 +00:00
with tutils.raises(ValueError):
assert not HTTP1Protocol._parse_absolute_form("invalid")
with tutils.raises(ValueError):
assert not HTTP1Protocol._parse_absolute_form("GET invalid HTTP/1.1")
with tutils.raises(ValueError):
assert not HTTP1Protocol._parse_absolute_form("GET http://foo.com:8888/test foo/1.1")
2012-06-18 21:42:32 +00:00
def test_parse_init_http():
u = "GET /test HTTP/1.1"
m, u, httpversion = HTTP1Protocol._parse_init_http(u)
2012-06-18 21:42:32 +00:00
assert m == "GET"
assert u == "/test"
assert httpversion == (1, 1)
2013-03-03 09:13:23 +00:00
u = "G\xfeET /test HTTP/1.1"
assert not HTTP1Protocol._parse_init_http(u)
2013-03-03 09:13:23 +00:00
assert not HTTP1Protocol._parse_init_http("invalid")
assert not HTTP1Protocol._parse_init_http("GET invalid HTTP/1.1")
assert not HTTP1Protocol._parse_init_http("GET /test foo/1.1")
assert not HTTP1Protocol._parse_init_http("GET /test\xc0 HTTP/1.1")
2012-06-18 21:42:32 +00:00
2012-06-18 21:42:32 +00:00
class TestReadHeaders:
def _read(self, data, verbatim=False):
if not verbatim:
data = textwrap.dedent(data)
data = data.strip()
2015-07-16 20:56:34 +00:00
return mock_protocol(data).read_headers()
2012-06-18 21:42:32 +00:00
def test_read_simple(self):
data = """
Header: one
Header2: two
\r\n
"""
2015-09-05 16:15:47 +00:00
headers = self._read(data)
assert headers.fields == [["Header", "one"], ["Header2", "two"]]
2012-06-18 21:42:32 +00:00
def test_read_multi(self):
data = """
Header: one
Header: two
\r\n
"""
2015-09-05 16:15:47 +00:00
headers = self._read(data)
assert headers.fields == [["Header", "one"], ["Header", "two"]]
2012-06-18 21:42:32 +00:00
def test_read_continued(self):
data = """
Header: one
\ttwo
Header2: three
\r\n
"""
2015-09-05 16:15:47 +00:00
headers = self._read(data)
assert headers.fields == [["Header", "one\r\n two"], ["Header2", "three"]]
2012-06-18 21:42:32 +00:00
def test_read_continued_err(self):
data = "\tfoo: bar\r\n"
assert self._read(data, True) is None
def test_read_err(self):
data = """
foo
"""
assert self._read(data) is None
2012-06-18 21:42:32 +00:00
2015-08-05 19:32:53 +00:00
class TestReadRequest(object):
def tst(self, data, **kwargs):
2015-07-16 20:56:34 +00:00
return mock_protocol(data).read_request(**kwargs)
def test_invalid(self):
tutils.raises(
"bad http request",
self.tst,
"xxx"
)
tutils.raises(
"bad http request line",
self.tst,
"get /\xff HTTP/1.1"
)
tutils.raises(
"invalid headers",
self.tst,
"get / HTTP/1.1\r\nfoo"
)
2015-04-29 20:41:13 +00:00
tutils.raises(
2015-09-15 17:12:15 +00:00
HttpReadDisconnect,
2015-04-29 20:41:13 +00:00
self.tst,
"\r\n"
)
def test_asterisk_form_in(self):
v = self.tst("OPTIONS * HTTP/1.1")
assert v.form_in == "relative"
assert v.method == "OPTIONS"
def test_absolute_form_in(self):
tutils.raises(
"Bad HTTP request line",
self.tst,
"GET oops-no-protocol.com HTTP/1.1"
)
v = self.tst("GET http://address:22/ HTTP/1.1")
assert v.form_in == "absolute"
assert v.port == 22
assert v.host == "address"
assert v.scheme == "http"
def test_connect(self):
tutils.raises(
"Bad HTTP request line",
self.tst,
"CONNECT oops-no-port.com HTTP/1.1"
)
v = self.tst("CONNECT foo.com:443 HTTP/1.1")
assert v.form_in == "authority"
assert v.method == "CONNECT"
assert v.port == 443
assert v.host == "foo.com"
def test_expect(self):
2015-09-15 17:12:15 +00:00
data = (
b"GET / HTTP/1.1\r\n"
b"Content-Length: 3\r\n"
b"Expect: 100-continue\r\n"
b"\r\n"
b"foobar"
)
2015-07-16 20:56:34 +00:00
2015-09-15 17:12:15 +00:00
rfile = BytesIO(data)
r = read_request(rfile)
assert r.body == b""
assert rfile.read(-1) == b"foobar"
2015-08-05 19:32:53 +00:00
class TestReadResponse(object):
def tst(self, data, method, body_size_limit, include_body=True):
data = textwrap.dedent(data)
return mock_protocol(data).read_response(
2015-08-24 16:16:34 +00:00
method, body_size_limit, include_body=include_body
2015-08-05 19:32:53 +00:00
)
def test_errors(self):
tutils.raises("server disconnect", self.tst, "", "GET", None)
tutils.raises("invalid server response", self.tst, "foo", "GET", None)
def test_simple(self):
data = """
HTTP/1.1 200
"""
assert self.tst(data, "GET", None) == http.Response(
2015-09-05 16:15:47 +00:00
(1, 1), 200, '', Headers(), ''
2015-08-05 19:32:53 +00:00
)
def test_simple_message(self):
data = """
HTTP/1.1 200 OK
"""
assert self.tst(data, "GET", None) == http.Response(
2015-09-05 16:15:47 +00:00
(1, 1), 200, 'OK', Headers(), ''
2015-08-05 19:32:53 +00:00
)
def test_invalid_http_version(self):
data = """
HTTP/x 200 OK
"""
tutils.raises("invalid http version", self.tst, data, "GET", None)
def test_invalid_status_code(self):
data = """
HTTP/1.1 xx OK
"""
tutils.raises("invalid server response", self.tst, data, "GET", None)
def test_valid_with_continue(self):
data = """
HTTP/1.1 100 CONTINUE
HTTP/1.1 200 OK
"""
assert self.tst(data, "GET", None) == http.Response(
2015-09-05 16:15:47 +00:00
(1, 1), 100, 'CONTINUE', Headers(), ''
2015-08-05 19:32:53 +00:00
)
def test_simple_body(self):
data = """
HTTP/1.1 200 OK
Content-Length: 3
foo
"""
assert self.tst(data, "GET", None).body == 'foo'
assert self.tst(data, "HEAD", None).body == ''
def test_invalid_headers(self):
data = """
HTTP/1.1 200 OK
\tContent-Length: 3
foo
"""
tutils.raises("invalid headers", self.tst, data, "GET", None)
def test_without_body(self):
data = """
HTTP/1.1 200 OK
Content-Length: 3
foo
"""
assert self.tst(data, "GET", None, include_body=False).body is None
class TestReadResponseNoContentLength(tservers.ServerTestBase):
handler = NoContentLengthHTTPHandler
def test_no_content_length(self):
c = tcp.TCPClient(("127.0.0.1", self.port))
c.connect()
2015-08-24 16:16:34 +00:00
resp = HTTP1Protocol(c).read_response("GET", None)
2015-08-05 19:32:53 +00:00
assert resp.body == "bar\r\n\r\n"
class TestAssembleRequest(object):
def test_simple(self):
req = tutils.treq()
b = HTTP1Protocol().assemble_request(req)
assert b == match_http_string("""
GET /path HTTP/1.1
header: qvalue
Host: address:22
Content-Length: 7
content""")
def test_body_missing(self):
req = tutils.treq(content=semantics.CONTENT_MISSING)
tutils.raises(http.HttpError, HTTP1Protocol().assemble_request, req)
def test_not_a_request(self):
tutils.raises(AssertionError, HTTP1Protocol().assemble_request, 'foo')
class TestAssembleResponse(object):
def test_simple(self):
resp = tutils.tresp()
b = HTTP1Protocol().assemble_response(resp)
assert b == match_http_string("""
HTTP/1.1 200 OK
header_response: svalue
Content-Length: 7
message""")
def test_body_missing(self):
resp = tutils.tresp(content=semantics.CONTENT_MISSING)
tutils.raises(http.HttpError, HTTP1Protocol().assemble_response, resp)
def test_not_a_request(self):
tutils.raises(AssertionError, HTTP1Protocol().assemble_response, 'foo')