2015-09-15 22:04:23 +00:00
|
|
|
from __future__ import absolute_import, print_function, division
|
|
|
|
from io import BytesIO
|
|
|
|
from mock import Mock
|
2015-09-26 18:07:11 +00:00
|
|
|
from netlib.exceptions import HttpException, HttpSyntaxException, HttpReadDisconnect, TcpDisconnect
|
2015-09-15 22:04:23 +00:00
|
|
|
from netlib.http import Headers
|
|
|
|
from netlib.http.http1.read import (
|
|
|
|
read_request, read_response, read_request_head,
|
|
|
|
read_response_head, read_body, connection_close, expected_http_body_size, _get_first_line,
|
|
|
|
_read_request_line, _parse_authority_form, _read_response_line, _check_http_version,
|
2016-05-31 06:54:42 +00:00
|
|
|
_read_headers, _read_chunked, get_header_tokens
|
2015-09-15 22:04:23 +00:00
|
|
|
)
|
|
|
|
from netlib.tutils import treq, tresp, raises
|
|
|
|
|
|
|
|
|
2016-05-31 06:54:42 +00:00
|
|
|
def test_get_header_tokens():
|
|
|
|
headers = Headers()
|
|
|
|
assert get_header_tokens(headers, "foo") == []
|
|
|
|
headers["foo"] = "bar"
|
|
|
|
assert get_header_tokens(headers, "foo") == ["bar"]
|
|
|
|
headers["foo"] = "bar, voing"
|
|
|
|
assert get_header_tokens(headers, "foo") == ["bar", "voing"]
|
|
|
|
headers.set_all("foo", ["bar, voing", "oink"])
|
|
|
|
assert get_header_tokens(headers, "foo") == ["bar", "voing", "oink"]
|
|
|
|
|
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
def test_read_request():
|
|
|
|
rfile = BytesIO(b"GET / HTTP/1.1\r\n\r\nskip")
|
|
|
|
r = read_request(rfile)
|
2015-09-25 22:39:04 +00:00
|
|
|
assert r.method == "GET"
|
|
|
|
assert r.content == b""
|
2015-09-15 22:04:23 +00:00
|
|
|
assert r.timestamp_end
|
|
|
|
assert rfile.read() == b"skip"
|
|
|
|
|
|
|
|
|
|
|
|
def test_read_request_head():
|
|
|
|
rfile = BytesIO(
|
|
|
|
b"GET / HTTP/1.1\r\n"
|
|
|
|
b"Content-Length: 4\r\n"
|
|
|
|
b"\r\n"
|
|
|
|
b"skip"
|
|
|
|
)
|
|
|
|
rfile.reset_timestamps = Mock()
|
|
|
|
rfile.first_byte_timestamp = 42
|
|
|
|
r = read_request_head(rfile)
|
2015-09-25 22:39:04 +00:00
|
|
|
assert r.method == "GET"
|
2015-09-21 23:48:35 +00:00
|
|
|
assert r.headers["Content-Length"] == "4"
|
2015-09-26 15:39:50 +00:00
|
|
|
assert r.content is None
|
2015-09-15 22:04:23 +00:00
|
|
|
assert rfile.reset_timestamps.called
|
|
|
|
assert r.timestamp_start == 42
|
|
|
|
assert rfile.read() == b"skip"
|
|
|
|
|
|
|
|
|
|
|
|
def test_read_response():
|
|
|
|
req = treq()
|
|
|
|
rfile = BytesIO(b"HTTP/1.1 418 I'm a teapot\r\n\r\nbody")
|
|
|
|
r = read_response(rfile, req)
|
|
|
|
assert r.status_code == 418
|
2015-09-26 15:39:50 +00:00
|
|
|
assert r.content == b"body"
|
2015-09-15 22:04:23 +00:00
|
|
|
assert r.timestamp_end
|
|
|
|
|
|
|
|
|
|
|
|
def test_read_response_head():
|
|
|
|
rfile = BytesIO(
|
|
|
|
b"HTTP/1.1 418 I'm a teapot\r\n"
|
|
|
|
b"Content-Length: 4\r\n"
|
|
|
|
b"\r\n"
|
|
|
|
b"skip"
|
|
|
|
)
|
|
|
|
rfile.reset_timestamps = Mock()
|
|
|
|
rfile.first_byte_timestamp = 42
|
|
|
|
r = read_response_head(rfile)
|
|
|
|
assert r.status_code == 418
|
2015-09-21 23:48:35 +00:00
|
|
|
assert r.headers["Content-Length"] == "4"
|
2015-09-26 15:39:50 +00:00
|
|
|
assert r.content is None
|
2015-09-15 22:04:23 +00:00
|
|
|
assert rfile.reset_timestamps.called
|
|
|
|
assert r.timestamp_start == 42
|
|
|
|
assert rfile.read() == b"skip"
|
|
|
|
|
|
|
|
|
|
|
|
class TestReadBody(object):
|
|
|
|
def test_chunked(self):
|
|
|
|
rfile = BytesIO(b"3\r\nfoo\r\n0\r\n\r\nbar")
|
|
|
|
body = b"".join(read_body(rfile, None))
|
|
|
|
assert body == b"foo"
|
|
|
|
assert rfile.read() == b"bar"
|
|
|
|
|
|
|
|
def test_known_size(self):
|
|
|
|
rfile = BytesIO(b"foobar")
|
|
|
|
body = b"".join(read_body(rfile, 3))
|
|
|
|
assert body == b"foo"
|
|
|
|
assert rfile.read() == b"bar"
|
|
|
|
|
|
|
|
def test_known_size_limit(self):
|
|
|
|
rfile = BytesIO(b"foobar")
|
|
|
|
with raises(HttpException):
|
|
|
|
b"".join(read_body(rfile, 3, 2))
|
|
|
|
|
|
|
|
def test_known_size_too_short(self):
|
|
|
|
rfile = BytesIO(b"foo")
|
|
|
|
with raises(HttpException):
|
|
|
|
b"".join(read_body(rfile, 6))
|
|
|
|
|
|
|
|
def test_unknown_size(self):
|
|
|
|
rfile = BytesIO(b"foobar")
|
|
|
|
body = b"".join(read_body(rfile, -1))
|
|
|
|
assert body == b"foobar"
|
|
|
|
|
|
|
|
def test_unknown_size_limit(self):
|
|
|
|
rfile = BytesIO(b"foobar")
|
|
|
|
with raises(HttpException):
|
|
|
|
b"".join(read_body(rfile, -1, 3))
|
|
|
|
|
2015-09-26 18:07:11 +00:00
|
|
|
def test_max_chunk_size(self):
|
|
|
|
rfile = BytesIO(b"123456")
|
|
|
|
assert list(read_body(rfile, -1, max_chunk_size=None)) == [b"123456"]
|
|
|
|
rfile = BytesIO(b"123456")
|
|
|
|
assert list(read_body(rfile, -1, max_chunk_size=1)) == [b"1", b"2", b"3", b"4", b"5", b"6"]
|
2015-09-15 22:04:23 +00:00
|
|
|
|
2016-05-29 09:43:29 +00:00
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
def test_connection_close():
|
|
|
|
headers = Headers()
|
2015-09-16 16:43:24 +00:00
|
|
|
assert connection_close(b"HTTP/1.0", headers)
|
|
|
|
assert not connection_close(b"HTTP/1.1", headers)
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
headers["connection"] = "keep-alive"
|
2015-09-16 16:43:24 +00:00
|
|
|
assert not connection_close(b"HTTP/1.1", headers)
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
headers["connection"] = "close"
|
2015-09-16 16:43:24 +00:00
|
|
|
assert connection_close(b"HTTP/1.1", headers)
|
2015-09-15 22:04:23 +00:00
|
|
|
|
2015-09-26 22:49:41 +00:00
|
|
|
headers["connection"] = "foobar"
|
|
|
|
assert connection_close(b"HTTP/1.0", headers)
|
|
|
|
assert not connection_close(b"HTTP/1.1", headers)
|
2015-09-15 22:04:23 +00:00
|
|
|
|
2016-05-29 09:43:29 +00:00
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
def test_expected_http_body_size():
|
|
|
|
# Expect: 100-continue
|
|
|
|
assert expected_http_body_size(
|
2015-09-21 23:48:35 +00:00
|
|
|
treq(headers=Headers(expect="100-continue", content_length="42"))
|
2015-09-15 22:04:23 +00:00
|
|
|
) == 0
|
|
|
|
|
|
|
|
# http://tools.ietf.org/html/rfc7230#section-3.3
|
|
|
|
assert expected_http_body_size(
|
|
|
|
treq(method=b"HEAD"),
|
2015-09-21 23:48:35 +00:00
|
|
|
tresp(headers=Headers(content_length="42"))
|
2015-09-15 22:04:23 +00:00
|
|
|
) == 0
|
|
|
|
assert expected_http_body_size(
|
|
|
|
treq(method=b"CONNECT"),
|
|
|
|
tresp()
|
|
|
|
) == 0
|
|
|
|
for code in (100, 204, 304):
|
|
|
|
assert expected_http_body_size(
|
|
|
|
treq(),
|
|
|
|
tresp(status_code=code)
|
|
|
|
) == 0
|
|
|
|
|
|
|
|
# chunked
|
|
|
|
assert expected_http_body_size(
|
2015-09-21 23:48:35 +00:00
|
|
|
treq(headers=Headers(transfer_encoding="chunked")),
|
2015-09-15 22:04:23 +00:00
|
|
|
) is None
|
|
|
|
|
|
|
|
# explicit length
|
2015-09-21 23:48:35 +00:00
|
|
|
for val in (b"foo", b"-7"):
|
2015-09-15 22:04:23 +00:00
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
expected_http_body_size(
|
2015-09-21 23:48:35 +00:00
|
|
|
treq(headers=Headers(content_length=val))
|
2015-09-15 22:04:23 +00:00
|
|
|
)
|
|
|
|
assert expected_http_body_size(
|
2015-09-21 23:48:35 +00:00
|
|
|
treq(headers=Headers(content_length="42"))
|
2015-09-15 22:04:23 +00:00
|
|
|
) == 42
|
|
|
|
|
|
|
|
# no length
|
|
|
|
assert expected_http_body_size(
|
2016-01-30 21:03:24 +00:00
|
|
|
treq(headers=Headers())
|
2015-09-15 22:04:23 +00:00
|
|
|
) == 0
|
|
|
|
assert expected_http_body_size(
|
2016-01-30 21:03:24 +00:00
|
|
|
treq(headers=Headers()), tresp(headers=Headers())
|
2015-09-15 22:04:23 +00:00
|
|
|
) == -1
|
|
|
|
|
|
|
|
|
|
|
|
def test_get_first_line():
|
|
|
|
rfile = BytesIO(b"foo\r\nbar")
|
|
|
|
assert _get_first_line(rfile) == b"foo"
|
|
|
|
|
|
|
|
rfile = BytesIO(b"\r\nfoo\r\nbar")
|
|
|
|
assert _get_first_line(rfile) == b"foo"
|
|
|
|
|
|
|
|
with raises(HttpReadDisconnect):
|
|
|
|
rfile = BytesIO(b"")
|
|
|
|
_get_first_line(rfile)
|
|
|
|
|
2015-09-26 18:07:11 +00:00
|
|
|
with raises(HttpReadDisconnect):
|
|
|
|
rfile = Mock()
|
|
|
|
rfile.readline.side_effect = TcpDisconnect
|
|
|
|
_get_first_line(rfile)
|
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
def test_read_request_line():
|
|
|
|
def t(b):
|
|
|
|
return _read_request_line(BytesIO(b))
|
|
|
|
|
|
|
|
assert (t(b"GET / HTTP/1.1") ==
|
|
|
|
("relative", b"GET", None, None, None, b"/", b"HTTP/1.1"))
|
|
|
|
assert (t(b"OPTIONS * HTTP/1.1") ==
|
|
|
|
("relative", b"OPTIONS", None, None, None, b"*", b"HTTP/1.1"))
|
|
|
|
assert (t(b"CONNECT foo:42 HTTP/1.1") ==
|
|
|
|
("authority", b"CONNECT", None, b"foo", 42, None, b"HTTP/1.1"))
|
|
|
|
assert (t(b"GET http://foo:42/bar HTTP/1.1") ==
|
|
|
|
("absolute", b"GET", b"http", b"foo", 42, b"/bar", b"HTTP/1.1"))
|
|
|
|
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
t(b"GET / WTF/1.1")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
t(b"this is not http")
|
2015-09-26 18:07:11 +00:00
|
|
|
with raises(HttpReadDisconnect):
|
|
|
|
t(b"")
|
2015-09-15 22:04:23 +00:00
|
|
|
|
2016-05-29 09:43:29 +00:00
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
def test_parse_authority_form():
|
|
|
|
assert _parse_authority_form(b"foo:42") == (b"foo", 42)
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_parse_authority_form(b"foo")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_parse_authority_form(b"foo:bar")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_parse_authority_form(b"foo:99999999")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_parse_authority_form(b"f\x00oo:80")
|
|
|
|
|
|
|
|
|
|
|
|
def test_read_response_line():
|
|
|
|
def t(b):
|
|
|
|
return _read_response_line(BytesIO(b))
|
|
|
|
|
|
|
|
assert t(b"HTTP/1.1 200 OK") == (b"HTTP/1.1", 200, b"OK")
|
|
|
|
assert t(b"HTTP/1.1 200") == (b"HTTP/1.1", 200, b"")
|
2015-09-28 09:18:00 +00:00
|
|
|
|
|
|
|
# https://github.com/mitmproxy/mitmproxy/issues/784
|
2015-09-28 09:46:18 +00:00
|
|
|
assert t(b"HTTP/1.1 200 Non-Autoris\xc3\xa9") == (b"HTTP/1.1", 200, b"Non-Autoris\xc3\xa9")
|
2015-09-28 09:18:00 +00:00
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
assert t(b"HTTP/1.1")
|
|
|
|
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
t(b"HTTP/1.1 OK OK")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
t(b"WTF/1.1 200 OK")
|
2015-09-26 18:07:11 +00:00
|
|
|
with raises(HttpReadDisconnect):
|
|
|
|
t(b"")
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_check_http_version():
|
|
|
|
_check_http_version(b"HTTP/0.9")
|
|
|
|
_check_http_version(b"HTTP/1.0")
|
|
|
|
_check_http_version(b"HTTP/1.1")
|
|
|
|
_check_http_version(b"HTTP/2.0")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_check_http_version(b"WTF/1.0")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_check_http_version(b"HTTP/1.10")
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
_check_http_version(b"HTTP/1.b")
|
|
|
|
|
|
|
|
|
|
|
|
class TestReadHeaders(object):
|
|
|
|
@staticmethod
|
|
|
|
def _read(data):
|
|
|
|
return _read_headers(BytesIO(data))
|
|
|
|
|
|
|
|
def test_read_simple(self):
|
|
|
|
data = (
|
|
|
|
b"Header: one\r\n"
|
|
|
|
b"Header2: two\r\n"
|
|
|
|
b"\r\n"
|
|
|
|
)
|
|
|
|
headers = self._read(data)
|
2016-05-19 01:46:42 +00:00
|
|
|
assert headers.fields == ((b"Header", b"one"), (b"Header2", b"two"))
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
def test_read_multi(self):
|
|
|
|
data = (
|
|
|
|
b"Header: one\r\n"
|
|
|
|
b"Header: two\r\n"
|
|
|
|
b"\r\n"
|
|
|
|
)
|
|
|
|
headers = self._read(data)
|
2016-05-19 01:46:42 +00:00
|
|
|
assert headers.fields == ((b"Header", b"one"), (b"Header", b"two"))
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
def test_read_continued(self):
|
|
|
|
data = (
|
|
|
|
b"Header: one\r\n"
|
|
|
|
b"\ttwo\r\n"
|
|
|
|
b"Header2: three\r\n"
|
|
|
|
b"\r\n"
|
|
|
|
)
|
|
|
|
headers = self._read(data)
|
2016-05-19 01:46:42 +00:00
|
|
|
assert headers.fields == ((b"Header", b"one\r\n two"), (b"Header2", b"three"))
|
2015-09-15 22:04:23 +00:00
|
|
|
|
|
|
|
def test_read_continued_err(self):
|
|
|
|
data = b"\tfoo: bar\r\n"
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
self._read(data)
|
|
|
|
|
|
|
|
def test_read_err(self):
|
|
|
|
data = b"foo"
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
self._read(data)
|
|
|
|
|
2015-09-16 16:43:24 +00:00
|
|
|
def test_read_empty_name(self):
|
|
|
|
data = b":foo"
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
self._read(data)
|
2015-09-15 22:04:23 +00:00
|
|
|
|
2015-11-16 19:46:48 +00:00
|
|
|
def test_read_empty_value(self):
|
|
|
|
data = b"bar:"
|
|
|
|
headers = self._read(data)
|
2016-05-19 01:46:42 +00:00
|
|
|
assert headers.fields == ((b"bar", b""),)
|
2015-09-21 23:48:35 +00:00
|
|
|
|
2016-05-29 09:43:29 +00:00
|
|
|
|
2015-09-15 22:04:23 +00:00
|
|
|
def test_read_chunked():
|
2015-09-25 22:39:04 +00:00
|
|
|
req = treq(content=None)
|
2015-09-15 22:04:23 +00:00
|
|
|
req.headers["Transfer-Encoding"] = "chunked"
|
|
|
|
|
|
|
|
data = b"1\r\na\r\n0\r\n"
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
b"".join(_read_chunked(BytesIO(data)))
|
|
|
|
|
|
|
|
data = b"1\r\na\r\n0\r\n\r\n"
|
|
|
|
assert b"".join(_read_chunked(BytesIO(data))) == b"a"
|
|
|
|
|
|
|
|
data = b"\r\n\r\n1\r\na\r\n1\r\nb\r\n0\r\n\r\n"
|
|
|
|
assert b"".join(_read_chunked(BytesIO(data))) == b"ab"
|
|
|
|
|
|
|
|
data = b"\r\n"
|
|
|
|
with raises("closed prematurely"):
|
|
|
|
b"".join(_read_chunked(BytesIO(data)))
|
|
|
|
|
|
|
|
data = b"1\r\nfoo"
|
|
|
|
with raises("malformed chunked body"):
|
|
|
|
b"".join(_read_chunked(BytesIO(data)))
|
|
|
|
|
|
|
|
data = b"foo\r\nfoo"
|
|
|
|
with raises(HttpSyntaxException):
|
|
|
|
b"".join(_read_chunked(BytesIO(data)))
|
|
|
|
|
|
|
|
data = b"5\r\naaaaa\r\n0\r\n\r\n"
|
|
|
|
with raises("too large"):
|
|
|
|
b"".join(_read_chunked(BytesIO(data), limit=2))
|