mirror of
https://github.com/Grasscutters/mitmproxy.git
synced 2024-11-23 16:17:49 +00:00
6032c4f235
This PR improves our handling of HTTP message body encodings: - The unaltered message body is now accessible as `.raw_content` - The "content-encoding"-decoded content (i.e. gzip removed) content is not `.content`, as this is what we want in 99% of the cases. - `.text` now provides the "content-encoding"-decoded and then "content-type charset"-decoded message body. - The decoded values for `.content` and `.text` are cached, so that repeated access and `x.text = x.text` is cheap. - The `decoded()` decorator is now deprecated, as we can now just use `.content`. Similarly `HTTPMessage.get_decoded_content()` is deprecated.
103 lines
3.0 KiB
Python
103 lines
3.0 KiB
Python
from __future__ import absolute_import, print_function, division
|
|
|
|
import netlib.http.url
|
|
from netlib import exceptions
|
|
|
|
|
|
def assemble_request(request):
|
|
if request.data.content is None:
|
|
raise exceptions.HttpException("Cannot assemble flow with missing content")
|
|
head = assemble_request_head(request)
|
|
body = b"".join(assemble_body(request.data.headers, [request.data.content]))
|
|
return head + body
|
|
|
|
|
|
def assemble_request_head(request):
|
|
first_line = _assemble_request_line(request.data)
|
|
headers = _assemble_request_headers(request.data)
|
|
return b"%s\r\n%s\r\n" % (first_line, headers)
|
|
|
|
|
|
def assemble_response(response):
|
|
if response.data.content is None:
|
|
raise exceptions.HttpException("Cannot assemble flow with missing content")
|
|
head = assemble_response_head(response)
|
|
body = b"".join(assemble_body(response.data.headers, [response.data.content]))
|
|
return head + body
|
|
|
|
|
|
def assemble_response_head(response):
|
|
first_line = _assemble_response_line(response.data)
|
|
headers = _assemble_response_headers(response.data)
|
|
return b"%s\r\n%s\r\n" % (first_line, headers)
|
|
|
|
|
|
def assemble_body(headers, body_chunks):
|
|
if "chunked" in headers.get("transfer-encoding", "").lower():
|
|
for chunk in body_chunks:
|
|
if chunk:
|
|
yield b"%x\r\n%s\r\n" % (len(chunk), chunk)
|
|
yield b"0\r\n\r\n"
|
|
else:
|
|
for chunk in body_chunks:
|
|
yield chunk
|
|
|
|
|
|
def _assemble_request_line(request_data):
|
|
"""
|
|
Args:
|
|
request_data (netlib.http.request.RequestData)
|
|
"""
|
|
form = request_data.first_line_format
|
|
if form == "relative":
|
|
return b"%s %s %s" % (
|
|
request_data.method,
|
|
request_data.path,
|
|
request_data.http_version
|
|
)
|
|
elif form == "authority":
|
|
return b"%s %s:%d %s" % (
|
|
request_data.method,
|
|
request_data.host,
|
|
request_data.port,
|
|
request_data.http_version
|
|
)
|
|
elif form == "absolute":
|
|
return b"%s %s://%s:%d%s %s" % (
|
|
request_data.method,
|
|
request_data.scheme,
|
|
request_data.host,
|
|
request_data.port,
|
|
request_data.path,
|
|
request_data.http_version
|
|
)
|
|
else:
|
|
raise RuntimeError("Invalid request form")
|
|
|
|
|
|
def _assemble_request_headers(request_data):
|
|
"""
|
|
Args:
|
|
request_data (netlib.http.request.RequestData)
|
|
"""
|
|
headers = request_data.headers.copy()
|
|
if "host" not in headers and request_data.scheme and request_data.host and request_data.port:
|
|
headers["host"] = netlib.http.url.hostport(
|
|
request_data.scheme,
|
|
request_data.host,
|
|
request_data.port
|
|
)
|
|
return bytes(headers)
|
|
|
|
|
|
def _assemble_response_line(response_data):
|
|
return b"%s %d %s" % (
|
|
response_data.http_version,
|
|
response_data.status_code,
|
|
response_data.reason,
|
|
)
|
|
|
|
|
|
def _assemble_response_headers(response):
|
|
return bytes(response.headers)
|