mitmproxy/libmproxy/console/contentview.py

import re, cStringIO, traceback, json
import urwid

try: from PIL import Image
except ImportError: import Image

try: from PIL.ExifTags import TAGS
except ImportError: from ExifTags import TAGS

import lxml.html, lxml.etree
import netlib.utils
import common
from .. import utils, encoding, flow
from ..contrib import jsbeautifier, html2text
import subprocess
try:
    import pyamf
    from pyamf import remoting, flex
except ImportError: # pragma nocover
    pyamf = None

VIEW_CUTOFF = 1024*50


def _view_text(content, total, limit):
    """
        Generates a body for a chunk of text.
    """
    txt = []
    for i in netlib.utils.cleanBin(content).splitlines():
        txt.append(
            urwid.Text(("text", i), wrap="any")
        )
    trailer(total, txt, limit)
    return txt


def trailer(clen, txt, limit):
    rem = clen - limit
    if rem > 0:
        txt.append(urwid.Text(""))
        txt.append(
            urwid.Text(
                [
                    ("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),
                    ("key", "f"),
                    ("highlight", " to load all data.")
                ]
            )
        )


class ViewAuto:
    name = "Auto"
    prompt = ("auto", "a")
    content_types = []
    def __call__(self, hdrs, content, limit):
        ctype = hdrs.get_first("content-type")
        if ctype:
            ct = utils.parse_content_type(ctype) if ctype else None
            ct = "%s/%s"%(ct[0], ct[1])
            if ct in content_types_map:
                return content_types_map[ct][0](hdrs, content, limit)
            elif utils.isXML(content):
                return get("XML")(hdrs, content, limit)
        return get("Raw")(hdrs, content, limit)


class ViewRaw:
    name = "Raw"
    prompt = ("raw", "r")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = _view_text(content[:limit], len(content), limit)
        return "Raw", txt


class ViewHex:
    name = "Hex"
    prompt = ("hex", "e")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = []
        for offset, hexa, s in netlib.utils.hexdump(content[:limit]):
            txt.append(urwid.Text([
                ("offset", offset),
                " ",
                ("text", hexa),
                "   ",
                ("text", s),
            ]))
        trailer(len(content), txt, limit)
        return "Hex", txt


class ViewXML:
    name = "XML"
    prompt = ("xml", "x")
    content_types = ["text/xml"]
    def __call__(self, hdrs, content, limit):
        parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)
        try:
            document = lxml.etree.fromstring(content, parser)
        except lxml.etree.XMLSyntaxError:
            return None
        docinfo = document.getroottree().docinfo

        prev = []
        p = document.getroottree().getroot().getprevious()
        while p is not None:
            prev.insert(
                0,
                lxml.etree.tostring(p)
            )
            p = p.getprevious()
        doctype=docinfo.doctype
        if prev:
            doctype += "\n".join(prev).strip()
        doctype = doctype.strip()

        s = lxml.etree.tostring(
                document,
                pretty_print=True,
                xml_declaration=True,
                doctype=doctype or None,
                encoding = docinfo.encoding
            )

        txt = []
        for i in s[:limit].strip().split("\n"):
            txt.append(
                urwid.Text(("text", i)),
            )
        trailer(len(content), txt, limit)
        return "XML-like data", txt


class ViewJSON:
    name = "JSON"
    prompt = ("json", "s")
    content_types = ["application/json"]
    def __call__(self, hdrs, content, limit):
        lines = utils.pretty_json(content)
        if lines:
            txt = []
            sofar = 0
            for i in lines:
                sofar += len(i)
                txt.append(
                    urwid.Text(("text", i)),
                )
                if sofar > limit:
                    break
            trailer(sum(len(i) for i in lines), txt, limit)
            return "JSON", txt


class ViewHTML:
    name = "HTML"
    prompt = ("html", "h")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        if utils.isXML(content):
            parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)
            d = lxml.html.fromstring(content, parser=parser)
            docinfo = d.getroottree().docinfo
            s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)
            return "HTML", _view_text(s[:limit], len(s), limit)


class ViewHTMLOutline:
    name = "HTML Outline"
    prompt = ("html outline", "o")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        content = content.decode("utf-8")
        h = html2text.HTML2Text(baseurl="")
        h.ignore_images = True
        h.body_width = 0
        content = h.handle(content)
        txt = _view_text(content[:limit], len(content), limit)
        return "HTML Outline", txt


class ViewURLEncoded:
    name = "URL-encoded"
    prompt = ("urlencoded", "u")
    content_types = ["application/x-www-form-urlencoded"]
    def __call__(self, hdrs, content, limit):
        lines = utils.urldecode(content)
        if lines:
            body = common.format_keyvals(
                        [(k+":", v) for (k, v) in lines],
                        key = "header",
                        val = "text"
                   )
            return "URLEncoded form", body


class ViewMultipart:
    name = "Multipart Form"
    prompt = ("multipart", "m")
    content_types = ["multipart/form-data"]
    def __call__(self, hdrs, content, limit):
        v = hdrs.get_first("content-type")
        if v:
            v = utils.parse_content_type(v)
            if not v:
                return
            boundary = v[2].get("boundary")
            if not boundary:
                return

            rx = re.compile(r'\bname="([^"]+)"')
            keys = []
            vals = []

            for i in content.split("--" + boundary):
                parts = i.splitlines()
                if len(parts) > 1 and parts[0][0:2] != "--":
                    match = rx.search(parts[1])
                    if match:
                        keys.append(match.group(1) + ":")
                        vals.append(netlib.utils.cleanBin(
                            "\n".join(parts[3+parts[2:].index(""):])
                        ))
            r = [
                urwid.Text(("highlight", "Form data:\n")),
            ]
            r.extend(common.format_keyvals(
                zip(keys, vals),
                key = "header",
                val = "text"
            ))
            return "Multipart form", r


if pyamf:
    class DummyObject(dict):
        def __init__(self, alias):
            dict.__init__(self)

        def __readamf__(self, input):
            data = input.readObject()
            self["data"] = data

    def pyamf_class_loader(s):
        for i in pyamf.CLASS_LOADERS:
            if i != pyamf_class_loader:
                v = i(s)
                if v:
                    return v
        return DummyObject

    pyamf.register_class_loader(pyamf_class_loader)

    class ViewAMF:
        name = "AMF"
        prompt = ("amf", "f")
        content_types = ["application/x-amf"]

        def unpack(self, b, seen=set([])):
            if hasattr(b, "body"):
                return self.unpack(b.body, seen)
            if isinstance(b, DummyObject):
                if id(b) in seen:
                    return "<recursion>"
                else:
                    seen.add(id(b))
                    for k, v in b.items():
                        b[k] = self.unpack(v, seen)
                    return b
            elif isinstance(b, dict):
                for k, v in b.items():
                    b[k] = self.unpack(v, seen)
                return b
            elif isinstance(b, list):
                return [self.unpack(i) for i in b]
            elif isinstance(b, flex.ArrayCollection):
                return [self.unpack(i, seen) for i in b]
            else:
                return b

        def __call__(self, hdrs, content, limit):
            envelope = remoting.decode(content, strict=False)
            if not envelope:
                return None


            txt = []
            for target, message in iter(envelope):
                if isinstance(message, pyamf.remoting.Request):
                    txt.append(urwid.Text([
                        ("header", "Request: "),
                        ("text", str(target)),
                    ]))
                else:
                    txt.append(urwid.Text([
                        ("header", "Response: "),
                        ("text", "%s, code %s"%(target, message.status)),
                    ]))

                s = json.dumps(self.unpack(message), indent=4)
                txt.extend(_view_text(s[:limit], len(s), limit))

            return "AMF v%s"%envelope.amfVersion, txt


class ViewJavaScript:
    name = "JavaScript"
    prompt = ("javascript", "j")
    content_types = [
        "application/x-javascript",
        "application/javascript",
        "text/javascript"
    ]
    def __call__(self, hdrs, content, limit):
        opts = jsbeautifier.default_options()
        opts.indent_size = 2
        res = jsbeautifier.beautify(content[:limit], opts)
        return "JavaScript", _view_text(res, len(content), limit)


class ViewImage:
    name = "Image"
    prompt = ("image", "i")
    content_types = [
        "image/png",
        "image/jpeg",
        "image/gif",
        "image/vnd.microsoft.icon",
        "image/x-icon",
    ]
    def __call__(self, hdrs, content, limit):
        try:
            img = Image.open(cStringIO.StringIO(content))
        except IOError:
            return None
        parts = [
            ("Format", str(img.format_description)),
            ("Size", "%s x %s px"%img.size),
            ("Mode", str(img.mode)),
        ]
        for i in sorted(img.info.keys()):
            if i != "exif":
                parts.append(
                    (str(i), str(img.info[i]))
                )
        if hasattr(img, "_getexif"):
            ex = img._getexif()
            if ex:
                for i in sorted(ex.keys()):
                    tag = TAGS.get(i, i)
                    parts.append(
                        (str(tag), str(ex[i]))
                    )
        clean = []
        for i in parts:
            clean.append([netlib.utils.cleanBin(i[0]), netlib.utils.cleanBin(i[1])])
        fmt = common.format_keyvals(
                clean,
                key = "header",
                val = "text"
            )
        return "%s image"%img.format, fmt

class ViewProtobuf:
    """Human friendly view of protocol buffers
    The view uses the protoc compiler to decode the binary
    """

    name = "Protocol Buffer"
    prompt = ("protobuf", "p")
    content_types = ["application/x-protobuf"]

    @staticmethod
    def is_available():
        try:
            p = subprocess.Popen(["protoc", "--version"], stdout=subprocess.PIPE)
            out, _ = p.communicate()
            return out.startswith("libprotoc")
        except:
            return False

    def decode_protobuf(self, content):
        # if Popen raises OSError, it will be caught in
        # get_content_view and fall back to Raw
        p = subprocess.Popen(['protoc', '--decode_raw'],
                             stdin=subprocess.PIPE,
                             stdout=subprocess.PIPE,
                             stderr=subprocess.PIPE)
        out, _ = p.communicate(input=content)
        return out

    def __call__(self, hdrs, content, limit):
        decoded = self.decode_protobuf(content)
        txt = _view_text(decoded[:limit], len(decoded), limit)
        return "Protobuf", txt

views = [
    ViewAuto(),
    ViewRaw(),
    ViewHex(),
    ViewJSON(),
    ViewXML(),
    ViewHTML(),
    ViewHTMLOutline(),
    ViewJavaScript(),
    ViewURLEncoded(),
    ViewMultipart(),
    ViewImage(),
]
if pyamf:
    views.append(ViewAMF())

if ViewProtobuf.is_available():
    views.append(ViewProtobuf())

content_types_map = {}
for i in views:
    for ct in i.content_types:
        l = content_types_map.setdefault(ct, [])
        l.append(i)


view_prompts = [i.prompt for i in views]


def get_by_shortcut(c):
    for i in views:
        if i.prompt[1] == c:
            return i


def get(name):
    for i in views:
        if i.name == name:
            return i


def get_content_view(viewmode, hdrItems, content, limit, logfunc):
    """
        Returns a (msg, body) tuple.
    """
    if not content:
        return ("No content", "")
    msg = []

    hdrs = flow.ODictCaseless([list(i) for i in hdrItems])

    enc = hdrs.get_first("content-encoding")
    if enc and enc != "identity":
        decoded = encoding.decode(enc, content)
        if decoded:
            content = decoded
            msg.append("[decoded %s]"%enc)
    try:
        ret = viewmode(hdrs, content, limit)
    # Third-party viewers can fail in unexpected ways...
    except Exception, e:
        s = traceback.format_exc()
        s = "Content viewer failed: \n"  + s
        logfunc(s)
        ret = None
    if not ret:
        ret = get("Raw")(hdrs, content, limit)
        msg.append("Couldn't parse: falling back to Raw")
    else:
        msg.append(ret[0])
    return " ".join(msg), ret[1]
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`import re, cStringIO, traceback, json`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import urwid`
Workaround for PIL's ambiguious import method and/or easy_install PIL packaging problem. PIL documents two different way to import it's modules: * import Image (http://www.pythonware.com/library/pil/handbook/introduction.htm) * from PIL import Image (http://www.pythonware.com/library/pil/handbook/image.htm) The same problem was noted in Django at https://code.djangoproject.com/ticket/6054 2012-11-23 16:48:24 +00:00
			`try: from PIL import Image`
			`except ImportError: import Image`

			`try: from PIL.ExifTags import TAGS`
			`except ImportError: from ExifTags import TAGS`

Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`import lxml.html, lxml.etree`
Move cleanBin and hexdump into netutils. 2012-09-23 23:21:12 +00:00			`import netlib.utils`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import common`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`from .. import utils, encoding, flow`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`from ..contrib import jsbeautifier, html2text`
Adds a new view for protocol buffers The view uses protoc from the Google protocol buffer tools. If the tool isn't installed, the view isn't shown. Google protobuf repo: https://code.google.com/p/protobuf/ 2013-04-06 18:18:12 +00:00			`import subprocess`
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`try:`
			`import pyamf`
Substantially rewrite AMF decoding. This is tricky, but we should now handle a lot more corner-cases. 2012-11-26 00:25:07 +00:00			`from pyamf import remoting, flex`
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`except ImportError: # pragma nocover`
			`pyamf = None`

Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`VIEW_CUTOFF = 1024*50`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`def _view_text(content, total, limit):`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`"""`
			`Generates a body for a chunk of text.`
			`"""`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt = []`
Move cleanBin and hexdump into netutils. 2012-09-23 23:21:12 +00:00			`for i in netlib.utils.cleanBin(content).splitlines():`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Wrap on any character for body text display. 2012-04-08 03:00:38 +00:00			`urwid.Text(("text", i), wrap="any")`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`trailer(total, txt, limit)`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`return txt`


Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def trailer(clen, txt, limit):`
			`rem = clen - limit`
			`if rem > 0:`
			`txt.append(urwid.Text(""))`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`urwid.Text(`
			`[`
			`("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),`
			`("key", "f"),`
			`("highlight", " to load all data.")`
			`]`
			`)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewAuto:`
			`name = "Auto"`
			`prompt = ("auto", "a")`
			`content_types = []`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`def __call__(self, hdrs, content, limit):`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`ctype = hdrs.get_first("content-type")`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`if ctype:`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`ct = utils.parse_content_type(ctype) if ctype else None`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`ct = "%s/%s"%(ct[0], ct[1])`
			`if ct in content_types_map:`
			`return content_types_map[ct][0](hdrs, content, limit)`
			`elif utils.isXML(content):`
			`return get("XML")(hdrs, content, limit)`
			`return get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewRaw:`
			`name = "Raw"`
			`prompt = ("raw", "r")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "Raw", txt`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewHex:`
			`name = "Hex"`
			`prompt = ("hex", "e")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt = []`
Move cleanBin and hexdump into netutils. 2012-09-23 23:21:12 +00:00			`for offset, hexa, s in netlib.utils.hexdump(content[:limit]):`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`txt.append(urwid.Text([`
			`("offset", offset),`
			`" ",`
			`("text", hexa),`
			`" ",`
			`("text", s),`
			`]))`
			`trailer(len(content), txt, limit)`
			`return "Hex", txt`


			`class ViewXML:`
			`name = "XML"`
			`prompt = ("xml", "x")`
			`content_types = ["text/xml"]`
			`def __call__(self, hdrs, content, limit):`
			`parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)`
			`try:`
			`document = lxml.etree.fromstring(content, parser)`
			`except lxml.etree.XMLSyntaxError:`
			`return None`
			`docinfo = document.getroottree().docinfo`

			`prev = []`
			`p = document.getroottree().getroot().getprevious()`
			`while p is not None:`
			`prev.insert(`
			`0,`
			`lxml.etree.tostring(p)`
			`)`
			`p = p.getprevious()`
			`doctype=docinfo.doctype`
			`if prev:`
			`doctype += "\n".join(prev).strip()`
			`doctype = doctype.strip()`

			`s = lxml.etree.tostring(`
			`document,`
			`pretty_print=True,`
			`xml_declaration=True,`
			`doctype=doctype or None,`
			`encoding = docinfo.encoding`
			`)`

			`txt = []`
			`for i in s[:limit].strip().split("\n"):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`trailer(len(content), txt, limit)`
			`return "XML-like data", txt`


			`class ViewJSON:`
			`name = "JSON"`
Correct display mode highlight keys Add html display mode to the help documentation. Correct html and hex display mode highlight keys (help used 'h' for hex). Correct json display mode highlight keys. 2013-04-16 21:54:34 +00:00			`prompt = ("json", "s")`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`content_types = ["application/json"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.pretty_json(content)`
			`if lines:`
			`txt = []`
			`sofar = 0`
			`for i in lines:`
			`sofar += len(i)`
			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
			`if sofar > limit:`
			`break`
			`trailer(sum(len(i) for i in lines), txt, limit)`
			`return "JSON", txt`


			`class ViewHTML:`
			`name = "HTML"`
			`prompt = ("html", "h")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`if utils.isXML(content):`
			`parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)`
			`d = lxml.html.fromstring(content, parser=parser)`
			`docinfo = d.getroottree().docinfo`
			`s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)`
			`return "HTML", _view_text(s[:limit], len(s), limit)`


			`class ViewHTMLOutline:`
			`name = "HTML Outline"`
			`prompt = ("html outline", "o")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`content = content.decode("utf-8")`
			`h = html2text.HTML2Text(baseurl="")`
			`h.ignore_images = True`
			`h.body_width = 0`
			`content = h.handle(content)`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "HTML Outline", txt`


			`class ViewURLEncoded:`
			`name = "URL-encoded"`
			`prompt = ("urlencoded", "u")`
			`content_types = ["application/x-www-form-urlencoded"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.urldecode(content)`
			`if lines:`
			`body = common.format_keyvals(`
			`[(k+":", v) for (k, v) in lines],`
			`key = "header",`
			`val = "text"`
			`)`
			`return "URLEncoded form", body`


			`class ViewMultipart:`
			`name = "Multipart Form"`
			`prompt = ("multipart", "m")`
			`content_types = ["multipart/form-data"]`
			`def __call__(self, hdrs, content, limit):`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`v = hdrs.get_first("content-type")`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`if v:`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`v = utils.parse_content_type(v)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`if not v:`
			`return`
			`boundary = v[2].get("boundary")`
			`if not boundary:`
			`return`

			`rx = re.compile(r'\bname="([^"]+)"')`
			`keys = []`
			`vals = []`

			`for i in content.split("--" + boundary):`
			`parts = i.splitlines()`
			`if len(parts) > 1 and parts[0][0:2] != "--":`
			`match = rx.search(parts[1])`
			`if match:`
			`keys.append(match.group(1) + ":")`
Move cleanBin and hexdump into netutils. 2012-09-23 23:21:12 +00:00			`vals.append(netlib.utils.cleanBin(`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`"\n".join(parts[3+parts[2:].index(""):])`
			`))`
			`r = [`
			`urwid.Text(("highlight", "Form data:\n")),`
			`]`
			`r.extend(common.format_keyvals(`
			`zip(keys, vals),`
			`key = "header",`
			`val = "text"`
			`))`
			`return "Multipart form", r`


Substantially rewrite AMF decoding. This is tricky, but we should now handle a lot more corner-cases. 2012-11-26 00:25:07 +00:00			`if pyamf:`
			`class DummyObject(dict):`
			`def __init__(self, alias):`
			`dict.__init__(self)`

			`def __readamf__(self, input):`
			`data = input.readObject()`
			`self["data"] = data`

			`def pyamf_class_loader(s):`
			`for i in pyamf.CLASS_LOADERS:`
			`if i != pyamf_class_loader:`
			`v = i(s)`
			`if v:`
			`return v`
			`return DummyObject`

			`pyamf.register_class_loader(pyamf_class_loader)`

			`class ViewAMF:`
			`name = "AMF"`
			`prompt = ("amf", "f")`
			`content_types = ["application/x-amf"]`

			`def unpack(self, b, seen=set([])):`
			`if hasattr(b, "body"):`
			`return self.unpack(b.body, seen)`
			`if isinstance(b, DummyObject):`
			`if id(b) in seen:`
			`return "<recursion>"`
			`else:`
			`seen.add(id(b))`
			`for k, v in b.items():`
			`b[k] = self.unpack(v, seen)`
			`return b`
			`elif isinstance(b, dict):`
			`for k, v in b.items():`
			`b[k] = self.unpack(v, seen)`
			`return b`
			`elif isinstance(b, list):`
			`return [self.unpack(i) for i in b]`
			`elif isinstance(b, flex.ArrayCollection):`
			`return [self.unpack(i, seen) for i in b]`
			`else:`
			`return b`

			`def __call__(self, hdrs, content, limit):`
			`envelope = remoting.decode(content, strict=False)`
			`if not envelope:`
			`return None`
Further content view cleaups. 2012-08-18 05:51:34 +00:00

Substantially rewrite AMF decoding. This is tricky, but we should now handle a lot more corner-cases. 2012-11-26 00:25:07 +00:00			`txt = []`
			`for target, message in iter(envelope):`
			`if isinstance(message, pyamf.remoting.Request):`
			`txt.append(urwid.Text([`
			`("header", "Request: "),`
			`("text", str(target)),`
			`]))`
			`else:`
			`txt.append(urwid.Text([`
			`("header", "Response: "),`
			`("text", "%s, code %s"%(target, message.status)),`
			`]))`

			`s = json.dumps(self.unpack(message), indent=4)`
			`txt.extend(_view_text(s[:limit], len(s), limit))`

			`return "AMF v%s"%envelope.amfVersion, txt`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00

			`class ViewJavaScript:`
			`name = "JavaScript"`
			`prompt = ("javascript", "j")`
			`content_types = [`
			`"application/x-javascript",`
			`"application/javascript",`
			`"text/javascript"`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`opts = jsbeautifier.default_options()`
			`opts.indent_size = 2`
			`res = jsbeautifier.beautify(content[:limit], opts)`
			`return "JavaScript", _view_text(res, len(content), limit)`


			`class ViewImage:`
			`name = "Image"`
			`prompt = ("image", "i")`
			`content_types = [`
			`"image/png",`
			`"image/jpeg",`
			`"image/gif",`
			`"image/vnd.microsoft.icon",`
			`"image/x-icon",`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`try:`
			`img = Image.open(cStringIO.StringIO(content))`
			`except IOError:`
			`return None`
			`parts = [`
			`("Format", str(img.format_description)),`
			`("Size", "%s x %s px"%img.size),`
			`("Mode", str(img.mode)),`
Re-enable simple multipart form parsing and preview. 2012-03-24 21:10:48 +00:00			`]`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`for i in sorted(img.info.keys()):`
			`if i != "exif":`
			`parts.append(`
			`(str(i), str(img.info[i]))`
			`)`
			`if hasattr(img, "_getexif"):`
			`ex = img._getexif()`
			`if ex:`
			`for i in sorted(ex.keys()):`
			`tag = TAGS.get(i, i)`
			`parts.append(`
			`(str(tag), str(ex[i]))`
			`)`
			`clean = []`
			`for i in parts:`
Move cleanBin and hexdump into netutils. 2012-09-23 23:21:12 +00:00			`clean.append([netlib.utils.cleanBin(i[0]), netlib.utils.cleanBin(i[1])])`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`fmt = common.format_keyvals(`
			`clean,`
			`key = "header",`
			`val = "text"`
			`)`
			`return "%s image"%img.format, fmt`

Adds a new view for protocol buffers The view uses protoc from the Google protocol buffer tools. If the tool isn't installed, the view isn't shown. Google protobuf repo: https://code.google.com/p/protobuf/ 2013-04-06 18:18:12 +00:00			`class ViewProtobuf:`
			`"""Human friendly view of protocol buffers`
			`The view uses the protoc compiler to decode the binary`
			`"""`

			`name = "Protocol Buffer"`
			`prompt = ("protobuf", "p")`
			`content_types = ["application/x-protobuf"]`

			`@staticmethod`
			`def is_available():`
			`try:`
			`p = subprocess.Popen(["protoc", "--version"], stdout=subprocess.PIPE)`
			`out, _ = p.communicate()`
			`return out.startswith("libprotoc")`
			`except:`
			`return False`

			`def decode_protobuf(self, content):`
			`# if Popen raises OSError, it will be caught in`
			`# get_content_view and fall back to Raw`
			`p = subprocess.Popen(['protoc', '--decode_raw'],`
			`stdin=subprocess.PIPE,`
			`stdout=subprocess.PIPE,`
			`stderr=subprocess.PIPE)`
			`out, _ = p.communicate(input=content)`
			`return out`

			`def __call__(self, hdrs, content, limit):`
			`decoded = self.decode_protobuf(content)`
			`txt = _view_text(decoded[:limit], len(decoded), limit)`
			`return "Protobuf", txt`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00
			`views = [`
			`ViewAuto(),`
			`ViewRaw(),`
			`ViewHex(),`
			`ViewJSON(),`
			`ViewXML(),`
			`ViewHTML(),`
			`ViewHTMLOutline(),`
			`ViewJavaScript(),`
			`ViewURLEncoded(),`
			`ViewMultipart(),`
			`ViewImage(),`
			`]`
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`if pyamf:`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`views.append(ViewAMF())`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Adds a new view for protocol buffers The view uses protoc from the Google protocol buffer tools. If the tool isn't installed, the view isn't shown. Google protobuf repo: https://code.google.com/p/protobuf/ 2013-04-06 18:18:12 +00:00			`if ViewProtobuf.is_available():`
			`views.append(ViewProtobuf())`

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`content_types_map = {}`
			`for i in views:`
			`for ct in i.content_types:`
			`l = content_types_map.setdefault(ct, [])`
			`l.append(i)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`view_prompts = [i.prompt for i in views]`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def get_by_shortcut(c):`
			`for i in views:`
			`if i.prompt[1] == c:`
			`return i`


			`def get(name):`
			`for i in views:`
			`if i.name == name:`
			`return i`

Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Send tracebacks from content viewers to event log. Also, 100% test coverage for content viewers. 2012-08-18 05:42:40 +00:00			`def get_content_view(viewmode, hdrItems, content, limit, logfunc):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`"""`
			`Returns a (msg, body) tuple.`
			`"""`
Display "No Content" instead of a parse error when there is no content. 2012-08-30 00:51:04 +00:00			`if not content:`
			`return ("No content", "")`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`msg = []`

			`hdrs = flow.ODictCaseless([list(i) for i in hdrItems])`

Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`enc = hdrs.get_first("content-encoding")`
			`if enc and enc != "identity":`
			`decoded = encoding.decode(enc, content)`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`if decoded:`
			`content = decoded`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`msg.append("[decoded %s]"%enc)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`try:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`ret = viewmode(hdrs, content, limit)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`# Third-party viewers can fail in unexpected ways...`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`except Exception, e:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`s = traceback.format_exc()`
Send tracebacks from content viewers to event log. Also, 100% test coverage for content viewers. 2012-08-18 05:42:40 +00:00			`s = "Content viewer failed: \n" + s`
			`logfunc(s)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`ret = None`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`if not ret:`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`ret = get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`msg.append("Couldn't parse: falling back to Raw")`
Make it clearer when we fall back to Raw. 2012-04-01 23:22:01 +00:00			`else:`
			`msg.append(ret[0])`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`return " ".join(msg), ret[1]`