mitmproxy/libmproxy/console/contentview.py

import re, cStringIO, traceback, json
import urwid
from PIL import Image
from PIL.ExifTags import TAGS
import lxml.html, lxml.etree
import common
from .. import utils, encoding, flow
from ..contrib import jsbeautifier, html2text

try:
    import pyamf
    from pyamf import remoting
except ImportError: # pragma nocover
    pyamf = None


VIEW_CUTOFF = 1024*50


def _view_text(content, total, limit):
    """
        Generates a body for a chunk of text.
    """
    txt = []
    for i in utils.cleanBin(content).splitlines():
        txt.append(
            urwid.Text(("text", i), wrap="any")
        )
    trailer(total, txt, limit)
    return txt


def trailer(clen, txt, limit):
    rem = clen - limit
    if rem > 0:
        txt.append(urwid.Text(""))
        txt.append(
            urwid.Text(
                [
                    ("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),
                    ("key", "f"),
                    ("highlight", " to load all data.")
                ]
            )
        )


class ViewAuto:
    name = "Auto"
    prompt = ("auto", "a")
    content_types = []
    def __call__(self, hdrs, content, limit):
        ctype = hdrs.get_first("content-type")
        if ctype:
            ct = utils.parse_content_type(ctype) if ctype else None
            ct = "%s/%s"%(ct[0], ct[1])
            if ct in content_types_map:
                return content_types_map[ct][0](hdrs, content, limit)
            elif utils.isXML(content):
                return get("XML")(hdrs, content, limit)
        return get("Raw")(hdrs, content, limit)


class ViewRaw:
    name = "Raw"
    prompt = ("raw", "r")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = _view_text(content[:limit], len(content), limit)
        return "Raw", txt


class ViewHex:
    name = "Hex"
    prompt = ("hex", "e")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = []
        for offset, hexa, s in utils.hexdump(content[:limit]):
            txt.append(urwid.Text([
                ("offset", offset),
                " ",
                ("text", hexa),
                "   ",
                ("text", s),
            ]))
        trailer(len(content), txt, limit)
        return "Hex", txt


class ViewXML:
    name = "XML"
    prompt = ("xml", "x")
    content_types = ["text/xml"]
    def __call__(self, hdrs, content, limit):
        parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)
        try:
            document = lxml.etree.fromstring(content, parser)
        except lxml.etree.XMLSyntaxError:
            return None
        docinfo = document.getroottree().docinfo

        prev = []
        p = document.getroottree().getroot().getprevious()
        while p is not None:
            prev.insert(
                0,
                lxml.etree.tostring(p)
            )
            p = p.getprevious()
        doctype=docinfo.doctype
        if prev:
            doctype += "\n".join(prev).strip()
        doctype = doctype.strip()

        s = lxml.etree.tostring(
                document,
                pretty_print=True,
                xml_declaration=True,
                doctype=doctype or None,
                encoding = docinfo.encoding
            )

        txt = []
        for i in s[:limit].strip().split("\n"):
            txt.append(
                urwid.Text(("text", i)),
            )
        trailer(len(content), txt, limit)
        return "XML-like data", txt


class ViewJSON:
    name = "JSON"
    prompt = ("json", "j")
    content_types = ["application/json"]
    def __call__(self, hdrs, content, limit):
        lines = utils.pretty_json(content)
        if lines:
            txt = []
            sofar = 0
            for i in lines:
                sofar += len(i)
                txt.append(
                    urwid.Text(("text", i)),
                )
                if sofar > limit:
                    break
            trailer(sum(len(i) for i in lines), txt, limit)
            return "JSON", txt


class ViewHTML:
    name = "HTML"
    prompt = ("html", "h")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        if utils.isXML(content):
            parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)
            d = lxml.html.fromstring(content, parser=parser)
            docinfo = d.getroottree().docinfo
            s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)
            return "HTML", _view_text(s[:limit], len(s), limit)


class ViewHTMLOutline:
    name = "HTML Outline"
    prompt = ("html outline", "o")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        content = content.decode("utf-8")
        h = html2text.HTML2Text(baseurl="")
        h.ignore_images = True
        h.body_width = 0
        content = h.handle(content)
        txt = _view_text(content[:limit], len(content), limit)
        return "HTML Outline", txt


class ViewURLEncoded:
    name = "URL-encoded"
    prompt = ("urlencoded", "u")
    content_types = ["application/x-www-form-urlencoded"]
    def __call__(self, hdrs, content, limit):
        lines = utils.urldecode(content)
        if lines:
            body = common.format_keyvals(
                        [(k+":", v) for (k, v) in lines],
                        key = "header",
                        val = "text"
                   )
            return "URLEncoded form", body


class ViewMultipart:
    name = "Multipart Form"
    prompt = ("multipart", "m")
    content_types = ["multipart/form-data"]
    def __call__(self, hdrs, content, limit):
        v = hdrs.get_first("content-type")
        if v:
            v = utils.parse_content_type(v)
            if not v:
                return
            boundary = v[2].get("boundary")
            if not boundary:
                return

            rx = re.compile(r'\bname="([^"]+)"')
            keys = []
            vals = []

            for i in content.split("--" + boundary):
                parts = i.splitlines()
                if len(parts) > 1 and parts[0][0:2] != "--":
                    match = rx.search(parts[1])
                    if match:
                        keys.append(match.group(1) + ":")
                        vals.append(utils.cleanBin(
                            "\n".join(parts[3+parts[2:].index(""):])
                        ))
            r = [
                urwid.Text(("highlight", "Form data:\n")),
            ]
            r.extend(common.format_keyvals(
                zip(keys, vals),
                key = "header",
                val = "text"
            ))
            return "Multipart form", r


class ViewAMF:
    name = "AMF"
    prompt = ("amf", "f")
    content_types = ["application/x-amf"]
    def __call__(self, hdrs, content, limit):
        envelope = remoting.decode(content)
        if not envelope:
            return None

        data = {}
        data['amfVersion'] = envelope.amfVersion
        for target, message in iter(envelope):
            one_message = {}

            if hasattr(message, 'status'):
                one_message['status'] = message.status

            if hasattr(message, 'target'):
                one_message['target'] = message.target

            one_message['body'] = message.body
            data[target] = one_message
        s = json.dumps(data, indent=4)
        return "AMF", _view_text(s[:limit], len(s), limit)


class ViewJavaScript:
    name = "JavaScript"
    prompt = ("javascript", "j")
    content_types = [
        "application/x-javascript",
        "application/javascript",
        "text/javascript"
    ]
    def __call__(self, hdrs, content, limit):
        opts = jsbeautifier.default_options()
        opts.indent_size = 2
        res = jsbeautifier.beautify(content[:limit], opts)
        return "JavaScript", _view_text(res, len(content), limit)


class ViewImage:
    name = "Image"
    prompt = ("image", "i")
    content_types = [
        "image/png",
        "image/jpeg",
        "image/gif",
        "image/vnd.microsoft.icon",
        "image/x-icon",
    ]
    def __call__(self, hdrs, content, limit):
        try:
            img = Image.open(cStringIO.StringIO(content))
        except IOError:
            return None
        parts = [
            ("Format", str(img.format_description)),
            ("Size", "%s x %s px"%img.size),
            ("Mode", str(img.mode)),
        ]
        for i in sorted(img.info.keys()):
            if i != "exif":
                parts.append(
                    (str(i), str(img.info[i]))
                )
        if hasattr(img, "_getexif"):
            ex = img._getexif()
            if ex:
                for i in sorted(ex.keys()):
                    tag = TAGS.get(i, i)
                    parts.append(
                        (str(tag), str(ex[i]))
                    )
        clean = []
        for i in parts:
            clean.append([utils.cleanBin(i[0]), utils.cleanBin(i[1])])
        fmt = common.format_keyvals(
                clean,
                key = "header",
                val = "text"
            )
        return "%s image"%img.format, fmt


views = [
    ViewAuto(),
    ViewRaw(),
    ViewHex(),
    ViewJSON(),
    ViewXML(),
    ViewHTML(),
    ViewHTMLOutline(),
    ViewJavaScript(),
    ViewURLEncoded(),
    ViewMultipart(),
    ViewImage(),
]
if pyamf:
    views.append(ViewAMF())

content_types_map = {}
for i in views:
    for ct in i.content_types:
        l = content_types_map.setdefault(ct, [])
        l.append(i)


view_prompts = [i.prompt for i in views]


def get_by_shortcut(c):
    for i in views:
        if i.prompt[1] == c:
            return i


def get(name):
    for i in views:
        if i.name == name:
            return i


def get_content_view(viewmode, hdrItems, content, limit, logfunc):
    """
        Returns a (msg, body) tuple.
    """
    if not content:
        return ("No content", "")
    msg = []

    hdrs = flow.ODictCaseless([list(i) for i in hdrItems])

    enc = hdrs.get_first("content-encoding")
    if enc and enc != "identity":
        decoded = encoding.decode(enc, content)
        if decoded:
            content = decoded
            msg.append("[decoded %s]"%enc)
    try:
        ret = viewmode(hdrs, content, limit)
    # Third-party viewers can fail in unexpected ways...
    except Exception, e:
        s = traceback.format_exc()
        s = "Content viewer failed: \n"  + s
        logfunc(s)
        ret = None
    if not ret:
        ret = get("Raw")(hdrs, content, limit)
        msg.append("Couldn't parse: falling back to Raw")
    else:
        msg.append(ret[0])
    return " ".join(msg), ret[1]
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`import re, cStringIO, traceback, json`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import urwid`
Add a pretty-viewer for images. This shows basic image information like dimensions, plus extracted EXIF tags and other metadata. 2012-03-25 22:26:02 +00:00			`from PIL import Image`
			`from PIL.ExifTags import TAGS`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`import lxml.html, lxml.etree`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import common`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`from .. import utils, encoding, flow`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`from ..contrib import jsbeautifier, html2text`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`try:`
			`import pyamf`
			`from pyamf import remoting`
			`except ImportError: # pragma nocover`
			`pyamf = None`


Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`VIEW_CUTOFF = 1024*50`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`def _view_text(content, total, limit):`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`"""`
			`Generates a body for a chunk of text.`
			`"""`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt = []`
Tune content viewing to maintain responsiveness: - Reduce display cutoff to 20k. - Make sure that we only indent the visible part of a JS body, not the whole thing. 2012-03-31 22:09:25 +00:00			`for i in utils.cleanBin(content).splitlines():`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Wrap on any character for body text display. 2012-04-08 03:00:38 +00:00			`urwid.Text(("text", i), wrap="any")`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`trailer(total, txt, limit)`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`return txt`


Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def trailer(clen, txt, limit):`
			`rem = clen - limit`
			`if rem > 0:`
			`txt.append(urwid.Text(""))`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`urwid.Text(`
			`[`
			`("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),`
			`("key", "f"),`
			`("highlight", " to load all data.")`
			`]`
			`)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewAuto:`
			`name = "Auto"`
			`prompt = ("auto", "a")`
			`content_types = []`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`def __call__(self, hdrs, content, limit):`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`ctype = hdrs.get_first("content-type")`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`if ctype:`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`ct = utils.parse_content_type(ctype) if ctype else None`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`ct = "%s/%s"%(ct[0], ct[1])`
			`if ct in content_types_map:`
			`return content_types_map[ct][0](hdrs, content, limit)`
			`elif utils.isXML(content):`
			`return get("XML")(hdrs, content, limit)`
			`return get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewRaw:`
			`name = "Raw"`
			`prompt = ("raw", "r")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "Raw", txt`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewHex:`
			`name = "Hex"`
			`prompt = ("hex", "e")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt = []`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`for offset, hexa, s in utils.hexdump(content[:limit]):`
			`txt.append(urwid.Text([`
			`("offset", offset),`
			`" ",`
			`("text", hexa),`
			`" ",`
			`("text", s),`
			`]))`
			`trailer(len(content), txt, limit)`
			`return "Hex", txt`


			`class ViewXML:`
			`name = "XML"`
			`prompt = ("xml", "x")`
			`content_types = ["text/xml"]`
			`def __call__(self, hdrs, content, limit):`
			`parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)`
			`try:`
			`document = lxml.etree.fromstring(content, parser)`
			`except lxml.etree.XMLSyntaxError:`
			`return None`
			`docinfo = document.getroottree().docinfo`

			`prev = []`
			`p = document.getroottree().getroot().getprevious()`
			`while p is not None:`
			`prev.insert(`
			`0,`
			`lxml.etree.tostring(p)`
			`)`
			`p = p.getprevious()`
			`doctype=docinfo.doctype`
			`if prev:`
			`doctype += "\n".join(prev).strip()`
			`doctype = doctype.strip()`

			`s = lxml.etree.tostring(`
			`document,`
			`pretty_print=True,`
			`xml_declaration=True,`
			`doctype=doctype or None,`
			`encoding = docinfo.encoding`
			`)`

			`txt = []`
			`for i in s[:limit].strip().split("\n"):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`trailer(len(content), txt, limit)`
			`return "XML-like data", txt`


			`class ViewJSON:`
			`name = "JSON"`
			`prompt = ("json", "j")`
			`content_types = ["application/json"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.pretty_json(content)`
			`if lines:`
			`txt = []`
			`sofar = 0`
			`for i in lines:`
			`sofar += len(i)`
			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
			`if sofar > limit:`
			`break`
			`trailer(sum(len(i) for i in lines), txt, limit)`
			`return "JSON", txt`


			`class ViewHTML:`
			`name = "HTML"`
			`prompt = ("html", "h")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`if utils.isXML(content):`
			`parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)`
			`d = lxml.html.fromstring(content, parser=parser)`
			`docinfo = d.getroottree().docinfo`
			`s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)`
			`return "HTML", _view_text(s[:limit], len(s), limit)`


			`class ViewHTMLOutline:`
			`name = "HTML Outline"`
			`prompt = ("html outline", "o")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`content = content.decode("utf-8")`
			`h = html2text.HTML2Text(baseurl="")`
			`h.ignore_images = True`
			`h.body_width = 0`
			`content = h.handle(content)`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "HTML Outline", txt`


			`class ViewURLEncoded:`
			`name = "URL-encoded"`
			`prompt = ("urlencoded", "u")`
			`content_types = ["application/x-www-form-urlencoded"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.urldecode(content)`
			`if lines:`
			`body = common.format_keyvals(`
			`[(k+":", v) for (k, v) in lines],`
			`key = "header",`
			`val = "text"`
			`)`
			`return "URLEncoded form", body`


			`class ViewMultipart:`
			`name = "Multipart Form"`
			`prompt = ("multipart", "m")`
			`content_types = ["multipart/form-data"]`
			`def __call__(self, hdrs, content, limit):`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`v = hdrs.get_first("content-type")`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`if v:`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`v = utils.parse_content_type(v)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`if not v:`
			`return`
			`boundary = v[2].get("boundary")`
			`if not boundary:`
			`return`

			`rx = re.compile(r'\bname="([^"]+)"')`
			`keys = []`
			`vals = []`

			`for i in content.split("--" + boundary):`
			`parts = i.splitlines()`
			`if len(parts) > 1 and parts[0][0:2] != "--":`
			`match = rx.search(parts[1])`
			`if match:`
			`keys.append(match.group(1) + ":")`
			`vals.append(utils.cleanBin(`
			`"\n".join(parts[3+parts[2:].index(""):])`
			`))`
			`r = [`
			`urwid.Text(("highlight", "Form data:\n")),`
			`]`
			`r.extend(common.format_keyvals(`
			`zip(keys, vals),`
			`key = "header",`
			`val = "text"`
			`))`
			`return "Multipart form", r`


			`class ViewAMF:`
			`name = "AMF"`
			`prompt = ("amf", "f")`
			`content_types = ["application/x-amf"]`
			`def __call__(self, hdrs, content, limit):`
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`envelope = remoting.decode(content)`
			`if not envelope:`
			`return None`

			`data = {}`
			`data['amfVersion'] = envelope.amfVersion`
			`for target, message in iter(envelope):`
			`one_message = {}`

			`if hasattr(message, 'status'):`
			`one_message['status'] = message.status`

			`if hasattr(message, 'target'):`
			`one_message['target'] = message.target`

			`one_message['body'] = message.body`
			`data[target] = one_message`
			`s = json.dumps(data, indent=4)`
			`return "AMF", _view_text(s[:limit], len(s), limit)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00

			`class ViewJavaScript:`
			`name = "JavaScript"`
			`prompt = ("javascript", "j")`
			`content_types = [`
			`"application/x-javascript",`
			`"application/javascript",`
			`"text/javascript"`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`opts = jsbeautifier.default_options()`
			`opts.indent_size = 2`
			`res = jsbeautifier.beautify(content[:limit], opts)`
			`return "JavaScript", _view_text(res, len(content), limit)`


			`class ViewImage:`
			`name = "Image"`
			`prompt = ("image", "i")`
			`content_types = [`
			`"image/png",`
			`"image/jpeg",`
			`"image/gif",`
			`"image/vnd.microsoft.icon",`
			`"image/x-icon",`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`try:`
			`img = Image.open(cStringIO.StringIO(content))`
			`except IOError:`
			`return None`
			`parts = [`
			`("Format", str(img.format_description)),`
			`("Size", "%s x %s px"%img.size),`
			`("Mode", str(img.mode)),`
Re-enable simple multipart form parsing and preview. 2012-03-24 21:10:48 +00:00			`]`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`for i in sorted(img.info.keys()):`
			`if i != "exif":`
			`parts.append(`
			`(str(i), str(img.info[i]))`
			`)`
			`if hasattr(img, "_getexif"):`
			`ex = img._getexif()`
			`if ex:`
			`for i in sorted(ex.keys()):`
			`tag = TAGS.get(i, i)`
			`parts.append(`
			`(str(tag), str(ex[i]))`
			`)`
			`clean = []`
			`for i in parts:`
			`clean.append([utils.cleanBin(i[0]), utils.cleanBin(i[1])])`
			`fmt = common.format_keyvals(`
			`clean,`
			`key = "header",`
			`val = "text"`
			`)`
			`return "%s image"%img.format, fmt`


			`views = [`
			`ViewAuto(),`
			`ViewRaw(),`
			`ViewHex(),`
			`ViewJSON(),`
			`ViewXML(),`
			`ViewHTML(),`
			`ViewHTMLOutline(),`
			`ViewJavaScript(),`
			`ViewURLEncoded(),`
			`ViewMultipart(),`
			`ViewImage(),`
			`]`
Further content view cleaups. 2012-08-18 05:51:34 +00:00			`if pyamf:`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`views.append(ViewAMF())`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`content_types_map = {}`
			`for i in views:`
			`for ct in i.content_types:`
			`l = content_types_map.setdefault(ct, [])`
			`l.append(i)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`view_prompts = [i.prompt for i in views]`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def get_by_shortcut(c):`
			`for i in views:`
			`if i.prompt[1] == c:`
			`return i`


			`def get(name):`
			`for i in views:`
			`if i.name == name:`
			`return i`

Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Send tracebacks from content viewers to event log. Also, 100% test coverage for content viewers. 2012-08-18 05:42:40 +00:00			`def get_content_view(viewmode, hdrItems, content, limit, logfunc):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`"""`
			`Returns a (msg, body) tuple.`
			`"""`
Display "No Content" instead of a parse error when there is no content. 2012-08-30 00:51:04 +00:00			`if not content:`
			`return ("No content", "")`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`msg = []`

			`hdrs = flow.ODictCaseless([list(i) for i in hdrItems])`

Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`enc = hdrs.get_first("content-encoding")`
			`if enc and enc != "identity":`
			`decoded = encoding.decode(enc, content)`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`if decoded:`
			`content = decoded`
Use the new ODict get_first convenience function in a bunch of places. 2012-08-18 06:14:30 +00:00			`msg.append("[decoded %s]"%enc)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`try:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`ret = viewmode(hdrs, content, limit)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`# Third-party viewers can fail in unexpected ways...`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`except Exception, e:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`s = traceback.format_exc()`
Send tracebacks from content viewers to event log. Also, 100% test coverage for content viewers. 2012-08-18 05:42:40 +00:00			`s = "Content viewer failed: \n" + s`
			`logfunc(s)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`ret = None`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`if not ret:`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`ret = get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`msg.append("Couldn't parse: falling back to Raw")`
Make it clearer when we fall back to Raw. 2012-04-01 23:22:01 +00:00			`else:`
			`msg.append(ret[0])`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`return " ".join(msg), ret[1]`