mitmproxy/libmproxy/console/contentview.py

import re, cStringIO, traceback
import urwid
from PIL import Image
from PIL.ExifTags import TAGS
import lxml.html, lxml.etree
import common
from .. import utils, encoding, flow
from ..contrib import jsbeautifier, html2text

VIEW_CUTOFF = 1024*50


def _view_text(content, total, limit):
    """
        Generates a body for a chunk of text.
    """
    txt = []
    for i in utils.cleanBin(content).splitlines():
        txt.append(
            urwid.Text(("text", i), wrap="any")
        )
    trailer(total, txt, limit)
    return txt


def trailer(clen, txt, limit):
    rem = clen - limit
    if rem > 0:
        txt.append(urwid.Text(""))
        txt.append(
            urwid.Text(
                [
                    ("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),
                    ("key", "f"),
                    ("highlight", " to load all data.")
                ]
            )
        )


class ViewAuto:
    name = "Auto"
    prompt = ("auto", "a")
    content_types = []
    def __call__(self, hdrs, content, limit):
        ctype = hdrs.get("content-type")
        if ctype:
            ctype = ctype[0]
        ct = utils.parse_content_type(ctype) if ctype else None
        if ct:
            ct = "%s/%s"%(ct[0], ct[1])
            if ct in content_types_map:
                return content_types_map[ct][0](hdrs, content, limit)
            elif utils.isXML(content):
                return get("XML")(hdrs, content, limit)
        return get("Raw")(hdrs, content, limit)


class ViewRaw:
    name = "Raw"
    prompt = ("raw", "r")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = _view_text(content[:limit], len(content), limit)
        return "Raw", txt


class ViewHex:
    name = "Hex"
    prompt = ("hex", "e")
    content_types = []
    def __call__(self, hdrs, content, limit):
        txt = []
        for offset, hexa, s in utils.hexdump(content[:limit]):
            txt.append(urwid.Text([
                ("offset", offset),
                " ",
                ("text", hexa),
                "   ",
                ("text", s),
            ]))
        trailer(len(content), txt, limit)
        return "Hex", txt


class ViewXML:
    name = "XML"
    prompt = ("xml", "x")
    content_types = ["text/xml"]
    def __call__(self, hdrs, content, limit):
        parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)
        try:
            document = lxml.etree.fromstring(content, parser)
        except lxml.etree.XMLSyntaxError:
            return None
        docinfo = document.getroottree().docinfo

        prev = []
        p = document.getroottree().getroot().getprevious()
        while p is not None:
            prev.insert(
                0,
                lxml.etree.tostring(p)
            )
            p = p.getprevious()
        doctype=docinfo.doctype
        if prev:
            doctype += "\n".join(prev).strip()
        doctype = doctype.strip()

        s = lxml.etree.tostring(
                document,
                pretty_print=True,
                xml_declaration=True,
                doctype=doctype or None,
                encoding = docinfo.encoding
            )

        txt = []
        for i in s[:limit].strip().split("\n"):
            txt.append(
                urwid.Text(("text", i)),
            )
        trailer(len(content), txt, limit)
        return "XML-like data", txt


class ViewJSON:
    name = "JSON"
    prompt = ("json", "j")
    content_types = ["application/json"]
    def __call__(self, hdrs, content, limit):
        lines = utils.pretty_json(content)
        if lines:
            txt = []
            sofar = 0
            for i in lines:
                sofar += len(i)
                txt.append(
                    urwid.Text(("text", i)),
                )
                if sofar > limit:
                    break
            trailer(sum(len(i) for i in lines), txt, limit)
            return "JSON", txt


class ViewHTML:
    name = "HTML"
    prompt = ("html", "h")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        if utils.isXML(content):
            parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)
            d = lxml.html.fromstring(content, parser=parser)
            docinfo = d.getroottree().docinfo
            s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)
            return "HTML", _view_text(s[:limit], len(s), limit)


class ViewHTMLOutline:
    name = "HTML Outline"
    prompt = ("html outline", "o")
    content_types = ["text/html"]
    def __call__(self, hdrs, content, limit):
        content = content.decode("utf-8")
        h = html2text.HTML2Text(baseurl="")
        h.ignore_images = True
        h.body_width = 0
        content = h.handle(content)
        txt = _view_text(content[:limit], len(content), limit)
        return "HTML Outline", txt


class ViewURLEncoded:
    name = "URL-encoded"
    prompt = ("urlencoded", "u")
    content_types = ["application/x-www-form-urlencoded"]
    def __call__(self, hdrs, content, limit):
        lines = utils.urldecode(content)
        if lines:
            body = common.format_keyvals(
                        [(k+":", v) for (k, v) in lines],
                        key = "header",
                        val = "text"
                   )
            return "URLEncoded form", body


class ViewMultipart:
    name = "Multipart Form"
    prompt = ("multipart", "m")
    content_types = ["multipart/form-data"]
    def __call__(self, hdrs, content, limit):
        v = hdrs.get("content-type")
        if v:
            v = utils.parse_content_type(v[0])
            if not v:
                return
            boundary = v[2].get("boundary")
            if not boundary:
                return

            rx = re.compile(r'\bname="([^"]+)"')
            keys = []
            vals = []

            for i in content.split("--" + boundary):
                parts = i.splitlines()
                if len(parts) > 1 and parts[0][0:2] != "--":
                    match = rx.search(parts[1])
                    if match:
                        keys.append(match.group(1) + ":")
                        vals.append(utils.cleanBin(
                            "\n".join(parts[3+parts[2:].index(""):])
                        ))
            r = [
                urwid.Text(("highlight", "Form data:\n")),
            ]
            r.extend(common.format_keyvals(
                zip(keys, vals),
                key = "header",
                val = "text"
            ))
            return "Multipart form", r


class ViewAMF:
    name = "AMF"
    prompt = ("amf", "f")
    content_types = ["application/x-amf"]
    def __call__(self, hdrs, content, limit):
        s = utils.pretty_amf(content)
        if s:
            return "AMF", _view_text(s[:limit], len(s), limit)


class ViewJavaScript:
    name = "JavaScript"
    prompt = ("javascript", "j")
    content_types = [
        "application/x-javascript",
        "application/javascript",
        "text/javascript"
    ]
    def __call__(self, hdrs, content, limit):
        opts = jsbeautifier.default_options()
        opts.indent_size = 2
        res = jsbeautifier.beautify(content[:limit], opts)
        return "JavaScript", _view_text(res, len(content), limit)


class ViewImage:
    name = "Image"
    prompt = ("image", "i")
    content_types = [
        "image/png",
        "image/jpeg",
        "image/gif",
        "image/vnd.microsoft.icon",
        "image/x-icon",
    ]
    def __call__(self, hdrs, content, limit):
        try:
            img = Image.open(cStringIO.StringIO(content))
        except IOError:
            return None
        parts = [
            ("Format", str(img.format_description)),
            ("Size", "%s x %s px"%img.size),
            ("Mode", str(img.mode)),
        ]
        for i in sorted(img.info.keys()):
            if i != "exif":
                parts.append(
                    (str(i), str(img.info[i]))
                )
        if hasattr(img, "_getexif"):
            ex = img._getexif()
            if ex:
                for i in sorted(ex.keys()):
                    tag = TAGS.get(i, i)
                    parts.append(
                        (str(tag), str(ex[i]))
                    )
        clean = []
        for i in parts:
            clean.append([utils.cleanBin(i[0]), utils.cleanBin(i[1])])
        fmt = common.format_keyvals(
                clean,
                key = "header",
                val = "text"
            )
        return "%s image"%img.format, fmt


views = [
    ViewAuto(),
    ViewRaw(),
    ViewHex(),
    ViewJSON(),
    ViewXML(),
    ViewHTML(),
    ViewHTMLOutline(),
    ViewJavaScript(),
    ViewURLEncoded(),
    ViewMultipart(),
    ViewImage(),
]
try:
    import pyamf
    views.append(ViewAMF())
except ImportError: # pragma nocover
    pass


content_types_map = {}
for i in views:
    for ct in i.content_types:
        l = content_types_map.setdefault(ct, [])
        l.append(i)


view_prompts = [i.prompt for i in views]


def get_by_shortcut(c):
    for i in views:
        if i.prompt[1] == c:
            return i


def get(name):
    for i in views:
        if i.name == name:
            return i


def get_content_view(viewmode, hdrItems, content, limit):
    """
        Returns a (msg, body) tuple.
    """
    msg = []

    hdrs = flow.ODictCaseless([list(i) for i in hdrItems])

    enc = hdrs.get("content-encoding")
    if enc and enc[0] != "identity":
        decoded = encoding.decode(enc[0], content)
        if decoded:
            content = decoded
            msg.append("[decoded %s]"%enc[0])
    try:
        ret = viewmode(hdrs, content, limit)
    # Third-party viewers can fail in unexpected ways...
    except Exception, e:
        s = traceback.format_exc()
        return "", _view_text(s, len(s), len(s))
        ret = None
    if not ret:
        ret = get("Raw")(hdrs, content, limit)
        msg.append("Couldn't parse: falling back to Raw")
    else:
        msg.append(ret[0])
    return " ".join(msg), ret[1]
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`import re, cStringIO, traceback`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import urwid`
Add a pretty-viewer for images. This shows basic image information like dimensions, plus extracted EXIF tags and other metadata. 2012-03-25 22:26:02 +00:00			`from PIL import Image`
			`from PIL.ExifTags import TAGS`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`import lxml.html, lxml.etree`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`import common`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`from .. import utils, encoding, flow`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`from ..contrib import jsbeautifier, html2text`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`VIEW_CUTOFF = 1024*50`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`def _view_text(content, total, limit):`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`"""`
			`Generates a body for a chunk of text.`
			`"""`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt = []`
Tune content viewing to maintain responsiveness: - Reduce display cutoff to 20k. - Make sure that we only indent the visible part of a JS body, not the whole thing. 2012-03-31 22:09:25 +00:00			`for i in utils.cleanBin(content).splitlines():`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Wrap on any character for body text display. 2012-04-08 03:00:38 +00:00			`urwid.Text(("text", i), wrap="any")`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`trailer(total, txt, limit)`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00			`return txt`


Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def trailer(clen, txt, limit):`
			`rem = clen - limit`
			`if rem > 0:`
			`txt.append(urwid.Text(""))`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`txt.append(`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`urwid.Text(`
			`[`
			`("highlight", "... %s of data not shown. Press "%utils.pretty_size(rem)),`
			`("key", "f"),`
			`("highlight", " to load all data.")`
			`]`
			`)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00			`)`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewAuto:`
			`name = "Auto"`
			`prompt = ("auto", "a")`
			`content_types = []`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`def __call__(self, hdrs, content, limit):`
			`ctype = hdrs.get("content-type")`
			`if ctype:`
			`ctype = ctype[0]`
			`ct = utils.parse_content_type(ctype) if ctype else None`
			`if ct:`
			`ct = "%s/%s"%(ct[0], ct[1])`
			`if ct in content_types_map:`
			`return content_types_map[ct][0](hdrs, content, limit)`
			`elif utils.isXML(content):`
			`return get("XML")(hdrs, content, limit)`
			`return get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewRaw:`
			`name = "Raw"`
			`prompt = ("raw", "r")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "Raw", txt`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`class ViewHex:`
			`name = "Hex"`
			`prompt = ("hex", "e")`
			`content_types = []`
			`def __call__(self, hdrs, content, limit):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt = []`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`for offset, hexa, s in utils.hexdump(content[:limit]):`
			`txt.append(urwid.Text([`
			`("offset", offset),`
			`" ",`
			`("text", hexa),`
			`" ",`
			`("text", s),`
			`]))`
			`trailer(len(content), txt, limit)`
			`return "Hex", txt`


			`class ViewXML:`
			`name = "XML"`
			`prompt = ("xml", "x")`
			`content_types = ["text/xml"]`
			`def __call__(self, hdrs, content, limit):`
			`parser = lxml.etree.XMLParser(remove_blank_text=True, resolve_entities=False, strip_cdata=False, recover=False)`
			`try:`
			`document = lxml.etree.fromstring(content, parser)`
			`except lxml.etree.XMLSyntaxError:`
			`return None`
			`docinfo = document.getroottree().docinfo`

			`prev = []`
			`p = document.getroottree().getroot().getprevious()`
			`while p is not None:`
			`prev.insert(`
			`0,`
			`lxml.etree.tostring(p)`
			`)`
			`p = p.getprevious()`
			`doctype=docinfo.doctype`
			`if prev:`
			`doctype += "\n".join(prev).strip()`
			`doctype = doctype.strip()`

			`s = lxml.etree.tostring(`
			`document,`
			`pretty_print=True,`
			`xml_declaration=True,`
			`doctype=doctype or None,`
			`encoding = docinfo.encoding`
			`)`

			`txt = []`
			`for i in s[:limit].strip().split("\n"):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`trailer(len(content), txt, limit)`
			`return "XML-like data", txt`


			`class ViewJSON:`
			`name = "JSON"`
			`prompt = ("json", "j")`
			`content_types = ["application/json"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.pretty_json(content)`
			`if lines:`
			`txt = []`
			`sofar = 0`
			`for i in lines:`
			`sofar += len(i)`
			`txt.append(`
			`urwid.Text(("text", i)),`
			`)`
			`if sofar > limit:`
			`break`
			`trailer(sum(len(i) for i in lines), txt, limit)`
			`return "JSON", txt`


			`class ViewHTML:`
			`name = "HTML"`
			`prompt = ("html", "h")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`if utils.isXML(content):`
			`parser = lxml.etree.HTMLParser(strip_cdata=True, remove_blank_text=True)`
			`d = lxml.html.fromstring(content, parser=parser)`
			`docinfo = d.getroottree().docinfo`
			`s = lxml.etree.tostring(d, pretty_print=True, doctype=docinfo.doctype)`
			`return "HTML", _view_text(s[:limit], len(s), limit)`


			`class ViewHTMLOutline:`
			`name = "HTML Outline"`
			`prompt = ("html outline", "o")`
			`content_types = ["text/html"]`
			`def __call__(self, hdrs, content, limit):`
			`content = content.decode("utf-8")`
			`h = html2text.HTML2Text(baseurl="")`
			`h.ignore_images = True`
			`h.body_width = 0`
			`content = h.handle(content)`
			`txt = _view_text(content[:limit], len(content), limit)`
			`return "HTML Outline", txt`


			`class ViewURLEncoded:`
			`name = "URL-encoded"`
			`prompt = ("urlencoded", "u")`
			`content_types = ["application/x-www-form-urlencoded"]`
			`def __call__(self, hdrs, content, limit):`
			`lines = utils.urldecode(content)`
			`if lines:`
			`body = common.format_keyvals(`
			`[(k+":", v) for (k, v) in lines],`
			`key = "header",`
			`val = "text"`
			`)`
			`return "URLEncoded form", body`


			`class ViewMultipart:`
			`name = "Multipart Form"`
			`prompt = ("multipart", "m")`
			`content_types = ["multipart/form-data"]`
			`def __call__(self, hdrs, content, limit):`
			`v = hdrs.get("content-type")`
			`if v:`
			`v = utils.parse_content_type(v[0])`
			`if not v:`
			`return`
			`boundary = v[2].get("boundary")`
			`if not boundary:`
			`return`

			`rx = re.compile(r'\bname="([^"]+)"')`
			`keys = []`
			`vals = []`

			`for i in content.split("--" + boundary):`
			`parts = i.splitlines()`
			`if len(parts) > 1 and parts[0][0:2] != "--":`
			`match = rx.search(parts[1])`
			`if match:`
			`keys.append(match.group(1) + ":")`
			`vals.append(utils.cleanBin(`
			`"\n".join(parts[3+parts[2:].index(""):])`
			`))`
			`r = [`
			`urwid.Text(("highlight", "Form data:\n")),`
			`]`
			`r.extend(common.format_keyvals(`
			`zip(keys, vals),`
			`key = "header",`
			`val = "text"`
			`))`
			`return "Multipart form", r`


			`class ViewAMF:`
			`name = "AMF"`
			`prompt = ("amf", "f")`
			`content_types = ["application/x-amf"]`
			`def __call__(self, hdrs, content, limit):`
			`s = utils.pretty_amf(content)`
			`if s:`
			`return "AMF", _view_text(s[:limit], len(s), limit)`


			`class ViewJavaScript:`
			`name = "JavaScript"`
			`prompt = ("javascript", "j")`
			`content_types = [`
			`"application/x-javascript",`
			`"application/javascript",`
			`"text/javascript"`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`opts = jsbeautifier.default_options()`
			`opts.indent_size = 2`
			`res = jsbeautifier.beautify(content[:limit], opts)`
			`return "JavaScript", _view_text(res, len(content), limit)`


			`class ViewImage:`
			`name = "Image"`
			`prompt = ("image", "i")`
			`content_types = [`
			`"image/png",`
			`"image/jpeg",`
			`"image/gif",`
			`"image/vnd.microsoft.icon",`
			`"image/x-icon",`
			`]`
			`def __call__(self, hdrs, content, limit):`
			`try:`
			`img = Image.open(cStringIO.StringIO(content))`
			`except IOError:`
			`return None`
			`parts = [`
			`("Format", str(img.format_description)),`
			`("Size", "%s x %s px"%img.size),`
			`("Mode", str(img.mode)),`
Re-enable simple multipart form parsing and preview. 2012-03-24 21:10:48 +00:00			`]`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`for i in sorted(img.info.keys()):`
			`if i != "exif":`
			`parts.append(`
			`(str(i), str(img.info[i]))`
			`)`
			`if hasattr(img, "_getexif"):`
			`ex = img._getexif()`
			`if ex:`
			`for i in sorted(ex.keys()):`
			`tag = TAGS.get(i, i)`
			`parts.append(`
			`(str(tag), str(ex[i]))`
			`)`
			`clean = []`
			`for i in parts:`
			`clean.append([utils.cleanBin(i[0]), utils.cleanBin(i[1])])`
			`fmt = common.format_keyvals(`
			`clean,`
			`key = "header",`
			`val = "text"`
			`)`
			`return "%s image"%img.format, fmt`


			`views = [`
			`ViewAuto(),`
			`ViewRaw(),`
			`ViewHex(),`
			`ViewJSON(),`
			`ViewXML(),`
			`ViewHTML(),`
			`ViewHTMLOutline(),`
			`ViewJavaScript(),`
			`ViewURLEncoded(),`
			`ViewMultipart(),`
			`ViewImage(),`
			`]`
			`try:`
			`import pyamf`
			`views.append(ViewAMF())`
			`except ImportError: # pragma nocover`
			`pass`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`content_types_map = {}`
			`for i in views:`
			`for ct in i.content_types:`
			`l = content_types_map.setdefault(ct, [])`
			`l.append(i)`
Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`view_prompts = [i.prompt for i in views]`
Pretty view now indents Javascript. Thanks to the JSBeautifier project, which is now included in the contrib directory. 2012-03-24 21:56:45 +00:00

Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`def get_by_shortcut(c):`
			`for i in views:`
			`if i.prompt[1] == c:`
			`return i`


			`def get(name):`
			`for i in views:`
			`if i.name == name:`
			`return i`

Factor out content view apparatus into contentview.py 2012-03-23 22:21:58 +00:00
Add an "f" shortcut key to load full body contents. 2012-04-08 07:23:05 +00:00			`def get_content_view(viewmode, hdrItems, content, limit):`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`"""`
			`Returns a (msg, body) tuple.`
			`"""`
			`msg = []`

			`hdrs = flow.ODictCaseless([list(i) for i in hdrItems])`

			`enc = hdrs.get("content-encoding")`
			`if enc and enc[0] != "identity":`
			`decoded = encoding.decode(enc[0], content)`
			`if decoded:`
			`content = decoded`
			`msg.append("[decoded %s]"%enc[0])`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`try:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`ret = viewmode(hdrs, content, limit)`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`# Third-party viewers can fail in unexpected ways...`
Add an HTML text outline view. Uses html2text, from here: https://github.com/aaronsw/html2text 2012-08-17 13:37:30 +00:00			`except Exception, e:`
Further simplifcation and testing of contentviews. 2012-08-18 05:29:29 +00:00			`s = traceback.format_exc()`
			`return "", _view_text(s, len(s), len(s))`
Protect against exceptions thrown by third-party view libraries. 2012-07-06 03:43:33 +00:00			`ret = None`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`if not ret:`
Huge cleanup of content viewers. 2012-08-18 05:08:17 +00:00			`ret = get("Raw")(hdrs, content, limit)`
Integrate lxml for pretty-printing HTML and XML. Tackling the pretty-printing performance problem head-on, at the cost of a major dependency. 2012-04-07 01:47:03 +00:00			`msg.append("Couldn't parse: falling back to Raw")`
Make it clearer when we fall back to Raw. 2012-04-01 23:22:01 +00:00			`else:`
			`msg.append(ret[0])`
Refactor pretty view mechanism. Also start adding unit tests for this subsystem. 2012-03-24 01:02:41 +00:00			`return " ".join(msg), ret[1]`