Shift a bunch more string-related functions to strutils

2025-01-30 14:58:38 +00:00 · 2016-06-02 13:03:37 +12:00 · 2016-06-02 13:03:37 +12:00 · 09da1febbd
commit 09da1febbd
parent 31012d782f
9 changed files with 82 additions and 87 deletions
--- a/examples/custom_contentviews.py
+++ b/examples/custom_contentviews.py
@ -1,7 +1,8 @@
 import string
 import lxml.html
 import lxml.etree
-from mitmproxy import utils, contentviews
+from mitmproxy import contentviews
+from netlib import strutils


 class ViewPigLatin(contentviews.View):
@ -10,7 +11,7 @@ class ViewPigLatin(contentviews.View):
    content_types = ["text/html"]

    def __call__(self, data, **metadata):
-        if utils.isXML(data):
+        if strutils.isXML(data):
            parser = lxml.etree.HTMLParser(
                strip_cdata=True,
                remove_blank_text=True
--- a/mitmproxy/contentviews.py
+++ b/mitmproxy/contentviews.py
@ -37,7 +37,6 @@ from netlib import http
 from netlib import odict
 from netlib.http import url
 from netlib import strutils
-import netlib.utils

 try:
    import pyamf
@ -130,11 +129,11 @@ class ViewAuto(View):
            ct = "%s/%s" % (ct[0], ct[1])
            if ct in content_types_map:
                return content_types_map[ct][0](data, **metadata)
-            elif mitmproxy.utils.isXML(data):
+            elif strutils.isXML(data):
                return get("XML")(data, **metadata)
        if metadata.get("query"):
            return get("Query")(data, **metadata)
-        if data and mitmproxy.utils.isMostlyBin(data):
+        if data and strutils.isMostlyBin(data):
            return get("Hex")(data)
        if not data:
            return "No content", []
@ -157,7 +156,7 @@ class ViewHex(View):

    @staticmethod
    def _format(data):
-        for offset, hexa, s in netlib.utils.hexdump(data):
+        for offset, hexa, s in strutils.hexdump(data):
            yield [
                ("offset", offset + " "),
                ("text", hexa + "   "),
@ -227,7 +226,7 @@ class ViewHTML(View):
    content_types = ["text/html"]

    def __call__(self, data, **metadata):
-        if mitmproxy.utils.isXML(data):
+        if strutils.isXML(data):
            parser = lxml.etree.HTMLParser(
                strip_cdata=True,
                remove_blank_text=True
--- a/mitmproxy/utils.py
+++ b/mitmproxy/utils.py
@ -25,32 +25,6 @@ def format_timestamp_with_milli(s):
    return d.strftime("%Y-%m-%d %H:%M:%S.%f")[:-3]


-def isBin(s):
-    """
-        Does this string have any non-ASCII characters?
-    """
-    for i in s:
-        i = ord(i)
-        if i < 9 or 13 < i < 32 or 126 < i:
-            return True
-    return False
-
-
-def isMostlyBin(s):
-    s = s[:100]
-    return sum(isBin(ch) for ch in s) / len(s) > 0.3
-
-
-def isXML(s):
-    for i in s:
-        if i in "\n \t":
-            continue
-        elif i == "<":
-            return True
-        else:
-            return False
-
-
 def pretty_json(s):
    try:
        p = json.loads(s)
@ -92,15 +66,3 @@ class LRUCache:
                d = self.cacheList.pop()
                self.cache.pop(d)
            return ret
-
-
-def clean_hanging_newline(t):
-    """
-        Many editors will silently add a newline to the final line of a
-        document (I'm looking at you, Vim). This function fixes this common
-        problem at the risk of removing a hanging newline in the rare cases
-        where the user actually intends it.
-    """
-    if t and t[-1] == "\n":
-        return t[:-1]
-    return t
--- a/netlib/strutils.py
+++ b/netlib/strutils.py
@ -101,3 +101,54 @@ def escaped_str_to_bytes(data):
    # This one is difficult - we use an undocumented Python API here
    # as per http://stackoverflow.com/a/23151714/934719
    return codecs.escape_decode(data)[0]
+
+
+def isBin(s):
+    """
+        Does this string have any non-ASCII characters?
+    """
+    for i in s:
+        i = ord(i)
+        if i < 9 or 13 < i < 32 or 126 < i:
+            return True
+    return False
+
+
+def isMostlyBin(s):
+    s = s[:100]
+    return sum(isBin(ch) for ch in s) / len(s) > 0.3
+
+
+def isXML(s):
+    for i in s:
+        if i in "\n \t":
+            continue
+        elif i == "<":
+            return True
+        else:
+            return False
+
+
+def clean_hanging_newline(t):
+    """
+        Many editors will silently add a newline to the final line of a
+        document (I'm looking at you, Vim). This function fixes this common
+        problem at the risk of removing a hanging newline in the rare cases
+        where the user actually intends it.
+    """
+    if t and t[-1] == "\n":
+        return t[:-1]
+    return t
+
+
+def hexdump(s):
+    """
+        Returns:
+            A generator of (offset, hex, str) tuples
+    """
+    for i in range(0, len(s), 16):
+        offset = "{:0=10x}".format(i).encode()
+        part = s[i:i + 16]
+        x = b" ".join("{:0=2x}".format(i).encode() for i in six.iterbytes(part))
+        x = x.ljust(47)  # 16*2 + 15
+        yield (offset, x, clean_bin(part, False))
--- a/netlib/utils.py
+++ b/netlib/utils.py
@ -6,21 +6,6 @@ import inspect

 import six

-from netlib import strutils
-
-
-def hexdump(s):
-    """
-        Returns:
-            A generator of (offset, hex, str) tuples
-    """
-    for i in range(0, len(s), 16):
-        offset = "{:0=10x}".format(i).encode()
-        part = s[i:i + 16]
-        x = b" ".join("{:0=2x}".format(i).encode() for i in six.iterbytes(part))
-        x = x.ljust(47)  # 16*2 + 15
-        yield (offset, x, strutils.clean_bin(part, False))
-

 def setbit(byte, offset, value):
    """
--- a/pathod/log.py
+++ b/pathod/log.py
@ -2,9 +2,6 @@ import datetime

 import six

-import netlib.utils
-import netlib.tcp
-import netlib.http
 from netlib import strutils

 TIMEFMT = '%d-%m-%y %H:%M:%S'
@ -63,7 +60,7 @@ class LogCtx(object):

    def dump(self, data, hexdump):
        if hexdump:
-            for line in netlib.utils.hexdump(data):
+            for line in strutils.hexdump(data):
                self("\t%s %s %s" % line)
        else:
            for i in strutils.clean_bin(data).split("\n"):
--- a/test/mitmproxy/test_utils.py
+++ b/test/mitmproxy/test_utils.py
@ -13,25 +13,6 @@ def test_format_timestamp_with_milli():
    assert utils.format_timestamp_with_milli(utils.timestamp())


-def test_isBin():
-    assert not utils.isBin("testing\n\r")
-    assert utils.isBin("testing\x01")
-    assert utils.isBin("testing\x0e")
-    assert utils.isBin("testing\x7f")
-
-
-def test_isXml():
-    assert not utils.isXML("foo")
-    assert utils.isXML("<foo")
-    assert utils.isXML("  \n<foo")
-
-
-def test_clean_hanging_newline():
-    s = "foo\n"
-    assert utils.clean_hanging_newline(s) == "foo"
-    assert utils.clean_hanging_newline("foo") == "foo"
-
-
 def test_pkg_data():
    assert utils.pkg_data.path("console")
    tutils.raises("does not exist", utils.pkg_data.path, "nonexistent")
--- a/test/netlib/test_strutils.py
+++ b/test/netlib/test_strutils.py
@ -38,3 +38,26 @@ def test_escaped_str_to_bytes():
    assert strutils.escaped_str_to_bytes(u"\\x08") == b"\b"
    assert strutils.escaped_str_to_bytes(u"&!?=\\\\)") == br"&!?=\)"
    assert strutils.escaped_str_to_bytes(u"ü") == b'\xc3\xbc'
+
+
+def test_isBin():
+    assert not strutils.isBin("testing\n\r")
+    assert strutils.isBin("testing\x01")
+    assert strutils.isBin("testing\x0e")
+    assert strutils.isBin("testing\x7f")
+
+
+def test_isXml():
+    assert not strutils.isXML("foo")
+    assert strutils.isXML("<foo")
+    assert strutils.isXML("  \n<foo")
+
+
+def test_clean_hanging_newline():
+    s = "foo\n"
+    assert strutils.clean_hanging_newline(s) == "foo"
+    assert strutils.clean_hanging_newline("foo") == "foo"
+
+
+def test_hexdump():
+    assert list(strutils.hexdump(b"one\0" * 10))
--- a/test/netlib/test_utils.py
+++ b/test/netlib/test_utils.py
@ -10,7 +10,3 @@ def test_bidi():
    assert b.get_name(5) is None
    tutils.raises(AttributeError, getattr, b, "c")
    tutils.raises(ValueError, utils.BiDi, one=1, two=1)
-
-
-def test_hexdump():
-    assert list(utils.hexdump(b"one\0" * 10))