diff options
author | Maximilian Hils <git@maximilianhils.com> | 2016-05-12 11:03:57 -0600 |
---|---|---|
committer | Maximilian Hils <git@maximilianhils.com> | 2016-05-12 11:03:57 -0600 |
commit | f1c922c652ec90f63cafed7f6b68d17f5229b58d (patch) | |
tree | 1091dc76bb1201dd334612a1d5bfa33f2918ad27 /netlib | |
parent | 518cc78454f9656be37e3153e2b508e56aa7ebf7 (diff) | |
download | mitmproxy-f1c922c652ec90f63cafed7f6b68d17f5229b58d.tar.gz mitmproxy-f1c922c652ec90f63cafed7f6b68d17f5229b58d.tar.bz2 mitmproxy-f1c922c652ec90f63cafed7f6b68d17f5229b58d.zip |
Sanitize Print (#1135)
* sanitize strings with shell control characters
* netlib: add utilities to safe-print bytes
* escaped str: add TODO for multi-byte chars
Diffstat (limited to 'netlib')
-rw-r--r-- | netlib/utils.py | 28 |
1 files changed, 28 insertions, 0 deletions
diff --git a/netlib/utils.py b/netlib/utils.py index ebd192f3..be2701a0 100644 --- a/netlib/utils.py +++ b/netlib/utils.py @@ -431,3 +431,31 @@ def safe_subn(pattern, repl, target, *args, **kwargs): need a better solution that is aware of the actual content ecoding. """ return re.subn(str(pattern), str(repl), target, *args, **kwargs) + + +def bytes_to_escaped_str(data): + """ + Take bytes and return a safe string that can be displayed to the user. + """ + # TODO: We may want to support multi-byte characters without escaping them. + # One way to do would be calling .decode("utf8", "backslashreplace") first + # and then escaping UTF8 control chars (see clean_bin). + + if not isinstance(data, bytes): + raise ValueError("data must be bytes") + return repr(data).lstrip("b")[1:-1] + + +def escaped_str_to_bytes(data): + """ + Take an escaped string and return the unescaped bytes equivalent. + """ + if not isinstance(data, str): + raise ValueError("data must be str") + + if six.PY2: + return data.decode("string-escape") + + # This one is difficult - we use an undocumented Python API here + # as per http://stackoverflow.com/a/23151714/934719 + return codecs.escape_decode(data)[0] |