aboutsummaryrefslogtreecommitdiffstats
path: root/netlib/encoding.py
blob: e3cf5f3065cfacd3335b0ad61acd0d6ec242b524 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
"""
Utility functions for decoding response bodies.
"""
from __future__ import absolute_import

import codecs
from io import BytesIO
import gzip
import zlib

from typing import Union  # noqa


def decode(obj, encoding, errors='strict'):
    # type: (Union[str, bytes], str, str) -> Union[str, bytes]
    """
    Decode the given input object

    Returns:
        The decoded value

    Raises:
        ValueError, if decoding fails.
    """
    try:
        try:
            return custom_decode[encoding](obj)
        except KeyError:
            return codecs.decode(obj, encoding, errors)
    except Exception as e:
        raise ValueError("{} when decoding {} with {}".format(
            type(e).__name__,
            repr(obj)[:10],
            repr(encoding),
        ))


def encode(obj, encoding, errors='strict'):
    # type: (Union[str, bytes], str, str) -> Union[str, bytes]
    """
    Encode the given input object

    Returns:
        The encoded value

    Raises:
        ValueError, if encoding fails.
    """
    try:
        try:
            return custom_encode[encoding](obj)
        except KeyError:
            return codecs.encode(obj, encoding, errors)
    except Exception as e:
        raise ValueError("{} when encoding {} with {}".format(
            type(e).__name__,
            repr(obj)[:10],
            repr(encoding),
        ))


def identity(content):
    """
        Returns content unchanged. Identity is the default value of
        Accept-Encoding headers.
    """
    return content


def decode_gzip(content):
    gfile = gzip.GzipFile(fileobj=BytesIO(content))
    return gfile.read()


def encode_gzip(content):
    s = BytesIO()
    gf = gzip.GzipFile(fileobj=s, mode='wb')
    gf.write(content)
    gf.close()
    return s.getvalue()


def decode_deflate(content):
    """
        Returns decompressed data for DEFLATE. Some servers may respond with
        compressed data without a zlib header or checksum. An undocumented
        feature of zlib permits the lenient decompression of data missing both
        values.

        http://bugs.python.org/issue5784
    """
    try:
        return zlib.decompress(content)
    except zlib.error:
        return zlib.decompress(content, -15)


def encode_deflate(content):
    """
        Returns compressed content, always including zlib header and checksum.
    """
    return zlib.compress(content)


custom_decode = {
    "identity": identity,
    "gzip": decode_gzip,
    "deflate": decode_deflate,
}
custom_encode = {
    "identity": identity,
    "gzip": encode_gzip,
    "deflate": encode_deflate,
}

__all__ = ["encode", "decode"]