summaryrefslogtreecommitdiff
path: root/test/with_dummyserver/test_chunked_transfer.py
blob: b176e63c993499777ed39b7d33f129d4e3aca72b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
# -*- coding: utf-8 -*-

from urllib3 import HTTPConnectionPool
from dummyserver.testcase import SocketDummyServerTestCase


class TestChunkedTransfer(SocketDummyServerTestCase):
    def start_chunked_handler(self):
        self.buffer = b""

        def socket_handler(listener):
            sock = listener.accept()[0]

            while not self.buffer.endswith(b"\r\n0\r\n\r\n"):
                self.buffer += sock.recv(65536)

            sock.send(
                b"HTTP/1.1 200 OK\r\n"
                b"Content-type: text/plain\r\n"
                b"Content-Length: 0\r\n"
                b"\r\n"
            )
            sock.close()

        self._start_server(socket_handler)

    def test_chunks(self):
        self.start_chunked_handler()
        chunks = ["foo", "bar", "", "bazzzzzzzzzzzzzzzzzzzzzz"]
        pool = HTTPConnectionPool(self.host, self.port, retries=False)
        pool.urlopen("GET", "/", chunks, headers=dict(DNT="1"), chunked=True)
        self.addCleanup(pool.close)

        self.assertIn(b"Transfer-Encoding", self.buffer)
        body = self.buffer.split(b"\r\n\r\n", 1)[1]
        lines = body.split(b"\r\n")
        # Empty chunks should have been skipped, as this could not be distinguished
        # from terminating the transmission
        for i, chunk in enumerate([c for c in chunks if c]):
            self.assertEqual(lines[i * 2], hex(len(chunk))[2:].encode("utf-8"))
            self.assertEqual(lines[i * 2 + 1], chunk.encode("utf-8"))

    def _test_body(self, data):
        self.start_chunked_handler()
        pool = HTTPConnectionPool(self.host, self.port, retries=False)
        self.addCleanup(pool.close)

        pool.urlopen("GET", "/", data, chunked=True)
        header, body = self.buffer.split(b"\r\n\r\n", 1)

        self.assertIn(b"Transfer-Encoding: chunked", header.split(b"\r\n"))
        if data:
            bdata = data if isinstance(data, bytes) else data.encode("utf-8")
            self.assertIn(b"\r\n" + bdata + b"\r\n", body)
            self.assertTrue(body.endswith(b"\r\n0\r\n\r\n"))

            len_str = body.split(b"\r\n", 1)[0]
            stated_len = int(len_str, 16)
            self.assertEqual(stated_len, len(bdata))
        else:
            self.assertEqual(body, b"0\r\n\r\n")

    def test_bytestring_body(self):
        self._test_body(b"thisshouldbeonechunk\r\nasdf")

    def test_unicode_body(self):
        # Define u'thisshouldbeonechunk\r\näöüß' in a way, so that python3.1
        # does not suffer a syntax error
        chunk = b"thisshouldbeonechunk\r\n\xc3\xa4\xc3\xb6\xc3\xbc\xc3\x9f".decode(
            "utf-8"
        )
        self._test_body(chunk)

    def test_empty_body(self):
        self._test_body(None)

    def test_empty_string_body(self):
        self._test_body("")

    def test_empty_iterable_body(self):
        self._test_body([])

    def test_removes_duplicate_host_header(self):
        self.start_chunked_handler()
        chunks = ["foo", "bar", "", "bazzzzzzzzzzzzzzzzzzzzzz"]
        pool = HTTPConnectionPool(self.host, self.port, retries=False)
        self.addCleanup(pool.close)
        pool.urlopen("GET", "/", chunks, headers={"Host": "test.org"}, chunked=True)

        header_block = self.buffer.split(b"\r\n\r\n", 1)[0].lower()
        header_lines = header_block.split(b"\r\n")[1:]

        host_headers = [x for x in header_lines if x.startswith(b"host")]
        self.assertEqual(len(host_headers), 1)

    def test_provides_default_host_header(self):
        self.start_chunked_handler()
        chunks = ["foo", "bar", "", "bazzzzzzzzzzzzzzzzzzzzzz"]
        pool = HTTPConnectionPool(self.host, self.port, retries=False)
        self.addCleanup(pool.close)
        pool.urlopen("GET", "/", chunks, chunked=True)

        header_block = self.buffer.split(b"\r\n\r\n", 1)[0].lower()
        header_lines = header_block.split(b"\r\n")[1:]

        host_headers = [x for x in header_lines if x.startswith(b"host")]
        self.assertEqual(len(host_headers), 1)