psf · rmcgibbo · Nov 24, 2015 · Nov 24, 2015 · Nov 25, 2015 · Nov 26, 2015
diff --git a/.travis.yml b/.travis.yml
@@ -1,4 +1,5 @@
 language: python
+sudo: false
 
 env:
  - TOXENV=py26

diff --git a/cachecontrol/adapter.py b/cachecontrol/adapter.py
@@ -1,3 +1,4 @@
+import types
 import functools
 
 from requests.adapters import HTTPAdapter
@@ -97,6 +98,14 @@ def build_response(self, request, response, from_cache=False):
                         response,
                     )
                 )
+                if response.chunked:
+                    super_update_chunk_length = response._update_chunk_length
+
+                    def _update_chunk_length(self):
+                        super_update_chunk_length()
+                        if self.chunk_left == 0:
+                            self._fp._close()
+                    response._update_chunk_length = types.MethodType(_update_chunk_length, response)
 
         resp = super(CacheControlAdapter, self).build_response(
             request, response

diff --git a/cachecontrol/filewrapper.py b/cachecontrol/filewrapper.py
@@ -45,19 +45,34 @@ def __is_fp_closed(self):
         # TODO: Add some logging here...
         return False
 
+    def _close(self):
+        if self.__callback:
+            self.__callback(self.__buf.getvalue())
+
+        # We assign this to None here, because otherwise we can get into
+        # really tricky problems where the CPython interpreter dead locks
+        # because the callback is holding a reference to something which
+        # has a __del__ method. Setting this to None breaks the cycle
+        # and allows the garbage collector to do it's thing normally.
+        self.__callback = None
+
     def read(self, amt=None):
         data = self.__fp.read(amt)
         self.__buf.write(data)
+        if self.__is_fp_closed():
+            self._close()
 
+        return data
+
+    def _safe_read(self, amt):
+        data = self.__fp._safe_read(amt)
+        if amt == 2 and data == b'\r\n':
+            # urllib executes this read to toss the CRLF at the end
+            # of the chunk.
+            return data
+
+        self.__buf.write(data)
         if self.__is_fp_closed():
-            if self.__callback:
-                self.__callback(self.__buf.getvalue())
-
-            # We assign this to None here, because otherwise we can get into
-            # really tricky problems where the CPython interpreter dead locks
-            # because the callback is holding a reference to something which
-            # has a __del__ method. Setting this to None breaks the cycle
-            # and allows the garbage collector to do it's thing normally.
-            self.__callback = None
+            self._close()
 
         return data
diff --git a/cachecontrol/serialize.py b/cachecontrol/serialize.py
@@ -134,6 +134,12 @@ def prepare_response(self, request, cached):
 
         body_raw = cached["response"].pop("body")
 
+        headers = CaseInsensitiveDict(data=cached['response']['headers'])
+        if headers.get('transfer-encoding', '') == 'chunked':
+            headers.pop('transfer-encoding')
+
+        cached['response']['headers'] = headers
+
         try:
             body = io.BytesIO(body_raw)
         except TypeError:

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -89,6 +89,14 @@ def multiple_choices(self, env, start_response):
         start_response('300 Multiple Choices', headers)
         return ['See: /permalink'.encode('utf-8')]
 
+    def stream(self, env, start_response):
+        headers = [
+            ('Cache-Control', 'max-age=5000'),
+            ('Content-Type', 'text/plain'),
+        ]
+        start_response('200 OK', headers)
+        return (pformat(env).encode("utf8") for i in range(10))
+
     def __call__(self, env, start_response):
         func = self.dispatch(env)
 

diff --git a/tests/test_stream.py b/tests/test_stream.py
@@ -0,0 +1,28 @@
+"""
+Test for supporting streamed responses (Transfer-Encoding: chunked)
+"""
+import requests
+
+from cachecontrol import CacheControl
+
+
+class TestStream(object):
+    def test_stream_is_cached(self, url):
+        sess = CacheControl(requests.Session())
+
+        resp_1 = sess.get(url + 'stream')
+        content_1 = resp_1.content
+
+        resp_2 = sess.get(url + 'stream')
+        content_2 = resp_1.content
+
+        assert not resp_1.from_cache
+        assert resp_2.from_cache
+        assert content_1 == content_2
+
+    def test_stream_is_not_cached_when_content_is_not_read(self, url):
+        sess = CacheControl(requests.Session())
+        sess.get(url + 'stream', stream=True)
+        resp = sess.get(url + 'stream', stream=True)
+
+        assert not resp.from_cache