Merge pull request #521 from taigaio/fixing-chunk-deserializing

Fixing chunk deserializing
2015-11-11 16:00:36 +01:00 · 2015-11-11 16:00:36 +01:00 · e518e25e6a
parent 1c384949ae c8ae1b84dc
commit e518e25e6a
1 changed files with 11 additions and 10 deletions
--- a/taiga/export_import/serializers.py
+++ b/taiga/export_import/serializers.py
@ -67,17 +67,18 @@ class AttachedFileField(serializers.WritableField):
        if not data:
            return None
        # Each sequence of 3 octets is represented by 4 characters in base64.
        # The file was encoded in chunks of 8190 (multiple of three) so the proper way of decoding it is:
        # - split the encoded data in multiple of four chars blocks
        # - decode each block
        decoded_data = b''
-        pending_data = data['data']
+        # The original file was encoded by chunks but we don't really know its
-        chunk_size = 8192
+        # length or if it was multiple of 3 so we must iterate over all those chunks
-        while pending_data:
+        # decoding them one by one
-            decoding_data = pending_data[0:chunk_size]
+        for decoding_chunk in data['data'].split("="):
-            decoded_data += base64.b64decode(decoding_data)
+            # When encoding to base64 3 bytes are transformed into 4 bytes and
-            pending_data = pending_data[chunk_size:]
+            # the extra space of the block is filled with =
            # We must ensure that the decoding chunk has a length multiple of 4 so
            # we restore the stripped '='s adding appending them until the chunk has
            # a length multiple of 4
            decoding_chunk += "=" * (-len(decoding_chunk) % 4)
            decoded_data += base64.b64decode(decoding_chunk+"=")
        return ContentFile(decoded_data, name=data['name'])