Fixing chunk deserializing

2015-11-11 10:31:05 +01:00 · 2015-11-11 10:31:05 +01:00 · c8ae1b84dc
parent 1c384949ae
commit c8ae1b84dc
1 changed files with 11 additions and 10 deletions
--- a/taiga/export_import/serializers.py
+++ b/taiga/export_import/serializers.py
@ -67,17 +67,18 @@ class AttachedFileField(serializers.WritableField):
        if not data:
            return None

-        # Each sequence of 3 octets is represented by 4 characters in base64.
-        # The file was encoded in chunks of 8190 (multiple of three) so the proper way of decoding it is:
-        # - split the encoded data in multiple of four chars blocks
-        # - decode each block
        decoded_data = b''
-        pending_data = data['data']
-        chunk_size = 8192
-        while pending_data:
-            decoding_data = pending_data[0:chunk_size]
-            decoded_data += base64.b64decode(decoding_data)
-            pending_data = pending_data[chunk_size:]
+        # The original file was encoded by chunks but we don't really know its
+        # length or if it was multiple of 3 so we must iterate over all those chunks
+        # decoding them one by one
+        for decoding_chunk in data['data'].split("="):
+            # When encoding to base64 3 bytes are transformed into 4 bytes and
+            # the extra space of the block is filled with =
+            # We must ensure that the decoding chunk has a length multiple of 4 so
+            # we restore the stripped '='s adding appending them until the chunk has
+            # a length multiple of 4
+            decoding_chunk += "=" * (-len(decoding_chunk) % 4)
+            decoded_data += base64.b64decode(decoding_chunk+"=")

        return ContentFile(decoded_data, name=data['name'])