Merge pull request #2920 from coreos-inc/joseph.schorr/QS-69/swift-chunk-test

Additional testing and a fix for Swift segmenting
2017-11-28 18:14:23 +02:00 · 2017-11-28 18:14:23 +02:00 · a918339c90
commit a918339c90
parent 773ea9fc65 6cd8140c34
2 changed files with 33 additions and 14 deletions
--- a/storage/swift.py
+++ b/storage/swift.py
@ -266,8 +266,8 @@ class SwiftStorage(BaseStorage):
    if length == 0:
      return 0, storage_metadata, None

-    # Note: Swift limits segments to a maximum of 5GB, so we keep writing segments until we
-    # are finished hitting the data limit.
+    # Note: Swift limits segments in size, so we need to sub-divide chunks into segments
+    # based on the configured maximum.
    total_bytes_written = 0
    upload_error = None
    read_until_end = length == filelike.READ_UNTIL_END
@ -289,6 +289,7 @@ class SwiftStorage(BaseStorage):

      offset = offset + bytes_written
      total_bytes_written = total_bytes_written + bytes_written
+
      if bytes_written == 0 or (not read_until_end and length <= 0):
        return total_bytes_written, storage_metadata, upload_error

@ -297,7 +298,7 @@ class SwiftStorage(BaseStorage):
  def _stream_upload_segment(self, uuid, offset, length, in_fp, storage_metadata, content_type):
    updated_metadata = copy.deepcopy(storage_metadata)
    segment_count = len(updated_metadata[_SEGMENTS_KEY])
-    segment_path = '%s/%s/%s' % (_SEGMENT_DIRECTORY, uuid, segment_count)
+    segment_path = '%s/%s/%s' % (_SEGMENT_DIRECTORY, uuid, '%09d' % segment_count)

    # Track the number of bytes read and if an explicit length is specified, limit the
    # file stream to that length.
--- a/storage/test/test_swift.py
+++ b/storage/test/test_swift.py
@ -4,7 +4,7 @@ import hashlib
 import copy

 from collections import defaultdict
-from mock import MagicMock
+from mock import MagicMock, patch

 from storage import StorageContext
 from storage.swift import SwiftStorage
@ -204,21 +204,39 @@ def test_checksum():
  swift.put_content('somepath', 'hello world!')
  assert swift.get_checksum('somepath') is not None

-def test_chunked_upload():
+@pytest.mark.parametrize('read_until_end', [
+  (True,),
+  (False,),
+])
+@pytest.mark.parametrize('max_chunk_size', [
+  (10000000),
+  (10),
+  (5),
+  (2),
+  (1),
+])
+@pytest.mark.parametrize('chunks', [
+  (['this', 'is', 'some', 'chunked', 'data', '']),
+  (['this is a very large chunk of data', '']),
+  (['h', 'e', 'l', 'l', 'o', '']),
+])
+def test_chunked_upload(chunks, max_chunk_size, read_until_end):
  swift = FakeSwiftStorage(**base_args)
  uuid, metadata = swift.initiate_chunked_upload()

-  chunks = ['this', 'is', 'some', 'chunked', 'data', '']
  offset = 0
-  for chunk in chunks:
-    bytes_written, metadata, error = swift.stream_upload_chunk(uuid, offset, len(chunk),
-                                                               io.BytesIO(chunk), metadata)
-    assert error is None
-    assert len(chunk) == bytes_written
-    offset += len(chunk)

-  swift.complete_chunked_upload(uuid, 'somepath', metadata)
-  assert swift.get_content('somepath') == ''.join(chunks)
+  with patch('storage.swift._MAXIMUM_SEGMENT_SIZE', max_chunk_size):
+    for chunk in chunks:
+      chunk_length = len(chunk) if not read_until_end else -1
+      bytes_written, metadata, error = swift.stream_upload_chunk(uuid, offset, chunk_length,
+                                                                 io.BytesIO(chunk), metadata)
+      assert error is None
+      assert len(chunk) == bytes_written
+      offset += len(chunk)
+
+    swift.complete_chunked_upload(uuid, 'somepath', metadata)
+    assert swift.get_content('somepath') == ''.join(chunks)

 def test_cancel_chunked_upload():
  swift = FakeSwiftStorage(**base_args)