test_object_store_service.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427
  1. import filecmp
  2. import os
  3. import tempfile
  4. from datetime import datetime
  5. from io import BytesIO
  6. from unittest import mock
  7. from unittest import skip
  8. import requests
  9. from cloudbridge.base import helpers as cb_helpers
  10. from cloudbridge.base.resources import BaseBucketObject
  11. from cloudbridge.interfaces.exceptions import DuplicateResourceException
  12. from cloudbridge.interfaces.exceptions import InvalidValueException
  13. from cloudbridge.interfaces.provider import TestMockHelperMixin
  14. from cloudbridge.interfaces.resources import Bucket
  15. from cloudbridge.interfaces.resources import BucketObject
  16. from tests import helpers
  17. from tests.helpers import ProviderTestBase
  18. from tests.helpers import standard_interface_tests as sit
  19. # S3 (and Swift) require every part except the last to be >= 5 MiB. Tests use
  20. # this size so they remain valid against real cloud providers, not just moto.
  21. MIN_PART_SIZE = 5 * 1024 * 1024
  22. class CloudObjectStoreServiceTestCase(ProviderTestBase):
  23. _multiprocess_can_split_ = True
  24. @helpers.skipIfNoService(['storage._bucket_objects', 'storage.buckets'])
  25. def test_storage_services_event_pattern(self):
  26. # pylint:disable=protected-access
  27. self.assertEqual(
  28. self.provider.storage.buckets._service_event_pattern,
  29. "provider.storage.buckets",
  30. "Event pattern for {} service should be '{}', "
  31. "but found '{}'.".format("buckets",
  32. "provider.storage.buckets",
  33. self.provider.storage.buckets.
  34. _service_event_pattern))
  35. # pylint:disable=protected-access
  36. self.assertEqual(
  37. self.provider.storage._bucket_objects._service_event_pattern,
  38. "provider.storage._bucket_objects",
  39. "Event pattern for {} service should be '{}', "
  40. "but found '{}'.".format("bucket_objects",
  41. "provider.storage._bucket_objects",
  42. self.provider.storage._bucket_objects.
  43. _service_event_pattern))
  44. @helpers.skipIfNoService(['storage.buckets'])
  45. def test_crud_bucket(self):
  46. def create_bucket(name):
  47. return self.provider.storage.buckets.create(name)
  48. def cleanup_bucket(bucket):
  49. if bucket:
  50. bucket.delete()
  51. def extra_tests(bucket):
  52. # Recreating existing bucket should raise an exception
  53. with self.assertRaises(DuplicateResourceException):
  54. self.provider.storage.buckets.create(name=bucket.name)
  55. sit.check_crud(self, self.provider.storage.buckets, Bucket,
  56. "cb-crudbucket", create_bucket, cleanup_bucket,
  57. extra_test_func=extra_tests)
  58. @helpers.skipIfNoService(['storage.buckets'])
  59. def test_crud_bucket_object(self):
  60. test_bucket = None
  61. def create_bucket_obj(name):
  62. obj = test_bucket.objects.create(name)
  63. # TODO: This is wrong. We shouldn't have to have a separate
  64. # call to upload some content before being able to delete
  65. # the content. Maybe the create_object method should accept
  66. # the file content as a parameter.
  67. obj.upload("dummy content")
  68. return obj
  69. def cleanup_bucket_obj(bucket_obj):
  70. if bucket_obj:
  71. bucket_obj.delete()
  72. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  73. name = "cb-crudbucketobj-{0}".format(helpers.get_uuid())
  74. test_bucket = self.provider.storage.buckets.create(name)
  75. sit.check_crud(self, test_bucket.objects, BucketObject,
  76. "cb-bucketobj", create_bucket_obj,
  77. cleanup_bucket_obj, skip_name_check=True)
  78. @helpers.skipIfNoService(['storage.buckets'])
  79. def test_crud_bucket_object_properties(self):
  80. # Create a new bucket, upload some contents into the bucket, and
  81. # check whether list properly detects the new content.
  82. # Delete everything afterwards.
  83. name = "cbtestbucketobjs-{0}".format(helpers.get_uuid())
  84. test_bucket = self.provider.storage.buckets.create(name)
  85. # ensure that the bucket is empty
  86. objects = test_bucket.objects.list()
  87. self.assertEqual([], objects)
  88. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  89. obj_name_prefix = "hello"
  90. obj_name = obj_name_prefix + "_world.txt"
  91. obj = test_bucket.objects.create(obj_name)
  92. with cb_helpers.cleanup_action(lambda: obj.delete()):
  93. # TODO: This is wrong. We shouldn't have to have a separate
  94. # call to upload some content before being able to delete
  95. # the content. Maybe the create_object method should accept
  96. # the file content as a parameter.
  97. obj.upload("dummy content")
  98. objs = test_bucket.objects.list()
  99. self.assertTrue(
  100. isinstance(objs[0].size, int),
  101. "Object size property needs to be a int, not {0}".format(
  102. type(objs[0].size)))
  103. # GET an object as the size property implementation differs
  104. # for objects returned by LIST and GET.
  105. obj = test_bucket.objects.get(objs[0].id)
  106. self.assertTrue(
  107. isinstance(objs[0].size, int),
  108. "Object size property needs to be an int, not {0}".format(
  109. type(obj.size)))
  110. self.assertTrue(
  111. datetime.strptime(objs[0].last_modified[:23],
  112. "%Y-%m-%dT%H:%M:%S.%f"),
  113. "Object's last_modified field format {0} not matching."
  114. .format(objs[0].last_modified))
  115. # check iteration
  116. iter_objs = list(test_bucket.objects)
  117. self.assertListEqual(iter_objs, objs)
  118. obj_too = test_bucket.objects.get(obj_name)
  119. self.assertTrue(
  120. isinstance(obj_too, BucketObject),
  121. "Did not get object {0} of expected type.".format(obj_too))
  122. prefix_filtered_list = test_bucket.objects.list(
  123. prefix=obj_name_prefix)
  124. self.assertTrue(
  125. len(objs) == len(prefix_filtered_list) == 1,
  126. 'The number of objects returned by list function, '
  127. 'with and without a prefix, are expected to be equal, '
  128. 'but its detected otherwise.')
  129. sit.check_delete(self, test_bucket.objects, obj)
  130. @helpers.skipIfNoService(['storage.buckets'])
  131. def test_upload_download_bucket_content(self):
  132. name = "cbtestbucketobjs-{0}".format(helpers.get_uuid())
  133. test_bucket = self.provider.storage.buckets.create(name)
  134. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  135. obj_name = "hello_upload_download.txt"
  136. obj = test_bucket.objects.create(obj_name)
  137. with cb_helpers.cleanup_action(lambda: obj.delete()):
  138. content = b"Hello World. Here's some content."
  139. # TODO: Upload and download methods accept different parameter
  140. # types. Need to make this consistent - possibly provider
  141. # multiple methods like upload_from_file, from_stream etc.
  142. obj.upload(content)
  143. target_stream = BytesIO()
  144. obj.save_content(target_stream)
  145. self.assertEqual(target_stream.getvalue(), content)
  146. target_stream2 = BytesIO()
  147. for data in obj.iter_content():
  148. target_stream2.write(data)
  149. self.assertEqual(target_stream2.getvalue(), content)
  150. @helpers.skipIfNoService(['storage.buckets'])
  151. def test_generate_url(self):
  152. name = "cbtestbucketobjs-{0}".format(helpers.get_uuid())
  153. test_bucket = self.provider.storage.buckets.create(name)
  154. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  155. obj_name = "hello_upload_download.txt"
  156. obj = test_bucket.objects.create(obj_name)
  157. with cb_helpers.cleanup_action(lambda: obj.delete()):
  158. content = b"Hello World. Generate a url."
  159. obj.upload(content)
  160. target_stream = BytesIO()
  161. obj.save_content(target_stream)
  162. url = obj.generate_url(100)
  163. if isinstance(self.provider, TestMockHelperMixin):
  164. raise self.skipTest(
  165. "Skipping rest of test - mock providers can't"
  166. " access generated url")
  167. self.assertEqual(requests.get(url).content, content)
  168. @helpers.skipIfNoService(['storage.buckets'])
  169. def test_generate_url_write_permissions(self):
  170. name = "cbtestbucketobjs-{0}".format(helpers.get_uuid())
  171. test_bucket = self.provider.storage.buckets.create(name)
  172. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  173. obj_name = "hello_upload_download.txt"
  174. obj = test_bucket.objects.create(obj_name)
  175. with cb_helpers.cleanup_action(lambda: obj.delete()):
  176. content = b"Hello World. Generate a url."
  177. url = obj.generate_url(100, writable=True)
  178. if isinstance(self.provider, TestMockHelperMixin):
  179. raise self.skipTest(
  180. "Skipping rest of test - mock providers can't"
  181. " access generated url")
  182. # Only Azure requires the x-ms-blob-type header to be present, but there's no harm
  183. # in sending this in for all providers.
  184. headers = {'x-ms-blob-type': 'BlockBlob'}
  185. response = requests.put(url, headers=headers, data=content)
  186. response.raise_for_status()
  187. obj = test_bucket.objects.get(obj_name)
  188. target_stream = BytesIO()
  189. obj.save_content(target_stream)
  190. self.assertEqual(target_stream.getvalue(), content)
  191. @helpers.skipIfNoService(['storage.buckets'])
  192. def test_upload_download_bucket_content_from_file(self):
  193. name = "cbtestbucketobjs-{0}".format(helpers.get_uuid())
  194. test_bucket = self.provider.storage.buckets.create(name)
  195. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  196. obj_name = "hello_upload_download.txt"
  197. obj = test_bucket.objects.create(obj_name)
  198. with cb_helpers.cleanup_action(lambda: obj.delete()):
  199. test_file = os.path.join(
  200. helpers.get_test_fixtures_folder(), 'logo.jpg')
  201. obj.upload_from_file(test_file)
  202. target_stream = BytesIO()
  203. obj.save_content(target_stream)
  204. with open(test_file, 'rb') as f:
  205. self.assertEqual(target_stream.getvalue(), f.read())
  206. @helpers.skipIfNoService(['storage.buckets'])
  207. def test_explicit_multipart_upload_roundtrip(self):
  208. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  209. test_bucket = self.provider.storage.buckets.create(name)
  210. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  211. obj_name = "mpu-roundtrip.bin"
  212. obj = test_bucket.objects.create(obj_name)
  213. with cb_helpers.cleanup_action(lambda: obj.delete()):
  214. part1 = b"a" * MIN_PART_SIZE
  215. part2 = b"b" * MIN_PART_SIZE
  216. part3 = b"c" * 1024 # final part may be smaller than the min
  217. expected = part1 + part2 + part3
  218. upload = obj.create_multipart_upload()
  219. parts = [upload.upload_part(1, part1),
  220. upload.upload_part(2, part2),
  221. upload.upload_part(3, part3)]
  222. upload.complete(parts)
  223. stored = test_bucket.objects.get(obj_name)
  224. self.assertIsNotNone(
  225. stored, "Object should exist after multipart completion")
  226. self.assertEqual(stored.size, len(expected))
  227. target_stream = BytesIO()
  228. stored.save_content(target_stream)
  229. self.assertEqual(target_stream.getvalue(), expected)
  230. @helpers.skipIfNoService(['storage.buckets'])
  231. def test_multipart_upload_out_of_order_parts(self):
  232. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  233. test_bucket = self.provider.storage.buckets.create(name)
  234. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  235. obj_name = "mpu-ooo.bin"
  236. obj = test_bucket.objects.create(obj_name)
  237. with cb_helpers.cleanup_action(lambda: obj.delete()):
  238. part1 = b"1" * MIN_PART_SIZE
  239. part2 = b"2" * MIN_PART_SIZE
  240. part3 = b"3" * 1024
  241. expected = part1 + part2 + part3
  242. upload = obj.create_multipart_upload()
  243. # Upload and collect parts out of order; complete must
  244. # assemble them in ascending part-number order regardless.
  245. p3 = upload.upload_part(3, part3)
  246. p1 = upload.upload_part(1, part1)
  247. p2 = upload.upload_part(2, part2)
  248. upload.complete([p3, p1, p2])
  249. stored = test_bucket.objects.get(obj_name)
  250. target_stream = BytesIO()
  251. stored.save_content(target_stream)
  252. self.assertEqual(target_stream.getvalue(), expected)
  253. @helpers.skipIfNoService(['storage.buckets'])
  254. def test_multipart_upload_abort(self):
  255. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  256. test_bucket = self.provider.storage.buckets.create(name)
  257. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  258. obj_name = "mpu-abort.bin"
  259. obj = test_bucket.objects.create(obj_name)
  260. upload = obj.create_multipart_upload()
  261. upload.upload_part(1, b"a" * MIN_PART_SIZE)
  262. upload.abort()
  263. # Aborting must not materialise the target object.
  264. self.assertIsNone(
  265. test_bucket.objects.get(obj_name),
  266. "Object should not exist after a multipart upload is aborted")
  267. @helpers.skipIfNoService(['storage.buckets'])
  268. def test_transparent_upload_large_stream_uses_multipart(self):
  269. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  270. test_bucket = self.provider.storage.buckets.create(name)
  271. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  272. obj_name = "transparent.bin"
  273. obj = test_bucket.objects.create(obj_name)
  274. with cb_helpers.cleanup_action(lambda: obj.delete()):
  275. content = b"x" * (MIN_PART_SIZE * 2 + 1024)
  276. # Lower the threshold/part size so a modest stream triggers
  277. # the multipart path, and assert it is actually taken.
  278. svc = self.provider.storage._bucket_objects
  279. with mock.patch.object(
  280. BaseBucketObject, 'CB_MULTIPART_THRESHOLD',
  281. MIN_PART_SIZE), \
  282. mock.patch.object(
  283. BaseBucketObject, 'CB_MULTIPART_PART_SIZE',
  284. MIN_PART_SIZE), \
  285. mock.patch.object(
  286. svc, 'create_multipart_upload',
  287. wraps=svc.create_multipart_upload) as spy:
  288. obj.upload(BytesIO(content))
  289. spy.assert_called_once()
  290. stored = test_bucket.objects.get(obj_name)
  291. self.assertEqual(stored.size, len(content))
  292. target_stream = BytesIO()
  293. stored.save_content(target_stream)
  294. self.assertEqual(target_stream.getvalue(), content)
  295. @helpers.skipIfNoService(['storage.buckets'])
  296. def test_small_upload_stays_single_shot(self):
  297. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  298. test_bucket = self.provider.storage.buckets.create(name)
  299. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  300. obj = test_bucket.objects.create("small.txt")
  301. with cb_helpers.cleanup_action(lambda: obj.delete()):
  302. content = b"a small payload below the multipart threshold"
  303. # A payload below the threshold must not trigger multipart.
  304. svc = self.provider.storage._bucket_objects
  305. with mock.patch.object(
  306. svc, 'create_multipart_upload',
  307. wraps=svc.create_multipart_upload) as spy:
  308. obj.upload(content)
  309. spy.assert_not_called()
  310. target_stream = BytesIO()
  311. obj.save_content(target_stream)
  312. self.assertEqual(target_stream.getvalue(), content)
  313. @helpers.skipIfNoService(['storage.buckets'])
  314. def test_multipart_part_size_below_minimum_raises(self):
  315. name = "cbtest-mpu-{0}".format(helpers.get_uuid())
  316. test_bucket = self.provider.storage.buckets.create(name)
  317. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  318. obj = test_bucket.objects.create("badpartsize.bin")
  319. with cb_helpers.cleanup_action(lambda: obj.delete()):
  320. content = b"x" * 4096
  321. # A part size below the 5 MiB portable minimum is invalid.
  322. with mock.patch.object(
  323. BaseBucketObject, 'CB_MULTIPART_THRESHOLD', 1024), \
  324. mock.patch.object(
  325. BaseBucketObject, 'CB_MULTIPART_PART_SIZE', 1024):
  326. with self.assertRaises(InvalidValueException):
  327. obj.upload(BytesIO(content))
  328. @skip("Skip unless you want to test objects bigger than 5GB")
  329. @helpers.skipIfNoService(['storage.buckets'])
  330. def test_upload_download_bucket_content_with_large_file(self):
  331. # Creates a 6 Gig file in the temp directory, then uploads it to
  332. # Swift. Once uploaded, then downloads to a new file in the temp
  333. # directory and compares the two files to see if they match.
  334. temp_dir = tempfile.gettempdir()
  335. file_name = '6GigTest.tmp'
  336. six_gig_file = os.path.join(temp_dir, file_name)
  337. with open(six_gig_file, "wb") as out:
  338. out.truncate(6 * 1024 * 1024 * 1024) # 6 Gig...
  339. with cb_helpers.cleanup_action(lambda: os.remove(six_gig_file)):
  340. download_file = "{0}/cbtestfile-{1}".format(temp_dir, file_name)
  341. bucket_name = "cbtestbucketlargeobjs-{0}".format(
  342. helpers.get_uuid())
  343. test_bucket = self.provider.storage.buckets.create(bucket_name)
  344. with cb_helpers.cleanup_action(lambda: test_bucket.delete()):
  345. test_obj = test_bucket.objects.create(file_name)
  346. with cb_helpers.cleanup_action(lambda: test_obj.delete()):
  347. file_uploaded = test_obj.upload_from_file(six_gig_file)
  348. self.assertTrue(file_uploaded, "Could not upload object?")
  349. with cb_helpers.cleanup_action(
  350. lambda: os.remove(download_file)):
  351. with open(download_file, 'wb') as f:
  352. test_obj.save_content(f)
  353. self.assertTrue(
  354. filecmp.cmp(six_gig_file, download_file),
  355. "Uploaded file != downloaded")