summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorwhoami-rajat <rajatdhasmana@gmail.com>2022-01-25 19:24:30 +0530
committerRajat Dhasmana <rajatdhasmana@gmail.com>2022-02-17 15:06:27 +0000
commitea5139be9a76ca8c2e60d12d8dd776bff39c4579 (patch)
treebf8b7c754004cc71ca6ce4b0417867c8bec7302a
parent83d9c5dc2e4ca4edb29970d0543f7e9c574c0911 (diff)
downloadglance_store-ea5139be9a76ca8c2e60d12d8dd776bff39c4579.tar.gz
Cinder store: Wait for device resize
When we have an image with size > 1 GB, we follow the following steps to accomodate the image: 1) Detach the volume 2) extend the volume 3) Attach the volume 4) Open the volume device as a file and resume writing the image Sometimes due to several reasons (mostly network related), the size of the device file could mismatch with the actual volume size (or the backend LUN size). This can happen if the extend was performed (i.e. the control path) but it takes the time to reflect that into the mapped device (i.e. the data path). This mismatch can cause the issue "IOError: [Errno 28] No space left on device". To avoid this scenario, we check if the device size is less than the volume size, we wait for the extended LUN to show up in mapped device and then continue the image writing operation. Closes-Bug: #1959913 Change-Id: I206580f6be615ebc5e15b546b9c23728d4116a5d (cherry picked from commit f3433ed1a5176bff85b3fe04dba2d4c76618a299)
-rw-r--r--glance_store/_drivers/cinder.py35
-rw-r--r--glance_store/tests/unit/test_cinder_store.py50
-rw-r--r--glance_store/tests/unit/test_multistore_cinder.py50
-rw-r--r--releasenotes/notes/fix-wait-device-resize-c282940b71a3748e.yaml7
4 files changed, 138 insertions, 4 deletions
diff --git a/glance_store/_drivers/cinder.py b/glance_store/_drivers/cinder.py
index 96f9b2a..5296dc2 100644
--- a/glance_store/_drivers/cinder.py
+++ b/glance_store/_drivers/cinder.py
@@ -641,6 +641,37 @@ class Store(glance_store.driver.Store):
raise exceptions.BadStoreConfiguration(store_name="cinder",
reason=reason)
+ @staticmethod
+ def _get_device_size(device_file):
+ # The seek position is corrected after every extend operation
+ # with the bytes written (which is after this wait call) so we
+ # don't need to worry about setting it back to original position
+ device_file.seek(0, os.SEEK_END)
+ # There are other ways to determine the file size like os.stat
+ # or os.path.getsize but it requires file name attribute which
+ # we don't have for the RBD file wrapper RBDVolumeIOWrapper
+ device_size = device_file.tell()
+ device_size = int(math.ceil(float(device_size) / units.Gi))
+ return device_size
+
+ @staticmethod
+ def _wait_resize_device(volume, device_file):
+ timeout = 20
+ max_recheck_wait = 10
+ tries = 0
+ elapsed = 0
+ while Store._get_device_size(device_file) < volume.size:
+ wait = min(0.5 * 2 ** tries, max_recheck_wait)
+ time.sleep(wait)
+ tries += 1
+ elapsed += wait
+ if elapsed >= timeout:
+ msg = (_('Timeout while waiting while volume %(volume_id)s '
+ 'to resize the device in %(tries)s tries.')
+ % {'volume_id': volume.id, 'tries': tries})
+ LOG.error(msg)
+ raise exceptions.BackendException(msg)
+
def _wait_volume_status(self, volume, status_transition, status_expected):
max_recheck_wait = 15
timeout = self.store_conf.cinder_state_transition_timeout
@@ -949,6 +980,10 @@ class Store(glance_store.driver.Store):
try:
while need_extend:
with self._open_cinder_volume(client, volume, 'wb') as f:
+ # Sometimes the extended LUN on storage side takes time
+ # to reflect in the device so we wait until the device
+ # size is equal to the extended volume size.
+ Store._wait_resize_device(volume, f)
f.seek(bytes_written)
if buf:
f.write(buf)
diff --git a/glance_store/tests/unit/test_cinder_store.py b/glance_store/tests/unit/test_cinder_store.py
index c281766..eca8a9f 100644
--- a/glance_store/tests/unit/test_cinder_store.py
+++ b/glance_store/tests/unit/test_cinder_store.py
@@ -16,6 +16,8 @@
import contextlib
import errno
import hashlib
+import io
+import math
import os
from unittest import mock
@@ -406,7 +408,7 @@ class TestCinderStore(base.StoreBaseTest,
self.assertEqual(expected_image_size, image_size)
def _test_cinder_add(self, fake_volume, volume_file, size_kb=5,
- verifier=None):
+ verifier=None, fail_resize=False):
expected_image_id = str(uuid.uuid4())
expected_size = size_kb * units.Ki
expected_file_contents = b"*" * expected_size
@@ -427,7 +429,11 @@ class TestCinderStore(base.StoreBaseTest,
with mock.patch.object(cinder.Store, 'get_cinderclient') as mock_cc, \
mock.patch.object(self.store, '_open_cinder_volume',
- side_effect=fake_open):
+ side_effect=fake_open), \
+ mock.patch.object(
+ cinder.Store, '_wait_resize_device') as mock_wait_resize:
+ if fail_resize:
+ mock_wait_resize.side_effect = exceptions.BackendException()
mock_cc.return_value = FakeObject(client=fake_client,
volumes=fake_volumes)
loc, size, checksum, multihash, _ = self.store.add(
@@ -509,3 +515,43 @@ class TestCinderStore(base.StoreBaseTest,
self.store.configure_add()
mock_log.warning.assert_called_with(
"Invalid `cinder_volume_type some_random_type`")
+
+ def test__get_device_size(self):
+ fake_data = b"fake binary data"
+ fake_len = int(math.ceil(float(len(fake_data)) / units.Gi))
+ fake_file = io.BytesIO(fake_data)
+ dev_size = cinder.Store._get_device_size(fake_file)
+ self.assertEqual(fake_len, dev_size)
+
+ @mock.patch.object(time, 'sleep')
+ def test__wait_resize_device_resized(self, mock_sleep):
+ fake_vol = mock.MagicMock()
+ fake_vol.size = 2
+ fake_file = io.BytesIO(b"fake binary data")
+ with mock.patch.object(
+ cinder.Store, '_get_device_size') as mock_get_dev_size:
+ mock_get_dev_size.side_effect = [1, 2]
+ cinder.Store._wait_resize_device(fake_vol, fake_file)
+
+ @mock.patch.object(time, 'sleep')
+ def test__wait_resize_device_fails(self, mock_sleep):
+ fake_vol = mock.MagicMock()
+ fake_vol.size = 2
+ fake_file = io.BytesIO(b"fake binary data")
+ with mock.patch.object(
+ cinder.Store, '_get_device_size',
+ return_value=1):
+ self.assertRaises(
+ exceptions.BackendException,
+ cinder.Store._wait_resize_device,
+ fake_vol, fake_file)
+
+ def test_cinder_add_fail_resize(self):
+ volume_file = io.BytesIO()
+ fake_volume = mock.MagicMock(id=str(uuid.uuid4()),
+ status='available',
+ size=1)
+ self.assertRaises(exceptions.BackendException,
+ self._test_cinder_add, fake_volume, volume_file,
+ fail_resize=True)
+ fake_volume.delete.assert_called_once()
diff --git a/glance_store/tests/unit/test_multistore_cinder.py b/glance_store/tests/unit/test_multistore_cinder.py
index 220952f..4046dcd 100644
--- a/glance_store/tests/unit/test_multistore_cinder.py
+++ b/glance_store/tests/unit/test_multistore_cinder.py
@@ -15,6 +15,8 @@
import contextlib
import errno
+import io
+import math
import os
from unittest import mock
@@ -525,7 +527,7 @@ class TestMultiCinderStore(base.MultiStoreBaseTest,
self.assertEqual(expected_image_size, image_size)
def _test_cinder_add(self, fake_volume, volume_file, size_kb=5,
- verifier=None, backend="cinder1"):
+ verifier=None, backend="cinder1", fail_resize=False):
expected_image_id = str(uuid.uuid4())
expected_size = size_kb * units.Ki
expected_file_contents = b"*" * expected_size
@@ -545,7 +547,11 @@ class TestMultiCinderStore(base.MultiStoreBaseTest,
with mock.patch.object(cinder.Store, 'get_cinderclient') as mock_cc, \
mock.patch.object(self.store, '_open_cinder_volume',
- side_effect=fake_open):
+ side_effect=fake_open), \
+ mock.patch.object(
+ cinder.Store, '_wait_resize_device') as mock_wait_resize:
+ if fail_resize:
+ mock_wait_resize.side_effect = exceptions.BackendException()
mock_cc.return_value = FakeObject(client=fake_client,
volumes=fake_volumes)
loc, size, checksum, metadata = self.store.add(expected_image_id,
@@ -619,3 +625,43 @@ class TestMultiCinderStore(base.MultiStoreBaseTest,
size=1)
volume_file = six.BytesIO()
self._test_cinder_add(fake_volume, volume_file, backend="cinder2")
+
+ def test__get_device_size(self):
+ fake_data = b"fake binary data"
+ fake_len = int(math.ceil(float(len(fake_data)) / units.Gi))
+ fake_file = io.BytesIO(fake_data)
+ dev_size = cinder.Store._get_device_size(fake_file)
+ self.assertEqual(fake_len, dev_size)
+
+ @mock.patch.object(time, 'sleep')
+ def test__wait_resize_device_resized(self, mock_sleep):
+ fake_vol = mock.MagicMock()
+ fake_vol.size = 2
+ fake_file = io.BytesIO(b"fake binary data")
+ with mock.patch.object(
+ cinder.Store, '_get_device_size') as mock_get_dev_size:
+ mock_get_dev_size.side_effect = [1, 2]
+ cinder.Store._wait_resize_device(fake_vol, fake_file)
+
+ @mock.patch.object(time, 'sleep')
+ def test__wait_resize_device_fails(self, mock_sleep):
+ fake_vol = mock.MagicMock()
+ fake_vol.size = 2
+ fake_file = io.BytesIO(b"fake binary data")
+ with mock.patch.object(
+ cinder.Store, '_get_device_size',
+ return_value=1):
+ self.assertRaises(
+ exceptions.BackendException,
+ cinder.Store._wait_resize_device,
+ fake_vol, fake_file)
+
+ def test_cinder_add_fail_resize(self):
+ volume_file = io.BytesIO()
+ fake_volume = mock.MagicMock(id=str(uuid.uuid4()),
+ status='available',
+ size=1)
+ self.assertRaises(exceptions.BackendException,
+ self._test_cinder_add, fake_volume, volume_file,
+ fail_resize=True)
+ fake_volume.delete.assert_called_once()
diff --git a/releasenotes/notes/fix-wait-device-resize-c282940b71a3748e.yaml b/releasenotes/notes/fix-wait-device-resize-c282940b71a3748e.yaml
new file mode 100644
index 0000000..27b3974
--- /dev/null
+++ b/releasenotes/notes/fix-wait-device-resize-c282940b71a3748e.yaml
@@ -0,0 +1,7 @@
+---
+fixes:
+ - |
+ `Bug #1959913 <https://bugs.launchpad.net/glance-store/+bug/1959913>`_:
+ Added wait between the volume being extended and
+ the new size being detected while opening the
+ volume device.