XIV\A9000: Added replication group support
This patch adds group replication capabilities for the IBM driver for the A-line system. implements: * Enable replication on group * Disable replication on group * Fail over replication * Get replication error status Implements: blueprint replication-cg-ibm-storage Change-Id: Ic59c568502258096e24ca5ab81dc5b8cd1779995 Depends-On: Ia4af4dd011d569a3ac84387b37dcf2606da48fba
This commit is contained in:
parent
695c1f9272
commit
bb9a4e1a90
@ -25,6 +25,7 @@ pyxcli_client.errors = fake_pyxcli_exceptions
|
||||
pyxcli_client.events = mock.Mock()
|
||||
pyxcli_client.mirroring = mock.Mock()
|
||||
pyxcli_client.transports = fake_pyxcli_exceptions
|
||||
pyxcli_client.mirroring.cg_recovery_manager = mock.Mock()
|
||||
|
||||
sys.modules['pyxcli'] = pyxcli_client
|
||||
sys.modules['pyxcli.events'] = pyxcli_client.events
|
||||
|
@ -20,6 +20,7 @@ from xml.etree import ElementTree
|
||||
from cinder import context
|
||||
from cinder import exception
|
||||
from cinder import objects
|
||||
from cinder.objects import fields
|
||||
from cinder import test
|
||||
from cinder.tests.unit import fake_constants as fake
|
||||
from cinder.tests.unit import utils as testutils
|
||||
@ -27,9 +28,11 @@ from cinder.tests.unit.volume.drivers.ibm import fake_pyxcli
|
||||
import cinder.volume.drivers.ibm.ibm_storage as storage
|
||||
from cinder.volume.drivers.ibm.ibm_storage import cryptish
|
||||
from cinder.volume.drivers.ibm.ibm_storage.xiv_proxy import XIVProxy
|
||||
from cinder.volume.drivers.ibm.ibm_storage import xiv_replication
|
||||
from cinder.volume import group_types
|
||||
|
||||
errors = fake_pyxcli.pyxcli_client.errors
|
||||
mirroring = fake_pyxcli.pyxcli_client.mirroring
|
||||
|
||||
test_mock = mock.MagicMock()
|
||||
module_patcher = mock.MagicMock()
|
||||
@ -45,6 +48,11 @@ TEST_VOLUME = {
|
||||
'group_id': fake.CONSISTENCY_GROUP_ID,
|
||||
}
|
||||
|
||||
TEST_GROUP_SPECS = {
|
||||
'group_replication_enabled': '<is> True',
|
||||
'replication_type': 'sync',
|
||||
}
|
||||
|
||||
TEST_EXTRA_SPECS = {
|
||||
'replication_enabled': '<is> False',
|
||||
}
|
||||
@ -356,7 +364,174 @@ class XIVProxyTest(test.TestCase):
|
||||
ex = getattr(p, "_get_exception")()
|
||||
self.assertRaises(ex, p.create_volume, volume)
|
||||
|
||||
@mock.patch("cinder.volume.utils.group_get_by_id", mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_replication.VolumeReplication.create_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_replication.GroupReplication.create_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy.get_group_specs_by_group_resource",
|
||||
mock.MagicMock(return_value=(TEST_GROUP_SPECS, '')))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_target_params",
|
||||
mock.MagicMock(return_value=REPLICA_PARAMS))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_target",
|
||||
mock.MagicMock(return_value="BLABLA"))
|
||||
def test_enable_replication(self):
|
||||
"""Test enable_replication"""
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
p.ibm_storage_cli = mock.MagicMock()
|
||||
p._call_remote_xiv_xcli = mock.MagicMock()
|
||||
p._update_consistencygroup = mock.MagicMock()
|
||||
p.targets = {'tgt1': 'info1'}
|
||||
|
||||
group = self._create_test_group('WTF')
|
||||
vol = testutils.create_volume(self.ctxt)
|
||||
ret = p.enable_replication(self.ctxt, group, [vol])
|
||||
|
||||
self.assertEqual((
|
||||
{'replication_status': fields.ReplicationStatus.ENABLED},
|
||||
[{'id': vol['id'],
|
||||
'replication_status': fields.ReplicationStatus.ENABLED}]), ret)
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_replication.VolumeReplication.delete_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.group_types.get_group_type_specs",
|
||||
mock.MagicMock(return_value=TEST_GROUP_SPECS))
|
||||
def test_disable_replication(self):
|
||||
"""Test disable_replication"""
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
p.ibm_storage_cli = mock.MagicMock()
|
||||
p._call_remote_xiv_xcli = mock.MagicMock()
|
||||
p._update_consistencygroup = mock.MagicMock()
|
||||
|
||||
group = self._create_test_group('WTF')
|
||||
ret = p.disable_replication(self.ctxt, group, [])
|
||||
|
||||
self.assertEqual((
|
||||
{'replication_status': fields.ReplicationStatus.DISABLED}, []),
|
||||
ret)
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._using_default_backend",
|
||||
mock.MagicMock(return_value=False))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_target_params",
|
||||
mock.MagicMock(return_value={'san_clustername': "master"}))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._init_xcli",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._init_xcli",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy.get_group_specs_by_group_resource",
|
||||
mock.MagicMock(return_value=(TEST_GROUP_SPECS, '')))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_replication.GroupReplication.failover",
|
||||
mock.MagicMock(return_value=(True, 'good')))
|
||||
def test_failover_replication_with_default(self):
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
group = self._create_test_group('WTF')
|
||||
group.replication_status = fields.ReplicationStatus.FAILED_OVER
|
||||
vol = testutils.create_volume(self.ctxt)
|
||||
group_update, vol_update = p.failover_replication(self.ctxt, group,
|
||||
[vol], 'default')
|
||||
updates = {'status': 'available'}
|
||||
self.assertEqual(({'replication_status': 'available'},
|
||||
[{'volume_id': vol['id'],
|
||||
'updates': updates}]), (group_update, vol_update))
|
||||
|
||||
def test_failover_resource_no_mirror(self):
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
|
||||
recovery_mgr = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active.return_value = False
|
||||
|
||||
group = self._create_test_group('WTF')
|
||||
ret = xiv_replication.Replication(p)._failover_resource(
|
||||
group, recovery_mgr, mock.MagicMock, 'cg', True)
|
||||
msg = ("%(rep_type)s %(res)s: no active mirroring and can not "
|
||||
"failback" % {'rep_type': 'cg',
|
||||
'res': group['name']})
|
||||
self.assertEqual((False, msg), ret)
|
||||
|
||||
def test_failover_resource_mirror(self):
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
recovery_mgr = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active.return_value = True
|
||||
|
||||
group = self._create_test_group('WTF')
|
||||
ret = xiv_replication.Replication(p)._failover_resource(
|
||||
group, recovery_mgr, mock.MagicMock, 'cg', True)
|
||||
|
||||
self.assertEqual((True, None), ret)
|
||||
|
||||
def test_failover_resource_change_role(self):
|
||||
driver = mock.MagicMock()
|
||||
driver.VERSION = "VERSION"
|
||||
|
||||
p = self.proxy(
|
||||
self.default_storage_info,
|
||||
mock.MagicMock(),
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
recovery_mgr = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active = mock.MagicMock()
|
||||
recovery_mgr.is_mirror_active.return_value = True
|
||||
recovery_mgr.switch_roles.side_effect = (
|
||||
errors.XCLIError(''))
|
||||
failover_rep_mgr = mock.MagicMock()
|
||||
failover_rep_mgr.change_role = mock.MagicMock()
|
||||
group = self._create_test_group('WTF')
|
||||
|
||||
xiv_replication.Replication(p)._failover_resource(
|
||||
group, recovery_mgr, failover_rep_mgr, 'cg', True)
|
||||
|
||||
failover_rep_mgr.change_role.assert_called_once_with(
|
||||
resource_id=group['name'],
|
||||
new_role='Slave')
|
||||
|
||||
@mock.patch("cinder.volume.utils.is_group_a_cg_snapshot_type",
|
||||
mock.MagicMock(return_value=True))
|
||||
def test_create_volume_with_consistency_group(self):
|
||||
@ -376,8 +551,8 @@ class XIVProxyTest(test.TestCase):
|
||||
vol_type = testutils.create_volume_type(self.ctxt, name='WTF')
|
||||
volume = testutils.create_volume(
|
||||
self.ctxt, size=16, volume_type_id=vol_type.id)
|
||||
grp = testutils.create_group(self.ctxt, name='bla', group_type_id='1',
|
||||
volume_type_ids=[vol_type.id])
|
||||
|
||||
grp = self._create_test_group('WTF')
|
||||
volume.group = grp
|
||||
p.create_volume(volume)
|
||||
|
||||
@ -390,7 +565,7 @@ class XIVProxyTest(test.TestCase):
|
||||
cg='cg')
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._replication_create",
|
||||
"xiv_replication.VolumeReplication.create_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_qos_specs",
|
||||
@ -417,7 +592,7 @@ class XIVProxyTest(test.TestCase):
|
||||
p.create_volume(volume)
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._replication_create",
|
||||
"xiv_replication.VolumeReplication.create_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_qos_specs",
|
||||
@ -446,10 +621,6 @@ class XIVProxyTest(test.TestCase):
|
||||
ex = getattr(p, "_get_exception")()
|
||||
self.assertRaises(ex, p.create_volume, volume)
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_targets",
|
||||
mock.MagicMock(
|
||||
return_value={'tgt1': 'info1', 'tgt2': 'info2'}))
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_qos_specs",
|
||||
mock.MagicMock(return_value=None))
|
||||
@ -495,7 +666,7 @@ class XIVProxyTest(test.TestCase):
|
||||
p.ibm_storage_cli.cmd.vol_delete.assert_called_once_with(vol='WTF32')
|
||||
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._replication_delete",
|
||||
"xiv_replication.VolumeReplication.delete_replication",
|
||||
mock.MagicMock())
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage."
|
||||
"xiv_proxy.XIVProxy._get_extra_specs",
|
||||
@ -1406,7 +1577,9 @@ class XIVProxyTest(test.TestCase):
|
||||
ex = getattr(p, "_get_exception")()
|
||||
self.assertRaises(ex, p.create_group, {}, self._create_test_group())
|
||||
|
||||
def test_create_consistencygroup_with_replication(self):
|
||||
@mock.patch("cinder.volume.drivers.ibm.ibm_storage.xiv_proxy."
|
||||
"client.XCLIClient")
|
||||
def test_create_consistencygroup_with_replication(self, mock_xcli):
|
||||
"""test create_consistenygroup when replication is set"""
|
||||
|
||||
p = self.proxy(
|
||||
@ -1426,8 +1599,8 @@ class XIVProxyTest(test.TestCase):
|
||||
group_obj.volume_types = objects.VolumeTypeList(context=self.ctxt,
|
||||
objects=[vol_type])
|
||||
|
||||
ex = getattr(p, "_get_exception")()
|
||||
self.assertRaises(ex, p.create_group, {}, group_obj)
|
||||
model_update = p.create_group({}, group_obj)
|
||||
self.assertEqual('available', model_update['status'])
|
||||
|
||||
def test_create_consistencygroup_from_src_cgsnapshot(self):
|
||||
"""test a successful cg create from cgsnapshot"""
|
||||
@ -2113,7 +2286,7 @@ class XIVProxyTest(test.TestCase):
|
||||
test_mock.cinder.exception,
|
||||
driver)
|
||||
|
||||
p._replication_create = test_mock.MagicMock(return_value=None)
|
||||
xiv_replication.VolumeReplication = mock.MagicMock()
|
||||
grp = testutils.create_group(self.ctxt, name='bla', group_type_id='1')
|
||||
volume = testutils.create_volume(self.ctxt, display_name='bla')
|
||||
volume.group = grp
|
||||
|
@ -365,14 +365,6 @@ class IBMStorageProxy(object):
|
||||
except Exception:
|
||||
return None
|
||||
|
||||
def _get_targets(self):
|
||||
return self.targets
|
||||
|
||||
def _is_replication_supported(self):
|
||||
if self.targets:
|
||||
return True
|
||||
return False
|
||||
|
||||
@_trace_time
|
||||
def _read_replication_devices(self):
|
||||
"""Read replication devices from configuration
|
||||
|
@ -27,8 +27,7 @@ if pyxcli:
|
||||
from pyxcli import client
|
||||
from pyxcli import errors
|
||||
from pyxcli.events import events
|
||||
from pyxcli.mirroring import errors as m_errors
|
||||
from pyxcli.mirroring import volume_recovery_manager
|
||||
from pyxcli.mirroring import mirrored_entities
|
||||
from pyxcli import transports
|
||||
|
||||
from cinder import context
|
||||
@ -40,6 +39,8 @@ from cinder.volume.drivers.ibm.ibm_storage import certificate
|
||||
from cinder.volume.drivers.ibm.ibm_storage import cryptish
|
||||
from cinder.volume.drivers.ibm.ibm_storage import proxy
|
||||
from cinder.volume.drivers.ibm.ibm_storage import strings
|
||||
from cinder.volume.drivers.ibm.ibm_storage import xiv_replication as repl
|
||||
from cinder.volume import group_types
|
||||
from cinder.volume import qos_specs
|
||||
from cinder.volume import utils
|
||||
from cinder.volume import volume_types
|
||||
@ -95,38 +96,19 @@ MANAGE_VOLUME_BASE_ERROR = _("Unable to manage the volume '%(volume)s': "
|
||||
"%(error)s.")
|
||||
|
||||
|
||||
class Rate(object):
|
||||
|
||||
def __init__(self, rpo, schedule):
|
||||
self.rpo = rpo
|
||||
self.schedule = schedule
|
||||
self.schedule_name = self._schedule_name_from_schedule(self.schedule)
|
||||
|
||||
def _schedule_name_from_schedule(self, schedule):
|
||||
if schedule == '00:00:20':
|
||||
return 'min_interval'
|
||||
return ("cinder_%(sched)s" %
|
||||
{'sched': schedule.replace(':', '_')})
|
||||
|
||||
|
||||
class XIVProxy(proxy.IBMStorageProxy):
|
||||
"""Proxy between the Cinder Volume and Spectrum Accelerate Storage.
|
||||
|
||||
Supports IBM XIV, Spectrum Accelerate, A9000, A9000R
|
||||
Version: 2.1.0
|
||||
Required pyxcli version: 1.1.2
|
||||
Required pyxcli version: 1.1.4
|
||||
|
||||
2.0 - First open source driver version
|
||||
2.1.0 - Support Consistency groups through Generic volume groups
|
||||
- Support XIV/A9000 Volume independent QoS
|
||||
- Support groups replication
|
||||
|
||||
"""
|
||||
async_rates = (
|
||||
Rate(rpo=120, schedule='00:01:00'),
|
||||
Rate(rpo=300, schedule='00:02:00'),
|
||||
Rate(rpo=600, schedule='00:05:00'),
|
||||
Rate(rpo=1200, schedule='00:10:00'),
|
||||
)
|
||||
|
||||
def __init__(self, storage_info, logger, exception,
|
||||
driver=None, active_backend_id=None):
|
||||
@ -192,13 +174,6 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
LOG.info("Connection to the IBM storage "
|
||||
"system established successfully.")
|
||||
|
||||
def _get_schedule_from_rpo(self, rpo):
|
||||
return [rate for rate in self.async_rates
|
||||
if rate.rpo == rpo][0].schedule_name
|
||||
|
||||
def _get_supported_rpo(self):
|
||||
return [rate.rpo for rate in self.async_rates]
|
||||
|
||||
@proxy._trace_time
|
||||
def _update_active_schedule_objects(self):
|
||||
"""Set schedule objects on active backend.
|
||||
@ -207,7 +182,7 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
min_interval.
|
||||
"""
|
||||
schedules = self._call_xiv_xcli("schedule_list").as_dict('name')
|
||||
for rate in self.async_rates:
|
||||
for rate in repl.Replication.async_rates:
|
||||
if rate.schedule == '00:00:20':
|
||||
continue
|
||||
name = rate.schedule_name
|
||||
@ -245,7 +220,7 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
min_interval.
|
||||
"""
|
||||
schedules = self._call_remote_xiv_xcli("schedule_list").as_dict('name')
|
||||
for rate in self.async_rates:
|
||||
for rate in repl.Replication.async_rates:
|
||||
if rate.schedule == '00:00:20':
|
||||
continue
|
||||
name = rate.schedule_name
|
||||
@ -438,30 +413,12 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
return self._get_qos_specs(type_id)
|
||||
|
||||
def _get_replication_info(self, specs):
|
||||
info = {'enabled': False, 'mode': None, 'rpo': 0}
|
||||
if specs:
|
||||
LOG.debug('_get_replication_info: specs %(specs)s',
|
||||
{'specs': specs})
|
||||
info['enabled'] = (
|
||||
specs.get('replication_enabled', '').upper() in
|
||||
(u'TRUE', strings.METADATA_IS_TRUE))
|
||||
replication_type = specs.get('replication_type', SYNC).lower()
|
||||
if replication_type in (u'sync', u'<is> sync'):
|
||||
info['mode'] = SYNC
|
||||
elif replication_type in (u'async', u'<is> async'):
|
||||
info['mode'] = ASYNC
|
||||
else:
|
||||
msg = (_("Unsupported replication mode %(mode)s")
|
||||
% {'mode': replication_type})
|
||||
|
||||
info, msg = repl.Replication.extract_replication_info_from_specs(specs)
|
||||
if not info:
|
||||
LOG.error(msg)
|
||||
raise self._get_exception()(message=msg)
|
||||
info['rpo'] = int(specs.get('rpo', u'<is> 0')[5:])
|
||||
if info['rpo'] and info['rpo'] not in self._get_supported_rpo():
|
||||
msg = (_("Unsupported replication RPO %(rpo)s")
|
||||
% {'rpo': info['rpo']})
|
||||
LOG.error(msg)
|
||||
raise self._get_exception()(message=msg)
|
||||
LOG.debug('_get_replication_info: info %(info)s', {'info': info})
|
||||
|
||||
return info
|
||||
|
||||
@proxy._trace_time
|
||||
@ -491,26 +448,74 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
@proxy._trace_time
|
||||
def create_volume(self, volume):
|
||||
"""Creates a volume."""
|
||||
|
||||
# read replication information
|
||||
specs = self._get_extra_specs(volume.get('volume_type_id', None))
|
||||
replication_info = self._get_replication_info(specs)
|
||||
|
||||
if volume.group and replication_info['enabled']:
|
||||
# An unsupported illegal configuration
|
||||
msg = _("Unable to create volume: "
|
||||
"Replication of consistency group is not supported")
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
self._create_volume(volume)
|
||||
return self.handle_created_vol_properties(replication_info,
|
||||
volume)
|
||||
|
||||
def handle_created_vol_properties(self, replication_info, volume):
|
||||
volume_update = {}
|
||||
|
||||
LOG.debug('checking replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
volume_update['replication_status'] = 'disabled'
|
||||
cg = volume.group and utils.is_group_a_cg_snapshot_type(volume.group)
|
||||
if replication_info['enabled']:
|
||||
try:
|
||||
repl.VolumeReplication(self).create_replication(
|
||||
volume.name, replication_info)
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = ('Failed create_replication for '
|
||||
'volume %(vol)s: %(err)s',
|
||||
{'vol': volume['name'], 'err': details})
|
||||
LOG.error(msg)
|
||||
if cg:
|
||||
cg_name = self._cg_name_from_volume(volume)
|
||||
self._silent_delete_volume_from_cg(volume, cg_name)
|
||||
self._silent_delete_volume(volume=volume)
|
||||
raise
|
||||
volume_update['replication_status'] = 'enabled'
|
||||
|
||||
if cg:
|
||||
if volume.group.is_replicated:
|
||||
# for replicated Consistency Group:
|
||||
# The Volume must be mirrored, and its mirroring settings must
|
||||
# be identical to those of the Consistency Group:
|
||||
# mirroring type (e.g., synchronous),
|
||||
# mirroring status, mirroring target(backend)
|
||||
group_specs = group_types.get_group_type_specs(
|
||||
volume.group.group_type_id)
|
||||
group_rep_info = self._get_replication_info(group_specs)
|
||||
|
||||
msg = None
|
||||
if volume_update['replication_status'] != 'enabled':
|
||||
msg = ('Cannot add non-replicated volume into'
|
||||
' replicated group')
|
||||
elif replication_info['mode'] != group_rep_info['mode']:
|
||||
msg = ('Volume replication type and Group replication type'
|
||||
' should be the same')
|
||||
elif volume.host != volume.group.host:
|
||||
msg = 'Cannot add volume to Group on different host'
|
||||
else:
|
||||
group_name = self._cg_name_from_group(volume.group)
|
||||
me = mirrored_entities.MirroredEntities(
|
||||
self.ibm_storage_cli)
|
||||
me_objs = me.get_mirror_resources_by_name_map()
|
||||
vol_sync_state = me_objs['volumes'][volume.name].sync_state
|
||||
cg_sync_state = me_objs['cgs'][group_name].sync_state
|
||||
|
||||
if (vol_sync_state != 'Synchronized' or
|
||||
cg_sync_state != 'Synchronized'):
|
||||
msg = ('Cannot add volume to Group. Both volume and '
|
||||
'group should have sync_state = Synchronized')
|
||||
if msg:
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
try:
|
||||
cg_name = self._cg_name_from_volume(volume)
|
||||
self._call_xiv_xcli(
|
||||
@ -543,35 +548,234 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
LOG.debug('checking replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
volume_update['replication_status'] = 'disabled'
|
||||
if replication_info['enabled']:
|
||||
try:
|
||||
self._replication_create(volume, replication_info)
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = ('Failed _replication_create for '
|
||||
'volume %(vol)s: %(err)s',
|
||||
{'vol': volume['name'], 'err': details})
|
||||
LOG.error(msg)
|
||||
if cg:
|
||||
cg_name = self._cg_name_from_volume(volume)
|
||||
self._silent_delete_volume_from_cg(volume, cg_name)
|
||||
self._silent_delete_volume(volume=volume)
|
||||
raise
|
||||
volume_update['replication_status'] = 'enabled'
|
||||
|
||||
return volume_update
|
||||
|
||||
def get_group_specs_by_group_resource(self, context, group):
|
||||
group_type = group.get('group_type_id', None)
|
||||
if group_type is None:
|
||||
msg = ('No group specs inside group type.')
|
||||
return None, msg
|
||||
group_specs = group_types.get_group_type_specs(group_type)
|
||||
keyword = 'consistent_group_replication_enabled'
|
||||
if not group_specs.get(keyword) == '<is> True':
|
||||
msg = ('No cg replication field in group specs.')
|
||||
return None, msg
|
||||
return group_specs, ''
|
||||
|
||||
@proxy._trace_time
|
||||
def enable_replication(self, context, group, volumes):
|
||||
"""Enable cg replication"""
|
||||
# fetch replication info
|
||||
group_specs = group_types.get_group_type_specs(group.group_type_id)
|
||||
if not group_specs:
|
||||
msg = 'No group specs inside group type'
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
# Add this field to adjust it to generic replication (for volumes)
|
||||
replication_info = self._get_replication_info(group_specs)
|
||||
if utils.is_group_a_cg_snapshot_type(group):
|
||||
# take every vol out of cg - we can't mirror the cg otherwise.
|
||||
if volumes:
|
||||
self._update_consistencygroup(context, group,
|
||||
remove_volumes=volumes)
|
||||
for volume in volumes:
|
||||
repl.VolumeReplication(self).create_replication(
|
||||
volume.name, replication_info)
|
||||
|
||||
# mirror entire group
|
||||
group_name = self._cg_name_from_group(group)
|
||||
self._create_consistencygroup_on_remote(context, group_name)
|
||||
repl.GroupReplication(self).create_replication(group_name,
|
||||
replication_info)
|
||||
|
||||
updated_volumes = []
|
||||
if volumes:
|
||||
# add volumes back to cg
|
||||
self._update_consistencygroup(context, group,
|
||||
add_volumes=volumes)
|
||||
for volume in volumes:
|
||||
updated_volumes.append(
|
||||
{'id': volume['id'],
|
||||
'replication_status':
|
||||
fields.ReplicationStatus.ENABLED})
|
||||
return ({'replication_status': fields.ReplicationStatus.ENABLED},
|
||||
updated_volumes)
|
||||
else:
|
||||
# For generic groups we replicate all the volumes
|
||||
updated_volumes = []
|
||||
for volume in volumes:
|
||||
repl.VolumeReplication(self).create_replication(
|
||||
volume.name, replication_info)
|
||||
|
||||
# update status
|
||||
for volume in volumes:
|
||||
updated_volumes.append(
|
||||
{'id': volume['id'],
|
||||
'replication_status': fields.ReplicationStatus.ENABLED})
|
||||
return ({'replication_status': fields.ReplicationStatus.ENABLED},
|
||||
updated_volumes)
|
||||
|
||||
@proxy._trace_time
|
||||
def disable_replication(self, context, group, volumes):
|
||||
"""disables CG replication"""
|
||||
group_specs = group_types.get_group_type_specs(group.group_type_id)
|
||||
if not group_specs:
|
||||
msg = 'No group specs inside group type'
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
replication_info = self._get_replication_info(group_specs)
|
||||
updated_volumes = []
|
||||
if utils.is_group_a_cg_snapshot_type(group):
|
||||
# one call deletes replication for cgs and volumes together.
|
||||
repl.GroupReplication(self).delete_replication(group,
|
||||
replication_info)
|
||||
for volume in volumes:
|
||||
# xiv locks volumes after deletion of replication.
|
||||
# we need to unlock it for further use.
|
||||
try:
|
||||
self.ibm_storage_cli.cmd.vol_unlock(vol=volume.name)
|
||||
except errors.XCLIError as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = ('Failed to unlock volumes %(details)s' %
|
||||
{'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
updated_volumes.append(
|
||||
{'id': volume.id,
|
||||
'replication_status': fields.ReplicationStatus.DISABLED})
|
||||
else:
|
||||
# For generic groups we replicate all the volumes
|
||||
updated_volumes = []
|
||||
for volume in volumes:
|
||||
repl.VolumeReplication(self).delete_replication(
|
||||
volume.name, replication_info)
|
||||
|
||||
# update status
|
||||
for volume in volumes:
|
||||
updated_volumes.append(
|
||||
{'id': volume['id'],
|
||||
'replication_status': fields.ReplicationStatus.DISABLED})
|
||||
return ({'replication_status': fields.ReplicationStatus.DISABLED},
|
||||
updated_volumes)
|
||||
|
||||
def get_secondary_backend_id(self, secondary_backend_id):
|
||||
if secondary_backend_id is None:
|
||||
secondary_backend_id = self._get_target()
|
||||
if secondary_backend_id is None:
|
||||
msg = _("No targets defined. Can't perform failover.")
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
return secondary_backend_id
|
||||
|
||||
def check_for_splitbrain(self, volumes, pool_master, pool_slave):
|
||||
if volumes:
|
||||
# check for split brain situations
|
||||
# check for files that are available on both volumes
|
||||
# and are not in an active mirroring relation
|
||||
split_brain = self._potential_split_brain(
|
||||
self.ibm_storage_cli,
|
||||
self.ibm_storage_remote_cli,
|
||||
volumes, pool_master,
|
||||
pool_slave)
|
||||
if split_brain:
|
||||
# if such a situation exists stop and raise an exception!
|
||||
msg = (_("A potential split brain condition has been found "
|
||||
"with the following volumes: \n'%(volumes)s.'") %
|
||||
{'volumes': split_brain})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
def failover_replication(self, context, group, volumes,
|
||||
secondary_backend_id):
|
||||
"""Failover a cg with all it's volumes.
|
||||
|
||||
if secondery_id is default, cg needs to be failed back.
|
||||
|
||||
"""
|
||||
volumes_updated = []
|
||||
goal_status = ''
|
||||
pool_master = None
|
||||
group_updated = {'replication_status': group.replication_status}
|
||||
LOG.info("failover_replication: of cg %(cg)s "
|
||||
"from %(active)s to %(id)s",
|
||||
{'cg': group.get('name'),
|
||||
'active': self.active_backend_id,
|
||||
'id': secondary_backend_id})
|
||||
if secondary_backend_id == strings.PRIMARY_BACKEND_ID:
|
||||
# default as active backend id
|
||||
if self._using_default_backend():
|
||||
LOG.info("CG has been failed back. "
|
||||
"No need to fail back again.")
|
||||
return group_updated, volumes_updated
|
||||
# get the master pool, not using default id.
|
||||
pool_master = self._get_target_params(
|
||||
self.active_backend_id)['san_clustername']
|
||||
pool_slave = self.storage_info[storage.FLAG_KEYS['storage_pool']]
|
||||
goal_status = 'available'
|
||||
else:
|
||||
if self._using_default_backend():
|
||||
LOG.info("cg already failed over.")
|
||||
return group_updated, volumes_updated
|
||||
# using same api as Cheesecake, we need
|
||||
# replciation_device entry. so we use get_targets.
|
||||
secondary_backend_id = self.get_secondary_backend_id(
|
||||
secondary_backend_id)
|
||||
pool_master = self.storage_info[storage.FLAG_KEYS['storage_pool']]
|
||||
pool_slave = self._get_target_params(
|
||||
secondary_backend_id)['san_clustername']
|
||||
goal_status = fields.ReplicationStatus.FAILED_OVER
|
||||
# we should have secondary_backend_id by here.
|
||||
self.ibm_storage_remote_cli = self._init_xcli(secondary_backend_id)
|
||||
|
||||
# check for split brain in mirrored volumes
|
||||
self.check_for_splitbrain(volumes, pool_master, pool_slave)
|
||||
group_specs, msg = self.get_group_specs_by_group_resource(context,
|
||||
group)
|
||||
if group_specs is None:
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
failback = (secondary_backend_id == strings.PRIMARY_BACKEND_ID)
|
||||
|
||||
result, details = repl.GroupReplication.failover(group, failback)
|
||||
|
||||
if result:
|
||||
status = goal_status
|
||||
group_updated['replication_status'] = status
|
||||
else:
|
||||
status = 'error'
|
||||
updates = {'status': status}
|
||||
if status == 'error':
|
||||
group_updated['replication_extended_status'] = details
|
||||
# if replication on cg was successful, then all of the volumes
|
||||
# have been successfully replicated as well.
|
||||
for volume in volumes:
|
||||
volumes_updated.append({
|
||||
'volume_id': volume.id,
|
||||
'updates': updates
|
||||
})
|
||||
# replace between active and secondary xcli
|
||||
self._replace_xcli_to_remote_xcli()
|
||||
|
||||
return group_updated, volumes_updated
|
||||
|
||||
def _replace_xcli_to_remote_xcli(self):
|
||||
temp_ibm_storage_cli = self.ibm_storage_cli
|
||||
self.ibm_storage_cli = self.ibm_storage_remote_cli
|
||||
self.ibm_storage_remote_cli = temp_ibm_storage_cli
|
||||
|
||||
def _get_replication_target_params(self):
|
||||
LOG.debug('_get_replication_target_params.')
|
||||
targets = self._get_targets()
|
||||
if not targets:
|
||||
if not self.targets:
|
||||
msg = _("No targets available for replication")
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
no_of_targets = len(targets)
|
||||
no_of_targets = len(self.targets)
|
||||
if no_of_targets > 1:
|
||||
msg = _("Too many targets configured. Only one is supported")
|
||||
LOG.error(msg)
|
||||
@ -591,89 +795,6 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
return target, params
|
||||
|
||||
def _replication_create(self, volume, replication_info):
|
||||
LOG.debug('_replication_create replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
|
||||
target, params = self._get_replication_target_params()
|
||||
LOG.info('Target %(target)s: %(params)s',
|
||||
{'target': target, 'params': six.text_type(params)})
|
||||
|
||||
try:
|
||||
pool = params['san_clustername']
|
||||
except Exception:
|
||||
msg = (_("Missing pool information for target '%(target)s'"),
|
||||
{'target': target})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
|
||||
False, self.ibm_storage_cli)
|
||||
|
||||
self._replication_create_mirror(volume, replication_info,
|
||||
target, pool, volume_replication_mgr)
|
||||
|
||||
def _replication_create_mirror(self, volume, replication_info,
|
||||
target, pool, volume_replication_mgr):
|
||||
LOG.debug('_replication_create_mirror')
|
||||
schedule = None
|
||||
if replication_info['rpo']:
|
||||
schedule = self._get_schedule_from_rpo(replication_info['rpo'])
|
||||
if schedule:
|
||||
LOG.debug('schedule %(sched)s: for rpo %(rpo)s',
|
||||
{'sched': schedule, 'rpo': replication_info['rpo']})
|
||||
else:
|
||||
LOG.error('Failed to find schedule for rpo %(rpo)s',
|
||||
{'rpo': replication_info['rpo']})
|
||||
# will fail in the next step
|
||||
try:
|
||||
volume_replication_mgr.create_mirror(
|
||||
resource_name=volume['name'],
|
||||
target_name=target,
|
||||
mirror_type=replication_info['mode'],
|
||||
slave_resource_name=volume['name'],
|
||||
create_slave='yes',
|
||||
remote_pool=pool,
|
||||
rpo=replication_info['rpo'],
|
||||
schedule=schedule,
|
||||
activate_mirror='yes')
|
||||
# TBD - what exceptions will we get here?
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed replication for %(vol)s: '%(details)s'"),
|
||||
{'vol': volume['name'], 'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
def _replication_delete(self, volume, replication_info):
|
||||
LOG.debug('_replication_delete replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
targets = self._get_targets()
|
||||
if not targets:
|
||||
LOG.debug('No targets defined for replication')
|
||||
|
||||
volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
|
||||
False, self.ibm_storage_cli)
|
||||
try:
|
||||
volume_replication_mgr.deactivate_mirror(
|
||||
resource_id=volume['name'])
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed ending replication for %(vol)s: '%(details)s'"),
|
||||
{'vol': volume['name'], 'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
try:
|
||||
volume_replication_mgr.delete_mirror(
|
||||
resource_id=volume['name'])
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed deleting replica for %(vol)s: '%(details)s'"),
|
||||
{'vol': volume['name'], 'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(data=msg)
|
||||
|
||||
def _delete_volume(self, vol_name):
|
||||
"""Deletes a volume on the Storage."""
|
||||
LOG.debug("_delete_volume: %(volume)s",
|
||||
@ -727,7 +848,8 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
replication_info = self._get_replication_info(specs)
|
||||
if replication_info['enabled']:
|
||||
try:
|
||||
self._replication_delete(volume, replication_info)
|
||||
repl.VolumeReplication(self).delete_replication(
|
||||
volume.name, replication_info)
|
||||
except Exception as e:
|
||||
error = self._get_code_and_status_or_message(e)
|
||||
LOG.error(DELETE_VOLUME_BASE_ERROR,
|
||||
@ -1221,70 +1343,6 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
potential_split_brain.append(name)
|
||||
return potential_split_brain
|
||||
|
||||
def _failover_vol(self, volume, volume_replication_mgr,
|
||||
failover_volume_replication_mgr,
|
||||
replication_info, failback):
|
||||
"""Failover a single volume.
|
||||
|
||||
Attempts to failover a single volume
|
||||
Sequence:
|
||||
1. attempt to switch roles from master
|
||||
2. attempt to change role to master on slave
|
||||
|
||||
returns (success, failure_reason)
|
||||
"""
|
||||
LOG.debug("_failover_vol %(vol)s", {'vol': volume['name']})
|
||||
|
||||
# check if mirror is defined and active
|
||||
try:
|
||||
LOG.debug('Check if mirroring is active on %(vol)s.',
|
||||
{'vol': volume['name']})
|
||||
active = volume_replication_mgr.is_mirror_active(
|
||||
resource_id=volume['name'])
|
||||
except Exception:
|
||||
active = False
|
||||
state = 'active' if active else 'inactive'
|
||||
LOG.debug('Mirroring is %(state)s', {'state': state})
|
||||
|
||||
# In case of failback, mirroring must be active
|
||||
# In case of failover we attempt to move in any condition
|
||||
if failback and not active:
|
||||
msg = ("Volume %(vol)s: no active mirroring and can not "
|
||||
"failback",
|
||||
{'vol': volume['name']})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
|
||||
try:
|
||||
volume_replication_mgr.switch_roles(resource_id=volume['name'])
|
||||
return True, None
|
||||
except Exception as e:
|
||||
# failed attempt to switch_roles from the master
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
LOG.warning('Failed to perform switch_roles on'
|
||||
' %(vol)s: %(err)s. '
|
||||
'Continue to change_role',
|
||||
{'vol': volume['name'], 'err': details})
|
||||
|
||||
try:
|
||||
# this is the ugly stage we come to brute force
|
||||
LOG.warning('Attempt to change_role to master')
|
||||
failover_volume_replication_mgr.failover_by_id(
|
||||
resource_id=volume['name'])
|
||||
return True, None
|
||||
except m_errors.NoMirrorDefinedError as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = ("Volume %(vol)s no replication defined: %(err)s" %
|
||||
{'vol': volume['name'], 'err': details})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
except Exception as e:
|
||||
details = self._get_code_and_status_or_message(e)
|
||||
msg = ('Volume %(vol)s change_role failed: %(err)s' %
|
||||
{'vol': volume['name'], 'err': details})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
|
||||
@proxy._trace_time
|
||||
def failover_host(self, context, volumes, secondary_id, groups=None):
|
||||
"""Failover a full backend.
|
||||
@ -1316,14 +1374,7 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
LOG.info("Already failed over. No need to failover again.")
|
||||
return self.active_backend_id, volume_update_list, []
|
||||
# case: need to select a target
|
||||
if secondary_id is None:
|
||||
secondary_id = self._get_target()
|
||||
# still no targets..
|
||||
if secondary_id is None:
|
||||
msg = _("No targets defined. Can't perform failover")
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
secondary_id = self.get_secondary_backend_id(secondary_id)
|
||||
pool_master = self.storage_info[storage.FLAG_KEYS['storage_pool']]
|
||||
try:
|
||||
pool_slave = self._get_target_params(
|
||||
@ -1340,45 +1391,21 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
# calling _init_xcli with secondary_id
|
||||
self.ibm_storage_remote_cli = self._init_xcli(secondary_id)
|
||||
|
||||
# Create volume manager for both master and remote
|
||||
volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
|
||||
False, self.ibm_storage_cli)
|
||||
failover_volume_replication_mgr = (
|
||||
volume_recovery_manager.VolumeRecoveryManager(
|
||||
True, self.ibm_storage_remote_cli))
|
||||
|
||||
# get replication_info for all volumes at once
|
||||
if len(volumes):
|
||||
# check for split brain situations
|
||||
# check for files that are available on both volumes
|
||||
# and are not in an active mirroring relation
|
||||
split_brain = self._potential_split_brain(
|
||||
self.ibm_storage_cli,
|
||||
self.ibm_storage_remote_cli,
|
||||
volumes, pool_master,
|
||||
pool_slave)
|
||||
if len(split_brain):
|
||||
# if such a situation exists stop and raise an exception!
|
||||
msg = (_("A potential split brain condition has been found "
|
||||
"with the following volumes: \n'%(volumes)s.'"),
|
||||
{'volumes': split_brain})
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
specs = self._get_extra_specs(
|
||||
volumes[0].get('volume_type_id', None))
|
||||
replication_info = self._get_replication_info(specs)
|
||||
self.check_for_splitbrain(volumes, pool_master, pool_slave)
|
||||
|
||||
# loop over volumes and attempt failover
|
||||
for volume in volumes:
|
||||
LOG.debug("Attempting to failover '%(vol)s'",
|
||||
{'vol': volume['name']})
|
||||
result, details = self._failover_vol(
|
||||
volume,
|
||||
volume_replication_mgr,
|
||||
failover_volume_replication_mgr,
|
||||
replication_info,
|
||||
failback=(secondary_id == strings.PRIMARY_BACKEND_ID))
|
||||
|
||||
result, details = repl.VolumeReplication(self).failover(
|
||||
volume, failback=(secondary_id == strings.PRIMARY_BACKEND_ID))
|
||||
|
||||
if result:
|
||||
status = goal_status
|
||||
else:
|
||||
@ -1393,9 +1420,7 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
})
|
||||
|
||||
# set active xcli to secondary xcli
|
||||
temp_ibm_storage_cli = self.ibm_storage_cli
|
||||
self.ibm_storage_cli = self.ibm_storage_remote_cli
|
||||
self.ibm_storage_remote_cli = temp_ibm_storage_cli
|
||||
self._replace_xcli_to_remote_xcli()
|
||||
# set active backend id to secondary id
|
||||
self.active_backend_id = secondary_id
|
||||
|
||||
@ -1500,6 +1525,8 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
self.meta['stat']["driver_version"] = self.full_version
|
||||
self.meta['stat']["storage_protocol"] = connection_type
|
||||
self.meta['stat']['multiattach'] = False
|
||||
self.meta['stat']['group_replication_enabled'] = True
|
||||
self.meta['stat']['consistent_group_replication_enabled'] = True
|
||||
self.meta['stat']['QoS_support'] = (
|
||||
self._check_storage_version_for_qos_support())
|
||||
|
||||
@ -1538,15 +1565,14 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
self.meta['stat']['thin_provision'] = ('True' if soft_size > hard_size
|
||||
else 'False')
|
||||
|
||||
targets = self._get_targets()
|
||||
if targets:
|
||||
if self.targets:
|
||||
self.meta['stat']['replication_enabled'] = True
|
||||
# TBD - replication_type should be according to type
|
||||
self.meta['stat']['replication_type'] = [SYNC, ASYNC]
|
||||
self.meta['stat']['rpo'] = self._get_supported_rpo()
|
||||
self.meta['stat']['replication_count'] = len(targets)
|
||||
self.meta['stat']['rpo'] = repl.Replication.get_supported_rpo()
|
||||
self.meta['stat']['replication_count'] = len(self.targets)
|
||||
self.meta['stat']['replication_targets'] = [target for target in
|
||||
six.iterkeys(targets)]
|
||||
six.iterkeys(
|
||||
self.targets)]
|
||||
|
||||
self.meta['stat']['timestamp'] = datetime.datetime.utcnow()
|
||||
|
||||
@ -1679,18 +1705,6 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
def create_group(self, context, group):
|
||||
"""Creates a group."""
|
||||
|
||||
for volume_type in group.volume_types:
|
||||
replication_info = self._get_replication_info(
|
||||
volume_type.extra_specs)
|
||||
|
||||
if replication_info.get('enabled'):
|
||||
# An unsupported illegal configuration
|
||||
msg = _("Unable to create group: create group with "
|
||||
"replication volume type is not supported")
|
||||
LOG.error(msg)
|
||||
raise self.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
if utils.is_group_a_cg_snapshot_type(group):
|
||||
cgname = self._cg_name_from_group(group)
|
||||
return self._create_consistencygroup(context, cgname)
|
||||
@ -1726,6 +1740,35 @@ class XIVProxy(proxy.IBMStorageProxy):
|
||||
model_update = {'status': fields.GroupStatus.AVAILABLE}
|
||||
return model_update
|
||||
|
||||
def _create_consistencygroup_on_remote(self, context, cgname):
|
||||
"""Creates a consistency group on secondary machine.
|
||||
|
||||
Return group available even if it already exists (for replication)
|
||||
"""
|
||||
|
||||
LOG.info("Creating consistency group %(name)s on secondary.",
|
||||
{'name': cgname})
|
||||
|
||||
# call remote XCLI
|
||||
try:
|
||||
self._call_remote_xiv_xcli(
|
||||
"cg_create", cg=cgname,
|
||||
pool=self.storage_info[
|
||||
storage.FLAG_KEYS['storage_pool']]).as_list
|
||||
except errors.CgNameExistsError:
|
||||
model_update = {'status': fields.GroupStatus.AVAILABLE}
|
||||
except errors.CgLimitReachedError:
|
||||
error = _("Maximum number of consistency groups reached")
|
||||
LOG.error(error)
|
||||
raise self._get_exception()(error)
|
||||
except errors.XCLIError as e:
|
||||
error = (_("Fatal error in cg_create on remote: %(details)s") %
|
||||
{'details': self._get_code_and_status_or_message(e)})
|
||||
LOG.error(error)
|
||||
raise self._get_exception()(error)
|
||||
model_update = {'status': fields.GroupStatus.AVAILABLE}
|
||||
return model_update
|
||||
|
||||
def _silent_cleanup_consistencygroup_from_src(self, context, group,
|
||||
volumes, cgname):
|
||||
"""Silent cleanup of volumes from CG.
|
||||
|
342
cinder/volume/drivers/ibm/ibm_storage/xiv_replication.py
Normal file
342
cinder/volume/drivers/ibm/ibm_storage/xiv_replication.py
Normal file
@ -0,0 +1,342 @@
|
||||
# Copyright (c) 2017 IBM Corporation
|
||||
# All Rights Reserved.
|
||||
#
|
||||
# Licensed under the Apache License, Version 2.0 (the "License"); you may
|
||||
# not use this file except in compliance with the License. You may obtain
|
||||
# a copy of the License at
|
||||
#
|
||||
# http://www.apache.org/licenses/LICENSE-2.0
|
||||
#
|
||||
# Unless required by applicable law or agreed to in writing, software
|
||||
# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
||||
# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
||||
# License for the specific language governing permissions and limitations
|
||||
# under the License.
|
||||
#
|
||||
import six
|
||||
|
||||
from oslo_log import log as logging
|
||||
from oslo_utils import importutils
|
||||
|
||||
pyxcli = importutils.try_import("pyxcli")
|
||||
if pyxcli:
|
||||
from pyxcli import errors
|
||||
from pyxcli.mirroring import cg_recovery_manager
|
||||
from pyxcli.mirroring import errors as m_errors
|
||||
from pyxcli.mirroring import volume_recovery_manager
|
||||
|
||||
from cinder.i18n import _
|
||||
from cinder.volume.drivers.ibm.ibm_storage import strings
|
||||
|
||||
SYNC = 'sync'
|
||||
ASYNC = 'async'
|
||||
|
||||
LOG = logging.getLogger(__name__)
|
||||
|
||||
|
||||
class Rate(object):
|
||||
|
||||
def __init__(self, rpo, schedule):
|
||||
self.rpo = rpo
|
||||
self.schedule = schedule
|
||||
self.schedule_name = self._schedule_name_from_schedule(self.schedule)
|
||||
|
||||
def _schedule_name_from_schedule(self, schedule):
|
||||
if schedule == '00:00:20':
|
||||
return 'min_interval'
|
||||
return ("cinder_%(sched)s" %
|
||||
{'sched': schedule.replace(':', '_')})
|
||||
|
||||
|
||||
class Replication(object):
|
||||
|
||||
async_rates = (
|
||||
Rate(rpo=120, schedule='00:01:00'),
|
||||
Rate(rpo=300, schedule='00:02:00'),
|
||||
Rate(rpo=600, schedule='00:05:00'),
|
||||
Rate(rpo=1200, schedule='00:10:00'),
|
||||
)
|
||||
|
||||
def __init__(self, proxy):
|
||||
self.proxy = proxy
|
||||
|
||||
@staticmethod
|
||||
def get_schedule_from_rpo(rpo):
|
||||
schedule = [rate for rate in Replication.async_rates
|
||||
if rate.rpo == rpo][0].schedule_name
|
||||
if schedule:
|
||||
LOG.debug('schedule %(sched)s: for rpo %(rpo)s',
|
||||
{'sched': schedule, 'rpo': rpo})
|
||||
else:
|
||||
LOG.error('Failed to find schedule for rpo %(rpo)s',
|
||||
{'rpo': rpo})
|
||||
return schedule
|
||||
|
||||
@staticmethod
|
||||
def get_supported_rpo():
|
||||
return [rate.rpo for rate in Replication.async_rates]
|
||||
|
||||
def get_recovery_mgr(self):
|
||||
# Recovery manager is set in derived classes
|
||||
raise NotImplementedError
|
||||
|
||||
def get_remote_recovery_mgr(self):
|
||||
# Recovery manager is set in derived classes
|
||||
raise NotImplementedError
|
||||
|
||||
def replication_create_mirror(self, resource, replication_info,
|
||||
target, pool):
|
||||
raise NotImplementedError
|
||||
|
||||
@staticmethod
|
||||
def extract_replication_info_from_specs(specs):
|
||||
info = {'enabled': False, 'mode': None, 'rpo': 0}
|
||||
msg = ""
|
||||
if specs:
|
||||
LOG.debug('extract_replication_info_from_specs: specs %(specs)s',
|
||||
{'specs': specs})
|
||||
|
||||
info['enabled'] = (
|
||||
specs.get('replication_enabled', '').upper() in
|
||||
(u'TRUE', strings.METADATA_IS_TRUE) or
|
||||
specs.get('group_replication_enabled', '').upper() in
|
||||
(u'TRUE', strings.METADATA_IS_TRUE))
|
||||
|
||||
replication_type = specs.get('replication_type', SYNC).lower()
|
||||
if replication_type in (u'sync', u'<is> sync'):
|
||||
info['mode'] = SYNC
|
||||
elif replication_type in (u'async', u'<is> async'):
|
||||
info['mode'] = ASYNC
|
||||
else:
|
||||
msg = (_("Unsupported replication mode %(mode)s")
|
||||
% {'mode': replication_type})
|
||||
return None, msg
|
||||
info['rpo'] = int(specs.get('rpo', u'<is> 0')[5:])
|
||||
supported_rpos = Replication.get_supported_rpo()
|
||||
if info['rpo'] and info['rpo'] not in supported_rpos:
|
||||
msg = (_("Unsupported replication RPO %(rpo)s"),
|
||||
{'rpo': info['rpo']})
|
||||
return None, msg
|
||||
|
||||
LOG.debug('extract_replication_info_from_specs: info %(info)s',
|
||||
{'info': info})
|
||||
return info, msg
|
||||
|
||||
def failover(self, resource, failback):
|
||||
raise NotImplementedError
|
||||
|
||||
def create_replication(self, resource_name, replication_info):
|
||||
LOG.debug('Replication::create_replication replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
|
||||
target, params = self.proxy._get_replication_target_params()
|
||||
LOG.info('Target %(target)s: %(params)s',
|
||||
{'target': target, 'params': six.text_type(params)})
|
||||
|
||||
try:
|
||||
pool = params['san_clustername']
|
||||
except Exception:
|
||||
msg = (_("Missing pool information for target '%(target)s'") %
|
||||
{'target': target})
|
||||
LOG.error(msg)
|
||||
raise self.proxy.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
self.replication_create_mirror(resource_name, replication_info,
|
||||
target, pool)
|
||||
|
||||
def delete_replication(self, resource_name, replication_info):
|
||||
LOG.debug('Replication::delete_replication replication_info %(rep)s',
|
||||
{'rep': replication_info})
|
||||
|
||||
recovery_mgr = self.get_recovery_mgr()
|
||||
|
||||
try:
|
||||
recovery_mgr.deactivate_mirror(resource_id=resource_name)
|
||||
except Exception as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed ending replication for %(resource)s: "
|
||||
"'%(details)s'") % {'resource': resource_name,
|
||||
'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.proxy.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
try:
|
||||
recovery_mgr.delete_mirror(resource_id=resource_name)
|
||||
except Exception as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed deleting replica for %(resource)s: "
|
||||
"'%(details)s'") % {'resource': resource_name,
|
||||
'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.proxy.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
def _failover_resource(self, resource, recovery_mgr, failover_rep_mgr,
|
||||
rep_type, failback):
|
||||
# check if mirror is defined and active
|
||||
LOG.debug('Check if mirroring is active on %(res)s',
|
||||
{'res': resource['name']})
|
||||
try:
|
||||
active = recovery_mgr.is_mirror_active(
|
||||
resource_id=resource['name'])
|
||||
except Exception:
|
||||
active = False
|
||||
state = 'active' if active else 'inactive'
|
||||
LOG.debug('Mirroring is %(state)s', {'state': state})
|
||||
|
||||
# In case of failback, mirroring must be active
|
||||
# In case of failover we attempt to move in any condition
|
||||
if failback and not active:
|
||||
msg = ("%(rep_type)s %(res)s: no active mirroring and can not "
|
||||
"failback" % {'rep_type': rep_type,
|
||||
'res': resource['name']})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
|
||||
try:
|
||||
recovery_mgr.switch_roles(resource_id=resource['name'])
|
||||
return True, None
|
||||
except Exception as e:
|
||||
# failed attempt to switch_roles from the master
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
LOG.warning('Failed to perform switch_roles on'
|
||||
' %(res)s: %(err)s. '
|
||||
'Continue to change_role',
|
||||
{'res': resource['name'], 'err': details})
|
||||
try:
|
||||
# this is the ugly stage we come to brute force
|
||||
if failback:
|
||||
role = 'Slave'
|
||||
else:
|
||||
role = 'Master'
|
||||
LOG.warning('Attempt to change_role to %(role)s', {'role': role})
|
||||
failover_rep_mgr.change_role(resource_id=resource['name'],
|
||||
new_role=role)
|
||||
return True, None
|
||||
except m_errors.NoMirrorDefinedError as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = ("%(rep_type)s %(res)s no replication defined: %(err)s" %
|
||||
{'rep_type': rep_type, 'res': resource['name'],
|
||||
'err': details})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
except Exception as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = ('%(rep_type)s %(res)s change_role failed: %(err)s' %
|
||||
{'rep_type': rep_type, 'res': resource['name'],
|
||||
'err': details})
|
||||
LOG.error(msg)
|
||||
return False, msg
|
||||
|
||||
|
||||
class VolumeReplication(Replication):
|
||||
|
||||
def __init__(self, proxy):
|
||||
super(VolumeReplication, self).__init__(proxy)
|
||||
|
||||
def get_recovery_mgr(self):
|
||||
return volume_recovery_manager.VolumeRecoveryManager(
|
||||
False, self.proxy.ibm_storage_cli)
|
||||
|
||||
def get_remote_recovery_mgr(self):
|
||||
return volume_recovery_manager.VolumeRecoveryManager(
|
||||
True, self.proxy.ibm_storage_remote_cli)
|
||||
|
||||
def replication_create_mirror(self, resource_name, replication_info,
|
||||
target, pool):
|
||||
LOG.debug('VolumeReplication::replication_create_mirror')
|
||||
|
||||
schedule = None
|
||||
if replication_info['rpo']:
|
||||
schedule = Replication.get_schedule_from_rpo(
|
||||
replication_info['rpo'])
|
||||
try:
|
||||
recovery_mgr = self.get_recovery_mgr()
|
||||
recovery_mgr.create_mirror(
|
||||
resource_name=resource_name,
|
||||
target_name=target,
|
||||
mirror_type=replication_info['mode'],
|
||||
slave_resource_name=resource_name,
|
||||
create_slave='yes',
|
||||
remote_pool=pool,
|
||||
rpo=replication_info['rpo'],
|
||||
schedule=schedule,
|
||||
activate_mirror='yes')
|
||||
except errors.VolumeMasterError:
|
||||
LOG.debug('Volume %(vol)s has been already mirrored',
|
||||
{'vol': resource_name})
|
||||
except Exception as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed replication for %(resource)s: '%(details)s'") %
|
||||
{'resource': resource_name, 'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.proxy.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
def failover(self, resource, failback):
|
||||
"""Failover a single volume.
|
||||
|
||||
Attempts to failover a single volume
|
||||
Sequence:
|
||||
1. attempt to switch roles from master
|
||||
2. attempt to change role to master on secondary
|
||||
|
||||
returns (success, failure_reason)
|
||||
"""
|
||||
LOG.debug("VolumeReplication::failover %(vol)s",
|
||||
{'vol': resource['name']})
|
||||
|
||||
recovery_mgr = self.get_recovery_mgr()
|
||||
remote_recovery_mgr = self.get_remote_recovery_mgr()
|
||||
return self._failover_resource(resource, recovery_mgr,
|
||||
remote_recovery_mgr, 'vol', failback)
|
||||
|
||||
|
||||
class GroupReplication(Replication):
|
||||
|
||||
def __init__(self, proxy):
|
||||
super(GroupReplication, self).__init__(proxy)
|
||||
|
||||
def get_recovery_mgr(self):
|
||||
return cg_recovery_manager.CGRecoveryManager(
|
||||
False, self.proxy.ibm_storage_cli)
|
||||
|
||||
def get_remote_recovery_mgr(self):
|
||||
return volume_recovery_manager.CGRecoveryManager(
|
||||
True, self.proxy.ibm_storage_remote_cli)
|
||||
|
||||
def replication_create_mirror(self, resource_name, replication_info,
|
||||
target, pool):
|
||||
LOG.debug('GroupReplication::replication_create_mirror')
|
||||
schedule = None
|
||||
if replication_info['rpo']:
|
||||
schedule = Replication.get_schedule_from_rpo(
|
||||
replication_info['rpo'])
|
||||
try:
|
||||
recovery_mgr = self.get_recovery_mgr()
|
||||
recovery_mgr.create_mirror(
|
||||
resource_name=resource_name,
|
||||
target_name=target,
|
||||
mirror_type=replication_info['mode'],
|
||||
slave_resource_name=resource_name,
|
||||
rpo=replication_info['rpo'],
|
||||
schedule=schedule,
|
||||
activate_mirror='yes')
|
||||
except Exception as e:
|
||||
details = self.proxy._get_code_and_status_or_message(e)
|
||||
msg = (_("Failed replication for %(resource)s: '%(details)s'"),
|
||||
{'resource': resource_name, 'details': details})
|
||||
LOG.error(msg)
|
||||
raise self.proxy.meta['exception'].VolumeBackendAPIException(
|
||||
data=msg)
|
||||
|
||||
def failover(self, resource, failback):
|
||||
LOG.debug("GroupReplication::failover %(cg)s",
|
||||
{'cg': resource['name']})
|
||||
|
||||
recovery_mgr = self.get_recovery_mgr()
|
||||
remote_recovery_mgr = self.get_remote_recovery_mgr()
|
||||
|
||||
return self._failover_resource(resource, recovery_mgr,
|
||||
remote_recovery_mgr, 'cg', failback)
|
@ -0,0 +1,4 @@
|
||||
---
|
||||
features:
|
||||
- |
|
||||
Add consistency group replication support in XIV\A9000 Cinder driver.
|
Loading…
x
Reference in New Issue
Block a user