XIV\A9000: Added replication group support

This patch adds group replication capabilities for the IBM driver for the A-line system. implements: * Enable replication on group * Disable replication on group * Fail over replication * Get replication error status Implements: blueprint replication-cg-ibm-storage Change-Id: Ic59c568502258096e24ca5ab81dc5b8cd1779995 Depends-On: Ia4af4dd011d569a3ac84387b37dcf2606da48fba
2017-05-28 18:54:37 +03:00 · 2017-05-28 18:54:37 +03:00 · bb9a4e1a90
commit bb9a4e1a90
parent 695c1f9272
6 changed files with 869 additions and 314 deletions
--- a/cinder/tests/unit/volume/drivers/ibm/fake_pyxcli.py
+++ b/cinder/tests/unit/volume/drivers/ibm/fake_pyxcli.py
@ -25,6 +25,7 @@ pyxcli_client.errors = fake_pyxcli_exceptions
 pyxcli_client.events = mock.Mock()
 pyxcli_client.mirroring = mock.Mock()
 pyxcli_client.transports = fake_pyxcli_exceptions
 pyxcli_client.mirroring.cg_recovery_manager = mock.Mock()
 sys.modules['pyxcli'] = pyxcli_client
 sys.modules['pyxcli.events'] = pyxcli_client.events
--- a/cinder/tests/unit/volume/drivers/ibm/test_xiv_proxy.py
+++ b/cinder/tests/unit/volume/drivers/ibm/test_xiv_proxy.py
@ -20,6 +20,7 @@ from xml.etree import ElementTree
 from cinder import context
 from cinder import exception
 from cinder import objects
 from cinder.objects import fields
 from cinder import test
 from cinder.tests.unit import fake_constants as fake
 from cinder.tests.unit import utils as testutils
@ -27,9 +28,11 @@ from cinder.tests.unit.volume.drivers.ibm import fake_pyxcli
 import cinder.volume.drivers.ibm.ibm_storage as storage
 from cinder.volume.drivers.ibm.ibm_storage import cryptish
 from cinder.volume.drivers.ibm.ibm_storage.xiv_proxy import XIVProxy
 from cinder.volume.drivers.ibm.ibm_storage import xiv_replication
 from cinder.volume import group_types
 errors = fake_pyxcli.pyxcli_client.errors
 mirroring = fake_pyxcli.pyxcli_client.mirroring
 test_mock = mock.MagicMock()
 module_patcher = mock.MagicMock()
@ -45,6 +48,11 @@ TEST_VOLUME = {
    'group_id': fake.CONSISTENCY_GROUP_ID,
 }
 TEST_GROUP_SPECS = {
    'group_replication_enabled': '<is> True',
    'replication_type': 'sync',
 }
 TEST_EXTRA_SPECS = {
    'replication_enabled': '<is> False',
 }
@ -356,7 +364,174 @@ class XIVProxyTest(test.TestCase):
        ex = getattr(p, "_get_exception")()
        self.assertRaises(ex, p.create_volume, volume)
-    @mock.patch("cinder.volume.utils.group_get_by_id", mock.MagicMock())
+    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_replication.VolumeReplication.create_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_replication.GroupReplication.create_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy.get_group_specs_by_group_resource",
                mock.MagicMock(return_value=(TEST_GROUP_SPECS, '')))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_target_params",
                mock.MagicMock(return_value=REPLICA_PARAMS))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_target",
                mock.MagicMock(return_value="BLABLA"))
    def test_enable_replication(self):
        """Test enable_replication"""
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        p.ibm_storage_cli = mock.MagicMock()
        p._call_remote_xiv_xcli = mock.MagicMock()
        p._update_consistencygroup = mock.MagicMock()
        p.targets = {'tgt1': 'info1'}
        group = self._create_test_group('WTF')
        vol = testutils.create_volume(self.ctxt)
        ret = p.enable_replication(self.ctxt, group, [vol])
        self.assertEqual((
            {'replication_status': fields.ReplicationStatus.ENABLED},
            [{'id': vol['id'],
              'replication_status': fields.ReplicationStatus.ENABLED}]), ret)
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_replication.VolumeReplication.delete_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.group_types.get_group_type_specs",
                mock.MagicMock(return_value=TEST_GROUP_SPECS))
    def test_disable_replication(self):
        """Test disable_replication"""
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        p.ibm_storage_cli = mock.MagicMock()
        p._call_remote_xiv_xcli = mock.MagicMock()
        p._update_consistencygroup = mock.MagicMock()
        group = self._create_test_group('WTF')
        ret = p.disable_replication(self.ctxt, group, [])
        self.assertEqual((
            {'replication_status': fields.ReplicationStatus.DISABLED}, []),
            ret)
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._using_default_backend",
                mock.MagicMock(return_value=False))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_target_params",
                mock.MagicMock(return_value={'san_clustername': "master"}))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._init_xcli",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._init_xcli",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy.get_group_specs_by_group_resource",
                mock.MagicMock(return_value=(TEST_GROUP_SPECS, '')))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_replication.GroupReplication.failover",
                mock.MagicMock(return_value=(True, 'good')))
    def test_failover_replication_with_default(self):
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        group = self._create_test_group('WTF')
        group.replication_status = fields.ReplicationStatus.FAILED_OVER
        vol = testutils.create_volume(self.ctxt)
        group_update, vol_update = p.failover_replication(self.ctxt, group,
                                                          [vol], 'default')
        updates = {'status': 'available'}
        self.assertEqual(({'replication_status': 'available'},
                          [{'volume_id': vol['id'],
                            'updates': updates}]), (group_update, vol_update))
    def test_failover_resource_no_mirror(self):
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        recovery_mgr = mock.MagicMock()
        recovery_mgr.is_mirror_active = mock.MagicMock()
        recovery_mgr.is_mirror_active.return_value = False
        group = self._create_test_group('WTF')
        ret = xiv_replication.Replication(p)._failover_resource(
            group, recovery_mgr, mock.MagicMock, 'cg', True)
        msg = ("%(rep_type)s %(res)s: no active mirroring and can not "
               "failback" % {'rep_type': 'cg',
                             'res': group['name']})
        self.assertEqual((False, msg), ret)
    def test_failover_resource_mirror(self):
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        recovery_mgr = mock.MagicMock()
        recovery_mgr.is_mirror_active = mock.MagicMock()
        recovery_mgr.is_mirror_active.return_value = True
        group = self._create_test_group('WTF')
        ret = xiv_replication.Replication(p)._failover_resource(
            group, recovery_mgr, mock.MagicMock, 'cg', True)
        self.assertEqual((True, None), ret)
    def test_failover_resource_change_role(self):
        driver = mock.MagicMock()
        driver.VERSION = "VERSION"
        p = self.proxy(
            self.default_storage_info,
            mock.MagicMock(),
            test_mock.cinder.exception,
            driver)
        recovery_mgr = mock.MagicMock()
        recovery_mgr.is_mirror_active = mock.MagicMock()
        recovery_mgr.is_mirror_active.return_value = True
        recovery_mgr.switch_roles.side_effect = (
            errors.XCLIError(''))
        failover_rep_mgr = mock.MagicMock()
        failover_rep_mgr.change_role = mock.MagicMock()
        group = self._create_test_group('WTF')
        xiv_replication.Replication(p)._failover_resource(
            group, recovery_mgr, failover_rep_mgr, 'cg', True)
        failover_rep_mgr.change_role.assert_called_once_with(
            resource_id=group['name'],
            new_role='Slave')
    @mock.patch("cinder.volume.utils.is_group_a_cg_snapshot_type",
                mock.MagicMock(return_value=True))
    def test_create_volume_with_consistency_group(self):
@ -376,8 +551,8 @@ class XIVProxyTest(test.TestCase):
        vol_type = testutils.create_volume_type(self.ctxt, name='WTF')
        volume = testutils.create_volume(
            self.ctxt, size=16, volume_type_id=vol_type.id)
-        grp = testutils.create_group(self.ctxt, name='bla', group_type_id='1',
+
-                                     volume_type_ids=[vol_type.id])
+        grp = self._create_test_group('WTF')
        volume.group = grp
        p.create_volume(volume)
@ -390,7 +565,7 @@ class XIVProxyTest(test.TestCase):
            cg='cg')
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
-                "xiv_proxy.XIVProxy._replication_create",
+                "xiv_replication.VolumeReplication.create_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_qos_specs",
@ -417,7 +592,7 @@ class XIVProxyTest(test.TestCase):
        p.create_volume(volume)
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
-                "xiv_proxy.XIVProxy._replication_create",
+                "xiv_replication.VolumeReplication.create_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_qos_specs",
@ -446,10 +621,6 @@ class XIVProxyTest(test.TestCase):
        ex = getattr(p, "_get_exception")()
        self.assertRaises(ex, p.create_volume, volume)
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_targets",
                mock.MagicMock(
                    return_value={'tgt1': 'info1', 'tgt2': 'info2'}))
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_qos_specs",
                mock.MagicMock(return_value=None))
@ -495,7 +666,7 @@ class XIVProxyTest(test.TestCase):
        p.ibm_storage_cli.cmd.vol_delete.assert_called_once_with(vol='WTF32')
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
-                "xiv_proxy.XIVProxy._replication_delete",
+                "xiv_replication.VolumeReplication.delete_replication",
                mock.MagicMock())
    @mock.patch("cinder.volume.drivers.ibm.ibm_storage."
                "xiv_proxy.XIVProxy._get_extra_specs",
@ -1406,7 +1577,9 @@ class XIVProxyTest(test.TestCase):
        ex = getattr(p, "_get_exception")()
        self.assertRaises(ex, p.create_group, {}, self._create_test_group())
-    def test_create_consistencygroup_with_replication(self):
+    @mock.patch("cinder.volume.drivers.ibm.ibm_storage.xiv_proxy."
                "client.XCLIClient")
    def test_create_consistencygroup_with_replication(self, mock_xcli):
        """test create_consistenygroup when replication is set"""
        p = self.proxy(
@ -1426,8 +1599,8 @@ class XIVProxyTest(test.TestCase):
        group_obj.volume_types = objects.VolumeTypeList(context=self.ctxt,
                                                        objects=[vol_type])
-        ex = getattr(p, "_get_exception")()
+        model_update = p.create_group({}, group_obj)
-        self.assertRaises(ex, p.create_group, {}, group_obj)
+        self.assertEqual('available', model_update['status'])
    def test_create_consistencygroup_from_src_cgsnapshot(self):
        """test a successful cg create from cgsnapshot"""
@ -2113,7 +2286,7 @@ class XIVProxyTest(test.TestCase):
            test_mock.cinder.exception,
            driver)
-        p._replication_create = test_mock.MagicMock(return_value=None)
+        xiv_replication.VolumeReplication = mock.MagicMock()
        grp = testutils.create_group(self.ctxt, name='bla', group_type_id='1')
        volume = testutils.create_volume(self.ctxt, display_name='bla')
        volume.group = grp
--- a/cinder/volume/drivers/ibm/ibm_storage/proxy.py
+++ b/cinder/volume/drivers/ibm/ibm_storage/proxy.py
@ -365,14 +365,6 @@ class IBMStorageProxy(object):
        except Exception:
            return None
    def _get_targets(self):
        return self.targets
    def _is_replication_supported(self):
        if self.targets:
            return True
        return False
    @_trace_time
    def _read_replication_devices(self):
        """Read replication devices from configuration
--- a/cinder/volume/drivers/ibm/ibm_storage/xiv_proxy.py
+++ b/cinder/volume/drivers/ibm/ibm_storage/xiv_proxy.py
@ -27,8 +27,7 @@ if pyxcli:
    from pyxcli import client
    from pyxcli import errors
    from pyxcli.events import events
-    from pyxcli.mirroring import errors as m_errors
+    from pyxcli.mirroring import mirrored_entities
    from pyxcli.mirroring import volume_recovery_manager
    from pyxcli import transports
 from cinder import context
@ -40,6 +39,8 @@ from cinder.volume.drivers.ibm.ibm_storage import certificate
 from cinder.volume.drivers.ibm.ibm_storage import cryptish
 from cinder.volume.drivers.ibm.ibm_storage import proxy
 from cinder.volume.drivers.ibm.ibm_storage import strings
 from cinder.volume.drivers.ibm.ibm_storage import xiv_replication as repl
 from cinder.volume import group_types
 from cinder.volume import qos_specs
 from cinder.volume import utils
 from cinder.volume import volume_types
@ -95,38 +96,19 @@ MANAGE_VOLUME_BASE_ERROR = _("Unable to manage the volume '%(volume)s': "
                             "%(error)s.")
 class Rate(object):
    def __init__(self, rpo, schedule):
        self.rpo = rpo
        self.schedule = schedule
        self.schedule_name = self._schedule_name_from_schedule(self.schedule)
    def _schedule_name_from_schedule(self, schedule):
        if schedule == '00:00:20':
            return 'min_interval'
        return ("cinder_%(sched)s" %
                {'sched': schedule.replace(':', '_')})
 class XIVProxy(proxy.IBMStorageProxy):
    """Proxy between the Cinder Volume and Spectrum Accelerate Storage.
    Supports IBM XIV, Spectrum Accelerate, A9000, A9000R
    Version: 2.1.0
-    Required pyxcli version: 1.1.2
+    Required pyxcli version: 1.1.4
    2.0 - First open source driver version
    2.1.0 - Support Consistency groups through Generic volume groups
          - Support XIV/A9000 Volume independent QoS
          - Support groups replication
    """
    async_rates = (
        Rate(rpo=120, schedule='00:01:00'),
        Rate(rpo=300, schedule='00:02:00'),
        Rate(rpo=600, schedule='00:05:00'),
        Rate(rpo=1200, schedule='00:10:00'),
    )
    def __init__(self, storage_info, logger, exception,
                 driver=None, active_backend_id=None):
@ -192,13 +174,6 @@ class XIVProxy(proxy.IBMStorageProxy):
        LOG.info("Connection to the IBM storage "
                 "system established successfully.")
    def _get_schedule_from_rpo(self, rpo):
        return [rate for rate in self.async_rates
                if rate.rpo == rpo][0].schedule_name
    def _get_supported_rpo(self):
        return [rate.rpo for rate in self.async_rates]
    @proxy._trace_time
    def _update_active_schedule_objects(self):
        """Set schedule objects on active backend.
@ -207,7 +182,7 @@ class XIVProxy(proxy.IBMStorageProxy):
        min_interval.
        """
        schedules = self._call_xiv_xcli("schedule_list").as_dict('name')
-        for rate in self.async_rates:
+        for rate in repl.Replication.async_rates:
            if rate.schedule == '00:00:20':
                continue
            name = rate.schedule_name
@ -245,7 +220,7 @@ class XIVProxy(proxy.IBMStorageProxy):
        min_interval.
        """
        schedules = self._call_remote_xiv_xcli("schedule_list").as_dict('name')
-        for rate in self.async_rates:
+        for rate in repl.Replication.async_rates:
            if rate.schedule == '00:00:20':
                continue
            name = rate.schedule_name
@ -438,30 +413,12 @@ class XIVProxy(proxy.IBMStorageProxy):
        return self._get_qos_specs(type_id)
    def _get_replication_info(self, specs):
-        info = {'enabled': False, 'mode': None, 'rpo': 0}
+
-        if specs:
+        info, msg = repl.Replication.extract_replication_info_from_specs(specs)
-            LOG.debug('_get_replication_info: specs %(specs)s',
+        if not info:
-                      {'specs': specs})
+            LOG.error(msg)
-            info['enabled'] = (
+            raise self._get_exception()(message=msg)
-                specs.get('replication_enabled', '').upper() in
+
                (u'TRUE', strings.METADATA_IS_TRUE))
            replication_type = specs.get('replication_type', SYNC).lower()
            if replication_type in (u'sync', u'<is> sync'):
                info['mode'] = SYNC
            elif replication_type in (u'async', u'<is> async'):
                info['mode'] = ASYNC
            else:
                msg = (_("Unsupported replication mode %(mode)s")
                       % {'mode': replication_type})
                LOG.error(msg)
                raise self._get_exception()(message=msg)
            info['rpo'] = int(specs.get('rpo', u'<is> 0')[5:])
            if info['rpo'] and info['rpo'] not in self._get_supported_rpo():
                msg = (_("Unsupported replication RPO %(rpo)s")
                       % {'rpo': info['rpo']})
                LOG.error(msg)
                raise self._get_exception()(message=msg)
            LOG.debug('_get_replication_info: info %(info)s', {'info': info})
        return info
    @proxy._trace_time
@ -491,26 +448,74 @@ class XIVProxy(proxy.IBMStorageProxy):
    @proxy._trace_time
    def create_volume(self, volume):
        """Creates a volume."""
        # read replication information
        specs = self._get_extra_specs(volume.get('volume_type_id', None))
        replication_info = self._get_replication_info(specs)
        if volume.group and replication_info['enabled']:
            # An unsupported illegal configuration
            msg = _("Unable to create volume: "
                    "Replication of consistency group is not supported")
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        self._create_volume(volume)
        return self.handle_created_vol_properties(replication_info,
                                                  volume)
    def handle_created_vol_properties(self, replication_info, volume):
        volume_update = {}
        LOG.debug('checking replication_info %(rep)s',
                  {'rep': replication_info})
        volume_update['replication_status'] = 'disabled'
        cg = volume.group and utils.is_group_a_cg_snapshot_type(volume.group)
        if replication_info['enabled']:
            try:
                repl.VolumeReplication(self).create_replication(
                    volume.name, replication_info)
            except Exception as e:
                details = self._get_code_and_status_or_message(e)
                msg = ('Failed create_replication for '
                       'volume %(vol)s: %(err)s',
                       {'vol': volume['name'], 'err': details})
                LOG.error(msg)
                if cg:
                    cg_name = self._cg_name_from_volume(volume)
                    self._silent_delete_volume_from_cg(volume, cg_name)
                self._silent_delete_volume(volume=volume)
                raise
            volume_update['replication_status'] = 'enabled'
        if cg:
            if volume.group.is_replicated:
                # for replicated Consistency Group:
                # The Volume must be mirrored, and its mirroring settings must
                # be identical to those of the Consistency Group:
                # mirroring type (e.g., synchronous),
                # mirroring status, mirroring target(backend)
                group_specs = group_types.get_group_type_specs(
                    volume.group.group_type_id)
                group_rep_info = self._get_replication_info(group_specs)
                msg = None
                if volume_update['replication_status'] != 'enabled':
                    msg = ('Cannot add non-replicated volume into'
                           ' replicated group')
                elif replication_info['mode'] != group_rep_info['mode']:
                    msg = ('Volume replication type and Group replication type'
                           ' should be the same')
                elif volume.host != volume.group.host:
                    msg = 'Cannot add volume to Group on different host'
                else:
                    group_name = self._cg_name_from_group(volume.group)
                    me = mirrored_entities.MirroredEntities(
                        self.ibm_storage_cli)
                    me_objs = me.get_mirror_resources_by_name_map()
                    vol_sync_state = me_objs['volumes'][volume.name].sync_state
                    cg_sync_state = me_objs['cgs'][group_name].sync_state
                    if (vol_sync_state != 'Synchronized' or
                            cg_sync_state != 'Synchronized'):
                        msg = ('Cannot add volume to Group. Both volume and '
                               'group should have sync_state = Synchronized')
                if msg:
                    LOG.error(msg)
                    raise self.meta['exception'].VolumeBackendAPIException(
                        data=msg)
            try:
                cg_name = self._cg_name_from_volume(volume)
                self._call_xiv_xcli(
@ -543,35 +548,234 @@ class XIVProxy(proxy.IBMStorageProxy):
                raise self.meta['exception'].VolumeBackendAPIException(
                    data=msg)
        LOG.debug('checking replication_info %(rep)s',
                  {'rep': replication_info})
        volume_update['replication_status'] = 'disabled'
        if replication_info['enabled']:
            try:
                self._replication_create(volume, replication_info)
            except Exception as e:
                details = self._get_code_and_status_or_message(e)
                msg = ('Failed _replication_create for '
                       'volume %(vol)s: %(err)s',
                       {'vol': volume['name'], 'err': details})
                LOG.error(msg)
                if cg:
                    cg_name = self._cg_name_from_volume(volume)
                    self._silent_delete_volume_from_cg(volume, cg_name)
                self._silent_delete_volume(volume=volume)
                raise
            volume_update['replication_status'] = 'enabled'
        return volume_update
    def get_group_specs_by_group_resource(self, context, group):
        group_type = group.get('group_type_id', None)
        if group_type is None:
            msg = ('No group specs inside group type.')
            return None, msg
        group_specs = group_types.get_group_type_specs(group_type)
        keyword = 'consistent_group_replication_enabled'
        if not group_specs.get(keyword) == '<is> True':
            msg = ('No cg replication field in group specs.')
            return None, msg
        return group_specs, ''
    @proxy._trace_time
    def enable_replication(self, context, group, volumes):
        """Enable cg replication"""
        # fetch replication info
        group_specs = group_types.get_group_type_specs(group.group_type_id)
        if not group_specs:
            msg = 'No group specs inside group type'
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        # Add this field to adjust it to generic replication (for volumes)
        replication_info = self._get_replication_info(group_specs)
        if utils.is_group_a_cg_snapshot_type(group):
            # take every vol out of cg - we can't mirror the cg otherwise.
            if volumes:
                self._update_consistencygroup(context, group,
                                              remove_volumes=volumes)
                for volume in volumes:
                    repl.VolumeReplication(self).create_replication(
                        volume.name, replication_info)
            # mirror entire group
            group_name = self._cg_name_from_group(group)
            self._create_consistencygroup_on_remote(context, group_name)
            repl.GroupReplication(self).create_replication(group_name,
                                                           replication_info)
            updated_volumes = []
            if volumes:
                # add volumes back to cg
                self._update_consistencygroup(context, group,
                                              add_volumes=volumes)
                for volume in volumes:
                    updated_volumes.append(
                        {'id': volume['id'],
                         'replication_status':
                             fields.ReplicationStatus.ENABLED})
            return ({'replication_status': fields.ReplicationStatus.ENABLED},
                    updated_volumes)
        else:
            # For generic groups we replicate all the volumes
            updated_volumes = []
            for volume in volumes:
                repl.VolumeReplication(self).create_replication(
                    volume.name, replication_info)
            # update status
            for volume in volumes:
                updated_volumes.append(
                    {'id': volume['id'],
                     'replication_status': fields.ReplicationStatus.ENABLED})
            return ({'replication_status': fields.ReplicationStatus.ENABLED},
                    updated_volumes)
    @proxy._trace_time
    def disable_replication(self, context, group, volumes):
        """disables CG replication"""
        group_specs = group_types.get_group_type_specs(group.group_type_id)
        if not group_specs:
            msg = 'No group specs inside group type'
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        replication_info = self._get_replication_info(group_specs)
        updated_volumes = []
        if utils.is_group_a_cg_snapshot_type(group):
            # one call deletes replication for cgs and volumes together.
            repl.GroupReplication(self).delete_replication(group,
                                                           replication_info)
            for volume in volumes:
                # xiv locks volumes after deletion of replication.
                # we need to unlock it for further use.
                try:
                    self.ibm_storage_cli.cmd.vol_unlock(vol=volume.name)
                except errors.XCLIError as e:
                    details = self._get_code_and_status_or_message(e)
                    msg = ('Failed to unlock volumes %(details)s' %
                           {'details': details})
                    LOG.error(msg)
                    raise self.meta['exception'].VolumeBackendAPIException(
                        data=msg)
                updated_volumes.append(
                    {'id': volume.id,
                     'replication_status': fields.ReplicationStatus.DISABLED})
        else:
            # For generic groups we replicate all the volumes
            updated_volumes = []
            for volume in volumes:
                repl.VolumeReplication(self).delete_replication(
                    volume.name, replication_info)
            # update status
            for volume in volumes:
                updated_volumes.append(
                    {'id': volume['id'],
                     'replication_status': fields.ReplicationStatus.DISABLED})
        return ({'replication_status': fields.ReplicationStatus.DISABLED},
                updated_volumes)
    def get_secondary_backend_id(self, secondary_backend_id):
        if secondary_backend_id is None:
            secondary_backend_id = self._get_target()
        if secondary_backend_id is None:
            msg = _("No targets defined. Can't perform failover.")
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(
                data=msg)
        return secondary_backend_id
    def check_for_splitbrain(self, volumes, pool_master, pool_slave):
        if volumes:
            # check for split brain situations
            # check for files that are available on both volumes
            # and are not in an active mirroring relation
            split_brain = self._potential_split_brain(
                self.ibm_storage_cli,
                self.ibm_storage_remote_cli,
                volumes, pool_master,
                pool_slave)
            if split_brain:
                # if such a situation exists stop and raise an exception!
                msg = (_("A potential split brain condition has been found "
                         "with the following volumes: \n'%(volumes)s.'") %
                       {'volumes': split_brain})
                LOG.error(msg)
                raise self.meta['exception'].VolumeBackendAPIException(
                    data=msg)
    def failover_replication(self, context, group, volumes,
                             secondary_backend_id):
        """Failover a cg with all it's volumes.
        if secondery_id is default, cg needs to be failed back.
        """
        volumes_updated = []
        goal_status = ''
        pool_master = None
        group_updated = {'replication_status': group.replication_status}
        LOG.info("failover_replication: of cg %(cg)s "
                 "from %(active)s to %(id)s",
                 {'cg': group.get('name'),
                  'active': self.active_backend_id,
                  'id': secondary_backend_id})
        if secondary_backend_id == strings.PRIMARY_BACKEND_ID:
            # default as active backend id
            if self._using_default_backend():
                LOG.info("CG has been failed back. "
                         "No need to fail back again.")
                return group_updated, volumes_updated
            # get the master pool, not using default id.
            pool_master = self._get_target_params(
                self.active_backend_id)['san_clustername']
            pool_slave = self.storage_info[storage.FLAG_KEYS['storage_pool']]
            goal_status = 'available'
        else:
            if self._using_default_backend():
                LOG.info("cg already failed over.")
                return group_updated, volumes_updated
            # using same api as Cheesecake, we need
            # replciation_device entry. so we use get_targets.
            secondary_backend_id = self.get_secondary_backend_id(
                secondary_backend_id)
            pool_master = self.storage_info[storage.FLAG_KEYS['storage_pool']]
            pool_slave = self._get_target_params(
                secondary_backend_id)['san_clustername']
            goal_status = fields.ReplicationStatus.FAILED_OVER
        # we should have secondary_backend_id by here.
        self.ibm_storage_remote_cli = self._init_xcli(secondary_backend_id)
        # check for split brain in mirrored volumes
        self.check_for_splitbrain(volumes, pool_master, pool_slave)
        group_specs, msg = self.get_group_specs_by_group_resource(context,
                                                                  group)
        if group_specs is None:
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        failback = (secondary_backend_id == strings.PRIMARY_BACKEND_ID)
        result, details = repl.GroupReplication.failover(group, failback)
        if result:
                status = goal_status
                group_updated['replication_status'] = status
        else:
            status = 'error'
        updates = {'status': status}
        if status == 'error':
            group_updated['replication_extended_status'] = details
        # if replication on cg was successful, then all of the volumes
        # have been successfully replicated as well.
        for volume in volumes:
            volumes_updated.append({
                'volume_id': volume.id,
                'updates': updates
            })
        # replace between active and secondary xcli
        self._replace_xcli_to_remote_xcli()
        return group_updated, volumes_updated
    def _replace_xcli_to_remote_xcli(self):
        temp_ibm_storage_cli = self.ibm_storage_cli
        self.ibm_storage_cli = self.ibm_storage_remote_cli
        self.ibm_storage_remote_cli = temp_ibm_storage_cli
    def _get_replication_target_params(self):
        LOG.debug('_get_replication_target_params.')
-        targets = self._get_targets()
+        if not self.targets:
        if not targets:
            msg = _("No targets available for replication")
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
-        no_of_targets = len(targets)
+        no_of_targets = len(self.targets)
        if no_of_targets > 1:
            msg = _("Too many targets configured. Only one is supported")
            LOG.error(msg)
@ -591,89 +795,6 @@ class XIVProxy(proxy.IBMStorageProxy):
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        return target, params
    def _replication_create(self, volume, replication_info):
        LOG.debug('_replication_create replication_info %(rep)s',
                  {'rep': replication_info})
        target, params = self._get_replication_target_params()
        LOG.info('Target %(target)s: %(params)s',
                 {'target': target, 'params': six.text_type(params)})
        try:
            pool = params['san_clustername']
        except Exception:
            msg = (_("Missing pool information for target '%(target)s'"),
                   {'target': target})
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
            False, self.ibm_storage_cli)
        self._replication_create_mirror(volume, replication_info,
                                        target, pool, volume_replication_mgr)
    def _replication_create_mirror(self, volume, replication_info,
                                   target, pool, volume_replication_mgr):
        LOG.debug('_replication_create_mirror')
        schedule = None
        if replication_info['rpo']:
            schedule = self._get_schedule_from_rpo(replication_info['rpo'])
            if schedule:
                LOG.debug('schedule %(sched)s: for rpo %(rpo)s',
                          {'sched': schedule, 'rpo': replication_info['rpo']})
            else:
                LOG.error('Failed to find schedule for rpo %(rpo)s',
                          {'rpo': replication_info['rpo']})
                # will fail in the next step
        try:
            volume_replication_mgr.create_mirror(
                resource_name=volume['name'],
                target_name=target,
                mirror_type=replication_info['mode'],
                slave_resource_name=volume['name'],
                create_slave='yes',
                remote_pool=pool,
                rpo=replication_info['rpo'],
                schedule=schedule,
                activate_mirror='yes')
        # TBD - what exceptions will we get here?
        except Exception as e:
            details = self._get_code_and_status_or_message(e)
            msg = (_("Failed replication for %(vol)s: '%(details)s'"),
                   {'vol': volume['name'], 'details': details})
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
    def _replication_delete(self, volume, replication_info):
        LOG.debug('_replication_delete replication_info %(rep)s',
                  {'rep': replication_info})
        targets = self._get_targets()
        if not targets:
            LOG.debug('No targets defined for replication')
        volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
            False, self.ibm_storage_cli)
        try:
            volume_replication_mgr.deactivate_mirror(
                resource_id=volume['name'])
        except Exception as e:
            details = self._get_code_and_status_or_message(e)
            msg = (_("Failed ending replication for %(vol)s: '%(details)s'"),
                   {'vol': volume['name'], 'details': details})
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
        try:
            volume_replication_mgr.delete_mirror(
                resource_id=volume['name'])
        except Exception as e:
            details = self._get_code_and_status_or_message(e)
            msg = (_("Failed deleting replica for %(vol)s: '%(details)s'"),
                   {'vol': volume['name'], 'details': details})
            LOG.error(msg)
            raise self.meta['exception'].VolumeBackendAPIException(data=msg)
    def _delete_volume(self, vol_name):
        """Deletes a volume on the Storage."""
        LOG.debug("_delete_volume: %(volume)s",
@ -727,7 +848,8 @@ class XIVProxy(proxy.IBMStorageProxy):
        replication_info = self._get_replication_info(specs)
        if replication_info['enabled']:
            try:
-                self._replication_delete(volume, replication_info)
+                repl.VolumeReplication(self).delete_replication(
                    volume.name, replication_info)
            except Exception as e:
                error = self._get_code_and_status_or_message(e)
                LOG.error(DELETE_VOLUME_BASE_ERROR,
@ -1221,70 +1343,6 @@ class XIVProxy(proxy.IBMStorageProxy):
                potential_split_brain.append(name)
        return potential_split_brain
    def _failover_vol(self, volume, volume_replication_mgr,
                      failover_volume_replication_mgr,
                      replication_info, failback):
        """Failover a single volume.
        Attempts to failover a single volume
        Sequence:
        1. attempt to switch roles from master
        2. attempt to change role to master on slave
        returns (success, failure_reason)
        """
        LOG.debug("_failover_vol %(vol)s", {'vol': volume['name']})
        # check if mirror is defined and active
        try:
            LOG.debug('Check if mirroring is active on %(vol)s.',
                      {'vol': volume['name']})
            active = volume_replication_mgr.is_mirror_active(
                resource_id=volume['name'])
        except Exception:
            active = False
        state = 'active' if active else 'inactive'
        LOG.debug('Mirroring is %(state)s', {'state': state})
        # In case of failback, mirroring must be active
        # In case of failover we attempt to move in any condition
        if failback and not active:
            msg = ("Volume %(vol)s: no active mirroring and can not "
                   "failback",
                   {'vol': volume['name']})
            LOG.error(msg)
            return False, msg
        try:
            volume_replication_mgr.switch_roles(resource_id=volume['name'])
            return True, None
        except Exception as e:
            # failed attempt to switch_roles from the master
            details = self._get_code_and_status_or_message(e)
            LOG.warning('Failed to perform switch_roles on'
                        ' %(vol)s: %(err)s. '
                        'Continue to change_role',
                        {'vol': volume['name'], 'err': details})
        try:
            # this is the ugly stage we come to brute force
            LOG.warning('Attempt to change_role to master')
            failover_volume_replication_mgr.failover_by_id(
                resource_id=volume['name'])
            return True, None
        except m_errors.NoMirrorDefinedError as e:
            details = self._get_code_and_status_or_message(e)
            msg = ("Volume %(vol)s no replication defined: %(err)s" %
                   {'vol': volume['name'], 'err': details})
            LOG.error(msg)
            return False, msg
        except Exception as e:
            details = self._get_code_and_status_or_message(e)
            msg = ('Volume %(vol)s change_role failed: %(err)s' %
                   {'vol': volume['name'], 'err': details})
            LOG.error(msg)
            return False, msg
    @proxy._trace_time
    def failover_host(self, context, volumes, secondary_id, groups=None):
        """Failover a full backend.
@ -1316,14 +1374,7 @@ class XIVProxy(proxy.IBMStorageProxy):
                LOG.info("Already failed over. No need to failover again.")
                return self.active_backend_id, volume_update_list, []
            # case: need to select a target
-            if secondary_id is None:
+            secondary_id = self.get_secondary_backend_id(secondary_id)
                secondary_id = self._get_target()
            # still no targets..
            if secondary_id is None:
                msg = _("No targets defined. Can't perform failover")
                LOG.error(msg)
                raise self.meta['exception'].VolumeBackendAPIException(
                    data=msg)
            pool_master = self.storage_info[storage.FLAG_KEYS['storage_pool']]
            try:
                pool_slave = self._get_target_params(
@ -1340,45 +1391,21 @@ class XIVProxy(proxy.IBMStorageProxy):
        #  calling _init_xcli with secondary_id
        self.ibm_storage_remote_cli = self._init_xcli(secondary_id)
        # Create volume manager for both master and remote
        volume_replication_mgr = volume_recovery_manager.VolumeRecoveryManager(
            False, self.ibm_storage_cli)
        failover_volume_replication_mgr = (
            volume_recovery_manager.VolumeRecoveryManager(
                True, self.ibm_storage_remote_cli))
        # get replication_info for all volumes at once
        if len(volumes):
            # check for split brain situations
            # check for files that are available on both volumes
            # and are not in an active mirroring relation
-            split_brain = self._potential_split_brain(
+            self.check_for_splitbrain(volumes, pool_master, pool_slave)
                self.ibm_storage_cli,
                self.ibm_storage_remote_cli,
                volumes, pool_master,
                pool_slave)
            if len(split_brain):
                # if such a situation exists stop and raise an exception!
                msg = (_("A potential split brain condition has been found "
                         "with the following volumes: \n'%(volumes)s.'"),
                       {'volumes': split_brain})
                LOG.error(msg)
                raise self.meta['exception'].VolumeBackendAPIException(
                    data=msg)
            specs = self._get_extra_specs(
                volumes[0].get('volume_type_id', None))
            replication_info = self._get_replication_info(specs)
        # loop over volumes and attempt failover
        for volume in volumes:
            LOG.debug("Attempting to failover '%(vol)s'",
                      {'vol': volume['name']})
-            result, details = self._failover_vol(
+
-                volume,
+            result, details = repl.VolumeReplication(self).failover(
-                volume_replication_mgr,
+                volume, failback=(secondary_id == strings.PRIMARY_BACKEND_ID))
-                failover_volume_replication_mgr,
+
                replication_info,
                failback=(secondary_id == strings.PRIMARY_BACKEND_ID))
            if result:
                status = goal_status
            else:
@ -1393,9 +1420,7 @@ class XIVProxy(proxy.IBMStorageProxy):
            })
        # set active xcli to secondary xcli
-        temp_ibm_storage_cli = self.ibm_storage_cli
+        self._replace_xcli_to_remote_xcli()
        self.ibm_storage_cli = self.ibm_storage_remote_cli
        self.ibm_storage_remote_cli = temp_ibm_storage_cli
        # set active backend id to secondary id
        self.active_backend_id = secondary_id
@ -1500,6 +1525,8 @@ class XIVProxy(proxy.IBMStorageProxy):
        self.meta['stat']["driver_version"] = self.full_version
        self.meta['stat']["storage_protocol"] = connection_type
        self.meta['stat']['multiattach'] = False
        self.meta['stat']['group_replication_enabled'] = True
        self.meta['stat']['consistent_group_replication_enabled'] = True
        self.meta['stat']['QoS_support'] = (
            self._check_storage_version_for_qos_support())
@ -1538,15 +1565,14 @@ class XIVProxy(proxy.IBMStorageProxy):
        self.meta['stat']['thin_provision'] = ('True' if soft_size > hard_size
                                               else 'False')
-        targets = self._get_targets()
+        if self.targets:
        if targets:
            self.meta['stat']['replication_enabled'] = True
            # TBD - replication_type should be according to type
            self.meta['stat']['replication_type'] = [SYNC, ASYNC]
-            self.meta['stat']['rpo'] = self._get_supported_rpo()
+            self.meta['stat']['rpo'] = repl.Replication.get_supported_rpo()
-            self.meta['stat']['replication_count'] = len(targets)
+            self.meta['stat']['replication_count'] = len(self.targets)
            self.meta['stat']['replication_targets'] = [target for target in
-                                                        six.iterkeys(targets)]
+                                                        six.iterkeys(
                                                            self.targets)]
        self.meta['stat']['timestamp'] = datetime.datetime.utcnow()
@ -1679,18 +1705,6 @@ class XIVProxy(proxy.IBMStorageProxy):
    def create_group(self, context, group):
        """Creates a group."""
        for volume_type in group.volume_types:
            replication_info = self._get_replication_info(
                volume_type.extra_specs)
            if replication_info.get('enabled'):
                # An unsupported illegal configuration
                msg = _("Unable to create group: create group with "
                        "replication volume type is not supported")
                LOG.error(msg)
                raise self.meta['exception'].VolumeBackendAPIException(
                    data=msg)
        if utils.is_group_a_cg_snapshot_type(group):
            cgname = self._cg_name_from_group(group)
            return self._create_consistencygroup(context, cgname)
@ -1726,6 +1740,35 @@ class XIVProxy(proxy.IBMStorageProxy):
        model_update = {'status': fields.GroupStatus.AVAILABLE}
        return model_update
    def _create_consistencygroup_on_remote(self, context, cgname):
        """Creates a consistency group on secondary machine.
        Return group available even if it already exists (for replication)
        """
        LOG.info("Creating consistency group %(name)s on secondary.",
                 {'name': cgname})
        # call remote XCLI
        try:
            self._call_remote_xiv_xcli(
                "cg_create", cg=cgname,
                pool=self.storage_info[
                    storage.FLAG_KEYS['storage_pool']]).as_list
        except errors.CgNameExistsError:
            model_update = {'status': fields.GroupStatus.AVAILABLE}
        except errors.CgLimitReachedError:
            error = _("Maximum number of consistency groups reached")
            LOG.error(error)
            raise self._get_exception()(error)
        except errors.XCLIError as e:
            error = (_("Fatal error in cg_create on remote: %(details)s") %
                     {'details': self._get_code_and_status_or_message(e)})
            LOG.error(error)
            raise self._get_exception()(error)
        model_update = {'status': fields.GroupStatus.AVAILABLE}
        return model_update
    def _silent_cleanup_consistencygroup_from_src(self, context, group,
                                                  volumes, cgname):
        """Silent cleanup of volumes from CG.
--- a/cinder/volume/drivers/ibm/ibm_storage/xiv_replication.py
+++ b/cinder/volume/drivers/ibm/ibm_storage/xiv_replication.py
@ -0,0 +1,342 @@
 #  Copyright (c) 2017 IBM Corporation
 #  All Rights Reserved.
 #
 #    Licensed under the Apache License, Version 2.0 (the "License"); you may
 #    not use this file except in compliance with the License. You may obtain
 #    a copy of the License at
 #
 #         http://www.apache.org/licenses/LICENSE-2.0
 #
 #    Unless required by applicable law or agreed to in writing, software
 #    distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 #    WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 #    License for the specific language governing permissions and limitations
 #    under the License.
 #
 import six
 from oslo_log import log as logging
 from oslo_utils import importutils
 pyxcli = importutils.try_import("pyxcli")
 if pyxcli:
    from pyxcli import errors
    from pyxcli.mirroring import cg_recovery_manager
    from pyxcli.mirroring import errors as m_errors
    from pyxcli.mirroring import volume_recovery_manager
 from cinder.i18n import _
 from cinder.volume.drivers.ibm.ibm_storage import strings
 SYNC = 'sync'
 ASYNC = 'async'
 LOG = logging.getLogger(__name__)
 class Rate(object):
    def __init__(self, rpo, schedule):
        self.rpo = rpo
        self.schedule = schedule
        self.schedule_name = self._schedule_name_from_schedule(self.schedule)
    def _schedule_name_from_schedule(self, schedule):
        if schedule == '00:00:20':
            return 'min_interval'
        return ("cinder_%(sched)s" %
                {'sched': schedule.replace(':', '_')})
 class Replication(object):
    async_rates = (
        Rate(rpo=120, schedule='00:01:00'),
        Rate(rpo=300, schedule='00:02:00'),
        Rate(rpo=600, schedule='00:05:00'),
        Rate(rpo=1200, schedule='00:10:00'),
    )
    def __init__(self, proxy):
        self.proxy = proxy
    @staticmethod
    def get_schedule_from_rpo(rpo):
        schedule = [rate for rate in Replication.async_rates
                    if rate.rpo == rpo][0].schedule_name
        if schedule:
            LOG.debug('schedule %(sched)s: for rpo %(rpo)s',
                      {'sched': schedule, 'rpo': rpo})
        else:
            LOG.error('Failed to find schedule for rpo %(rpo)s',
                      {'rpo': rpo})
        return schedule
    @staticmethod
    def get_supported_rpo():
        return [rate.rpo for rate in Replication.async_rates]
    def get_recovery_mgr(self):
        # Recovery manager is set in derived classes
        raise NotImplementedError
    def get_remote_recovery_mgr(self):
        # Recovery manager is set in derived classes
        raise NotImplementedError
    def replication_create_mirror(self, resource, replication_info,
                                  target, pool):
        raise NotImplementedError
    @staticmethod
    def extract_replication_info_from_specs(specs):
        info = {'enabled': False, 'mode': None, 'rpo': 0}
        msg = ""
        if specs:
            LOG.debug('extract_replication_info_from_specs: specs %(specs)s',
                      {'specs': specs})
            info['enabled'] = (
                specs.get('replication_enabled', '').upper() in
                (u'TRUE', strings.METADATA_IS_TRUE) or
                specs.get('group_replication_enabled', '').upper() in
                (u'TRUE', strings.METADATA_IS_TRUE))
            replication_type = specs.get('replication_type', SYNC).lower()
            if replication_type in (u'sync', u'<is> sync'):
                info['mode'] = SYNC
            elif replication_type in (u'async', u'<is> async'):
                info['mode'] = ASYNC
            else:
                msg = (_("Unsupported replication mode %(mode)s")
                       % {'mode': replication_type})
                return None, msg
            info['rpo'] = int(specs.get('rpo', u'<is> 0')[5:])
            supported_rpos = Replication.get_supported_rpo()
            if info['rpo'] and info['rpo'] not in supported_rpos:
                msg = (_("Unsupported replication RPO %(rpo)s"),
                       {'rpo': info['rpo']})
                return None, msg
            LOG.debug('extract_replication_info_from_specs: info %(info)s',
                      {'info': info})
        return info, msg
    def failover(self, resource, failback):
        raise NotImplementedError
    def create_replication(self, resource_name, replication_info):
        LOG.debug('Replication::create_replication replication_info %(rep)s',
                  {'rep': replication_info})
        target, params = self.proxy._get_replication_target_params()
        LOG.info('Target %(target)s: %(params)s',
                 {'target': target, 'params': six.text_type(params)})
        try:
            pool = params['san_clustername']
        except Exception:
            msg = (_("Missing pool information for target '%(target)s'") %
                   {'target': target})
            LOG.error(msg)
            raise self.proxy.meta['exception'].VolumeBackendAPIException(
                data=msg)
        self.replication_create_mirror(resource_name, replication_info,
                                       target, pool)
    def delete_replication(self, resource_name, replication_info):
        LOG.debug('Replication::delete_replication replication_info %(rep)s',
                  {'rep': replication_info})
        recovery_mgr = self.get_recovery_mgr()
        try:
            recovery_mgr.deactivate_mirror(resource_id=resource_name)
        except Exception as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = (_("Failed ending replication for %(resource)s: "
                     "'%(details)s'") % {'resource': resource_name,
                                         'details': details})
            LOG.error(msg)
            raise self.proxy.meta['exception'].VolumeBackendAPIException(
                data=msg)
        try:
            recovery_mgr.delete_mirror(resource_id=resource_name)
        except Exception as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = (_("Failed deleting replica for %(resource)s: "
                     "'%(details)s'") % {'resource': resource_name,
                                         'details': details})
            LOG.error(msg)
            raise self.proxy.meta['exception'].VolumeBackendAPIException(
                data=msg)
    def _failover_resource(self, resource, recovery_mgr, failover_rep_mgr,
                           rep_type, failback):
        # check if mirror is defined and active
        LOG.debug('Check if mirroring is active on %(res)s',
                  {'res': resource['name']})
        try:
            active = recovery_mgr.is_mirror_active(
                resource_id=resource['name'])
        except Exception:
            active = False
        state = 'active' if active else 'inactive'
        LOG.debug('Mirroring is %(state)s', {'state': state})
        # In case of failback, mirroring must be active
        # In case of failover we attempt to move in any condition
        if failback and not active:
            msg = ("%(rep_type)s %(res)s: no active mirroring and can not "
                   "failback" % {'rep_type': rep_type,
                                 'res': resource['name']})
            LOG.error(msg)
            return False, msg
        try:
            recovery_mgr.switch_roles(resource_id=resource['name'])
            return True, None
        except Exception as e:
            # failed attempt to switch_roles from the master
            details = self.proxy._get_code_and_status_or_message(e)
            LOG.warning('Failed to perform switch_roles on'
                        ' %(res)s: %(err)s. '
                        'Continue to change_role',
                        {'res': resource['name'], 'err': details})
        try:
            # this is the ugly stage we come to brute force
            if failback:
                role = 'Slave'
            else:
                role = 'Master'
            LOG.warning('Attempt to change_role to %(role)s', {'role': role})
            failover_rep_mgr.change_role(resource_id=resource['name'],
                                         new_role=role)
            return True, None
        except m_errors.NoMirrorDefinedError as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = ("%(rep_type)s %(res)s no replication defined: %(err)s" %
                   {'rep_type': rep_type, 'res': resource['name'],
                    'err': details})
            LOG.error(msg)
            return False, msg
        except Exception as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = ('%(rep_type)s %(res)s change_role failed: %(err)s' %
                   {'rep_type': rep_type, 'res': resource['name'],
                    'err': details})
            LOG.error(msg)
            return False, msg
 class VolumeReplication(Replication):
    def __init__(self, proxy):
        super(VolumeReplication, self).__init__(proxy)
    def get_recovery_mgr(self):
        return volume_recovery_manager.VolumeRecoveryManager(
            False, self.proxy.ibm_storage_cli)
    def get_remote_recovery_mgr(self):
        return volume_recovery_manager.VolumeRecoveryManager(
            True, self.proxy.ibm_storage_remote_cli)
    def replication_create_mirror(self, resource_name, replication_info,
                                  target, pool):
        LOG.debug('VolumeReplication::replication_create_mirror')
        schedule = None
        if replication_info['rpo']:
            schedule = Replication.get_schedule_from_rpo(
                replication_info['rpo'])
        try:
            recovery_mgr = self.get_recovery_mgr()
            recovery_mgr.create_mirror(
                resource_name=resource_name,
                target_name=target,
                mirror_type=replication_info['mode'],
                slave_resource_name=resource_name,
                create_slave='yes',
                remote_pool=pool,
                rpo=replication_info['rpo'],
                schedule=schedule,
                activate_mirror='yes')
        except errors.VolumeMasterError:
            LOG.debug('Volume %(vol)s has been already mirrored',
                      {'vol': resource_name})
        except Exception as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = (_("Failed replication for %(resource)s: '%(details)s'") %
                   {'resource': resource_name, 'details': details})
            LOG.error(msg)
            raise self.proxy.meta['exception'].VolumeBackendAPIException(
                data=msg)
    def failover(self, resource, failback):
        """Failover a single volume.
        Attempts to failover a single volume
        Sequence:
        1. attempt to switch roles from master
        2. attempt to change role to master on secondary
        returns (success, failure_reason)
        """
        LOG.debug("VolumeReplication::failover %(vol)s",
                  {'vol': resource['name']})
        recovery_mgr = self.get_recovery_mgr()
        remote_recovery_mgr = self.get_remote_recovery_mgr()
        return self._failover_resource(resource, recovery_mgr,
                                       remote_recovery_mgr, 'vol', failback)
 class GroupReplication(Replication):
    def __init__(self, proxy):
        super(GroupReplication, self).__init__(proxy)
    def get_recovery_mgr(self):
        return cg_recovery_manager.CGRecoveryManager(
            False, self.proxy.ibm_storage_cli)
    def get_remote_recovery_mgr(self):
        return volume_recovery_manager.CGRecoveryManager(
            True, self.proxy.ibm_storage_remote_cli)
    def replication_create_mirror(self, resource_name, replication_info,
                                  target, pool):
        LOG.debug('GroupReplication::replication_create_mirror')
        schedule = None
        if replication_info['rpo']:
            schedule = Replication.get_schedule_from_rpo(
                replication_info['rpo'])
        try:
            recovery_mgr = self.get_recovery_mgr()
            recovery_mgr.create_mirror(
                resource_name=resource_name,
                target_name=target,
                mirror_type=replication_info['mode'],
                slave_resource_name=resource_name,
                rpo=replication_info['rpo'],
                schedule=schedule,
                activate_mirror='yes')
        except Exception as e:
            details = self.proxy._get_code_and_status_or_message(e)
            msg = (_("Failed replication for %(resource)s: '%(details)s'"),
                   {'resource': resource_name, 'details': details})
            LOG.error(msg)
            raise self.proxy.meta['exception'].VolumeBackendAPIException(
                data=msg)
    def failover(self, resource, failback):
        LOG.debug("GroupReplication::failover %(cg)s",
                  {'cg': resource['name']})
        recovery_mgr = self.get_recovery_mgr()
        remote_recovery_mgr = self.get_remote_recovery_mgr()
        return self._failover_resource(resource, recovery_mgr,
                                       remote_recovery_mgr, 'cg', failback)
--- a/releasenotes/notes/xiv-replication-group-7ca437c90f2474a7.yaml
+++ b/releasenotes/notes/xiv-replication-group-7ca437c90f2474a7.yaml
@ -0,0 +1,4 @@
 ---
 features:
  - |
    Add consistency group replication support in XIV\A9000 Cinder driver.