Fix several issues in the lock/release database code

Major:
- Result's first() does not raise NoResultFound, it returns None.
- Avoid opening a read transaction while a write transaction is active.

Minor:
- Do not handle NoResultFound where it cannot happen (or is already
  handled).
- Only load the fields we use when fetching intermediate results.
- Do not load the node the 2nd time when releasing: the detection of
  the exact error is racy anyway.

Change-Id: I099c7b782e0a633908383958e7aed2b17c8c3864
This commit is contained in:
Dmitry Tantsur 2023-07-06 15:06:39 +02:00
parent 76a920aed2
commit c6610c2f7f

View File

@ -639,85 +639,62 @@ class Connection(api.Connection):
@synchronized(RESERVATION_SEMAPHORE, fair=True) @synchronized(RESERVATION_SEMAPHORE, fair=True)
def _reserve_node_place_lock(self, tag, node_id, node): def _reserve_node_place_lock(self, tag, node_id, node):
try: # NOTE(TheJulia): We explicitly do *not* synch the session
# NOTE(TheJulia): We explicitly do *not* synch the session # so the other actions in the conductor do not become aware
# so the other actions in the conductor do not become aware # that the lock is in place and believe they hold the lock.
# that the lock is in place and believe they hold the lock. # This necessitates an overall lock in the code side, so
# This necessitates an overall lock in the code side, so # we avoid conditions where two separate threads can believe
# we avoid conditions where two separate threads can believe # they hold locks at the same time.
# they hold locks at the same time. with _session_for_write() as session:
with _session_for_write() as session: res = session.execute(
res = session.execute( sa.update(models.Node).
sa.update(models.Node). where(models.Node.id == node.id).
where(models.Node.id == node.id). where(models.Node.reservation == None). # noqa
where(models.Node.reservation == None). # noqa values(reservation=tag).
values(reservation=tag). execution_options(synchronize_session=False))
execution_options(synchronize_session=False)) session.flush()
session.flush() node = self._get_node_reservation(node.id)
node = self._get_node_by_id_no_joins(node.id) # NOTE(TheJulia): In SQLAlchemy 2.0 style, we don't
# NOTE(TheJulia): In SQLAlchemy 2.0 style, we don't # magically get a changed node as they moved from the
# magically get a changed node as they moved from the # many ways to do things to singular ways to do things.
# many ways to do things to singular ways to do things. if res.rowcount != 1:
if res.rowcount != 1: # Nothing updated and node exists. Must already be
# Nothing updated and node exists. Must already be # locked.
# locked. raise exception.NodeLocked(node=node.uuid, host=node.reservation)
raise exception.NodeLocked(node=node.uuid,
host=node.reservation)
except NoResultFound:
# In the event that someone has deleted the node on
# another thread.
raise exception.NodeNotFound(node=node_id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def reserve_node(self, tag, node_id): def reserve_node(self, tag, node_id):
with _session_for_read() as session: # Check existence and convert UUID to ID
try: node = self._get_node_reservation(node_id)
# TODO(TheJulia): Figure out a good way to query if node.reservation:
# this so that we do it as light as possible without # Fail fast, instead of attempt the update.
# the full object invocation, which will speed lock raise exception.NodeLocked(node=node.uuid, host=node.reservation)
# activities. Granted, this is all at the DB level
# so maybe that is okay in the grand scheme of things.
query = session.query(models.Node)
query = add_identity_filter(query, node_id)
node = query.one()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
if node.reservation:
# Fail fast, instead of attempt the update.
raise exception.NodeLocked(node=node.uuid,
host=node.reservation)
self._reserve_node_place_lock(tag, node_id, node) self._reserve_node_place_lock(tag, node_id, node)
# Return a node object as that is the contract for this method. # Return a node object as that is the contract for this method.
return self.get_node_by_id(node.id) return self.get_node_by_id(node.id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def release_node(self, tag, node_id): def release_node(self, tag, node_id):
with _session_for_read() as session: # Check existence and convert UUID to ID
try: node = self._get_node_reservation(node_id)
query = session.query(models.Node)
query = add_identity_filter(query, node_id)
node = query.one()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
with _session_for_write() as session: with _session_for_write() as session:
try: res = session.execute(
res = session.execute( sa.update(models.Node).
sa.update(models.Node). where(models.Node.id == node.id).
where(models.Node.id == node.id). where(models.Node.reservation == tag).
where(models.Node.reservation == tag). values(reservation=None).
values(reservation=None). execution_options(synchronize_session=False)
execution_options(synchronize_session=False) )
) session.flush()
node = self.get_node_by_id(node.id)
if res.rowcount != 1: if res.rowcount != 1:
if node.reservation is None: if node.reservation is None:
raise exception.NodeNotLocked(node=node.uuid) raise exception.NodeNotLocked(node=node.uuid)
else: else:
raise exception.NodeLocked(node=node.uuid, raise exception.NodeLocked(node=node.uuid,
host=node['reservation']) host=node.reservation)
session.flush()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def create_node(self, values): def create_node(self, values):
@ -762,20 +739,24 @@ class Connection(api.Connection):
raise exception.NodeAlreadyExists(uuid=values['uuid']) raise exception.NodeAlreadyExists(uuid=values['uuid'])
return node return node
def _get_node_by_id_no_joins(self, node_id): def _get_node_reservation(self, node_id):
# TODO(TheJulia): Maybe replace with this with a minimal with _session_for_read() as session:
# "get these three fields" thing. # Explicitly load NodeBase as the invocation of the
try: # primary model object results in the join query
with _session_for_read() as session: # triggering.
# Explicitly load NodeBase as the invocation of the res = session.execute(
# priamary model object reesults in the join query add_identity_filter(
# triggering. sa.select(models.NodeBase.id,
res = session.execute( models.NodeBase.uuid,
sa.select(models.NodeBase).filter_by(id=node_id).limit(1) models.NodeBase.reservation),
).scalars().first() node_id
except NoResultFound: ).limit(1)
).first()
if res is None:
raise exception.NodeNotFound(node=node_id) raise exception.NodeNotFound(node=node_id)
return res else:
return res
def get_node_by_id(self, node_id): def get_node_by_id(self, node_id):
try: try: