Fix several issues in the lock/release database code

Major:
- Result's first() does not raise NoResultFound, it returns None.
- Avoid opening a read transaction while a write transaction is active.

Minor:
- Do not handle NoResultFound where it cannot happen (or is already
  handled).
- Only load the fields we use when fetching intermediate results.
- Do not load the node the 2nd time when releasing: the detection of
  the exact error is racy anyway.

Change-Id: I099c7b782e0a633908383958e7aed2b17c8c3864
This commit is contained in:
Dmitry Tantsur 2023-07-06 15:06:39 +02:00
parent 76a920aed2
commit c6610c2f7f

View File

@ -639,7 +639,6 @@ class Connection(api.Connection):
@synchronized(RESERVATION_SEMAPHORE, fair=True) @synchronized(RESERVATION_SEMAPHORE, fair=True)
def _reserve_node_place_lock(self, tag, node_id, node): def _reserve_node_place_lock(self, tag, node_id, node):
try:
# NOTE(TheJulia): We explicitly do *not* synch the session # NOTE(TheJulia): We explicitly do *not* synch the session
# so the other actions in the conductor do not become aware # so the other actions in the conductor do not become aware
# that the lock is in place and believe they hold the lock. # that the lock is in place and believe they hold the lock.
@ -654,53 +653,33 @@ class Connection(api.Connection):
values(reservation=tag). values(reservation=tag).
execution_options(synchronize_session=False)) execution_options(synchronize_session=False))
session.flush() session.flush()
node = self._get_node_by_id_no_joins(node.id) node = self._get_node_reservation(node.id)
# NOTE(TheJulia): In SQLAlchemy 2.0 style, we don't # NOTE(TheJulia): In SQLAlchemy 2.0 style, we don't
# magically get a changed node as they moved from the # magically get a changed node as they moved from the
# many ways to do things to singular ways to do things. # many ways to do things to singular ways to do things.
if res.rowcount != 1: if res.rowcount != 1:
# Nothing updated and node exists. Must already be # Nothing updated and node exists. Must already be
# locked. # locked.
raise exception.NodeLocked(node=node.uuid, raise exception.NodeLocked(node=node.uuid, host=node.reservation)
host=node.reservation)
except NoResultFound:
# In the event that someone has deleted the node on
# another thread.
raise exception.NodeNotFound(node=node_id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def reserve_node(self, tag, node_id): def reserve_node(self, tag, node_id):
with _session_for_read() as session: # Check existence and convert UUID to ID
try: node = self._get_node_reservation(node_id)
# TODO(TheJulia): Figure out a good way to query
# this so that we do it as light as possible without
# the full object invocation, which will speed lock
# activities. Granted, this is all at the DB level
# so maybe that is okay in the grand scheme of things.
query = session.query(models.Node)
query = add_identity_filter(query, node_id)
node = query.one()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
if node.reservation: if node.reservation:
# Fail fast, instead of attempt the update. # Fail fast, instead of attempt the update.
raise exception.NodeLocked(node=node.uuid, raise exception.NodeLocked(node=node.uuid, host=node.reservation)
host=node.reservation)
self._reserve_node_place_lock(tag, node_id, node) self._reserve_node_place_lock(tag, node_id, node)
# Return a node object as that is the contract for this method. # Return a node object as that is the contract for this method.
return self.get_node_by_id(node.id) return self.get_node_by_id(node.id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def release_node(self, tag, node_id): def release_node(self, tag, node_id):
with _session_for_read() as session: # Check existence and convert UUID to ID
try: node = self._get_node_reservation(node_id)
query = session.query(models.Node)
query = add_identity_filter(query, node_id)
node = query.one()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
with _session_for_write() as session: with _session_for_write() as session:
try:
res = session.execute( res = session.execute(
sa.update(models.Node). sa.update(models.Node).
where(models.Node.id == node.id). where(models.Node.id == node.id).
@ -708,16 +687,14 @@ class Connection(api.Connection):
values(reservation=None). values(reservation=None).
execution_options(synchronize_session=False) execution_options(synchronize_session=False)
) )
node = self.get_node_by_id(node.id) session.flush()
if res.rowcount != 1: if res.rowcount != 1:
if node.reservation is None: if node.reservation is None:
raise exception.NodeNotLocked(node=node.uuid) raise exception.NodeNotLocked(node=node.uuid)
else: else:
raise exception.NodeLocked(node=node.uuid, raise exception.NodeLocked(node=node.uuid,
host=node['reservation']) host=node.reservation)
session.flush()
except NoResultFound:
raise exception.NodeNotFound(node=node_id)
@oslo_db_api.retry_on_deadlock @oslo_db_api.retry_on_deadlock
def create_node(self, values): def create_node(self, values):
@ -762,19 +739,23 @@ class Connection(api.Connection):
raise exception.NodeAlreadyExists(uuid=values['uuid']) raise exception.NodeAlreadyExists(uuid=values['uuid'])
return node return node
def _get_node_by_id_no_joins(self, node_id): def _get_node_reservation(self, node_id):
# TODO(TheJulia): Maybe replace with this with a minimal
# "get these three fields" thing.
try:
with _session_for_read() as session: with _session_for_read() as session:
# Explicitly load NodeBase as the invocation of the # Explicitly load NodeBase as the invocation of the
# priamary model object reesults in the join query # primary model object results in the join query
# triggering. # triggering.
res = session.execute( res = session.execute(
sa.select(models.NodeBase).filter_by(id=node_id).limit(1) add_identity_filter(
).scalars().first() sa.select(models.NodeBase.id,
except NoResultFound: models.NodeBase.uuid,
models.NodeBase.reservation),
node_id
).limit(1)
).first()
if res is None:
raise exception.NodeNotFound(node=node_id) raise exception.NodeNotFound(node=node_id)
else:
return res return res
def get_node_by_id(self, node_id): def get_node_by_id(self, node_id):