Remove logging from ProducerConnection._produce_message

In impl_kafka, _produce_message is run in a tpool.execute
context but it was also calling logging functions.
This could cause subsequent calls to logging functions to
deadlock.

This patch moves the logging calls out of the tpool.execute scope.

Change-Id: I81167eea0a6b1a43a88baa3bc383af684f4b1345
Closes-bug: #1981093
This commit is contained in:
Guillaume Espanel 2022-07-11 10:58:32 +02:00
parent 4186386748
commit 43f2224aac
3 changed files with 67 additions and 15 deletions

View File

@ -265,18 +265,17 @@ class ProducerConnection(Connection):
self.producer = None self.producer = None
self.producer_lock = threading.Lock() self.producer_lock = threading.Lock()
def _produce_message(self, topic, message): def _produce_message(self, topic, message, poll):
while True: if poll:
self.producer.poll(poll)
try: try:
self.producer.produce(topic, message) self.producer.produce(topic, message)
except KafkaException as e: except KafkaException as e:
LOG.error("Produce message failed: %s" % str(e)) self.producer.poll(0)
except BufferError: raise e
LOG.debug("Produce message queue full, waiting for deliveries") except BufferError as e:
self.producer.poll(0.5) # We'll have to poll next time
continue raise e
break
self.producer.poll(0) self.producer.poll(0)
def notify_send(self, topic, ctxt, msg, retry): def notify_send(self, topic, ctxt, msg, retry):
@ -293,9 +292,22 @@ class ProducerConnection(Connection):
try: try:
self._ensure_producer() self._ensure_producer()
poll = 0
while True:
try:
if eventletutils.is_monkey_patched('thread'): if eventletutils.is_monkey_patched('thread'):
return tpool.execute(self._produce_message, topic, message) return tpool.execute(self._produce_message, topic,
return self._produce_message(topic, message) message, poll)
return self._produce_message(topic, message, poll)
except KafkaException as e:
LOG.error("Produce message failed: %s" % str(e))
break
except BufferError:
LOG.debug("Produce message queue full, "
"waiting for deliveries")
# We'll retry with .5s polling
poll = 0.5
except Exception: except Exception:
# NOTE(sileht): if something goes wrong close the producer # NOTE(sileht): if something goes wrong close the producer
# connection # connection

View File

@ -15,6 +15,8 @@
import testscenarios import testscenarios
from unittest import mock from unittest import mock
from confluent_kafka import KafkaException
import oslo_messaging import oslo_messaging
from oslo_messaging._drivers import impl_kafka as kafka_driver from oslo_messaging._drivers import impl_kafka as kafka_driver
from oslo_messaging.tests import utils as test_utils from oslo_messaging.tests import utils as test_utils
@ -120,6 +122,36 @@ class TestKafkaDriver(test_utils.BaseTestCase):
'ssl.key.password': '', 'ssl.key.password': '',
}) })
def test_send_notification_retries_on_buffer_error(self):
target = oslo_messaging.Target(topic="topic_test")
with mock.patch("confluent_kafka.Producer") as producer:
fake_producer = mock.MagicMock()
fake_producer.produce = mock.Mock(
side_effect=[BufferError, BufferError, None])
producer.return_value = fake_producer
self.driver.send_notification(
target, {}, {"payload": ["test_1"]},
None, retry=3)
assert fake_producer.produce.call_count == 3
def test_send_notification_stops_on_kafka_error(self):
target = oslo_messaging.Target(topic="topic_test")
with mock.patch("confluent_kafka.Producer") as producer:
fake_producer = mock.MagicMock()
fake_producer.produce = mock.Mock(
side_effect=[KafkaException, None])
producer.return_value = fake_producer
self.driver.send_notification(
target, {}, {"payload": ["test_1"]},
None, retry=3)
assert fake_producer.produce.call_count == 1
def test_listen(self): def test_listen(self):
target = oslo_messaging.Target(topic="topic_test") target = oslo_messaging.Target(topic="topic_test")
self.assertRaises(NotImplementedError, self.driver.listen, target, self.assertRaises(NotImplementedError, self.driver.listen, target,

View File

@ -0,0 +1,8 @@
---
fixes:
- |
[`bug 1981093 <https://bugs.launchpad.net/oslo.messaging/+bug/1981093>`_]
Pulls calls to logging functions out of ``impl_kafka._produce_message``.
Since ``_produce_message`` is called through tpool.execute, calling logging
functions inside ``_produce_message`` could cause subsequent calls to
logging functions to deadlock.