2021-03-06 14:50:29 +00:00
|
|
|
import asyncio
|
|
|
|
import logging
|
|
|
|
import typing
|
|
|
|
|
|
|
|
|
2021-03-08 12:27:40 +00:00
|
|
|
class Connector:
|
|
|
|
"""Sends metrics to a statsd server.
|
|
|
|
|
|
|
|
:param host: statsd server to send metrics to
|
|
|
|
:param port: TCP port that the server is listening on
|
2021-03-11 12:31:24 +00:00
|
|
|
:param kwargs: additional keyword parameters are passed
|
|
|
|
to the :class:`.Processor` initializer
|
2021-03-08 12:27:40 +00:00
|
|
|
|
|
|
|
This class maintains a TCP connection to a statsd server and
|
|
|
|
sends metric lines to it asynchronously. You must call the
|
|
|
|
:meth:`start` method when your application is starting. It
|
|
|
|
creates a :class:`~asyncio.Task` that manages the connection
|
|
|
|
to the statsd server. You must also call :meth:`.stop` before
|
|
|
|
terminating to ensure that all metrics are flushed to the
|
|
|
|
statsd server.
|
|
|
|
|
|
|
|
When the connector is *should_terminate*, metric payloads are sent by
|
|
|
|
calling the :meth:`.inject_metric` method. The payloads are
|
|
|
|
stored in an internal queue that is consumed whenever the
|
|
|
|
connection to the server is active.
|
|
|
|
|
|
|
|
.. attribute:: processor
|
|
|
|
:type: Processor
|
|
|
|
|
|
|
|
The statsd processor that maintains the connection and
|
|
|
|
sends the metric payloads.
|
|
|
|
|
|
|
|
"""
|
2021-03-11 12:31:24 +00:00
|
|
|
def __init__(self, host: str, port: int = 8125, **kwargs):
|
|
|
|
self.processor = Processor(host=host, port=port, **kwargs)
|
2021-03-08 12:27:40 +00:00
|
|
|
self._processor_task = None
|
|
|
|
|
|
|
|
async def start(self):
|
2021-03-09 20:06:23 +00:00
|
|
|
"""Start the processor in the background.
|
|
|
|
|
|
|
|
This is a *blocking* method and does not return until the
|
|
|
|
processor task is actually running.
|
|
|
|
|
|
|
|
"""
|
2021-03-08 12:27:40 +00:00
|
|
|
self._processor_task = asyncio.create_task(self.processor.run())
|
2021-03-09 20:06:23 +00:00
|
|
|
await self.processor.running.wait()
|
2021-03-08 12:27:40 +00:00
|
|
|
|
|
|
|
async def stop(self):
|
|
|
|
"""Stop the background processor.
|
|
|
|
|
|
|
|
Items that are currently in the queue will be flushed to
|
|
|
|
the statsd server if possible. This is a *blocking* method
|
|
|
|
and does not return until the background processor has
|
|
|
|
stopped.
|
|
|
|
|
|
|
|
"""
|
|
|
|
await self.processor.stop()
|
|
|
|
|
|
|
|
def inject_metric(self, path: str, value, type_code: str):
|
|
|
|
"""Send a metric to the statsd server.
|
|
|
|
|
|
|
|
:param path: formatted metric name
|
|
|
|
:param value: metric value as a number or a string. The
|
|
|
|
string form is required for relative gauges.
|
|
|
|
:param type_code: type of the metric to send
|
|
|
|
|
|
|
|
This method formats the payload and inserts it on the
|
|
|
|
internal queue for future processing.
|
|
|
|
|
|
|
|
"""
|
|
|
|
payload = f'{path}:{value}|{type_code}\n'
|
|
|
|
self.processor.queue.put_nowait(payload.encode('utf-8'))
|
|
|
|
|
|
|
|
|
2021-03-06 14:50:29 +00:00
|
|
|
class Processor(asyncio.Protocol):
|
2021-03-08 12:27:40 +00:00
|
|
|
"""Maintains the statsd connection and sends metric payloads.
|
|
|
|
|
|
|
|
:param host: statsd server to send metrics to
|
|
|
|
:param port: TCP port that the server is listening on
|
2021-03-11 12:31:24 +00:00
|
|
|
:param reconnect_sleep: number of seconds to sleep after socket
|
|
|
|
error occurs when connecting
|
|
|
|
:param wait_timeout: number os seconds to wait for a message to
|
|
|
|
arrive on the queue
|
2021-03-08 12:27:40 +00:00
|
|
|
|
|
|
|
This class implements :class:`~asyncio.Protocol` for the statsd
|
|
|
|
TCP connection. The :meth:`.run` method is run as a background
|
|
|
|
:class:`~asyncio.Task` that consumes payloads from an internal
|
|
|
|
queue, connects to the TCP server as required, and sends the
|
|
|
|
already formatted payloads.
|
|
|
|
|
|
|
|
.. attribute:: host
|
|
|
|
:type: str
|
|
|
|
|
|
|
|
IP address or DNS name for the statsd server to send metrics to
|
|
|
|
|
|
|
|
.. attribute:: port
|
|
|
|
:type: int
|
|
|
|
|
|
|
|
TCP port number that the statsd server is listening on
|
|
|
|
|
|
|
|
.. attribute:: should_terminate
|
|
|
|
:type: bool
|
|
|
|
|
|
|
|
Flag that controls whether the background task is active or
|
|
|
|
not. This flag is set to :data:`False` when the task is started.
|
|
|
|
Setting it to :data:`True` will cause the task to shutdown in
|
|
|
|
an orderly fashion.
|
|
|
|
|
|
|
|
.. attribute:: queue
|
|
|
|
:type: asyncio.Queue
|
|
|
|
|
|
|
|
Formatted metric payloads to send to the statsd server. Enqueue
|
|
|
|
payloads to send them to the server.
|
|
|
|
|
|
|
|
.. attribute:: connected
|
|
|
|
:type: asyncio.Event
|
|
|
|
|
|
|
|
Is the TCP connection currently connected?
|
|
|
|
|
2021-03-09 20:06:23 +00:00
|
|
|
.. attribute:: running
|
|
|
|
:type: asyncio.Event
|
|
|
|
|
|
|
|
Is the background task currently running? This is the event that
|
|
|
|
:meth:`.run` sets when it starts and it remains set until the task
|
|
|
|
exits.
|
|
|
|
|
2021-03-08 12:27:40 +00:00
|
|
|
.. attribute:: stopped
|
|
|
|
:type: asyncio.Event
|
|
|
|
|
|
|
|
Is the background task currently stopped? This is the event that
|
|
|
|
:meth:`.run` sets when it exits and that :meth:`.stop` blocks on
|
|
|
|
until the task stops.
|
|
|
|
|
|
|
|
"""
|
2021-03-11 12:31:24 +00:00
|
|
|
def __init__(self,
|
|
|
|
*,
|
|
|
|
host,
|
|
|
|
port: int = 8125,
|
|
|
|
reconnect_sleep: float = 1.0,
|
|
|
|
wait_timeout: float = 0.1):
|
2021-03-08 12:27:40 +00:00
|
|
|
super().__init__()
|
2021-03-09 20:06:23 +00:00
|
|
|
if not host:
|
|
|
|
raise RuntimeError('host must be set')
|
|
|
|
if not port or port < 1:
|
|
|
|
raise RuntimeError('port must be a positive integer')
|
|
|
|
|
2021-03-06 14:50:29 +00:00
|
|
|
self.host = host
|
|
|
|
self.port = port
|
2021-03-11 12:31:24 +00:00
|
|
|
self._reconnect_sleep = reconnect_sleep
|
|
|
|
self._wait_timeout = wait_timeout
|
2021-03-06 14:50:29 +00:00
|
|
|
|
2021-03-09 20:06:23 +00:00
|
|
|
self.running = asyncio.Event()
|
2021-03-08 12:27:40 +00:00
|
|
|
self.stopped = asyncio.Event()
|
|
|
|
self.stopped.set()
|
2021-03-06 14:50:29 +00:00
|
|
|
self.connected = asyncio.Event()
|
|
|
|
self.logger = logging.getLogger(__package__).getChild('Processor')
|
2021-03-08 12:27:40 +00:00
|
|
|
self.should_terminate = False
|
2021-03-06 14:50:29 +00:00
|
|
|
self.transport = None
|
2021-03-08 12:27:40 +00:00
|
|
|
self.queue = asyncio.Queue()
|
2021-03-06 14:50:29 +00:00
|
|
|
|
2021-03-07 19:37:24 +00:00
|
|
|
self._failed_sends = []
|
2021-03-07 19:35:42 +00:00
|
|
|
|
2021-03-06 14:50:29 +00:00
|
|
|
async def run(self):
|
2021-03-08 12:27:40 +00:00
|
|
|
"""Maintains the connection and processes metric payloads."""
|
2021-03-09 20:06:23 +00:00
|
|
|
self.running.set()
|
2021-03-08 12:27:40 +00:00
|
|
|
self.stopped.clear()
|
|
|
|
self.should_terminate = False
|
|
|
|
while not self.should_terminate:
|
2021-03-06 14:50:29 +00:00
|
|
|
try:
|
|
|
|
await self._connect_if_necessary()
|
2021-03-11 12:03:18 +00:00
|
|
|
if self.connected.is_set():
|
|
|
|
await self._process_metric()
|
2021-03-06 14:50:29 +00:00
|
|
|
except asyncio.CancelledError:
|
|
|
|
self.logger.info('task cancelled, exiting')
|
|
|
|
break
|
|
|
|
|
2021-03-08 12:27:40 +00:00
|
|
|
self.should_terminate = True
|
2021-03-07 19:35:42 +00:00
|
|
|
self.logger.info('loop finished with %d metrics in the queue',
|
2021-03-08 12:27:40 +00:00
|
|
|
self.queue.qsize())
|
2021-03-06 14:50:29 +00:00
|
|
|
if self.connected.is_set():
|
2021-03-08 12:27:40 +00:00
|
|
|
num_ready = self.queue.qsize()
|
2021-03-07 19:35:42 +00:00
|
|
|
self.logger.info('draining %d metrics', num_ready)
|
|
|
|
for _ in range(num_ready):
|
|
|
|
await self._process_metric()
|
2021-03-06 14:50:29 +00:00
|
|
|
self.logger.debug('closing transport')
|
|
|
|
self.transport.close()
|
|
|
|
|
|
|
|
while self.connected.is_set():
|
|
|
|
self.logger.debug('waiting on transport to close')
|
|
|
|
await asyncio.sleep(0.1)
|
|
|
|
|
2021-03-07 19:35:42 +00:00
|
|
|
self.logger.info('processor is exiting')
|
2021-03-09 20:06:23 +00:00
|
|
|
self.running.clear()
|
2021-03-08 12:27:40 +00:00
|
|
|
self.stopped.set()
|
2021-03-06 14:50:29 +00:00
|
|
|
|
|
|
|
async def stop(self):
|
2021-03-08 12:27:40 +00:00
|
|
|
"""Stop the processor.
|
2021-03-06 14:50:29 +00:00
|
|
|
|
2021-03-08 12:27:40 +00:00
|
|
|
This is an asynchronous but blocking method. It does not
|
|
|
|
return until enqueued metrics are flushed and the processor
|
|
|
|
connection is closed.
|
|
|
|
|
|
|
|
"""
|
|
|
|
self.should_terminate = True
|
|
|
|
await self.stopped.wait()
|
2021-03-07 19:35:42 +00:00
|
|
|
|
2021-03-06 14:50:29 +00:00
|
|
|
def eof_received(self):
|
|
|
|
self.logger.warning('received EOF from statsd server')
|
|
|
|
self.connected.clear()
|
|
|
|
|
|
|
|
def connection_made(self, transport: asyncio.Transport):
|
|
|
|
server, port = transport.get_extra_info('peername')
|
|
|
|
self.logger.info('connected to statsd %s:%s', server, port)
|
|
|
|
self.transport = transport
|
|
|
|
self.connected.set()
|
|
|
|
|
|
|
|
def connection_lost(self, exc: typing.Optional[Exception]):
|
|
|
|
self.logger.warning('statsd server connection lost')
|
|
|
|
self.connected.clear()
|
|
|
|
|
2021-03-11 12:31:24 +00:00
|
|
|
async def _connect_if_necessary(self):
|
2021-03-06 14:50:29 +00:00
|
|
|
try:
|
2021-03-11 12:31:24 +00:00
|
|
|
await asyncio.wait_for(self.connected.wait(), self._wait_timeout)
|
2021-03-06 14:50:29 +00:00
|
|
|
except asyncio.TimeoutError:
|
|
|
|
try:
|
|
|
|
self.logger.debug('starting connection to %s:%s', self.host,
|
|
|
|
self.port)
|
|
|
|
await asyncio.get_running_loop().create_connection(
|
|
|
|
protocol_factory=lambda: self,
|
|
|
|
host=self.host,
|
|
|
|
port=self.port)
|
|
|
|
except IOError as error:
|
|
|
|
self.logger.warning('connection to %s:%s failed: %s',
|
|
|
|
self.host, self.port, error)
|
2021-03-11 12:31:24 +00:00
|
|
|
await asyncio.sleep(self._reconnect_sleep)
|
2021-03-07 19:35:42 +00:00
|
|
|
|
|
|
|
async def _process_metric(self):
|
2021-03-07 19:37:24 +00:00
|
|
|
processing_failed_send = False
|
2021-03-11 12:03:18 +00:00
|
|
|
if not self._failed_sends:
|
2021-03-07 19:37:24 +00:00
|
|
|
try:
|
2021-03-11 12:31:24 +00:00
|
|
|
metric = await asyncio.wait_for(self.queue.get(),
|
|
|
|
self._wait_timeout)
|
2021-03-07 19:37:24 +00:00
|
|
|
self.logger.debug('received %r from queue', metric)
|
2021-03-11 12:03:18 +00:00
|
|
|
self.queue.task_done()
|
2021-03-07 19:37:24 +00:00
|
|
|
except asyncio.TimeoutError:
|
|
|
|
return
|
|
|
|
else:
|
|
|
|
# Since we `await`d the state of the transport may have
|
|
|
|
# changed. Sending on the closed transport won't return
|
|
|
|
# an error since the send is async. We can catch the
|
|
|
|
# problem here though.
|
|
|
|
if self.transport.is_closing():
|
|
|
|
self.logger.debug('preventing send on closed transport')
|
|
|
|
self._failed_sends.append(metric)
|
|
|
|
return
|
2021-03-11 12:03:18 +00:00
|
|
|
else:
|
|
|
|
self.logger.debug('using previous send attempt')
|
|
|
|
metric = self._failed_sends[0]
|
|
|
|
processing_failed_send = True
|
2021-03-07 19:37:24 +00:00
|
|
|
|
|
|
|
self.transport.write(metric)
|
2021-03-11 12:03:18 +00:00
|
|
|
if not self.transport.is_closing():
|
2021-03-07 19:37:24 +00:00
|
|
|
self.logger.debug('sent %r to statsd', metric)
|
|
|
|
if processing_failed_send:
|
|
|
|
self._failed_sends.pop(0)
|
2021-03-11 12:03:18 +00:00
|
|
|
else:
|
|
|
|
# Writing to a transport does not raise exceptions, it
|
|
|
|
# will close the transport if a low-level error occurs.
|
|
|
|
self.logger.debug('transport closed by writing')
|