cnn-classification-service/cnn_classification_service/main.py

132 lines
4.3 KiB
Python
Raw Normal View History

2020-07-27 17:58:48 +02:00
#!/usr/bin/env python3
2021-07-30 17:09:57 +02:00
import time
2021-07-30 12:17:18 +02:00
import jaeger_client
import opentracing
2021-08-04 16:17:06 +02:00
from opentracing.ext import tags
from opentracing.propagation import Format
2021-07-30 12:17:18 +02:00
2020-07-27 17:58:48 +02:00
import logging
import sys
import pika
import json
from sentry_sdk.integrations.logging import LoggingIntegration
import sentry_sdk
2021-07-30 11:43:38 +02:00
from config import Config
2020-10-06 00:41:54 +02:00
from magic_doer import MagicDoer
2021-12-05 01:15:06 +01:00
from classifier_cache import ClassifierCache
2020-07-27 17:58:48 +02:00
2020-10-05 22:19:25 +02:00
def message_callback(channel, method, properties, body):
2021-08-04 16:17:06 +02:00
try:
msg = json.loads(body.decode('utf-8'))
except (UnicodeDecodeError, json.JSONDecodeError) as e:
logging.warning(f"Invalid message recieved: {e}")
channel.basic_ack(delivery_tag=method.delivery_tag) # We don't want this to be requeue
return
2021-07-30 15:24:57 +02:00
2021-08-04 16:17:06 +02:00
logging.debug(f"Handling message: {msg}")
span_ctx = opentracing.tracer.extract(Format.TEXT_MAP, msg)
span_tags = {tags.SPAN_KIND: tags.SPAN_KIND_CONSUMER}
with opentracing.tracer.start_active_span(
'main.handleMessage', finish_on_close=True, child_of=span_ctx, tags=span_tags
) as scope:
2021-07-30 15:24:57 +02:00
2021-08-04 15:57:29 +02:00
with opentracing.tracer.start_active_span('magicDoer.runEverything'):
try:
results = MagicDoer.run_everything(msg) # <- This is where the magic happens
except Exception as e:
2021-08-04 15:59:54 +02:00
logging.error(f"Something went wrong during handling sample {msg['tag']} run: {e}; msg: {msg}")
2021-08-04 15:57:29 +02:00
logging.exception(e)
channel.basic_nack(delivery_tag=method.delivery_tag, requeue=True)
return
2021-07-30 15:24:57 +02:00
if results:
2021-08-04 16:17:06 +02:00
opentracing.tracer.inject(scope.span.context, Format.TEXT_MAP, results)
logging.debug(f"Publishing message: {results}")
2021-07-30 15:24:57 +02:00
channel.basic_publish(
exchange=Config.PIKA_OUTPUT_EXCHANGE,
routing_key='classification-result',
body=json.dumps(results).encode("utf-8")
)
2021-08-04 15:57:29 +02:00
channel.basic_ack(delivery_tag=method.delivery_tag)
2020-07-27 17:58:48 +02:00
def main():
2021-07-30 12:17:18 +02:00
# setup observability stuffs
2021-12-05 01:15:06 +01:00
if (not Config.PIKA_URL) or (not Config.PIKA_OUTPUT_EXCHANGE):
logging.error("Mandatory config parameters unset: PIKA_URL or PIKA_OUTPUT_EXCHANGE")
raise KeyError
2021-07-30 12:17:18 +02:00
2021-07-30 11:43:38 +02:00
if Config.SENTRY_DSN:
2020-07-27 17:58:48 +02:00
sentry_logging = LoggingIntegration(
level=logging.DEBUG, # Capture info and above as breadcrumbs
event_level=logging.ERROR # Send errors as events
)
sentry_sdk.init(
2021-07-30 11:43:38 +02:00
dsn=Config.SENTRY_DSN,
2020-07-27 17:58:48 +02:00
integrations=[sentry_logging],
2020-10-19 22:30:00 +02:00
traces_sample_rate=1.0,
2020-07-27 17:58:48 +02:00
send_default_pii=True,
2021-07-30 11:43:38 +02:00
release=Config.RELEASE_ID,
environment=Config.RELEASEMODE,
2020-10-19 22:30:00 +02:00
_experiments={"auto_enabling_integrations": True}
2020-07-27 17:58:48 +02:00
)
2021-07-30 12:17:18 +02:00
jaeger_client.Config(config={}, service_name='cnn-classification-service', validate=True).initialize_tracer()
# Start the memes
2020-07-27 17:58:48 +02:00
logging.info("Connecting to MQ service...")
2021-07-30 11:43:38 +02:00
connection = pika.BlockingConnection(pika.connection.URLParameters(Config.PIKA_URL))
2020-07-27 17:58:48 +02:00
channel = connection.channel()
2021-07-30 11:43:38 +02:00
channel.exchange_declare(exchange=Config.PIKA_INPUT_EXCHANGE, exchange_type='direct')
2020-07-27 17:58:48 +02:00
2020-10-24 00:58:28 +02:00
queue_declare_result = channel.queue_declare(queue='cnnqueue', exclusive=False)
2020-07-27 17:58:48 +02:00
queue_name = queue_declare_result.method.queue
2021-08-18 16:06:14 +02:00
channel.queue_bind(exchange=Config.PIKA_INPUT_EXCHANGE, routing_key='sample', queue=queue_name)
2020-10-06 00:41:54 +02:00
2020-10-24 00:50:55 +02:00
channel.basic_qos(prefetch_count=1)
channel.basic_consume(queue=queue_name, on_message_callback=message_callback, auto_ack=False)
2020-07-27 17:58:48 +02:00
logging.info("Connection complete! Listening to messages...")
try:
channel.start_consuming()
except KeyboardInterrupt:
logging.info("SIGINT Received! Stopping stuff...")
channel.stop_consuming()
2021-07-30 17:09:57 +02:00
time.sleep(2) # lol
opentracing.tracer.close()
2020-07-27 17:58:48 +02:00
2021-12-05 01:15:06 +01:00
def test_loader():
logging.info("Testing if model loading works...")
cc = ClassifierCache(Config.MODEL_INFO_URL)
details, classifier = cc.get_default_classifier()
logging.info(f"Loaded classifier: {classifier}")
logging.info(f"Details: {details}")
2020-07-27 17:58:48 +02:00
if __name__ == '__main__':
2021-12-05 01:15:06 +01:00
# setup logging
logging.basicConfig(
stream=sys.stdout,
format="%(asctime)s - %(name)s [%(levelname)s]: %(message)s",
level=Config.LOG_LEVEL
)
if '--test-loader' in sys.argv:
test_loader()
else:
main()