| tierno | 87858ca | 2018-10-08 16:30:15 +0200 | [diff] [blame] | 1 | # -*- coding: utf-8 -*- |
| 2 | |
| 3 | # Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | # you may not use this file except in compliance with the License. |
| 5 | # You may obtain a copy of the License at |
| 6 | # |
| 7 | # http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | # |
| 9 | # Unless required by applicable law or agreed to in writing, software |
| 10 | # distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or |
| 12 | # implied. |
| 13 | # See the License for the specific language governing permissions and |
| 14 | # limitations under the License. |
| 15 | |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 16 | import logging |
| 17 | import asyncio |
| 18 | import yaml |
| 19 | from aiokafka import AIOKafkaConsumer |
| 20 | from aiokafka import AIOKafkaProducer |
| 21 | from aiokafka.errors import KafkaError |
| tierno | 3054f78 | 2018-04-25 16:59:53 +0200 | [diff] [blame] | 22 | from osm_common.msgbase import MsgBase, MsgException |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 23 | |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 24 | __author__ = ( |
| 25 | "Alfonso Tierno <alfonso.tiernosepulveda@telefonica.com>, " |
| 26 | "Guillermo Calvino <guillermo.calvinosanchez@altran.com>" |
| 27 | ) |
| tierno | 3054f78 | 2018-04-25 16:59:53 +0200 | [diff] [blame] | 28 | |
| 29 | |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 30 | class MsgKafka(MsgBase): |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 31 | def __init__(self, logger_name="msg", lock=False): |
| tierno | 1e9a329 | 2018-11-05 18:18:45 +0100 | [diff] [blame] | 32 | super().__init__(logger_name, lock) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 33 | self.host = None |
| 34 | self.port = None |
| 35 | self.consumer = None |
| 36 | self.producer = None |
| 37 | self.loop = None |
| 38 | self.broker = None |
| tierno | 73da4fa | 2018-08-31 13:50:59 +0000 | [diff] [blame] | 39 | self.group_id = None |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 40 | |
| 41 | def connect(self, config): |
| 42 | try: |
| 43 | if "logger_name" in config: |
| 44 | self.logger = logging.getLogger(config["logger_name"]) |
| 45 | self.host = config["host"] |
| 46 | self.port = config["port"] |
| tierno | 05ede8f | 2019-01-28 16:20:18 +0000 | [diff] [blame] | 47 | self.loop = config.get("loop") or asyncio.get_event_loop() |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 48 | self.broker = str(self.host) + ":" + str(self.port) |
| tierno | 73da4fa | 2018-08-31 13:50:59 +0000 | [diff] [blame] | 49 | self.group_id = config.get("group_id") |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 50 | |
| 51 | except Exception as e: # TODO refine |
| 52 | raise MsgException(str(e)) |
| 53 | |
| 54 | def disconnect(self): |
| 55 | try: |
| tierno | ebbf353 | 2018-05-03 17:49:37 +0200 | [diff] [blame] | 56 | pass |
| 57 | # self.loop.close() |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 58 | except Exception as e: # TODO refine |
| 59 | raise MsgException(str(e)) |
| 60 | |
| 61 | def write(self, topic, key, msg): |
| tierno | 8657799 | 2018-05-10 16:51:17 +0200 | [diff] [blame] | 62 | """ |
| 63 | Write a message at kafka bus |
| 64 | :param topic: message topic, must be string |
| 65 | :param key: message key, must be string |
| 66 | :param msg: message content, can be string or dictionary |
| 67 | :return: None or raises MsgException on failing |
| 68 | """ |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 69 | retry = 2 # Try two times |
| delacruzramo | 562435a | 2019-12-10 12:06:01 +0100 | [diff] [blame] | 70 | while retry: |
| 71 | try: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 72 | self.loop.run_until_complete( |
| 73 | self.aiowrite(topic=topic, key=key, msg=msg) |
| 74 | ) |
| delacruzramo | 562435a | 2019-12-10 12:06:01 +0100 | [diff] [blame] | 75 | break |
| 76 | except Exception as e: |
| 77 | retry -= 1 |
| 78 | if retry == 0: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 79 | raise MsgException( |
| 80 | "Error writing {} topic: {}".format(topic, str(e)) |
| 81 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 82 | |
| 83 | def read(self, topic): |
| 84 | """ |
| tierno | 8657799 | 2018-05-10 16:51:17 +0200 | [diff] [blame] | 85 | Read from one or several topics. |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 86 | :param topic: can be str: single topic; or str list: several topics |
| 87 | :return: topic, key, message; or None |
| 88 | """ |
| 89 | try: |
| 90 | return self.loop.run_until_complete(self.aioread(topic, self.loop)) |
| 91 | except MsgException: |
| 92 | raise |
| 93 | except Exception as e: |
| 94 | raise MsgException("Error reading {} topic: {}".format(topic, str(e))) |
| 95 | |
| 96 | async def aiowrite(self, topic, key, msg, loop=None): |
| tierno | 05ede8f | 2019-01-28 16:20:18 +0000 | [diff] [blame] | 97 | """ |
| 98 | Asyncio write |
| 99 | :param topic: str kafka topic |
| 100 | :param key: str kafka key |
| 101 | :param msg: str or dictionary kafka message |
| 102 | :param loop: asyncio loop. To be DEPRECATED! in near future!!! loop must be provided inside config at connect |
| 103 | :return: None |
| 104 | """ |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 105 | |
| 106 | if not loop: |
| 107 | loop = self.loop |
| 108 | try: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 109 | self.producer = AIOKafkaProducer( |
| 110 | loop=loop, |
| 111 | key_serializer=str.encode, |
| 112 | value_serializer=str.encode, |
| 113 | bootstrap_servers=self.broker, |
| 114 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 115 | await self.producer.start() |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 116 | await self.producer.send( |
| 117 | topic=topic, key=key, value=yaml.safe_dump(msg, default_flow_style=True) |
| 118 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 119 | except Exception as e: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 120 | raise MsgException( |
| 121 | "Error publishing topic '{}', key '{}': {}".format(topic, key, e) |
| 122 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 123 | finally: |
| 124 | await self.producer.stop() |
| 125 | |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 126 | async def aioread( |
| 127 | self, |
| 128 | topic, |
| 129 | loop=None, |
| 130 | callback=None, |
| 131 | aiocallback=None, |
| 132 | group_id=None, |
| 133 | from_beginning=None, |
| 134 | **kwargs |
| 135 | ): |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 136 | """ |
| tierno | 05ede8f | 2019-01-28 16:20:18 +0000 | [diff] [blame] | 137 | Asyncio read from one or several topics. |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 138 | :param topic: can be str: single topic; or str list: several topics |
| tierno | 05ede8f | 2019-01-28 16:20:18 +0000 | [diff] [blame] | 139 | :param loop: asyncio loop. To be DEPRECATED! in near future!!! loop must be provided inside config at connect |
| Benjamin Diaz | 48b78e1 | 2018-10-18 17:55:12 -0300 | [diff] [blame] | 140 | :param callback: synchronous callback function that will handle the message in kafka bus |
| 141 | :param aiocallback: async callback function that will handle the message in kafka bus |
| tierno | 10602af | 2019-02-18 14:53:54 +0000 | [diff] [blame] | 142 | :param group_id: kafka group_id to use. Can be False (set group_id to None), None (use general group_id provided |
| 143 | at connect inside config), or a group_id string |
| tierno | 41ca4d0 | 2020-07-16 11:22:12 +0000 | [diff] [blame] | 144 | :param from_beginning: if True, messages will be obtained from beginning instead of only new ones. |
| 145 | If group_id is supplied, only the not processed messages by other worker are obtained. |
| 146 | If group_id is None, all messages stored at kafka are obtained. |
| Benjamin Diaz | 48b78e1 | 2018-10-18 17:55:12 -0300 | [diff] [blame] | 147 | :param kwargs: optional keyword arguments for callback function |
| 148 | :return: If no callback defined, it returns (topic, key, message) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 149 | """ |
| 150 | |
| 151 | if not loop: |
| 152 | loop = self.loop |
| tierno | 10602af | 2019-02-18 14:53:54 +0000 | [diff] [blame] | 153 | if group_id is False: |
| 154 | group_id = None |
| 155 | elif group_id is None: |
| 156 | group_id = self.group_id |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 157 | try: |
| 158 | if isinstance(topic, (list, tuple)): |
| 159 | topic_list = topic |
| 160 | else: |
| 161 | topic_list = (topic,) |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 162 | self.consumer = AIOKafkaConsumer( |
| 163 | loop=loop, |
| 164 | bootstrap_servers=self.broker, |
| 165 | group_id=group_id, |
| 166 | auto_offset_reset="earliest" if from_beginning else "latest", |
| 167 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 168 | await self.consumer.start() |
| 169 | self.consumer.subscribe(topic_list) |
| 170 | |
| 171 | async for message in self.consumer: |
| 172 | if callback: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 173 | callback( |
| 174 | message.topic, |
| 175 | yaml.safe_load(message.key), |
| 176 | yaml.safe_load(message.value), |
| 177 | **kwargs |
| 178 | ) |
| Benjamin Diaz | 48b78e1 | 2018-10-18 17:55:12 -0300 | [diff] [blame] | 179 | elif aiocallback: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 180 | await aiocallback( |
| 181 | message.topic, |
| 182 | yaml.safe_load(message.key), |
| 183 | yaml.safe_load(message.value), |
| 184 | **kwargs |
| 185 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 186 | else: |
| garciadeblas | 2644b76 | 2021-03-24 09:21:01 +0100 | [diff] [blame] | 187 | return ( |
| 188 | message.topic, |
| 189 | yaml.safe_load(message.key), |
| 190 | yaml.safe_load(message.value), |
| 191 | ) |
| tierno | 5c01261 | 2018-04-19 16:01:59 +0200 | [diff] [blame] | 192 | except KafkaError as e: |
| 193 | raise MsgException(str(e)) |
| 194 | finally: |
| 195 | await self.consumer.stop() |