blob: ebfca7e957a927e17acc3259896bf3ea9b6c3054 [file] [log] [blame]
tiernoc0e42e22018-05-11 11:36:10 +02001#!/usr/bin/python3
2# -*- coding: utf-8 -*-
3
tierno2e215512018-11-28 09:37:52 +00004##
5# Copyright 2018 Telefonica S.A.
6#
7# Licensed under the Apache License, Version 2.0 (the "License"); you may
8# not use this file except in compliance with the License. You may obtain
9# a copy of the License at
10#
11# http://www.apache.org/licenses/LICENSE-2.0
12#
13# Unless required by applicable law or agreed to in writing, software
14# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
15# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
16# License for the specific language governing permissions and limitations
17# under the License.
18##
19
quilesj7e13aeb2019-10-08 13:34:55 +020020
21# DEBUG WITH PDB
22import os
23import pdb
24
tiernoc0e42e22018-05-11 11:36:10 +020025import asyncio
26import yaml
tierno275411e2018-05-16 14:33:32 +020027import logging
28import logging.handlers
29import getopt
tierno275411e2018-05-16 14:33:32 +020030import sys
tierno59d22d22018-09-25 18:10:19 +020031
tiernob996d942020-07-03 14:52:28 +000032from osm_lcm import ns, prometheus, vim_sdn, netslice
tierno69f0d382020-05-07 13:08:09 +000033from osm_lcm.ng_ro import NgRoException, NgRoClient
34from osm_lcm.ROclient import ROClient, ROClientException
quilesj7e13aeb2019-10-08 13:34:55 +020035
tierno94f06112020-02-11 12:38:19 +000036from time import time
tierno8069ce52019-08-28 15:34:33 +000037from osm_lcm.lcm_utils import versiontuple, LcmException, TaskRegistry, LcmExceptionExit
tiernoa4dea5a2020-01-05 16:29:30 +000038from osm_lcm import version as lcm_version, version_date as lcm_version_date
tierno8069ce52019-08-28 15:34:33 +000039
bravof922c4172020-11-24 21:21:43 -030040from osm_common import msglocal, msgkafka
tierno98768132018-09-11 12:07:21 +020041from osm_common import version as common_version
tierno59d22d22018-09-25 18:10:19 +020042from osm_common.dbbase import DbException
tiernoc0e42e22018-05-11 11:36:10 +020043from osm_common.fsbase import FsException
44from osm_common.msgbase import MsgException
bravof922c4172020-11-24 21:21:43 -030045from osm_lcm.data_utils.database.database import Database
46from osm_lcm.data_utils.filesystem.filesystem import Filesystem
tierno275411e2018-05-16 14:33:32 +020047from os import environ, path
tierno16427352019-04-22 11:37:36 +000048from random import choice as random_choice
tierno59d22d22018-09-25 18:10:19 +020049from n2vc import version as n2vc_version
bravof922c4172020-11-24 21:21:43 -030050import traceback
tiernoc0e42e22018-05-11 11:36:10 +020051
quilesj7e13aeb2019-10-08 13:34:55 +020052if os.getenv('OSMLCM_PDB_DEBUG', None) is not None:
53 pdb.set_trace()
54
tiernoc0e42e22018-05-11 11:36:10 +020055
tierno275411e2018-05-16 14:33:32 +020056__author__ = "Alfonso Tierno"
tiernoe64f7fb2019-09-11 08:55:52 +000057min_RO_version = "6.0.2"
tierno6e9d2eb2018-09-12 17:47:18 +020058min_n2vc_version = "0.0.2"
quilesj7e13aeb2019-10-08 13:34:55 +020059
tierno16427352019-04-22 11:37:36 +000060min_common_version = "0.1.19"
tierno3e359b12019-02-03 02:29:13 +010061health_check_file = path.expanduser("~") + "/time_last_ping" # TODO find better location for this file
tierno275411e2018-05-16 14:33:32 +020062
63
tiernoc0e42e22018-05-11 11:36:10 +020064class Lcm:
65
tiernoa9843d82018-10-24 10:44:20 +020066 ping_interval_pace = 120 # how many time ping is send once is confirmed all is running
tiernof578e552018-11-08 19:07:20 +010067 ping_interval_boot = 5 # how many time ping is sent when booting
tierno991e95d2020-07-21 12:41:25 +000068 cfg_logger_name = {"message": "lcm.msg", "database": "lcm.db", "storage": "lcm.fs", "tsdb": "lcm.prometheus"}
69 # ^ contains for each section at lcm.cfg the used logger name
tiernoa9843d82018-10-24 10:44:20 +020070
tierno59d22d22018-09-25 18:10:19 +020071 def __init__(self, config_file, loop=None):
tiernoc0e42e22018-05-11 11:36:10 +020072 """
73 Init, Connect to database, filesystem storage, and messaging
74 :param config: two level dictionary with configuration. Top level should contain 'database', 'storage',
75 :return: None
76 """
tiernoc0e42e22018-05-11 11:36:10 +020077 self.db = None
78 self.msg = None
tierno16427352019-04-22 11:37:36 +000079 self.msg_admin = None
tiernoc0e42e22018-05-11 11:36:10 +020080 self.fs = None
81 self.pings_not_received = 1
tiernoc2564fe2019-01-28 16:18:56 +000082 self.consecutive_errors = 0
83 self.first_start = False
tiernoc0e42e22018-05-11 11:36:10 +020084
tiernoc0e42e22018-05-11 11:36:10 +020085 # logging
86 self.logger = logging.getLogger('lcm')
tierno16427352019-04-22 11:37:36 +000087 # get id
88 self.worker_id = self.get_process_id()
tiernoc0e42e22018-05-11 11:36:10 +020089 # load configuration
90 config = self.read_config_file(config_file)
91 self.config = config
tierno744303e2020-01-13 16:46:31 +000092 self.config["ro_config"] = {
tierno69f0d382020-05-07 13:08:09 +000093 "ng": config["RO"].get("ng", False),
94 "uri": config["RO"].get("uri"),
tierno750b2452018-05-17 16:39:29 +020095 "tenant": config.get("tenant", "osm"),
tierno69f0d382020-05-07 13:08:09 +000096 "logger_name": "lcm.roclient",
97 "loglevel": config["RO"].get("loglevel", "ERROR"),
tiernoc0e42e22018-05-11 11:36:10 +020098 }
tierno69f0d382020-05-07 13:08:09 +000099 if not self.config["ro_config"]["uri"]:
tierno2357f4e2020-10-19 16:38:59 +0000100 self.config["ro_config"]["uri"] = "http://{}:{}/".format(config["RO"]["host"], config["RO"]["port"])
101 elif "/ro" in self.config["ro_config"]["uri"][-4:] or "/openmano" in self.config["ro_config"]["uri"][-10:]:
102 # uri ends with '/ro', '/ro/', '/openmano', '/openmano/'
103 index = self.config["ro_config"]["uri"][-1].rfind("/")
104 self.config["ro_config"]["uri"] = self.config["ro_config"]["uri"][index+1]
tiernoc0e42e22018-05-11 11:36:10 +0200105
tierno59d22d22018-09-25 18:10:19 +0200106 self.loop = loop or asyncio.get_event_loop()
David Garciac1fe90a2021-03-31 19:12:02 +0200107 self.ns = self.netslice = self.vim = self.wim = self.sdn = self.k8scluster = self.vca = self.k8srepo = None
tiernoc0e42e22018-05-11 11:36:10 +0200108
109 # logging
110 log_format_simple = "%(asctime)s %(levelname)s %(name)s %(filename)s:%(lineno)s %(message)s"
111 log_formatter_simple = logging.Formatter(log_format_simple, datefmt='%Y-%m-%dT%H:%M:%S')
112 config["database"]["logger_name"] = "lcm.db"
113 config["storage"]["logger_name"] = "lcm.fs"
114 config["message"]["logger_name"] = "lcm.msg"
tierno86aa62f2018-08-20 11:57:04 +0000115 if config["global"].get("logfile"):
tiernoc0e42e22018-05-11 11:36:10 +0200116 file_handler = logging.handlers.RotatingFileHandler(config["global"]["logfile"],
117 maxBytes=100e6, backupCount=9, delay=0)
118 file_handler.setFormatter(log_formatter_simple)
119 self.logger.addHandler(file_handler)
tierno86aa62f2018-08-20 11:57:04 +0000120 if not config["global"].get("nologging"):
tiernoc0e42e22018-05-11 11:36:10 +0200121 str_handler = logging.StreamHandler()
122 str_handler.setFormatter(log_formatter_simple)
123 self.logger.addHandler(str_handler)
124
125 if config["global"].get("loglevel"):
126 self.logger.setLevel(config["global"]["loglevel"])
127
128 # logging other modules
tierno991e95d2020-07-21 12:41:25 +0000129 for k1, logname in self.cfg_logger_name.items():
tiernoc0e42e22018-05-11 11:36:10 +0200130 config[k1]["logger_name"] = logname
131 logger_module = logging.getLogger(logname)
tierno86aa62f2018-08-20 11:57:04 +0000132 if config[k1].get("logfile"):
tiernoc0e42e22018-05-11 11:36:10 +0200133 file_handler = logging.handlers.RotatingFileHandler(config[k1]["logfile"],
134 maxBytes=100e6, backupCount=9, delay=0)
135 file_handler.setFormatter(log_formatter_simple)
136 logger_module.addHandler(file_handler)
tierno86aa62f2018-08-20 11:57:04 +0000137 if config[k1].get("loglevel"):
tiernoc0e42e22018-05-11 11:36:10 +0200138 logger_module.setLevel(config[k1]["loglevel"])
tierno86aa62f2018-08-20 11:57:04 +0000139 self.logger.critical("starting osm/lcm version {} {}".format(lcm_version, lcm_version_date))
tierno59d22d22018-09-25 18:10:19 +0200140
tiernoc0e42e22018-05-11 11:36:10 +0200141 # check version of N2VC
142 # TODO enhance with int conversion or from distutils.version import LooseVersion
143 # or with list(map(int, version.split(".")))
tierno59d22d22018-09-25 18:10:19 +0200144 if versiontuple(n2vc_version) < versiontuple(min_n2vc_version):
tierno6e9d2eb2018-09-12 17:47:18 +0200145 raise LcmException("Not compatible osm/N2VC version '{}'. Needed '{}' or higher".format(
tierno59d22d22018-09-25 18:10:19 +0200146 n2vc_version, min_n2vc_version))
147 # check version of common
tierno27246d82018-09-27 15:59:09 +0200148 if versiontuple(common_version) < versiontuple(min_common_version):
tierno6e9d2eb2018-09-12 17:47:18 +0200149 raise LcmException("Not compatible osm/common version '{}'. Needed '{}' or higher".format(
150 common_version, min_common_version))
tierno22f4f9c2018-06-11 18:53:39 +0200151
tiernoc0e42e22018-05-11 11:36:10 +0200152 try:
bravof922c4172020-11-24 21:21:43 -0300153 self.db = Database(config).instance.db
tiernoc0e42e22018-05-11 11:36:10 +0200154
bravof922c4172020-11-24 21:21:43 -0300155 self.fs = Filesystem(config).instance.fs
tiernoc0e42e22018-05-11 11:36:10 +0200156
quilesj7e13aeb2019-10-08 13:34:55 +0200157 # copy message configuration in order to remove 'group_id' for msg_admin
tiernoc2564fe2019-01-28 16:18:56 +0000158 config_message = config["message"].copy()
159 config_message["loop"] = self.loop
160 if config_message["driver"] == "local":
tiernoc0e42e22018-05-11 11:36:10 +0200161 self.msg = msglocal.MsgLocal()
tiernoc2564fe2019-01-28 16:18:56 +0000162 self.msg.connect(config_message)
tierno16427352019-04-22 11:37:36 +0000163 self.msg_admin = msglocal.MsgLocal()
164 config_message.pop("group_id", None)
165 self.msg_admin.connect(config_message)
tiernoc2564fe2019-01-28 16:18:56 +0000166 elif config_message["driver"] == "kafka":
tiernoc0e42e22018-05-11 11:36:10 +0200167 self.msg = msgkafka.MsgKafka()
tiernoc2564fe2019-01-28 16:18:56 +0000168 self.msg.connect(config_message)
tierno16427352019-04-22 11:37:36 +0000169 self.msg_admin = msgkafka.MsgKafka()
170 config_message.pop("group_id", None)
171 self.msg_admin.connect(config_message)
tiernoc0e42e22018-05-11 11:36:10 +0200172 else:
173 raise LcmException("Invalid configuration param '{}' at '[message]':'driver'".format(
tiernoc2564fe2019-01-28 16:18:56 +0000174 config["message"]["driver"]))
tiernoc0e42e22018-05-11 11:36:10 +0200175 except (DbException, FsException, MsgException) as e:
176 self.logger.critical(str(e), exc_info=True)
177 raise LcmException(str(e))
178
kuused124bfe2019-06-18 12:09:24 +0200179 # contains created tasks/futures to be able to cancel
bravof922c4172020-11-24 21:21:43 -0300180 self.lcm_tasks = TaskRegistry(self.worker_id, self.logger)
kuused124bfe2019-06-18 12:09:24 +0200181
tierno991e95d2020-07-21 12:41:25 +0000182 if self.config.get("tsdb") and self.config["tsdb"].get("driver"):
183 if self.config["tsdb"]["driver"] == "prometheus":
bravof922c4172020-11-24 21:21:43 -0300184 self.prometheus = prometheus.Prometheus(self.config["tsdb"], self.worker_id, self.loop)
tierno991e95d2020-07-21 12:41:25 +0000185 else:
186 raise LcmException("Invalid configuration param '{}' at '[tsdb]':'driver'".format(
187 config["tsdb"]["driver"]))
tiernob996d942020-07-03 14:52:28 +0000188 else:
189 self.prometheus = None
tierno59d22d22018-09-25 18:10:19 +0200190
tierno22f4f9c2018-06-11 18:53:39 +0200191 async def check_RO_version(self):
tiernoe64f7fb2019-09-11 08:55:52 +0000192 tries = 14
193 last_error = None
194 while True:
tierno2357f4e2020-10-19 16:38:59 +0000195 ro_uri = self.config["ro_config"]["uri"]
tiernoe64f7fb2019-09-11 08:55:52 +0000196 try:
tierno2357f4e2020-10-19 16:38:59 +0000197 # try new RO, if fail old RO
198 try:
199 self.config["ro_config"]["uri"] = ro_uri + "ro"
tierno69f0d382020-05-07 13:08:09 +0000200 ro_server = NgRoClient(self.loop, **self.config["ro_config"])
tierno2357f4e2020-10-19 16:38:59 +0000201 ro_version = await ro_server.get_version()
202 self.config["ro_config"]["ng"] = True
203 except Exception:
204 self.config["ro_config"]["uri"] = ro_uri + "openmano"
tierno69f0d382020-05-07 13:08:09 +0000205 ro_server = ROClient(self.loop, **self.config["ro_config"])
tierno2357f4e2020-10-19 16:38:59 +0000206 ro_version = await ro_server.get_version()
207 self.config["ro_config"]["ng"] = False
tiernoe64f7fb2019-09-11 08:55:52 +0000208 if versiontuple(ro_version) < versiontuple(min_RO_version):
209 raise LcmException("Not compatible osm/RO version '{}'. Needed '{}' or higher".format(
210 ro_version, min_RO_version))
tierno2357f4e2020-10-19 16:38:59 +0000211 self.logger.info("Connected to RO version {} new-generation version {}".
212 format(ro_version, self.config["ro_config"]["ng"]))
tiernoe64f7fb2019-09-11 08:55:52 +0000213 return
tierno69f0d382020-05-07 13:08:09 +0000214 except (ROClientException, NgRoException) as e:
tierno2357f4e2020-10-19 16:38:59 +0000215 self.config["ro_config"]["uri"] = ro_uri
tiernoe64f7fb2019-09-11 08:55:52 +0000216 tries -= 1
bravof922c4172020-11-24 21:21:43 -0300217 traceback.print_tb(e.__traceback__)
tierno69f0d382020-05-07 13:08:09 +0000218 error_text = "Error while connecting to RO on {}: {}".format(self.config["ro_config"]["uri"], e)
tiernoe64f7fb2019-09-11 08:55:52 +0000219 if tries <= 0:
220 self.logger.critical(error_text)
221 raise LcmException(error_text)
222 if last_error != error_text:
223 last_error = error_text
224 self.logger.error(error_text + ". Waiting until {} seconds".format(5*tries))
225 await asyncio.sleep(5)
tierno22f4f9c2018-06-11 18:53:39 +0200226
tiernoc0e42e22018-05-11 11:36:10 +0200227 async def test(self, param=None):
228 self.logger.debug("Starting/Ending test task: {}".format(param))
229
tiernoc0e42e22018-05-11 11:36:10 +0200230 async def kafka_ping(self):
231 self.logger.debug("Task kafka_ping Enter")
232 consecutive_errors = 0
233 first_start = True
234 kafka_has_received = False
235 self.pings_not_received = 1
236 while True:
237 try:
tierno16427352019-04-22 11:37:36 +0000238 await self.msg_admin.aiowrite(
239 "admin", "ping",
240 {"from": "lcm", "to": "lcm", "worker_id": self.worker_id, "version": lcm_version},
241 self.loop)
tiernoc0e42e22018-05-11 11:36:10 +0200242 # time between pings are low when it is not received and at starting
tiernoa9843d82018-10-24 10:44:20 +0200243 wait_time = self.ping_interval_boot if not kafka_has_received else self.ping_interval_pace
tiernoc0e42e22018-05-11 11:36:10 +0200244 if not self.pings_not_received:
245 kafka_has_received = True
246 self.pings_not_received += 1
247 await asyncio.sleep(wait_time, loop=self.loop)
248 if self.pings_not_received > 10:
249 raise LcmException("It is not receiving pings from Kafka bus")
250 consecutive_errors = 0
251 first_start = False
252 except LcmException:
253 raise
254 except Exception as e:
255 # if not first_start is the first time after starting. So leave more time and wait
256 # to allow kafka starts
257 if consecutive_errors == 8 if not first_start else 30:
258 self.logger.error("Task kafka_read task exit error too many errors. Exception: {}".format(e))
259 raise
260 consecutive_errors += 1
261 self.logger.error("Task kafka_read retrying after Exception {}".format(e))
tierno16427352019-04-22 11:37:36 +0000262 wait_time = 2 if not first_start else 5
tiernoc0e42e22018-05-11 11:36:10 +0200263 await asyncio.sleep(wait_time, loop=self.loop)
264
gcalvinoed7f6d42018-12-14 14:44:56 +0100265 def kafka_read_callback(self, topic, command, params):
266 order_id = 1
267
268 if topic != "admin" and command != "ping":
269 self.logger.debug("Task kafka_read receives {} {}: {}".format(topic, command, params))
270 self.consecutive_errors = 0
271 self.first_start = False
272 order_id += 1
273 if command == "exit":
274 raise LcmExceptionExit
275 elif command.startswith("#"):
276 return
277 elif command == "echo":
278 # just for test
279 print(params)
280 sys.stdout.flush()
281 return
282 elif command == "test":
283 asyncio.Task(self.test(params), loop=self.loop)
284 return
285
286 if topic == "admin":
287 if command == "ping" and params["to"] == "lcm" and params["from"] == "lcm":
tierno16427352019-04-22 11:37:36 +0000288 if params.get("worker_id") != self.worker_id:
289 return
gcalvinoed7f6d42018-12-14 14:44:56 +0100290 self.pings_not_received = 0
tierno3e359b12019-02-03 02:29:13 +0100291 try:
292 with open(health_check_file, "w") as f:
293 f.write(str(time()))
294 except Exception as e:
295 self.logger.error("Cannot write into '{}' for healthcheck: {}".format(health_check_file, e))
gcalvinoed7f6d42018-12-14 14:44:56 +0100296 return
magnussonle9198bb2020-01-21 13:00:51 +0100297 elif topic == "pla":
298 if command == "placement":
299 self.ns.update_nsrs_with_pla_result(params)
300 return
calvinosanch9f9c6f22019-11-04 13:37:39 +0100301 elif topic == "k8scluster":
302 if command == "create" or command == "created":
303 k8scluster_id = params.get("_id")
304 task = asyncio.ensure_future(self.k8scluster.create(params, order_id))
305 self.lcm_tasks.register("k8scluster", k8scluster_id, order_id, "k8scluster_create", task)
306 return
307 elif command == "delete" or command == "deleted":
308 k8scluster_id = params.get("_id")
309 task = asyncio.ensure_future(self.k8scluster.delete(params, order_id))
310 self.lcm_tasks.register("k8scluster", k8scluster_id, order_id, "k8scluster_delete", task)
311 return
David Garciac1fe90a2021-03-31 19:12:02 +0200312 elif topic == "vca":
313 if command == "create" or command == "created":
314 vca_id = params.get("_id")
315 task = asyncio.ensure_future(self.vca.create(params, order_id))
316 self.lcm_tasks.register("vca", vca_id, order_id, "vca_create", task)
317 return
318 elif command == "delete" or command == "deleted":
319 vca_id = params.get("_id")
320 task = asyncio.ensure_future(self.vca.delete(params, order_id))
321 self.lcm_tasks.register("vca", vca_id, order_id, "vca_delete", task)
322 return
calvinosanch9f9c6f22019-11-04 13:37:39 +0100323 elif topic == "k8srepo":
324 if command == "create" or command == "created":
325 k8srepo_id = params.get("_id")
326 self.logger.debug("k8srepo_id = {}".format(k8srepo_id))
327 task = asyncio.ensure_future(self.k8srepo.create(params, order_id))
328 self.lcm_tasks.register("k8srepo", k8srepo_id, order_id, "k8srepo_create", task)
329 return
330 elif command == "delete" or command == "deleted":
331 k8srepo_id = params.get("_id")
332 task = asyncio.ensure_future(self.k8srepo.delete(params, order_id))
333 self.lcm_tasks.register("k8srepo", k8srepo_id, order_id, "k8srepo_delete", task)
334 return
gcalvinoed7f6d42018-12-14 14:44:56 +0100335 elif topic == "ns":
tierno307425f2020-01-26 23:35:59 +0000336 if command == "instantiate":
gcalvinoed7f6d42018-12-14 14:44:56 +0100337 # self.logger.debug("Deploying NS {}".format(nsr_id))
338 nslcmop = params
339 nslcmop_id = nslcmop["_id"]
340 nsr_id = nslcmop["nsInstanceId"]
341 task = asyncio.ensure_future(self.ns.instantiate(nsr_id, nslcmop_id))
342 self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_instantiate", task)
343 return
tierno307425f2020-01-26 23:35:59 +0000344 elif command == "terminate":
gcalvinoed7f6d42018-12-14 14:44:56 +0100345 # self.logger.debug("Deleting NS {}".format(nsr_id))
346 nslcmop = params
347 nslcmop_id = nslcmop["_id"]
348 nsr_id = nslcmop["nsInstanceId"]
349 self.lcm_tasks.cancel(topic, nsr_id)
350 task = asyncio.ensure_future(self.ns.terminate(nsr_id, nslcmop_id))
351 self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_terminate", task)
352 return
ksaikiranr3fde2c72021-03-15 10:39:06 +0530353 elif command == "vca_status_refresh":
354 nslcmop = params
355 nslcmop_id = nslcmop["_id"]
356 nsr_id = nslcmop["nsInstanceId"]
357 task = asyncio.ensure_future(self.ns.vca_status_refresh(nsr_id, nslcmop_id))
358 self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_vca_status_refresh", task)
359 return
gcalvinoed7f6d42018-12-14 14:44:56 +0100360 elif command == "action":
361 # self.logger.debug("Update NS {}".format(nsr_id))
362 nslcmop = params
363 nslcmop_id = nslcmop["_id"]
364 nsr_id = nslcmop["nsInstanceId"]
365 task = asyncio.ensure_future(self.ns.action(nsr_id, nslcmop_id))
366 self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_action", task)
367 return
368 elif command == "scale":
369 # self.logger.debug("Update NS {}".format(nsr_id))
370 nslcmop = params
371 nslcmop_id = nslcmop["_id"]
372 nsr_id = nslcmop["nsInstanceId"]
373 task = asyncio.ensure_future(self.ns.scale(nsr_id, nslcmop_id))
374 self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_scale", task)
375 return
376 elif command == "show":
tiernoc2564fe2019-01-28 16:18:56 +0000377 nsr_id = params
gcalvinoed7f6d42018-12-14 14:44:56 +0100378 try:
379 db_nsr = self.db.get_one("nsrs", {"_id": nsr_id})
380 print("nsr:\n _id={}\n operational-status: {}\n config-status: {}"
381 "\n detailed-status: {}\n deploy: {}\n tasks: {}"
382 "".format(nsr_id, db_nsr["operational-status"], db_nsr["config-status"],
383 db_nsr["detailed-status"],
384 db_nsr["_admin"]["deployed"], self.lcm_ns_tasks.get(nsr_id)))
385 except Exception as e:
386 print("nsr {} not found: {}".format(nsr_id, e))
387 sys.stdout.flush()
388 return
389 elif command == "deleted":
390 return # TODO cleaning of task just in case should be done
391 elif command in ("terminated", "instantiated", "scaled", "actioned"): # "scaled-cooldown-time"
392 return
393 elif topic == "nsi": # netslice LCM processes (instantiate, terminate, etc)
tierno307425f2020-01-26 23:35:59 +0000394 if command == "instantiate":
gcalvinoed7f6d42018-12-14 14:44:56 +0100395 # self.logger.debug("Instantiating Network Slice {}".format(nsilcmop["netsliceInstanceId"]))
396 nsilcmop = params
397 nsilcmop_id = nsilcmop["_id"] # slice operation id
398 nsir_id = nsilcmop["netsliceInstanceId"] # slice record id
399 task = asyncio.ensure_future(self.netslice.instantiate(nsir_id, nsilcmop_id))
400 self.lcm_tasks.register("nsi", nsir_id, nsilcmop_id, "nsi_instantiate", task)
401 return
tierno307425f2020-01-26 23:35:59 +0000402 elif command == "terminate":
gcalvinoed7f6d42018-12-14 14:44:56 +0100403 # self.logger.debug("Terminating Network Slice NS {}".format(nsilcmop["netsliceInstanceId"]))
404 nsilcmop = params
405 nsilcmop_id = nsilcmop["_id"] # slice operation id
406 nsir_id = nsilcmop["netsliceInstanceId"] # slice record id
407 self.lcm_tasks.cancel(topic, nsir_id)
408 task = asyncio.ensure_future(self.netslice.terminate(nsir_id, nsilcmop_id))
409 self.lcm_tasks.register("nsi", nsir_id, nsilcmop_id, "nsi_terminate", task)
410 return
411 elif command == "show":
tiernoc2564fe2019-01-28 16:18:56 +0000412 nsir_id = params
gcalvinoed7f6d42018-12-14 14:44:56 +0100413 try:
414 db_nsir = self.db.get_one("nsirs", {"_id": nsir_id})
415 print("nsir:\n _id={}\n operational-status: {}\n config-status: {}"
416 "\n detailed-status: {}\n deploy: {}\n tasks: {}"
417 "".format(nsir_id, db_nsir["operational-status"], db_nsir["config-status"],
418 db_nsir["detailed-status"],
419 db_nsir["_admin"]["deployed"], self.lcm_netslice_tasks.get(nsir_id)))
420 except Exception as e:
421 print("nsir {} not found: {}".format(nsir_id, e))
422 sys.stdout.flush()
423 return
424 elif command == "deleted":
425 return # TODO cleaning of task just in case should be done
426 elif command in ("terminated", "instantiated", "scaled", "actioned"): # "scaled-cooldown-time"
427 return
428 elif topic == "vim_account":
429 vim_id = params["_id"]
tiernof210c1c2019-10-16 09:09:58 +0000430 if command in ("create", "created"):
tierno2357f4e2020-10-19 16:38:59 +0000431 if not self.config["ro_config"].get("ng"):
432 task = asyncio.ensure_future(self.vim.create(params, order_id))
433 self.lcm_tasks.register("vim_account", vim_id, order_id, "vim_create", task)
gcalvinoed7f6d42018-12-14 14:44:56 +0100434 return
calvinosanch9f9c6f22019-11-04 13:37:39 +0100435 elif command == "delete" or command == "deleted":
gcalvinoed7f6d42018-12-14 14:44:56 +0100436 self.lcm_tasks.cancel(topic, vim_id)
kuuse6a470c62019-07-10 13:52:45 +0200437 task = asyncio.ensure_future(self.vim.delete(params, order_id))
gcalvinoed7f6d42018-12-14 14:44:56 +0100438 self.lcm_tasks.register("vim_account", vim_id, order_id, "vim_delete", task)
439 return
440 elif command == "show":
441 print("not implemented show with vim_account")
442 sys.stdout.flush()
443 return
tiernof210c1c2019-10-16 09:09:58 +0000444 elif command in ("edit", "edited"):
tierno2357f4e2020-10-19 16:38:59 +0000445 if not self.config["ro_config"].get("ng"):
446 task = asyncio.ensure_future(self.vim.edit(params, order_id))
447 self.lcm_tasks.register("vim_account", vim_id, order_id, "vim_edit", task)
gcalvinoed7f6d42018-12-14 14:44:56 +0100448 return
tiernof210c1c2019-10-16 09:09:58 +0000449 elif command == "deleted":
450 return # TODO cleaning of task just in case should be done
gcalvinoed7f6d42018-12-14 14:44:56 +0100451 elif topic == "wim_account":
452 wim_id = params["_id"]
tiernof210c1c2019-10-16 09:09:58 +0000453 if command in ("create", "created"):
tierno2357f4e2020-10-19 16:38:59 +0000454 if not self.config["ro_config"].get("ng"):
455 task = asyncio.ensure_future(self.wim.create(params, order_id))
456 self.lcm_tasks.register("wim_account", wim_id, order_id, "wim_create", task)
gcalvinoed7f6d42018-12-14 14:44:56 +0100457 return
calvinosanch9f9c6f22019-11-04 13:37:39 +0100458 elif command == "delete" or command == "deleted":
gcalvinoed7f6d42018-12-14 14:44:56 +0100459 self.lcm_tasks.cancel(topic, wim_id)
kuuse6a470c62019-07-10 13:52:45 +0200460 task = asyncio.ensure_future(self.wim.delete(params, order_id))
gcalvinoed7f6d42018-12-14 14:44:56 +0100461 self.lcm_tasks.register("wim_account", wim_id, order_id, "wim_delete", task)
462 return
463 elif command == "show":
464 print("not implemented show with wim_account")
465 sys.stdout.flush()
466 return
tiernof210c1c2019-10-16 09:09:58 +0000467 elif command in ("edit", "edited"):
gcalvinoed7f6d42018-12-14 14:44:56 +0100468 task = asyncio.ensure_future(self.wim.edit(params, order_id))
469 self.lcm_tasks.register("wim_account", wim_id, order_id, "wim_edit", task)
470 return
tiernof210c1c2019-10-16 09:09:58 +0000471 elif command == "deleted":
472 return # TODO cleaning of task just in case should be done
gcalvinoed7f6d42018-12-14 14:44:56 +0100473 elif topic == "sdn":
474 _sdn_id = params["_id"]
tiernof210c1c2019-10-16 09:09:58 +0000475 if command in ("create", "created"):
tierno2357f4e2020-10-19 16:38:59 +0000476 if not self.config["ro_config"].get("ng"):
477 task = asyncio.ensure_future(self.sdn.create(params, order_id))
478 self.lcm_tasks.register("sdn", _sdn_id, order_id, "sdn_create", task)
gcalvinoed7f6d42018-12-14 14:44:56 +0100479 return
calvinosanch9f9c6f22019-11-04 13:37:39 +0100480 elif command == "delete" or command == "deleted":
gcalvinoed7f6d42018-12-14 14:44:56 +0100481 self.lcm_tasks.cancel(topic, _sdn_id)
kuuse6a470c62019-07-10 13:52:45 +0200482 task = asyncio.ensure_future(self.sdn.delete(params, order_id))
gcalvinoed7f6d42018-12-14 14:44:56 +0100483 self.lcm_tasks.register("sdn", _sdn_id, order_id, "sdn_delete", task)
484 return
tiernof210c1c2019-10-16 09:09:58 +0000485 elif command in ("edit", "edited"):
gcalvinoed7f6d42018-12-14 14:44:56 +0100486 task = asyncio.ensure_future(self.sdn.edit(params, order_id))
487 self.lcm_tasks.register("sdn", _sdn_id, order_id, "sdn_edit", task)
488 return
tiernof210c1c2019-10-16 09:09:58 +0000489 elif command == "deleted":
490 return # TODO cleaning of task just in case should be done
gcalvinoed7f6d42018-12-14 14:44:56 +0100491 self.logger.critical("unknown topic {} and command '{}'".format(topic, command))
492
tiernoc0e42e22018-05-11 11:36:10 +0200493 async def kafka_read(self):
tierno16427352019-04-22 11:37:36 +0000494 self.logger.debug("Task kafka_read Enter with worker_id={}".format(self.worker_id))
tiernoc0e42e22018-05-11 11:36:10 +0200495 # future = asyncio.Future()
gcalvinoed7f6d42018-12-14 14:44:56 +0100496 self.consecutive_errors = 0
497 self.first_start = True
498 while self.consecutive_errors < 10:
tiernoc0e42e22018-05-11 11:36:10 +0200499 try:
David Garciac1fe90a2021-03-31 19:12:02 +0200500 topics = ("ns", "vim_account", "wim_account", "sdn", "nsi", "k8scluster", "vca", "k8srepo", "pla")
tierno16427352019-04-22 11:37:36 +0000501 topics_admin = ("admin", )
502 await asyncio.gather(
tierno247439e2020-07-16 11:26:02 +0000503 self.msg.aioread(topics, self.loop, self.kafka_read_callback, from_beginning=True),
tierno16427352019-04-22 11:37:36 +0000504 self.msg_admin.aioread(topics_admin, self.loop, self.kafka_read_callback, group_id=False)
505 )
tiernoc0e42e22018-05-11 11:36:10 +0200506
gcalvinoed7f6d42018-12-14 14:44:56 +0100507 except LcmExceptionExit:
508 self.logger.debug("Bye!")
509 break
tiernoc0e42e22018-05-11 11:36:10 +0200510 except Exception as e:
511 # if not first_start is the first time after starting. So leave more time and wait
512 # to allow kafka starts
gcalvinoed7f6d42018-12-14 14:44:56 +0100513 if self.consecutive_errors == 8 if not self.first_start else 30:
tiernoc0e42e22018-05-11 11:36:10 +0200514 self.logger.error("Task kafka_read task exit error too many errors. Exception: {}".format(e))
515 raise
gcalvinoed7f6d42018-12-14 14:44:56 +0100516 self.consecutive_errors += 1
tiernoc0e42e22018-05-11 11:36:10 +0200517 self.logger.error("Task kafka_read retrying after Exception {}".format(e))
gcalvinoed7f6d42018-12-14 14:44:56 +0100518 wait_time = 2 if not self.first_start else 5
tiernoc0e42e22018-05-11 11:36:10 +0200519 await asyncio.sleep(wait_time, loop=self.loop)
520
521 # self.logger.debug("Task kafka_read terminating")
522 self.logger.debug("Task kafka_read exit")
523
524 def start(self):
tierno22f4f9c2018-06-11 18:53:39 +0200525
526 # check RO version
527 self.loop.run_until_complete(self.check_RO_version())
528
bravof922c4172020-11-24 21:21:43 -0300529 self.ns = ns.NsLcm(self.msg, self.lcm_tasks, self.config, self.loop, self.prometheus)
530 self.netslice = netslice.NetsliceLcm(self.msg, self.lcm_tasks, self.config, self.loop,
tierno2357f4e2020-10-19 16:38:59 +0000531 self.ns)
bravof922c4172020-11-24 21:21:43 -0300532 self.vim = vim_sdn.VimLcm(self.msg, self.lcm_tasks, self.config, self.loop)
533 self.wim = vim_sdn.WimLcm(self.msg, self.lcm_tasks, self.config, self.loop)
534 self.sdn = vim_sdn.SdnLcm(self.msg, self.lcm_tasks, self.config, self.loop)
535 self.k8scluster = vim_sdn.K8sClusterLcm(self.msg, self.lcm_tasks, self.config, self.loop)
David Garciac1fe90a2021-03-31 19:12:02 +0200536 self.vca = vim_sdn.VcaLcm(self.msg, self.lcm_tasks, self.config, self.loop)
bravof922c4172020-11-24 21:21:43 -0300537 self.k8srepo = vim_sdn.K8sRepoLcm(self.msg, self.lcm_tasks, self.config, self.loop)
tierno2357f4e2020-10-19 16:38:59 +0000538
tierno991e95d2020-07-21 12:41:25 +0000539 # configure tsdb prometheus
tiernob996d942020-07-03 14:52:28 +0000540 if self.prometheus:
541 self.loop.run_until_complete(self.prometheus.start())
542
tiernoc0e42e22018-05-11 11:36:10 +0200543 self.loop.run_until_complete(asyncio.gather(
544 self.kafka_read(),
545 self.kafka_ping()
546 ))
547 # TODO
548 # self.logger.debug("Terminating cancelling creation tasks")
tiernoca2e16a2018-06-29 15:25:24 +0200549 # self.lcm_tasks.cancel("ALL", "create")
tiernoc0e42e22018-05-11 11:36:10 +0200550 # timeout = 200
551 # while self.is_pending_tasks():
552 # self.logger.debug("Task kafka_read terminating. Waiting for tasks termination")
553 # await asyncio.sleep(2, loop=self.loop)
554 # timeout -= 2
555 # if not timeout:
tiernoca2e16a2018-06-29 15:25:24 +0200556 # self.lcm_tasks.cancel("ALL", "ALL")
tiernoc0e42e22018-05-11 11:36:10 +0200557 self.loop.close()
558 self.loop = None
559 if self.db:
560 self.db.db_disconnect()
561 if self.msg:
562 self.msg.disconnect()
tierno16427352019-04-22 11:37:36 +0000563 if self.msg_admin:
564 self.msg_admin.disconnect()
tiernoc0e42e22018-05-11 11:36:10 +0200565 if self.fs:
566 self.fs.fs_disconnect()
567
tiernoc0e42e22018-05-11 11:36:10 +0200568 def read_config_file(self, config_file):
569 # TODO make a [ini] + yaml inside parser
570 # the configparser library is not suitable, because it does not admit comments at the end of line,
571 # and not parse integer or boolean
572 try:
tierno744303e2020-01-13 16:46:31 +0000573 # read file as yaml format
tiernoc0e42e22018-05-11 11:36:10 +0200574 with open(config_file) as f:
tiernoda6fb102019-11-23 00:36:52 +0000575 conf = yaml.load(f, Loader=yaml.Loader)
tierno744303e2020-01-13 16:46:31 +0000576 # Ensure all sections are not empty
577 for k in ("global", "timeout", "RO", "VCA", "database", "storage", "message"):
578 if not conf.get(k):
579 conf[k] = {}
580
581 # read all environ that starts with OSMLCM_
tiernoc0e42e22018-05-11 11:36:10 +0200582 for k, v in environ.items():
583 if not k.startswith("OSMLCM_"):
584 continue
tierno744303e2020-01-13 16:46:31 +0000585 subject, _, item = k[7:].lower().partition("_")
586 if not item:
tierno17a612f2018-10-23 11:30:42 +0200587 continue
tierno744303e2020-01-13 16:46:31 +0000588 if subject in ("ro", "vca"):
tierno17a612f2018-10-23 11:30:42 +0200589 # put in capital letter
tierno744303e2020-01-13 16:46:31 +0000590 subject = subject.upper()
tiernoc0e42e22018-05-11 11:36:10 +0200591 try:
tierno744303e2020-01-13 16:46:31 +0000592 if item == "port" or subject == "timeout":
593 conf[subject][item] = int(v)
tiernoc0e42e22018-05-11 11:36:10 +0200594 else:
tierno744303e2020-01-13 16:46:31 +0000595 conf[subject][item] = v
tiernoc0e42e22018-05-11 11:36:10 +0200596 except Exception as e:
tierno744303e2020-01-13 16:46:31 +0000597 self.logger.warning("skipping environ '{}' on exception '{}'".format(k, e))
598
599 # backward compatibility of VCA parameters
600
601 if 'pubkey' in conf["VCA"]:
602 conf["VCA"]['public_key'] = conf["VCA"].pop('pubkey')
603 if 'cacert' in conf["VCA"]:
604 conf["VCA"]['ca_cert'] = conf["VCA"].pop('cacert')
605 if 'apiproxy' in conf["VCA"]:
606 conf["VCA"]['api_proxy'] = conf["VCA"].pop('apiproxy')
607
608 if 'enableosupgrade' in conf["VCA"]:
609 conf["VCA"]['enable_os_upgrade'] = conf["VCA"].pop('enableosupgrade')
610 if isinstance(conf["VCA"].get('enable_os_upgrade'), str):
611 if conf["VCA"]['enable_os_upgrade'].lower() == 'false':
612 conf["VCA"]['enable_os_upgrade'] = False
613 elif conf["VCA"]['enable_os_upgrade'].lower() == 'true':
614 conf["VCA"]['enable_os_upgrade'] = True
615
616 if 'aptmirror' in conf["VCA"]:
617 conf["VCA"]['apt_mirror'] = conf["VCA"].pop('aptmirror')
tiernoc0e42e22018-05-11 11:36:10 +0200618
619 return conf
620 except Exception as e:
621 self.logger.critical("At config file '{}': {}".format(config_file, e))
622 exit(1)
623
tierno16427352019-04-22 11:37:36 +0000624 @staticmethod
625 def get_process_id():
626 """
627 Obtain a unique ID for this process. If running from inside docker, it will get docker ID. If not it
628 will provide a random one
629 :return: Obtained ID
630 """
631 # Try getting docker id. If fails, get pid
632 try:
633 with open("/proc/self/cgroup", "r") as f:
634 text_id_ = f.readline()
635 _, _, text_id = text_id_.rpartition("/")
636 text_id = text_id.replace('\n', '')[:12]
637 if text_id:
638 return text_id
639 except Exception:
640 pass
641 # Return a random id
642 return ''.join(random_choice("0123456789abcdef") for _ in range(12))
643
tiernoc0e42e22018-05-11 11:36:10 +0200644
tierno275411e2018-05-16 14:33:32 +0200645def usage():
646 print("""Usage: {} [options]
quilesj7e13aeb2019-10-08 13:34:55 +0200647 -c|--config [configuration_file]: loads the configuration file (default: ./lcm.cfg)
tiernoa9843d82018-10-24 10:44:20 +0200648 --health-check: do not run lcm, but inspect kafka bus to determine if lcm is healthy
tierno275411e2018-05-16 14:33:32 +0200649 -h|--help: shows this help
650 """.format(sys.argv[0]))
tierno750b2452018-05-17 16:39:29 +0200651 # --log-socket-host HOST: send logs to this host")
652 # --log-socket-port PORT: send logs using this port (default: 9022)")
tierno275411e2018-05-16 14:33:32 +0200653
654
tiernoc0e42e22018-05-11 11:36:10 +0200655if __name__ == '__main__':
quilesj7e13aeb2019-10-08 13:34:55 +0200656
tierno275411e2018-05-16 14:33:32 +0200657 try:
tierno8c16b052020-02-05 15:08:32 +0000658 # print("SYS.PATH='{}'".format(sys.path))
tierno275411e2018-05-16 14:33:32 +0200659 # load parameters and configuration
quilesj7e13aeb2019-10-08 13:34:55 +0200660 # -h
661 # -c value
662 # --config value
663 # --help
664 # --health-check
tiernoa9843d82018-10-24 10:44:20 +0200665 opts, args = getopt.getopt(sys.argv[1:], "hc:", ["config=", "help", "health-check"])
tierno275411e2018-05-16 14:33:32 +0200666 # TODO add "log-socket-host=", "log-socket-port=", "log-file="
667 config_file = None
668 for o, a in opts:
669 if o in ("-h", "--help"):
670 usage()
671 sys.exit()
672 elif o in ("-c", "--config"):
673 config_file = a
tiernoa9843d82018-10-24 10:44:20 +0200674 elif o == "--health-check":
tierno94f06112020-02-11 12:38:19 +0000675 from osm_lcm.lcm_hc import health_check
676 health_check(health_check_file, Lcm.ping_interval_pace)
tierno275411e2018-05-16 14:33:32 +0200677 # elif o == "--log-socket-port":
678 # log_socket_port = a
679 # elif o == "--log-socket-host":
680 # log_socket_host = a
681 # elif o == "--log-file":
682 # log_file = a
683 else:
684 assert False, "Unhandled option"
quilesj7e13aeb2019-10-08 13:34:55 +0200685
tierno275411e2018-05-16 14:33:32 +0200686 if config_file:
687 if not path.isfile(config_file):
quilesj7e13aeb2019-10-08 13:34:55 +0200688 print("configuration file '{}' does not exist".format(config_file), file=sys.stderr)
tierno275411e2018-05-16 14:33:32 +0200689 exit(1)
690 else:
691 for config_file in (__file__[:__file__.rfind(".")] + ".cfg", "./lcm.cfg", "/etc/osm/lcm.cfg"):
692 if path.isfile(config_file):
693 break
694 else:
tierno17a612f2018-10-23 11:30:42 +0200695 print("No configuration file 'lcm.cfg' found neither at local folder nor at /etc/osm/", file=sys.stderr)
tierno275411e2018-05-16 14:33:32 +0200696 exit(1)
697 lcm = Lcm(config_file)
tierno3e359b12019-02-03 02:29:13 +0100698 lcm.start()
tierno22f4f9c2018-06-11 18:53:39 +0200699 except (LcmException, getopt.GetoptError) as e:
tierno275411e2018-05-16 14:33:32 +0200700 print(str(e), file=sys.stderr)
701 # usage()
702 exit(1)