blob: b4e6887d4e14518d3ad476d326d1b1877fa1c526 [file] [log] [blame]
tierno59d22d22018-09-25 18:10:19 +02001# -*- coding: utf-8 -*-
2
tierno2e215512018-11-28 09:37:52 +00003##
4# Copyright 2018 Telefonica S.A.
5#
6# Licensed under the Apache License, Version 2.0 (the "License"); you may
7# not use this file except in compliance with the License. You may obtain
8# a copy of the License at
9#
10# http://www.apache.org/licenses/LICENSE-2.0
11#
12# Unless required by applicable law or agreed to in writing, software
13# distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
14# WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
15# License for the specific language governing permissions and limitations
16# under the License.
17##
tierno59d22d22018-09-25 18:10:19 +020018
kuused124bfe2019-06-18 12:09:24 +020019import asyncio
tierno59d22d22018-09-25 18:10:19 +020020from collections import OrderedDict
tierno79cd8ad2019-10-18 13:03:10 +000021from time import time
tiernobaa51102018-12-14 13:16:18 +000022# from osm_common.dbbase import DbException
tierno59d22d22018-09-25 18:10:19 +020023
24__author__ = "Alfonso Tierno"
25
26
27class LcmException(Exception):
28 pass
29
30
tiernof578e552018-11-08 19:07:20 +010031class LcmExceptionNoMgmtIP(LcmException):
32 pass
33
34
gcalvinoed7f6d42018-12-14 14:44:56 +010035class LcmExceptionExit(LcmException):
36 pass
37
38
tierno59d22d22018-09-25 18:10:19 +020039def versiontuple(v):
tierno27246d82018-09-27 15:59:09 +020040 """utility for compare dot separate versions. Fills with zeros to proper number comparison
41 package version will be something like 4.0.1.post11+gb3f024d.dirty-1. Where 4.0.1 is the git tag, postXX is the
42 number of commits from this tag, and +XXXXXXX is the git commit short id. Total length is 16 with until 999 commits
43 """
tierno59d22d22018-09-25 18:10:19 +020044 filled = []
45 for point in v.split("."):
tiernoe64f7fb2019-09-11 08:55:52 +000046 point, _, _ = point.partition("+")
47 point, _, _ = point.partition("-")
48 filled.append(point.zfill(20))
tierno59d22d22018-09-25 18:10:19 +020049 return tuple(filled)
50
51
kuused124bfe2019-06-18 12:09:24 +020052# LcmBase must be listed before TaskRegistry, as it is a dependency.
53class LcmBase:
54
55 def __init__(self, db, msg, fs, logger):
56 """
57
58 :param db: database connection
59 """
60 self.db = db
61 self.msg = msg
62 self.fs = fs
63 self.logger = logger
64
65 def update_db_2(self, item, _id, _desc):
66 """
67 Updates database with _desc information. If success _desc is cleared
68 :param item:
69 :param _id:
70 :param _desc: dictionary with the content to update. Keys are dot separated keys for
71 :return: None. Exception is raised on error
72 """
73 if not _desc:
74 return
tierno79cd8ad2019-10-18 13:03:10 +000075 now = time()
76 _desc["_admin.modified"] = now
kuused124bfe2019-06-18 12:09:24 +020077 self.db.set_one(item, {"_id": _id}, _desc)
78 _desc.clear()
79 # except DbException as e:
80 # self.logger.error("Updating {} _id={} with '{}'. Error: {}".format(item, _id, _desc, e))
81
82
83class TaskRegistry(LcmBase):
tierno59d22d22018-09-25 18:10:19 +020084 """
85 Implements a registry of task needed for later cancelation, look for related tasks that must be completed before
86 etc. It stores a four level dict
87 First level is the topic, ns, vim_account, sdn
88 Second level is the _id
89 Third level is the operation id
90 Fourth level is a descriptive name, the value is the task class
kuused124bfe2019-06-18 12:09:24 +020091
92 The HA (High-Availability) methods are used when more than one LCM instance is running.
93 To register the current task in the external DB, use LcmBase as base class, to be able
94 to reuse LcmBase.update_db_2()
95 The DB registry uses the following fields to distinguish a task:
96 - op_type: operation type ("nslcmops" or "nsilcmops")
97 - op_id: operation ID
98 - worker: the worker ID for this process
tierno59d22d22018-09-25 18:10:19 +020099 """
100
kuuse6a470c62019-07-10 13:52:45 +0200101 # NS/NSI: "services" VIM/WIM/SDN: "accounts"
102 topic_service_list = ['ns', 'nsi']
calvinosanch9f9c6f22019-11-04 13:37:39 +0100103 topic_account_list = ['vim', 'wim', 'sdn', 'k8scluster', 'k8srepo']
kuuse6a470c62019-07-10 13:52:45 +0200104
105 # Map topic to InstanceID
106 topic2instid_dict = {
107 'ns': 'nsInstanceId',
108 'nsi': 'netsliceInstanceId'}
109
110 # Map topic to DB table name
111 topic2dbtable_dict = {
112 'ns': 'nslcmops',
113 'nsi': 'nsilcmops',
114 'vim': 'vim_accounts',
115 'wim': 'wim_accounts',
calvinosanch9f9c6f22019-11-04 13:37:39 +0100116 'sdn': 'sdns',
117 'k8scluster': 'k8sclusters',
118 'k8srepo': 'k8srepos'}
kuused124bfe2019-06-18 12:09:24 +0200119
120 def __init__(self, worker_id=None, db=None, logger=None):
tierno59d22d22018-09-25 18:10:19 +0200121 self.task_registry = {
122 "ns": {},
Felipe Vicensc2033f22018-11-15 15:09:58 +0100123 "nsi": {},
tierno59d22d22018-09-25 18:10:19 +0200124 "vim_account": {},
tiernoe37b57d2018-12-11 17:22:51 +0000125 "wim_account": {},
tierno59d22d22018-09-25 18:10:19 +0200126 "sdn": {},
calvinosanch9f9c6f22019-11-04 13:37:39 +0100127 "k8scluster": {},
128 "k8srepo": {},
tierno59d22d22018-09-25 18:10:19 +0200129 }
kuused124bfe2019-06-18 12:09:24 +0200130 self.worker_id = worker_id
131 self.db = db
132 self.logger = logger
tierno59d22d22018-09-25 18:10:19 +0200133
134 def register(self, topic, _id, op_id, task_name, task):
135 """
136 Register a new task
Felipe Vicensc2033f22018-11-15 15:09:58 +0100137 :param topic: Can be "ns", "nsi", "vim_account", "sdn"
tierno59d22d22018-09-25 18:10:19 +0200138 :param _id: _id of the related item
139 :param op_id: id of the operation of the related item
140 :param task_name: Task descriptive name, as create, instantiate, terminate. Must be unique in this op_id
141 :param task: Task class
142 :return: none
143 """
144 if _id not in self.task_registry[topic]:
145 self.task_registry[topic][_id] = OrderedDict()
146 if op_id not in self.task_registry[topic][_id]:
147 self.task_registry[topic][_id][op_id] = {task_name: task}
148 else:
149 self.task_registry[topic][_id][op_id][task_name] = task
150 # print("registering task", topic, _id, op_id, task_name, task)
151
152 def remove(self, topic, _id, op_id, task_name=None):
153 """
tiernobaa51102018-12-14 13:16:18 +0000154 When task is ended, it should be removed. It ignores missing tasks. It also removes tasks done with this _id
Felipe Vicensc2033f22018-11-15 15:09:58 +0100155 :param topic: Can be "ns", "nsi", "vim_account", "sdn"
tierno59d22d22018-09-25 18:10:19 +0200156 :param _id: _id of the related item
157 :param op_id: id of the operation of the related item
tiernobaa51102018-12-14 13:16:18 +0000158 :param task_name: Task descriptive name. If none it deletes all tasks with same _id and op_id
159 :return: None
tierno59d22d22018-09-25 18:10:19 +0200160 """
tiernobaa51102018-12-14 13:16:18 +0000161 if not self.task_registry[topic].get(_id):
tierno59d22d22018-09-25 18:10:19 +0200162 return
163 if not task_name:
tiernobaa51102018-12-14 13:16:18 +0000164 self.task_registry[topic][_id].pop(op_id, None)
165 elif self.task_registry[topic][_id].get(op_id):
166 self.task_registry[topic][_id][op_id].pop(task_name, None)
167
168 # delete done tasks
169 for op_id_ in list(self.task_registry[topic][_id]):
170 for name, task in self.task_registry[topic][_id][op_id_].items():
171 if not task.done():
172 break
173 else:
174 del self.task_registry[topic][_id][op_id_]
tierno59d22d22018-09-25 18:10:19 +0200175 if not self.task_registry[topic][_id]:
176 del self.task_registry[topic][_id]
177
178 def lookfor_related(self, topic, _id, my_op_id=None):
179 task_list = []
180 task_name_list = []
181 if _id not in self.task_registry[topic]:
182 return "", task_name_list
183 for op_id in reversed(self.task_registry[topic][_id]):
184 if my_op_id:
185 if my_op_id == op_id:
186 my_op_id = None # so that the next task is taken
187 continue
188
189 for task_name, task in self.task_registry[topic][_id][op_id].items():
tiernobaa51102018-12-14 13:16:18 +0000190 if not task.done():
191 task_list.append(task)
192 task_name_list.append(task_name)
tierno59d22d22018-09-25 18:10:19 +0200193 break
194 return ", ".join(task_name_list), task_list
195
196 def cancel(self, topic, _id, target_op_id=None, target_task_name=None):
197 """
kuused124bfe2019-06-18 12:09:24 +0200198 Cancel all active tasks of a concrete ns, nsi, vim_account, sdn identified for _id. If op_id is supplied only
Felipe Vicensc2033f22018-11-15 15:09:58 +0100199 this is cancelled, and the same with task_name
tierno59d22d22018-09-25 18:10:19 +0200200 """
201 if not self.task_registry[topic].get(_id):
202 return
203 for op_id in reversed(self.task_registry[topic][_id]):
204 if target_op_id and target_op_id != op_id:
205 continue
206 for task_name, task in self.task_registry[topic][_id][op_id].items():
207 if target_task_name and target_task_name != task_name:
208 continue
209 # result =
210 task.cancel()
211 # if result:
212 # self.logger.debug("{} _id={} order_id={} task={} cancelled".format(topic, _id, op_id, task_name))
213
kuuse6a470c62019-07-10 13:52:45 +0200214 # Is topic NS/NSI?
215 def _is_service_type_HA(self, topic):
216 return topic in self.topic_service_list
217
218 # Is topic VIM/WIM/SDN?
219 def _is_account_type_HA(self, topic):
220 return topic in self.topic_account_list
221
222 # Input: op_id, example: 'abc123def:3' Output: account_id='abc123def', op_index=3
223 def _get_account_and_op_HA(self, op_id):
224 if not op_id:
225 return (None, None)
226 account_id, _, op_index = op_id.rpartition(':')
227 if not account_id:
228 return (None, None)
229 if not op_index.isdigit():
230 return (None, None)
231 return account_id, op_index
232
233 # Get '_id' for any topic and operation
234 def _get_instance_id_HA(self, topic, op_type, op_id):
235 _id = None
236 # Special operation 'ANY', for SDN account associated to a VIM account: op_id as '_id'
237 if op_type == 'ANY':
238 _id = op_id
239 # NS/NSI: Use op_id as '_id'
240 elif self._is_service_type_HA(topic):
241 _id = op_id
calvinosanch9f9c6f22019-11-04 13:37:39 +0100242 # VIM/SDN/WIM/K8SCLUSTER: Split op_id to get Account ID and Operation Index, use Account ID as '_id'
kuuse6a470c62019-07-10 13:52:45 +0200243 elif self._is_account_type_HA(topic):
244 _id, _ = self._get_account_and_op_HA(op_id)
245 return _id
246
247 # Set DB _filter for querying any related process state
248 def _get_waitfor_filter_HA(self, db_lcmop, topic, op_type, op_id):
249 _filter = {}
250 # Special operation 'ANY', for SDN account associated to a VIM account: op_id as '_id'
251 # In this special case, the timestamp is ignored
252 if op_type == 'ANY':
253 _filter = {'operationState': 'PROCESSING'}
254 # Otherwise, get 'startTime' timestamp for this operation
255 else:
256 # NS/NSI
257 if self._is_service_type_HA(topic):
tierno79cd8ad2019-10-18 13:03:10 +0000258 now = time()
kuuse6a470c62019-07-10 13:52:45 +0200259 starttime_this_op = db_lcmop.get("startTime")
260 instance_id_label = self.topic2instid_dict.get(topic)
261 instance_id = db_lcmop.get(instance_id_label)
262 _filter = {instance_id_label: instance_id,
263 'operationState': 'PROCESSING',
tierno79cd8ad2019-10-18 13:03:10 +0000264 'startTime.lt': starttime_this_op,
265 "_admin.modified.gt": now - 2*3600, # ignore if tow hours of inactivity
266 }
calvinosanch9f9c6f22019-11-04 13:37:39 +0100267 # VIM/WIM/SDN/K8scluster
kuuse6a470c62019-07-10 13:52:45 +0200268 elif self._is_account_type_HA(topic):
269 _, op_index = self._get_account_and_op_HA(op_id)
270 _ops = db_lcmop['_admin']['operations']
271 _this_op = _ops[int(op_index)]
272 starttime_this_op = _this_op.get('startTime', None)
273 _filter = {'operationState': 'PROCESSING',
274 'startTime.lt': starttime_this_op}
275 return _filter
276
277 # Get DB params for any topic and operation
278 def _get_dbparams_for_lock_HA(self, topic, op_type, op_id):
279 q_filter = {}
280 update_dict = {}
281 # NS/NSI
282 if self._is_service_type_HA(topic):
283 q_filter = {'_id': op_id, '_admin.worker': None}
284 update_dict = {'_admin.worker': self.worker_id}
285 # VIM/WIM/SDN
286 elif self._is_account_type_HA(topic):
287 account_id, op_index = self._get_account_and_op_HA(op_id)
288 if not account_id:
289 return None, None
290 if op_type == 'create':
291 # Creating a VIM/WIM/SDN account implies setting '_admin.current_operation' = 0
292 op_index = 0
293 q_filter = {'_id': account_id, "_admin.operations.{}.worker".format(op_index): None}
294 update_dict = {'_admin.operations.{}.worker'.format(op_index): self.worker_id,
295 '_admin.current_operation': op_index}
296 return q_filter, update_dict
297
kuused124bfe2019-06-18 12:09:24 +0200298 def lock_HA(self, topic, op_type, op_id):
299 """
kuuse6a470c62019-07-10 13:52:45 +0200300 Lock a task, if possible, to indicate to the HA system that
kuused124bfe2019-06-18 12:09:24 +0200301 the task will be executed in this LCM instance.
kuuse6a470c62019-07-10 13:52:45 +0200302 :param topic: Can be "ns", "nsi", "vim", "wim", or "sdn"
303 :param op_type: Operation type, can be "nslcmops", "nsilcmops", "create", "edit", "delete"
304 :param op_id: NS, NSI: Operation ID VIM,WIM,SDN: Account ID + ':' + Operation Index
kuused124bfe2019-06-18 12:09:24 +0200305 :return:
kuuse6a470c62019-07-10 13:52:45 +0200306 True=lock was successful => execute the task (not registered by any other LCM instance)
kuused124bfe2019-06-18 12:09:24 +0200307 False=lock failed => do NOT execute the task (already registered by another LCM instance)
kuuse6a470c62019-07-10 13:52:45 +0200308
309 HA tasks and backward compatibility:
310 If topic is "account type" (VIM/WIM/SDN) and op_id is None, 'op_id' was not provided by NBI.
311 This means that the running NBI instance does not support HA.
312 In such a case this method should always return True, to always execute
313 the task in this instance of LCM, without querying the DB.
tierno59d22d22018-09-25 18:10:19 +0200314 """
315
calvinosanch9f9c6f22019-11-04 13:37:39 +0100316 # Backward compatibility for VIM/WIM/SDN/k8scluster without op_id
kuuse6a470c62019-07-10 13:52:45 +0200317 if self._is_account_type_HA(topic) and op_id is None:
318 return True
tierno59d22d22018-09-25 18:10:19 +0200319
kuuse6a470c62019-07-10 13:52:45 +0200320 # Try to lock this task
321 db_table_name = self.topic2dbtable_dict.get(topic)
322 q_filter, update_dict = self._get_dbparams_for_lock_HA(topic, op_type, op_id)
323 db_lock_task = self.db.set_one(db_table_name,
324 q_filter=q_filter,
325 update_dict=update_dict,
326 fail_on_empty=False)
kuused124bfe2019-06-18 12:09:24 +0200327 if db_lock_task is None:
328 self.logger.debug("Task {} operation={} already locked by another worker".format(topic, op_id))
329 return False
330 else:
kuuse6a470c62019-07-10 13:52:45 +0200331 # Set 'detailed-status' to 'In progress' for VIM/WIM/SDN operations
332 if self._is_account_type_HA(topic):
333 detailed_status = 'In progress'
334 account_id, op_index = self._get_account_and_op_HA(op_id)
335 q_filter = {'_id': account_id}
336 update_dict = {'_admin.operations.{}.detailed-status'.format(op_index): detailed_status}
337 self.db.set_one(db_table_name,
338 q_filter=q_filter,
339 update_dict=update_dict,
340 fail_on_empty=False)
kuused124bfe2019-06-18 12:09:24 +0200341 return True
342
kuuse6a470c62019-07-10 13:52:45 +0200343 def register_HA(self, topic, op_type, op_id, operationState, detailed_status):
344 """
345 Register a task, done when finished a VIM/WIM/SDN 'create' operation.
346 :param topic: Can be "vim", "wim", or "sdn"
347 :param op_type: Operation type, can be "create", "edit", "delete"
348 :param op_id: Account ID + ':' + Operation Index
349 :return: nothing
350 """
351
352 # Backward compatibility
353 if not self._is_account_type_HA(topic) or (self._is_account_type_HA(topic) and op_id is None):
354 return
355
356 # Get Account ID and Operation Index
357 account_id, op_index = self._get_account_and_op_HA(op_id)
358 db_table_name = self.topic2dbtable_dict.get(topic)
359
360 # If this is a 'delete' operation, the account may have been deleted (SUCCESS) or may still exist (FAILED)
361 # If the account exist, register the HA task.
362 # Update DB for HA tasks
363 q_filter = {'_id': account_id}
364 update_dict = {'_admin.operations.{}.operationState'.format(op_index): operationState,
365 '_admin.operations.{}.detailed-status'.format(op_index): detailed_status}
366 self.db.set_one(db_table_name,
367 q_filter=q_filter,
368 update_dict=update_dict,
369 fail_on_empty=False)
370 return
371
kuused124bfe2019-06-18 12:09:24 +0200372 async def waitfor_related_HA(self, topic, op_type, op_id=None):
tierno59d22d22018-09-25 18:10:19 +0200373 """
kuused124bfe2019-06-18 12:09:24 +0200374 Wait for any pending related HA tasks
tierno59d22d22018-09-25 18:10:19 +0200375 """
kuused124bfe2019-06-18 12:09:24 +0200376
kuuse6a470c62019-07-10 13:52:45 +0200377 # Backward compatibility
378 if not (self._is_service_type_HA(topic) or self._is_account_type_HA(topic)) and (op_id is None):
379 return
kuused124bfe2019-06-18 12:09:24 +0200380
kuuse6a470c62019-07-10 13:52:45 +0200381 # Get DB table name
382 db_table_name = self.topic2dbtable_dict.get(topic)
383
384 # Get instance ID
385 _id = self._get_instance_id_HA(topic, op_type, op_id)
386 _filter = {"_id": _id}
387 db_lcmop = self.db.get_one(db_table_name,
388 _filter,
kuused124bfe2019-06-18 12:09:24 +0200389 fail_on_empty=False)
390 if not db_lcmop:
tierno59d22d22018-09-25 18:10:19 +0200391 return
kuuse6a470c62019-07-10 13:52:45 +0200392
393 # Set DB _filter for querying any related process state
394 _filter = self._get_waitfor_filter_HA(db_lcmop, topic, op_type, op_id)
kuused124bfe2019-06-18 12:09:24 +0200395
396 # For HA, get list of tasks from DB instead of from dictionary (in-memory) variable.
397 timeout_wait_for_task = 3600 # Max time (seconds) to wait for a related task to finish
398 # interval_wait_for_task = 30 # A too long polling interval slows things down considerably
399 interval_wait_for_task = 10 # Interval in seconds for polling related tasks
400 time_left = timeout_wait_for_task
401 old_num_related_tasks = 0
402 while True:
kuuse6a470c62019-07-10 13:52:45 +0200403 # Get related tasks (operations within the same instance as this) which are
kuused124bfe2019-06-18 12:09:24 +0200404 # still running (operationState='PROCESSING') and which were started before this task.
kuuse6a470c62019-07-10 13:52:45 +0200405 # In the case of op_type='ANY', get any related tasks with operationState='PROCESSING', ignore timestamps.
406 db_waitfor_related_task = self.db.get_list(db_table_name,
kuused124bfe2019-06-18 12:09:24 +0200407 q_filter=_filter)
408 new_num_related_tasks = len(db_waitfor_related_task)
kuuse6a470c62019-07-10 13:52:45 +0200409 # If there are no related tasks, there is nothing to wait for, so return.
kuused124bfe2019-06-18 12:09:24 +0200410 if not new_num_related_tasks:
kuused124bfe2019-06-18 12:09:24 +0200411 return
412 # If number of pending related tasks have changed,
413 # update the 'detailed-status' field and log the change.
kuuse6a470c62019-07-10 13:52:45 +0200414 # Do NOT update the 'detailed-status' for SDNC-associated-to-VIM operations ('ANY').
415 if (op_type != 'ANY') and (new_num_related_tasks != old_num_related_tasks):
416 step = "Waiting for {} related tasks to be completed.".format(new_num_related_tasks)
417 update_dict = {}
418 q_filter = {'_id': _id}
419 # NS/NSI
420 if self._is_service_type_HA(topic):
421 update_dict = {'detailed-status': step}
422 # VIM/WIM/SDN
423 elif self._is_account_type_HA(topic):
424 _, op_index = self._get_account_and_op_HA(op_id)
425 update_dict = {'_admin.operations.{}.detailed-status'.format(op_index): step}
426 self.logger.debug("Task {} operation={} {}".format(topic, _id, step))
427 self.db.set_one(db_table_name,
428 q_filter=q_filter,
429 update_dict=update_dict,
430 fail_on_empty=False)
kuused124bfe2019-06-18 12:09:24 +0200431 old_num_related_tasks = new_num_related_tasks
432 time_left -= interval_wait_for_task
433 if time_left < 0:
434 raise LcmException(
435 "Timeout ({}) when waiting for related tasks to be completed".format(
436 timeout_wait_for_task))
437 await asyncio.sleep(interval_wait_for_task)
438
439 return