1 # -*- coding: utf-8 -*-
4 # Copyright 2018 Telefonica S.A.
6 # Licensed under the Apache License, Version 2.0 (the "License"); you may
7 # not use this file except in compliance with the License. You may obtain
8 # a copy of the License at
10 # http://www.apache.org/licenses/LICENSE-2.0
12 # Unless required by applicable law or agreed to in writing, software
13 # distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
14 # WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
15 # License for the specific language governing permissions and limitations
20 from collections
import OrderedDict
21 # from osm_common.dbbase import DbException
23 __author__
= "Alfonso Tierno"
26 class LcmException(Exception):
30 class LcmExceptionNoMgmtIP(LcmException
):
34 class LcmExceptionExit(LcmException
):
39 """utility for compare dot separate versions. Fills with zeros to proper number comparison
40 package version will be something like 4.0.1.post11+gb3f024d.dirty-1. Where 4.0.1 is the git tag, postXX is the
41 number of commits from this tag, and +XXXXXXX is the git commit short id. Total length is 16 with until 999 commits
44 for point
in v
.split("."):
45 point
, _
, _
= point
.partition("+")
46 point
, _
, _
= point
.partition("-")
47 filled
.append(point
.zfill(20))
51 # LcmBase must be listed before TaskRegistry, as it is a dependency.
54 def __init__(self
, db
, msg
, fs
, logger
):
57 :param db: database connection
64 def update_db_2(self
, item
, _id
, _desc
):
66 Updates database with _desc information. If success _desc is cleared
69 :param _desc: dictionary with the content to update. Keys are dot separated keys for
70 :return: None. Exception is raised on error
74 self
.db
.set_one(item
, {"_id": _id
}, _desc
)
76 # except DbException as e:
77 # self.logger.error("Updating {} _id={} with '{}'. Error: {}".format(item, _id, _desc, e))
80 class TaskRegistry(LcmBase
):
82 Implements a registry of task needed for later cancelation, look for related tasks that must be completed before
83 etc. It stores a four level dict
84 First level is the topic, ns, vim_account, sdn
85 Second level is the _id
86 Third level is the operation id
87 Fourth level is a descriptive name, the value is the task class
89 The HA (High-Availability) methods are used when more than one LCM instance is running.
90 To register the current task in the external DB, use LcmBase as base class, to be able
91 to reuse LcmBase.update_db_2()
92 The DB registry uses the following fields to distinguish a task:
93 - op_type: operation type ("nslcmops" or "nsilcmops")
95 - worker: the worker ID for this process
98 # NS/NSI: "services" VIM/WIM/SDN: "accounts"
99 topic_service_list
= ['ns', 'nsi']
100 topic_account_list
= ['vim', 'wim', 'sdn', 'k8scluster', 'k8srepo']
102 # Map topic to InstanceID
103 topic2instid_dict
= {
104 'ns': 'nsInstanceId',
105 'nsi': 'netsliceInstanceId'}
107 # Map topic to DB table name
108 topic2dbtable_dict
= {
111 'vim': 'vim_accounts',
112 'wim': 'wim_accounts',
114 'k8scluster': 'k8sclusters',
115 'k8srepo': 'k8srepos'}
117 def __init__(self
, worker_id
=None, db
=None, logger
=None):
118 self
.task_registry
= {
127 self
.worker_id
= worker_id
131 def register(self
, topic
, _id
, op_id
, task_name
, task
):
134 :param topic: Can be "ns", "nsi", "vim_account", "sdn"
135 :param _id: _id of the related item
136 :param op_id: id of the operation of the related item
137 :param task_name: Task descriptive name, as create, instantiate, terminate. Must be unique in this op_id
138 :param task: Task class
141 if _id
not in self
.task_registry
[topic
]:
142 self
.task_registry
[topic
][_id
] = OrderedDict()
143 if op_id
not in self
.task_registry
[topic
][_id
]:
144 self
.task_registry
[topic
][_id
][op_id
] = {task_name
: task
}
146 self
.task_registry
[topic
][_id
][op_id
][task_name
] = task
147 # print("registering task", topic, _id, op_id, task_name, task)
149 def remove(self
, topic
, _id
, op_id
, task_name
=None):
151 When task is ended, it should be removed. It ignores missing tasks. It also removes tasks done with this _id
152 :param topic: Can be "ns", "nsi", "vim_account", "sdn"
153 :param _id: _id of the related item
154 :param op_id: id of the operation of the related item
155 :param task_name: Task descriptive name. If none it deletes all tasks with same _id and op_id
158 if not self
.task_registry
[topic
].get(_id
):
161 self
.task_registry
[topic
][_id
].pop(op_id
, None)
162 elif self
.task_registry
[topic
][_id
].get(op_id
):
163 self
.task_registry
[topic
][_id
][op_id
].pop(task_name
, None)
166 for op_id_
in list(self
.task_registry
[topic
][_id
]):
167 for name
, task
in self
.task_registry
[topic
][_id
][op_id_
].items():
171 del self
.task_registry
[topic
][_id
][op_id_
]
172 if not self
.task_registry
[topic
][_id
]:
173 del self
.task_registry
[topic
][_id
]
175 def lookfor_related(self
, topic
, _id
, my_op_id
=None):
178 if _id
not in self
.task_registry
[topic
]:
179 return "", task_name_list
180 for op_id
in reversed(self
.task_registry
[topic
][_id
]):
182 if my_op_id
== op_id
:
183 my_op_id
= None # so that the next task is taken
186 for task_name
, task
in self
.task_registry
[topic
][_id
][op_id
].items():
188 task_list
.append(task
)
189 task_name_list
.append(task_name
)
191 return ", ".join(task_name_list
), task_list
193 def cancel(self
, topic
, _id
, target_op_id
=None, target_task_name
=None):
195 Cancel all active tasks of a concrete ns, nsi, vim_account, sdn identified for _id. If op_id is supplied only
196 this is cancelled, and the same with task_name
198 if not self
.task_registry
[topic
].get(_id
):
200 for op_id
in reversed(self
.task_registry
[topic
][_id
]):
201 if target_op_id
and target_op_id
!= op_id
:
203 for task_name
, task
in self
.task_registry
[topic
][_id
][op_id
].items():
204 if target_task_name
and target_task_name
!= task_name
:
209 # self.logger.debug("{} _id={} order_id={} task={} cancelled".format(topic, _id, op_id, task_name))
212 def _is_service_type_HA(self
, topic
):
213 return topic
in self
.topic_service_list
215 # Is topic VIM/WIM/SDN?
216 def _is_account_type_HA(self
, topic
):
217 return topic
in self
.topic_account_list
219 # Input: op_id, example: 'abc123def:3' Output: account_id='abc123def', op_index=3
220 def _get_account_and_op_HA(self
, op_id
):
223 account_id
, _
, op_index
= op_id
.rpartition(':')
226 if not op_index
.isdigit():
228 return account_id
, op_index
230 # Get '_id' for any topic and operation
231 def _get_instance_id_HA(self
, topic
, op_type
, op_id
):
233 # Special operation 'ANY', for SDN account associated to a VIM account: op_id as '_id'
236 # NS/NSI: Use op_id as '_id'
237 elif self
._is
_service
_type
_HA
(topic
):
239 # VIM/SDN/WIM/K8SCLUSTER: Split op_id to get Account ID and Operation Index, use Account ID as '_id'
240 elif self
._is
_account
_type
_HA
(topic
):
241 _id
, _
= self
._get
_account
_and
_op
_HA
(op_id
)
244 # Set DB _filter for querying any related process state
245 def _get_waitfor_filter_HA(self
, db_lcmop
, topic
, op_type
, op_id
):
247 # Special operation 'ANY', for SDN account associated to a VIM account: op_id as '_id'
248 # In this special case, the timestamp is ignored
250 _filter
= {'operationState': 'PROCESSING'}
251 # Otherwise, get 'startTime' timestamp for this operation
254 if self
._is
_service
_type
_HA
(topic
):
255 starttime_this_op
= db_lcmop
.get("startTime")
256 instance_id_label
= self
.topic2instid_dict
.get(topic
)
257 instance_id
= db_lcmop
.get(instance_id_label
)
258 _filter
= {instance_id_label
: instance_id
,
259 'operationState': 'PROCESSING',
260 'startTime.lt': starttime_this_op
}
261 # VIM/WIM/SDN/K8scluster
262 elif self
._is
_account
_type
_HA
(topic
):
263 _
, op_index
= self
._get
_account
_and
_op
_HA
(op_id
)
264 _ops
= db_lcmop
['_admin']['operations']
265 _this_op
= _ops
[int(op_index
)]
266 starttime_this_op
= _this_op
.get('startTime', None)
267 _filter
= {'operationState': 'PROCESSING',
268 'startTime.lt': starttime_this_op
}
271 # Get DB params for any topic and operation
272 def _get_dbparams_for_lock_HA(self
, topic
, op_type
, op_id
):
276 if self
._is
_service
_type
_HA
(topic
):
277 q_filter
= {'_id': op_id
, '_admin.worker': None}
278 update_dict
= {'_admin.worker': self
.worker_id
}
280 elif self
._is
_account
_type
_HA
(topic
):
281 account_id
, op_index
= self
._get
_account
_and
_op
_HA
(op_id
)
284 if op_type
== 'create':
285 # Creating a VIM/WIM/SDN account implies setting '_admin.current_operation' = 0
287 q_filter
= {'_id': account_id
, "_admin.operations.{}.worker".format(op_index
): None}
288 update_dict
= {'_admin.operations.{}.worker'.format(op_index
): self
.worker_id
,
289 '_admin.current_operation': op_index
}
290 return q_filter
, update_dict
292 def lock_HA(self
, topic
, op_type
, op_id
):
294 Lock a task, if possible, to indicate to the HA system that
295 the task will be executed in this LCM instance.
296 :param topic: Can be "ns", "nsi", "vim", "wim", or "sdn"
297 :param op_type: Operation type, can be "nslcmops", "nsilcmops", "create", "edit", "delete"
298 :param op_id: NS, NSI: Operation ID VIM,WIM,SDN: Account ID + ':' + Operation Index
300 True=lock was successful => execute the task (not registered by any other LCM instance)
301 False=lock failed => do NOT execute the task (already registered by another LCM instance)
303 HA tasks and backward compatibility:
304 If topic is "account type" (VIM/WIM/SDN) and op_id is None, 'op_id' was not provided by NBI.
305 This means that the running NBI instance does not support HA.
306 In such a case this method should always return True, to always execute
307 the task in this instance of LCM, without querying the DB.
310 # Backward compatibility for VIM/WIM/SDN/k8scluster without op_id
311 if self
._is
_account
_type
_HA
(topic
) and op_id
is None:
314 # Try to lock this task
315 db_table_name
= self
.topic2dbtable_dict
.get(topic
)
316 q_filter
, update_dict
= self
._get
_dbparams
_for
_lock
_HA
(topic
, op_type
, op_id
)
317 db_lock_task
= self
.db
.set_one(db_table_name
,
319 update_dict
=update_dict
,
321 if db_lock_task
is None:
322 self
.logger
.debug("Task {} operation={} already locked by another worker".format(topic
, op_id
))
325 # Set 'detailed-status' to 'In progress' for VIM/WIM/SDN operations
326 if self
._is
_account
_type
_HA
(topic
):
327 detailed_status
= 'In progress'
328 account_id
, op_index
= self
._get
_account
_and
_op
_HA
(op_id
)
329 q_filter
= {'_id': account_id
}
330 update_dict
= {'_admin.operations.{}.detailed-status'.format(op_index
): detailed_status
}
331 self
.db
.set_one(db_table_name
,
333 update_dict
=update_dict
,
337 def register_HA(self
, topic
, op_type
, op_id
, operationState
, detailed_status
):
339 Register a task, done when finished a VIM/WIM/SDN 'create' operation.
340 :param topic: Can be "vim", "wim", or "sdn"
341 :param op_type: Operation type, can be "create", "edit", "delete"
342 :param op_id: Account ID + ':' + Operation Index
346 # Backward compatibility
347 if not self
._is
_account
_type
_HA
(topic
) or (self
._is
_account
_type
_HA
(topic
) and op_id
is None):
350 # Get Account ID and Operation Index
351 account_id
, op_index
= self
._get
_account
_and
_op
_HA
(op_id
)
352 db_table_name
= self
.topic2dbtable_dict
.get(topic
)
354 # If this is a 'delete' operation, the account may have been deleted (SUCCESS) or may still exist (FAILED)
355 # If the account exist, register the HA task.
356 # Update DB for HA tasks
357 q_filter
= {'_id': account_id
}
358 update_dict
= {'_admin.operations.{}.operationState'.format(op_index
): operationState
,
359 '_admin.operations.{}.detailed-status'.format(op_index
): detailed_status
}
360 self
.db
.set_one(db_table_name
,
362 update_dict
=update_dict
,
366 async def waitfor_related_HA(self
, topic
, op_type
, op_id
=None):
368 Wait for any pending related HA tasks
371 # Backward compatibility
372 if not (self
._is
_service
_type
_HA
(topic
) or self
._is
_account
_type
_HA
(topic
)) and (op_id
is None):
376 db_table_name
= self
.topic2dbtable_dict
.get(topic
)
379 _id
= self
._get
_instance
_id
_HA
(topic
, op_type
, op_id
)
380 _filter
= {"_id": _id
}
381 db_lcmop
= self
.db
.get_one(db_table_name
,
387 # Set DB _filter for querying any related process state
388 _filter
= self
._get
_waitfor
_filter
_HA
(db_lcmop
, topic
, op_type
, op_id
)
390 # For HA, get list of tasks from DB instead of from dictionary (in-memory) variable.
391 timeout_wait_for_task
= 3600 # Max time (seconds) to wait for a related task to finish
392 # interval_wait_for_task = 30 # A too long polling interval slows things down considerably
393 interval_wait_for_task
= 10 # Interval in seconds for polling related tasks
394 time_left
= timeout_wait_for_task
395 old_num_related_tasks
= 0
397 # Get related tasks (operations within the same instance as this) which are
398 # still running (operationState='PROCESSING') and which were started before this task.
399 # In the case of op_type='ANY', get any related tasks with operationState='PROCESSING', ignore timestamps.
400 db_waitfor_related_task
= self
.db
.get_list(db_table_name
,
402 new_num_related_tasks
= len(db_waitfor_related_task
)
403 # If there are no related tasks, there is nothing to wait for, so return.
404 if not new_num_related_tasks
:
406 # If number of pending related tasks have changed,
407 # update the 'detailed-status' field and log the change.
408 # Do NOT update the 'detailed-status' for SDNC-associated-to-VIM operations ('ANY').
409 if (op_type
!= 'ANY') and (new_num_related_tasks
!= old_num_related_tasks
):
410 step
= "Waiting for {} related tasks to be completed.".format(new_num_related_tasks
)
412 q_filter
= {'_id': _id
}
414 if self
._is
_service
_type
_HA
(topic
):
415 update_dict
= {'detailed-status': step
}
417 elif self
._is
_account
_type
_HA
(topic
):
418 _
, op_index
= self
._get
_account
_and
_op
_HA
(op_id
)
419 update_dict
= {'_admin.operations.{}.detailed-status'.format(op_index
): step
}
420 self
.logger
.debug("Task {} operation={} {}".format(topic
, _id
, step
))
421 self
.db
.set_one(db_table_name
,
423 update_dict
=update_dict
,
425 old_num_related_tasks
= new_num_related_tasks
426 time_left
-= interval_wait_for_task
429 "Timeout ({}) when waiting for related tasks to be completed".format(
430 timeout_wait_for_task
))
431 await asyncio
.sleep(interval_wait_for_task
)