blob: aecac77beab97d3afae6a7b15600c58ee80b0c92 [file] [log] [blame]
#!/usr/bin/python3
# -*- coding: utf-8 -*-
import asyncio
import logging
import logging.handlers
import traceback
import ns
from lcm_utils import LcmException, LcmBase
from osm_common.dbbase import DbException
from time import time
__author__ = "Felipe Vicens, Pol Alemany, Alfonso Tierno"
class NetsliceLcm(LcmBase):
def __init__(self, db, msg, fs, lcm_tasks, ro_config, vca_config, loop):
"""
Init, Connect to database, filesystem storage, and messaging
:param config: two level dictionary with configuration. Top level should contain 'database', 'storage',
:return: None
"""
# logging
self.logger = logging.getLogger('lcm.netslice')
self.loop = loop
self.lcm_tasks = lcm_tasks
self.ns = ns.NsLcm(db, msg, fs, lcm_tasks, ro_config, vca_config, loop)
super().__init__(db, msg, fs, self.logger)
# TODO: check logging_text within the self.logger.info/debug
async def instantiate(self, nsir_id, nsilcmop_id):
logging_text = "Task netslice={} instantiate={} ".format(nsir_id, nsilcmop_id)
self.logger.debug(logging_text + "Enter")
# get all needed from database
exc = None
db_nsir = None
db_nsilcmop = None
db_nsir_update = {"_admin.nsilcmop": nsilcmop_id}
db_nsilcmop_update = {}
nsilcmop_operation_state = None
try:
step = "Getting nsir={} from db".format(nsir_id)
db_nsir = self.db.get_one("nsis", {"_id": nsir_id})
step = "Getting nsilcmop={} from db".format(nsilcmop_id)
db_nsilcmop = self.db.get_one("nsilcmops", {"_id": nsilcmop_id})
# look if previous tasks is in process
task_name, task_dependency = self.lcm_tasks.lookfor_related("nsi", nsir_id, nsilcmop_id)
if task_dependency:
step = db_nsilcmop_update["detailed-status"] = \
"Waiting for related tasks to be completed: {}".format(task_name)
self.logger.debug(logging_text + step)
self.update_db_2("nsilcmops", nsilcmop_id, db_nsilcmop_update)
_, pending = await asyncio.wait(task_dependency, timeout=3600)
if pending:
raise LcmException("Timeout waiting related tasks to be completed")
# Empty list to keep track of network service records status in the netslice
nsir_admin = db_nsir["_admin"]
nsir_admin["nsrs-detailed-list"] = []
# Slice status Creating
db_nsir_update["detailed-status"] = "creating"
db_nsir_update["operational-status"] = "init"
self.update_db_2("nsis", nsir_id, db_nsir_update)
# Iterate over the network services operation ids to instantiate NSs
# TODO: (future improvement) look another way check the tasks instead of keep asking
# -> https://docs.python.org/3/library/asyncio-task.html#waiting-primitives
# steps: declare ns_tasks, add task when terminate is called, await asyncio.wait(vca_task_list, timeout=300)
# ns_tasks = []
nslcmop_ids = db_nsilcmop["operationParams"].get("nslcmops_ids")
for nslcmop_id in nslcmop_ids:
nslcmop = self.db.get_one("nslcmops", {"_id": nslcmop_id})
nsr_id = nslcmop.get("nsInstanceId")
step = "Launching ns={} instantiate={} task".format(nsr_id, nslcmop)
task = asyncio.ensure_future(self.ns.instantiate(nsr_id, nslcmop_id))
self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_instantiate", task)
# Wait until Network Slice is ready
step = nsir_status_detailed = " Waiting nsi ready. nsi_id={}".format(nsir_id)
nsrs_detailed_list_old = None
self.logger.debug(logging_text + step)
# TODO: substitute while for await (all task to be done or not)
deployment_timeout = 2 * 3600 # Two hours
while deployment_timeout > 0:
# Check ns instantiation status
nsi_ready = True
nsrs_detailed_list = []
for nslcmop_item in nslcmop_ids:
nslcmop = self.db.get_one("nslcmops", {"_id": nslcmop_item})
status = nslcmop.get("operationState")
# TODO: (future improvement) other possible status: ROLLING_BACK,ROLLED_BACK
nsrs_detailed_list.append({"nsrId": nslcmop["nsInstanceId"], "status": nslcmop["operationState"],
"detailed-status":
nsir_status_detailed + "; {}".format(nslcmop.get("detailed-status"))})
if status not in ["COMPLETED", "PARTIALLY_COMPLETED", "FAILED", "FAILED_TEMP"]:
nsi_ready = False
if nsrs_detailed_list != nsrs_detailed_list_old:
nsir_admin["nsrs-detailed-list"] = nsrs_detailed_list
nsrs_detailed_list_old = nsrs_detailed_list
db_nsir_update["_admin"] = nsir_admin
self.update_db_2("nsis", nsir_id, db_nsir_update)
if nsi_ready:
step = "Network Slice Instance is ready. nsi_id={}".format(nsir_id)
for items in nsrs_detailed_list:
if "FAILED" in items.values():
raise LcmException("Error deploying NSI: {}".format(nsir_id))
break
# TODO: future improvement due to synchronism -> await asyncio.wait(vca_task_list, timeout=300)
await asyncio.sleep(5, loop=self.loop)
deployment_timeout -= 5
if deployment_timeout <= 0:
raise LcmException("Timeout waiting nsi to be ready. nsi_id={}".format(nsir_id))
db_nsir_update["operational-status"] = "running"
db_nsir_update["detailed-status"] = "done"
db_nsir_update["config-status"] = "configured"
db_nsilcmop_update["operationState"] = nsilcmop_operation_state = "COMPLETED"
db_nsilcmop_update["statusEnteredTime"] = time()
db_nsilcmop_update["detailed-status"] = "done"
return
except (LcmException, DbException) as e:
self.logger.error(logging_text + "Exit Exception while '{}': {}".format(step, e))
exc = e
except asyncio.CancelledError:
self.logger.error(logging_text + "Cancelled Exception while '{}'".format(step))
exc = "Operation was cancelled"
except Exception as e:
exc = traceback.format_exc()
self.logger.critical(logging_text + "Exit Exception {} while '{}': {}".format(type(e).__name__, step, e),
exc_info=True)
finally:
if exc:
if db_nsir:
db_nsir_update["detailed-status"] = "ERROR {}: {}".format(step, exc)
db_nsir_update["operational-status"] = "failed"
if db_nsilcmop:
db_nsilcmop_update["detailed-status"] = "FAILED {}: {}".format(step, exc)
db_nsilcmop_update["operationState"] = nsilcmop_operation_state = "FAILED"
db_nsilcmop_update["statusEnteredTime"] = time()
if db_nsir:
db_nsir_update["_admin.nsiState"] = "INSTANTIATED"
db_nsir_update["_admin.nsilcmop"] = None
self.update_db_2("nsis", nsir_id, db_nsir_update)
if db_nsilcmop:
self.update_db_2("nsilcmops", nsilcmop_id, db_nsilcmop_update)
if nsilcmop_operation_state:
try:
await self.msg.aiowrite("nsi", "instantiated", {"nsir_id": nsir_id, "nsilcmop_id": nsilcmop_id,
"operationState": nsilcmop_operation_state})
except Exception as e:
self.logger.error(logging_text + "kafka_write notification Exception {}".format(e))
self.logger.debug(logging_text + "Exit")
self.lcm_tasks.remove("nsi", nsir_id, nsilcmop_id, "nsi_instantiate")
async def terminate(self, nsir_id, nsilcmop_id):
logging_text = "Task nsi={} terminate={} ".format(nsir_id, nsilcmop_id)
self.logger.debug(logging_text + "Enter")
exc = None
db_nsir = None
db_nsilcmop = None
db_nsir_update = {"_admin.nsilcmop": nsilcmop_id}
db_nsilcmop_update = {}
nsilcmop_operation_state = None
try:
step = "Getting nsir={} from db".format(nsir_id)
db_nsir = self.db.get_one("nsis", {"_id": nsir_id})
step = "Getting nsilcmop={} from db".format(nsilcmop_id)
db_nsilcmop = self.db.get_one("nsilcmops", {"_id": nsilcmop_id})
# TODO: Check if makes sense check the nsiState=NOT_INSTANTIATED when terminate
# CASE: Instance was terminated but there is a second request to terminate the instance
if db_nsir["_admin"]["nsiState"] == "NOT_INSTANTIATED":
return
# Slice status Terminating
db_nsir_update["operational-status"] = "terminating"
db_nsir_update["config-status"] = "terminating"
self.update_db_2("nsis", nsir_id, db_nsir_update)
# look if previous tasks is in process
task_name, task_dependency = self.lcm_tasks.lookfor_related("nsi", nsir_id, nsilcmop_id)
if task_dependency:
step = db_nsilcmop_update["detailed-status"] = \
"Waiting for related tasks to be completed: {}".format(task_name)
self.logger.debug(logging_text + step)
self.update_db_2("nsilcmops", nsilcmop_id, db_nsilcmop_update)
_, pending = await asyncio.wait(task_dependency, timeout=3600)
if pending:
raise LcmException("Timeout waiting related tasks to be completed")
# Gets the list to keep track of network service records status in the netslice
nsir_admin = db_nsir["_admin"]
nsrs_detailed_list = []
# Iterate over the network services operation ids to terminate NSs
# TODO: (future improvement) look another way check the tasks instead of keep asking
# -> https://docs.python.org/3/library/asyncio-task.html#waiting-primitives
# steps: declare ns_tasks, add task when terminate is called, await asyncio.wait(vca_task_list, timeout=300)
# ns_tasks = []
nslcmop_ids = db_nsilcmop["operationParams"].get("nslcmops_ids")
for nslcmop_id in nslcmop_ids:
nslcmop = self.db.get_one("nslcmops", {"_id": nslcmop_id})
nsr_id = nslcmop["operationParams"].get("nsInstanceId")
task = asyncio.ensure_future(self.ns.terminate(nsr_id, nslcmop_id))
self.lcm_tasks.register("ns", nsr_id, nslcmop_id, "ns_instantiate", task)
# Wait until Network Slice is terminated
step = nsir_status_detailed = " Waiting nsi terminated. nsi_id={}".format(nsir_id)
nsrs_detailed_list_old = None
self.logger.debug(logging_text + step)
termination_timeout = 2 * 3600 # Two hours
while termination_timeout > 0:
# Check ns termination status
nsi_ready = True
nsrs_detailed_list = []
for nslcmop_item in nslcmop_ids:
nslcmop = self.db.get_one("nslcmops", {"_id": nslcmop_item})
status = nslcmop["operationState"]
# TODO: (future improvement) other possible status: ROLLING_BACK,ROLLED_BACK
nsrs_detailed_list.append({"nsrId": nslcmop["nsInstanceId"], "status": nslcmop["operationState"],
"detailed-status":
nsir_status_detailed + "; {}".format(nslcmop.get("detailed-status"))})
if status not in ["COMPLETED", "PARTIALLY_COMPLETED", "FAILED", "FAILED_TEMP"]:
nsi_ready = False
if nsrs_detailed_list != nsrs_detailed_list_old:
nsir_admin["nsrs-detailed-list"] = nsrs_detailed_list
nsrs_detailed_list_old = nsrs_detailed_list
db_nsir_update["_admin"] = nsir_admin
self.update_db_2("nsis", nsir_id, db_nsir_update)
if nsi_ready:
step = "Network Slice Instance is terminated. nsi_id={}".format(nsir_id)
for items in nsrs_detailed_list:
if "FAILED" in items.values():
raise LcmException("Error terminating NSI: {}".format(nsir_id))
break
await asyncio.sleep(5, loop=self.loop)
termination_timeout -= 5
if termination_timeout <= 0:
raise LcmException("Timeout waiting nsi to be terminated. nsi_id={}".format(nsir_id))
db_nsir_update["operational-status"] = "terminated"
db_nsir_update["config-status"] = "configured"
db_nsir_update["detailed-status"] = "done"
db_nsilcmop_update["operationState"] = nsilcmop_operation_state = "COMPLETED"
db_nsilcmop_update["statusEnteredTime"] = time()
db_nsilcmop_update["detailed-status"] = "done"
return
except (LcmException, DbException) as e:
self.logger.error(logging_text + "Exit Exception while '{}': {}".format(step, e))
exc = e
except asyncio.CancelledError:
self.logger.error(logging_text + "Cancelled Exception while '{}'".format(step))
exc = "Operation was cancelled"
except Exception as e:
exc = traceback.format_exc()
self.logger.critical(logging_text + "Exit Exception {} while '{}': {}".format(type(e).__name__, step, e),
exc_info=True)
finally:
if exc:
if db_nsir:
db_nsir_update["detailed-status"] = "ERROR {}: {}".format(step, exc)
db_nsir_update["operational-status"] = "failed"
if db_nsilcmop:
db_nsilcmop_update["detailed-status"] = "FAILED {}: {}".format(step, exc)
db_nsilcmop_update["operationState"] = nsilcmop_operation_state = "FAILED"
db_nsilcmop_update["statusEnteredTime"] = time()
if db_nsir:
db_nsir_update["_admin.nsilcmop"] = None
db_nsir_update["_admin.nsiState"] = "TERMINATED"
self.update_db_2("nsis", nsir_id, db_nsir_update)
if db_nsilcmop:
self.update_db_2("nsilcmops", nsilcmop_id, db_nsilcmop_update)
if nsilcmop_operation_state:
try:
await self.msg.aiowrite("nsi", "terminated", {"nsir_id": nsir_id, "nsilcmop_id": nsilcmop_id,
"operationState": nsilcmop_operation_state})
except Exception as e:
self.logger.error(logging_text + "kafka_write notification Exception {}".format(e))
self.logger.debug(logging_text + "Exit")
self.lcm_tasks.remove("nsi", nsir_id, nsilcmop_id, "nsi_terminate")