2 # Copyright 2020 Telefonica Investigacion y Desarrollo, S.A.U.
4 # Licensed under the Apache License, Version 2.0 (the "License");
5 # you may not use this file except in compliance with the License.
6 # You may obtain a copy of the License at
8 # http://www.apache.org/licenses/LICENSE-2.0
10 # Unless required by applicable law or agreed to in writing, software
11 # distributed under the License is distributed on an "AS IS" BASIS,
12 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
14 # See the License for the specific language governing permissions and
15 # limitations under the License.
25 from grpclib
.client
import Channel
27 from osm_lcm
.frontend_pb2
import PrimitiveRequest
28 from osm_lcm
.frontend_pb2
import SshKeyRequest
, SshKeyReply
29 from osm_lcm
.frontend_grpc
import FrontendExecutorStub
30 from osm_lcm
.lcm_utils
import LcmBase
32 from osm_lcm
.data_utils
.database
.database
import Database
33 from osm_lcm
.data_utils
.filesystem
.filesystem
import Filesystem
35 from n2vc
.n2vc_conn
import N2VCConnector
36 from n2vc
.k8s_helm_conn
import K8sHelmConnector
37 from n2vc
.k8s_helm3_conn
import K8sHelm3Connector
38 from n2vc
.exceptions
import N2VCBadArgumentsException
, N2VCException
, N2VCExecutionException
40 from osm_lcm
.lcm_utils
import deep_get
43 def retryer(max_wait_time_var
="_initial_retry_time", delay_time_var
="_retry_delay"):
46 ConnectionRefusedError
49 @functools.wraps(func
)
50 async def wrapped(*args
, **kwargs
):
51 # default values for wait time and delay_time
55 # obtain arguments from variable names
57 if self
.__dict
__.get(max_wait_time_var
):
58 max_wait_time
= self
.__dict
__.get(max_wait_time_var
)
59 if self
.__dict
__.get(delay_time_var
):
60 delay_time
= self
.__dict
__.get(delay_time_var
)
62 wait_time
= max_wait_time
65 return await func(*args
, **kwargs
)
66 except retry_exceptions
:
67 wait_time
= wait_time
- delay_time
68 await asyncio
.sleep(delay_time
)
71 return ConnectionRefusedError
76 class LCMHelmConn(N2VCConnector
, LcmBase
):
77 _KUBECTL_OSM_NAMESPACE
= "osm"
78 _KUBECTL_OSM_CLUSTER_NAME
= "_system-osm-k8s"
79 _EE_SERVICE_PORT
= 50050
81 # Initial max retry time
82 _MAX_INITIAL_RETRY_TIME
= 600
83 # Max retry time for normal operations
85 # Time beetween retries, retry time after a connection error is raised
93 vca_config
: dict = None,
96 Initialize EE helm connector.
99 self
.db
= Database().instance
.db
100 self
.fs
= Filesystem().instance
.fs
102 # parent class constructor
103 N2VCConnector
.__init
__(
109 vca_config
=vca_config
,
110 on_update_db
=on_update_db
,
115 self
.log
.debug("Initialize helm N2VC connector")
116 self
.log
.debug("initial vca_config: {}".format(vca_config
))
118 # TODO - Obtain data from configuration
119 self
._ee
_service
_port
= self
._EE
_SERVICE
_PORT
121 self
._retry
_delay
= self
._EE
_RETRY
_DELAY
123 if self
.vca_config
and self
.vca_config
.get("eegrpcinittimeout"):
124 self
._initial
_retry
_time
= self
.vca_config
.get("eegrpcinittimeout")
125 self
.log
.debug("Initial retry time: {}".format(self
._initial
_retry
_time
))
127 self
._initial
_retry
_time
= self
._MAX
_INITIAL
_RETRY
_TIME
128 self
.log
.debug("Applied default retry time: {}".format(self
._initial
_retry
_time
))
130 if self
.vca_config
and self
.vca_config
.get("eegrpctimeout"):
131 self
._max
_retry
_time
= self
.vca_config
.get("eegrpctimeout")
132 self
.log
.debug("Retry time: {}".format(self
._max
_retry
_time
))
134 self
._max
_retry
_time
= self
._MAX
_RETRY
_TIME
135 self
.log
.debug("Applied default retry time: {}".format(self
._max
_retry
_time
))
137 # initialize helm connector for helmv2 and helmv3
138 self
._k
8sclusterhelm
2 = K8sHelmConnector(
139 kubectl_command
=self
.vca_config
.get("kubectlpath"),
140 helm_command
=self
.vca_config
.get("helmpath"),
147 self
._k
8sclusterhelm
3 = K8sHelm3Connector(
148 kubectl_command
=self
.vca_config
.get("kubectlpath"),
149 helm_command
=self
.vca_config
.get("helm3path"),
156 self
._system
_cluster
_id
= None
157 self
.log
.info("Helm N2VC connector initialized")
159 # TODO - ¿reuse_ee_id?
160 async def create_execution_environment(self
,
163 reuse_ee_id
: str = None,
164 progress_timeout
: float = None,
165 total_timeout
: float = None,
167 artifact_path
: str = None,
168 vca_type
: str = None,
169 *kargs
, **kwargs
) -> (str, dict):
171 Creates a new helm execution environment deploying the helm-chat indicated in the
173 :param str namespace: This param is not used, all helm charts are deployed in the osm
175 :param dict db_dict: where to write to database when the status changes.
176 It contains a dictionary with {collection: str, filter: {}, path: str},
177 e.g. {collection: "nsrs", filter: {_id: <nsd-id>, path:
178 "_admin.deployed.VCA.3"}
179 :param str reuse_ee_id: ee id from an older execution. TODO - right now this params is not used
180 :param float progress_timeout:
181 :param float total_timeout:
182 :param dict config: General variables to instantiate KDU
183 :param str artifact_path: path of package content
184 :param str vca_type: Type of vca, must be type helm or helm-v3
185 :returns str, dict: id of the new execution environment including namespace.helm_id
186 and credentials object set to None as all credentials should be osm kubernetes .kubeconfig
190 "create_execution_environment: namespace: {}, artifact_path: {}, db_dict: {}, "
191 "reuse_ee_id: {}".format(
192 namespace
, artifact_path
, db_dict
, reuse_ee_id
)
195 # Validate artifact-path is provided
196 if artifact_path
is None or len(artifact_path
) == 0:
197 raise N2VCBadArgumentsException(
198 message
="artifact_path is mandatory", bad_args
=["artifact_path"]
201 # Validate artifact-path exists and sync path
202 from_path
= os
.path
.split(artifact_path
)[0]
203 self
.fs
.sync(from_path
)
205 # remove / in charm path
206 while artifact_path
.find("//") >= 0:
207 artifact_path
= artifact_path
.replace("//", "/")
210 if self
.fs
.file_exists(artifact_path
):
211 helm_chart_path
= artifact_path
213 msg
= "artifact path does not exist: {}".format(artifact_path
)
214 raise N2VCBadArgumentsException(message
=msg
, bad_args
=["artifact_path"])
216 if artifact_path
.startswith("/"):
217 full_path
= self
.fs
.path
+ helm_chart_path
219 full_path
= self
.fs
.path
+ "/" + helm_chart_path
221 while full_path
.find("//") >= 0:
222 full_path
= full_path
.replace("//", "/")
225 # Call helm conn install
226 # Obtain system cluster id from database
227 system_cluster_uuid
= await self
._get
_system
_cluster
_id
()
228 # Add parameter osm if exist to global
229 if config
and config
.get("osm"):
230 if not config
.get("global"):
231 config
["global"] = {}
232 config
["global"]["osm"] = config
.get("osm")
234 self
.log
.debug("install helm chart: {}".format(full_path
))
235 if vca_type
== "helm":
236 helm_id
= self
._k
8sclusterhelm
2.generate_kdu_instance_name(
240 await self
._k
8sclusterhelm
2.install(system_cluster_uuid
, kdu_model
=full_path
,
241 kdu_instance
=helm_id
,
242 namespace
=self
._KUBECTL
_OSM
_NAMESPACE
,
245 timeout
=progress_timeout
)
247 helm_id
= self
._k
8sclusterhelm
2.generate_kdu_instance_name(
251 await self
._k
8sclusterhelm
3.install(system_cluster_uuid
, kdu_model
=full_path
,
252 kdu_instance
=helm_id
,
253 namespace
=self
._KUBECTL
_OSM
_NAMESPACE
,
256 timeout
=progress_timeout
)
258 ee_id
= "{}:{}.{}".format(vca_type
, self
._KUBECTL
_OSM
_NAMESPACE
, helm_id
)
260 except N2VCException
:
262 except Exception as e
:
263 self
.log
.error("Error deploying chart ee: {}".format(e
), exc_info
=True)
264 raise N2VCException("Error deploying chart ee: {}".format(e
))
266 async def register_execution_environment(self
, namespace
: str, credentials
: dict, db_dict
: dict,
267 progress_timeout
: float = None, total_timeout
: float = None,
268 *kargs
, **kwargs
) -> str:
272 async def install_configuration_sw(self
,
276 progress_timeout
: float = None,
277 total_timeout
: float = None,
285 async def add_relation(self
, ee_id_1
: str, ee_id_2
: str, endpoint_1
: str, endpoint_2
: str):
289 async def remove_relation(self
):
293 async def get_status(self
, namespace
: str, yaml_format
: bool = True):
294 # not used for this connector
297 async def get_ee_ssh_public__key(self
, ee_id
: str, db_dict
: dict, progress_timeout
: float = None,
298 total_timeout
: float = None) -> str:
300 Obtains ssh-public key from ee executing GetSShKey method from the ee.
302 :param str ee_id: the id of the execution environment returned by
303 create_execution_environment or register_execution_environment
305 :param float progress_timeout:
306 :param float total_timeout:
307 :returns: public key of the execution environment
311 "get_ee_ssh_public_key: ee_id: {}, db_dict: {}".format(
316 if ee_id
is None or len(ee_id
) == 0:
317 raise N2VCBadArgumentsException(
318 message
="ee_id is mandatory", bad_args
=["ee_id"]
322 # Obtain ip_addr for the ee service, it is resolved by dns from the ee name by kubernetes
323 version
, namespace
, helm_id
= self
._get
_ee
_id
_parts
(ee_id
)
324 ip_addr
= socket
.gethostbyname(helm_id
)
326 # Obtain ssh_key from the ee, this method will implement retries to allow the ee
327 # install libraries and start successfully
328 ssh_key
= await self
._get
_ssh
_key
(ip_addr
)
330 except Exception as e
:
331 self
.log
.error("Error obtaining ee ssh_key: {}".format(e
), exc_info
=True)
332 raise N2VCException("Error obtaining ee ssh_ke: {}".format(e
))
334 async def exec_primitive(self
, ee_id
: str, primitive_name
: str, params_dict
: dict, db_dict
: dict = None,
335 progress_timeout
: float = None, total_timeout
: float = None) -> str:
337 Execute a primitive in the execution environment
339 :param str ee_id: the one returned by create_execution_environment or
340 register_execution_environment with the format namespace.helm_id
341 :param str primitive_name: must be one defined in the software. There is one
342 called 'config', where, for the proxy case, the 'credentials' of VM are
344 :param dict params_dict: parameters of the action
345 :param dict db_dict: where to write into database when the status changes.
346 It contains a dict with
347 {collection: <str>, filter: {}, path: <str>},
348 e.g. {collection: "nslcmops", filter:
349 {_id: <nslcmop_id>, path: "_admin.VCA"}
350 It will be used to store information about intermediate notifications
351 :param float progress_timeout:
352 :param float total_timeout:
353 :returns str: primitive result, if ok. It raises exceptions in case of fail
356 self
.log
.info("exec primitive for ee_id : {}, primitive_name: {}, params_dict: {}, db_dict: {}".format(
357 ee_id
, primitive_name
, params_dict
, db_dict
361 if ee_id
is None or len(ee_id
) == 0:
362 raise N2VCBadArgumentsException(
363 message
="ee_id is mandatory", bad_args
=["ee_id"]
365 if primitive_name
is None or len(primitive_name
) == 0:
366 raise N2VCBadArgumentsException(
367 message
="action_name is mandatory", bad_args
=["action_name"]
369 if params_dict
is None:
373 version
, namespace
, helm_id
= self
._get
_ee
_id
_parts
(ee_id
)
374 ip_addr
= socket
.gethostbyname(helm_id
)
375 except Exception as e
:
376 self
.log
.error("Error getting ee ip ee: {}".format(e
))
377 raise N2VCException("Error getting ee ip ee: {}".format(e
))
379 if primitive_name
== "config":
381 # Execute config primitive, higher timeout to check the case ee is starting
382 status
, detailed_message
= await self
._execute
_config
_primitive
(ip_addr
, params_dict
, db_dict
=db_dict
)
383 self
.log
.debug("Executed config primitive ee_id_ {}, status: {}, message: {}".format(
384 ee_id
, status
, detailed_message
))
386 self
.log
.error("Error configuring helm ee, status: {}, message: {}".format(
387 status
, detailed_message
))
388 raise N2VCExecutionException(
389 message
="Error configuring helm ee_id: {}, status: {}, message: {}: ".format(
390 ee_id
, status
, detailed_message
392 primitive_name
=primitive_name
,
394 except Exception as e
:
395 self
.log
.error("Error configuring helm ee: {}".format(e
))
396 raise N2VCExecutionException(
397 message
="Error configuring helm ee_id: {}, {}".format(
400 primitive_name
=primitive_name
,
406 status
, detailed_message
= await self
._execute
_primitive
(ip_addr
, primitive_name
,
407 params_dict
, db_dict
=db_dict
)
408 self
.log
.debug("Executed primitive {} ee_id_ {}, status: {}, message: {}".format(
409 primitive_name
, ee_id
, status
, detailed_message
))
410 if status
!= "OK" and status
!= "PROCESSING":
412 "Execute primitive {} returned not ok status: {}, message: {}".format(
413 primitive_name
, status
, detailed_message
)
415 raise N2VCExecutionException(
416 message
="Execute primitive {} returned not ok status: {}, message: {}".format(
417 primitive_name
, status
, detailed_message
419 primitive_name
=primitive_name
,
421 except Exception as e
:
423 "Error executing primitive {}: {}".format(primitive_name
, e
)
425 raise N2VCExecutionException(
426 message
="Error executing primitive {} into ee={} : {}".format(
427 primitive_name
, ee_id
, e
429 primitive_name
=primitive_name
,
431 return detailed_message
433 async def deregister_execution_environments(self
):
437 async def delete_execution_environment(
440 db_dict
: dict = None,
441 total_timeout
: float = None,
445 Delete an execution environment
446 :param str ee_id: id of the execution environment to delete, included namespace.helm_id
447 :param dict db_dict: where to write into database when the status changes.
448 It contains a dict with
449 {collection: <str>, filter: {}, path: <str>},
450 e.g. {collection: "nsrs", filter:
451 {_id: <nsd-id>, path: "_admin.deployed.VCA.3"}
452 :param float total_timeout:
455 self
.log
.info("ee_id: {}".format(ee_id
))
459 raise N2VCBadArgumentsException(
460 message
="ee_id is mandatory", bad_args
=["ee_id"]
465 # Obtain cluster_uuid
466 system_cluster_uuid
= await self
._get
_system
_cluster
_id
()
469 version
, namespace
, helm_id
= self
._get
_ee
_id
_parts
(ee_id
)
471 # Uninstall chart, for backward compatibility we must assume that if there is no
472 # version it is helm-v2
473 if version
== "helm-v3":
474 await self
._k
8sclusterhelm
3.uninstall(system_cluster_uuid
, helm_id
)
476 await self
._k
8sclusterhelm
2.uninstall(system_cluster_uuid
, helm_id
)
477 self
.log
.info("ee_id: {} deleted".format(ee_id
))
478 except N2VCException
:
480 except Exception as e
:
481 self
.log
.error("Error deleting ee id: {}: {}".format(ee_id
, e
), exc_info
=True)
482 raise N2VCException("Error deleting ee id {}: {}".format(ee_id
, e
))
484 async def delete_namespace(self
, namespace
: str, db_dict
: dict = None, total_timeout
: float = None):
485 # method not implemented for this connector, execution environments must be deleted individually
488 async def install_k8s_proxy_charm(
494 progress_timeout
: float = None,
495 total_timeout
: float = None,
501 @retryer(max_wait_time_var
="_initial_retry_time", delay_time_var
="_retry_delay")
502 async def _get_ssh_key(self
, ip_addr
):
503 channel
= Channel(ip_addr
, self
._ee
_service
_port
)
505 stub
= FrontendExecutorStub(channel
)
506 self
.log
.debug("get ssh key, ip_addr: {}".format(ip_addr
))
507 reply
: SshKeyReply
= await stub
.GetSshKey(SshKeyRequest())
512 @retryer(max_wait_time_var
="_initial_retry_time", delay_time_var
="_retry_delay")
513 async def _execute_config_primitive(self
, ip_addr
, params
, db_dict
=None):
514 return await self
._execute
_primitive
_internal
(ip_addr
, "config", params
, db_dict
=db_dict
)
516 @retryer(max_wait_time_var
="_max_retry_time", delay_time_var
="_retry_delay")
517 async def _execute_primitive(self
, ip_addr
, primitive_name
, params
, db_dict
=None):
518 return await self
._execute
_primitive
_internal
(ip_addr
, primitive_name
, params
, db_dict
=db_dict
)
520 async def _execute_primitive_internal(self
, ip_addr
, primitive_name
, params
, db_dict
=None):
522 channel
= Channel(ip_addr
, self
._ee
_service
_port
)
524 stub
= FrontendExecutorStub(channel
)
525 async with stub
.RunPrimitive
.open() as stream
:
526 primitive_id
= str(uuid
.uuid1())
528 self
.log
.debug("Execute primitive internal: id:{}, name:{}, params: {}".
529 format(primitive_id
, primitive_name
, params
))
530 await stream
.send_message(
531 PrimitiveRequest(id=primitive_id
, name
=primitive_name
, params
=yaml
.dump(params
)), end
=True)
532 async for reply
in stream
:
533 self
.log
.debug("Received reply: {}".format(reply
))
535 # If db_dict provided write notifs in database
537 self
._write
_op
_detailed
_status
(db_dict
, reply
.status
, reply
.detailed_message
)
539 return reply
.status
, reply
.detailed_message
541 return "ERROR", "No result received"
545 def _write_op_detailed_status(self
, db_dict
, status
, detailed_message
):
547 # write ee_id to database: _admin.deployed.VCA.x
549 the_table
= db_dict
["collection"]
550 the_filter
= db_dict
["filter"]
551 update_dict
= {"detailed-status": "{}: {}".format(status
, detailed_message
)}
552 # self.log.debug('Writing ee_id to database: {}'.format(the_path))
556 update_dict
=update_dict
,
559 except asyncio
.CancelledError
:
561 except Exception as e
:
562 self
.log
.error("Error writing detailedStatus to database: {}".format(e
))
564 async def _get_system_cluster_id(self
):
565 if not self
._system
_cluster
_id
:
566 db_k8cluster
= self
.db
.get_one("k8sclusters", {"name": self
._KUBECTL
_OSM
_CLUSTER
_NAME
})
567 k8s_hc_id
= deep_get(db_k8cluster
, ("_admin", "helm-chart-v3", "id"))
570 # backward compatibility for existing clusters that have not been initialized for helm v3
571 cluster_id
= db_k8cluster
.get("_id")
572 k8s_credentials
= yaml
.safe_dump(db_k8cluster
.get("credentials"))
573 k8s_hc_id
, uninstall_sw
= await self
._k
8sclusterhelm
3.init_env(k8s_credentials
,
574 reuse_cluster_uuid
=cluster_id
)
575 db_k8scluster_update
= {"_admin.helm-chart-v3.error_msg": None,
576 "_admin.helm-chart-v3.id": k8s_hc_id
,
577 "_admin.helm-chart-v3}.created": uninstall_sw
,
578 "_admin.helm-chart-v3.operationalState": "ENABLED"}
579 self
.update_db_2("k8sclusters", cluster_id
, db_k8scluster_update
)
580 except Exception as e
:
581 self
.log
.error("error initializing helm-v3 cluster: {}".format(str(e
)))
582 raise N2VCException("K8s system cluster '{}' has not been initialized for helm-chart-v3".format(
584 self
._system
_cluster
_id
= k8s_hc_id
585 return self
._system
_cluster
_id
587 def _get_ee_id_parts(self
, ee_id
):
589 Parses ee_id stored at database that can be either 'version:namespace.helm_id' or only
590 namespace.helm_id for backward compatibility
591 If exists helm version can be helm-v3 or helm (helm-v2 old version)
593 version
, _
, part_id
= ee_id
.rpartition(':')
594 namespace
, _
, helm_id
= part_id
.rpartition('.')
595 return version
, namespace
, helm_id