| peusterm | 79ef6ae | 2016-07-08 13:53:57 +0200 | [diff] [blame] | 1 | """
|
| 2 | Copyright (c) 2015 SONATA-NFV
|
| 3 | ALL RIGHTS RESERVED.
|
| 4 |
|
| 5 | Licensed under the Apache License, Version 2.0 (the "License");
|
| 6 | you may not use this file except in compliance with the License.
|
| 7 | You may obtain a copy of the License at
|
| 8 |
|
| 9 | http://www.apache.org/licenses/LICENSE-2.0
|
| 10 |
|
| 11 | Unless required by applicable law or agreed to in writing, software
|
| 12 | distributed under the License is distributed on an "AS IS" BASIS,
|
| 13 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
| 14 | See the License for the specific language governing permissions and
|
| 15 | limitations under the License.
|
| 16 |
|
| 17 | Neither the name of the SONATA-NFV [, ANY ADDITIONAL AFFILIATION]
|
| 18 | nor the names of its contributors may be used to endorse or promote
|
| 19 | products derived from this software without specific prior written
|
| 20 | permission.
|
| 21 |
|
| 22 | This work has been performed in the framework of the SONATA project,
|
| 23 | funded by the European Commission under Grant number 671517 through
|
| 24 | the Horizon 2020 and 5G-PPP programmes. The authors would like to
|
| 25 | acknowledge the contributions of their colleagues of the SONATA
|
| 26 | partner consortium (www.sonata-nfv.eu).
|
| 27 | """
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 28 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 29 | import logging
|
| stevenvanrossem | 51d4ae7 | 2016-08-10 13:22:53 +0200 | [diff] [blame] | 30 | import sys
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 31 | from mininet.node import OVSSwitch
|
| 32 | import ast
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 33 | import time
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 34 | from prometheus_client import start_http_server, Summary, Histogram, Gauge, Counter, REGISTRY, CollectorRegistry, \
|
| 35 | pushadd_to_gateway, push_to_gateway, delete_from_gateway
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 36 | import threading
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 37 | from subprocess import Popen
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 38 | import os
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 39 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 40 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 41 | logging.basicConfig(level=logging.INFO)
|
| 42 |
|
| 43 | """
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 44 | class to read openflow stats from the Ryu controller of the DCNetwork
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 45 | """
|
| 46 |
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 47 | PUSHGATEWAY_PORT = 9091
|
| 48 | CADVISOR_PORT = 8080
|
| 49 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 50 | class DCNetworkMonitor():
|
| 51 | def __init__(self, net):
|
| 52 | self.net = net
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 53 |
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 54 | # pushgateway address
|
| 55 | self.pushgateway = 'localhost:{0}'.format(PUSHGATEWAY_PORT)
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 56 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 57 | # supported Prometheus metrics
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 58 | self.registry = CollectorRegistry()
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 59 | self.prom_tx_packet_count = Gauge('sonemu_tx_count_packets', 'Total number of packets sent',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 60 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 61 | self.prom_rx_packet_count = Gauge('sonemu_rx_count_packets', 'Total number of packets received',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 62 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 63 | self.prom_tx_byte_count = Gauge('sonemu_tx_count_bytes', 'Total number of bytes sent',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 64 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 65 | self.prom_rx_byte_count = Gauge('sonemu_rx_count_bytes', 'Total number of bytes received',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 66 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 67 |
|
| 68 | self.prom_metrics={'tx_packets':self.prom_tx_packet_count, 'rx_packets':self.prom_rx_packet_count,
|
| 69 | 'tx_bytes':self.prom_tx_byte_count,'rx_bytes':self.prom_rx_byte_count}
|
| 70 |
|
| 71 | # list of installed metrics to monitor
|
| 72 | # each entry can contain this data
|
| 73 | '''
|
| 74 | {
|
| 75 | switch_dpid = 0
|
| 76 | vnf_name = None
|
| 77 | vnf_interface = None
|
| 78 | previous_measurement = 0
|
| 79 | previous_monitor_time = 0
|
| 80 | metric_key = None
|
| 81 | mon_port = None
|
| 82 | }
|
| 83 | '''
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 84 | self.monitor_lock = threading.Lock()
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 85 | self.monitor_flow_lock = threading.Lock()
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 86 | self.network_metrics = []
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 87 | self.flow_metrics = []
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 88 |
|
| 89 | # start monitoring thread
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 90 | self.start_monitoring = True
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 91 | self.monitor_thread = threading.Thread(target=self.get_network_metrics)
|
| 92 | self.monitor_thread.start()
|
| 93 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 94 | self.monitor_flow_thread = threading.Thread(target=self.get_flow_metrics)
|
| 95 | self.monitor_flow_thread.start()
|
| 96 |
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 97 | # helper tools
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 98 | # cAdvisor, Prometheus pushgateway are started as external container, to gather monitoring metric in son-emu
|
| 99 | self.start_PushGateway()
|
| 100 | self.start_cAdvisor()
|
| stevenvanrossem | 8970680 | 2016-07-19 02:54:45 +0200 | [diff] [blame] | 101 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 102 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 103 | # first set some parameters, before measurement can start
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 104 | def setup_flow(self, vnf_name, vnf_interface=None, metric='tx_packets', cookie=0):
|
| 105 |
|
| 106 | flow_metric = {}
|
| 107 |
|
| 108 | # check if port is specified (vnf:port)
|
| 109 | if vnf_interface is None:
|
| 110 | # take first interface by default
|
| 111 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 112 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 113 | vnf_interface = link_dict[0]['src_port_id']
|
| 114 |
|
| 115 | flow_metric['vnf_name'] = vnf_name
|
| 116 | flow_metric['vnf_interface'] = vnf_interface
|
| 117 |
|
| 118 | vnf_switch = None
|
| 119 | for connected_sw in self.net.DCNetwork_graph.neighbors(vnf_name):
|
| 120 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 121 | for link in link_dict:
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 122 | if link_dict[link]['src_port_id'] == vnf_interface:
|
| 123 | # found the right link and connected switch
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 124 | vnf_switch = connected_sw
|
| 125 | flow_metric['mon_port'] = link_dict[link]['dst_port_nr']
|
| 126 | break
|
| 127 |
|
| 128 | if not vnf_switch:
|
| 129 | logging.exception("vnf switch of {0}:{1} not found!".format(vnf_name, vnf_interface))
|
| 130 | return "vnf switch of {0}:{1} not found!".format(vnf_name, vnf_interface)
|
| 131 |
|
| 132 | try:
|
| 133 | # default port direction to monitor
|
| 134 | if metric is None:
|
| 135 | metric = 'tx_packets'
|
| 136 |
|
| 137 | next_node = self.net.getNodeByName(vnf_switch)
|
| 138 |
|
| 139 | if not isinstance(next_node, OVSSwitch):
|
| 140 | logging.info("vnf: {0} is not connected to switch".format(vnf_name))
|
| 141 | return
|
| 142 |
|
| 143 | flow_metric['previous_measurement'] = 0
|
| 144 | flow_metric['previous_monitor_time'] = 0
|
| 145 |
|
| 146 | flow_metric['switch_dpid'] = int(str(next_node.dpid), 16)
|
| 147 | flow_metric['metric_key'] = metric
|
| 148 | flow_metric['cookie'] = cookie
|
| 149 |
|
| 150 | self.monitor_flow_lock.acquire()
|
| 151 | self.flow_metrics.append(flow_metric)
|
| 152 | self.monitor_flow_lock.release()
|
| 153 |
|
| 154 | logging.info('Started monitoring flow:{3} {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie))
|
| 155 | return 'Started monitoring flow:{3} {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie)
|
| 156 |
|
| 157 | except Exception as ex:
|
| 158 | logging.exception("setup_metric error.")
|
| 159 | return ex.message
|
| 160 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 161 | def stop_flow(self, vnf_name, vnf_interface=None, metric=None, cookie=0,):
|
| 162 |
|
| 163 | # check if port is specified (vnf:port)
|
| 164 | if vnf_interface is None and metric is not None:
|
| 165 | # take first interface by default
|
| 166 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 167 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 168 | vnf_interface = link_dict[0]['src_port_id']
|
| 169 |
|
| stevenvanrossem | 1ef7702 | 2016-05-12 16:36:10 +0200 | [diff] [blame] | 170 | for flow_dict in self.flow_metrics:
|
| 171 | if flow_dict['vnf_name'] == vnf_name and flow_dict['vnf_interface'] == vnf_interface \
|
| 172 | and flow_dict['metric_key'] == metric and flow_dict['cookie'] == cookie:
|
| 173 |
|
| 174 | self.monitor_flow_lock.acquire()
|
| 175 |
|
| 176 | self.flow_metrics.remove(flow_dict)
|
| 177 |
|
| 178 | for collector in self.registry._collectors:
|
| 179 | if (vnf_name, vnf_interface, cookie) in collector._metrics:
|
| stevenvanrossem | 1ef7702 | 2016-05-12 16:36:10 +0200 | [diff] [blame] | 180 | collector.remove(vnf_name, vnf_interface, cookie)
|
| 181 |
|
| 182 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 183 |
|
| 184 | self.monitor_flow_lock.release()
|
| 185 |
|
| 186 | logging.info('Stopped monitoring flow {3}: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie))
|
| 187 | return 'Stopped monitoring flow {3}: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie)
|
| 188 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 189 | return 'Error stopping monitoring flow: {0} on {1}:{2}'.format(metric, vnf_name, vnf_interface)
|
| 190 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 191 |
|
| 192 | # first set some parameters, before measurement can start
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 193 | def setup_metric(self, vnf_name, vnf_interface=None, metric='tx_packets'):
|
| 194 |
|
| 195 | network_metric = {}
|
| 196 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 197 | # check if port is specified (vnf:port)
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 198 | if vnf_interface is None:
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 199 | # take first interface by default
|
| 200 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 201 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 202 | vnf_interface = link_dict[0]['src_port_id']
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 203 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 204 | network_metric['vnf_name'] = vnf_name
|
| 205 | network_metric['vnf_interface'] = vnf_interface
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 206 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 207 | for connected_sw in self.net.DCNetwork_graph.neighbors(vnf_name):
|
| 208 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 209 | for link in link_dict:
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 210 | if link_dict[link]['src_port_id'] == vnf_interface:
|
| 211 | # found the right link and connected switch
|
| stevenvanrossem | 307aa1f | 2016-05-06 10:35:15 +0200 | [diff] [blame] | 212 | network_metric['mon_port'] = link_dict[link]['dst_port_nr']
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 213 | break
|
| 214 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 215 | if 'mon_port' not in network_metric:
|
| 216 | logging.exception("vnf interface {0}:{1} not found!".format(vnf_name,vnf_interface))
|
| 217 | return "vnf interface {0}:{1} not found!".format(vnf_name,vnf_interface)
|
| 218 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 219 | try:
|
| 220 | # default port direction to monitor
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 221 | if metric is None:
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 222 | metric = 'tx_packets'
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 223 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 224 | vnf_switch = self.net.DCNetwork_graph.neighbors(str(vnf_name))
|
| 225 |
|
| 226 | if len(vnf_switch) > 1:
|
| 227 | logging.info("vnf: {0} has multiple ports".format(vnf_name))
|
| 228 | return
|
| 229 | elif len(vnf_switch) == 0:
|
| 230 | logging.info("vnf: {0} is not connected".format(vnf_name))
|
| 231 | return
|
| 232 | else:
|
| 233 | vnf_switch = vnf_switch[0]
|
| 234 | next_node = self.net.getNodeByName(vnf_switch)
|
| 235 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 236 | if not isinstance(next_node, OVSSwitch):
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 237 | logging.info("vnf: {0} is not connected to switch".format(vnf_name))
|
| 238 | return
|
| 239 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 240 | network_metric['previous_measurement'] = 0
|
| 241 | network_metric['previous_monitor_time'] = 0
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 242 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 243 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 244 | network_metric['switch_dpid'] = int(str(next_node.dpid), 16)
|
| 245 | network_metric['metric_key'] = metric
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 246 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 247 | self.monitor_lock.acquire()
|
| 248 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 249 | self.network_metrics.append(network_metric)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 250 | self.monitor_lock.release()
|
| 251 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 252 |
|
| 253 | logging.info('Started monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric))
|
| 254 | return 'Started monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric)
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 255 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 256 | except Exception as ex:
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 257 | logging.exception("setup_metric error.")
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 258 | return ex.message
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 259 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 260 | def stop_metric(self, vnf_name, vnf_interface=None, metric=None):
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 261 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 262 | # check if port is specified (vnf:port)
|
| 263 | if vnf_interface is None and metric is not None:
|
| 264 | # take first interface by default
|
| 265 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 266 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 267 | vnf_interface = link_dict[0]['src_port_id']
|
| 268 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 269 | for metric_dict in self.network_metrics:
|
| 270 | if metric_dict['vnf_name'] == vnf_name and metric_dict['vnf_interface'] == vnf_interface \
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 271 | and metric_dict['metric_key'] == metric:
|
| 272 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 273 | self.monitor_lock.acquire()
|
| 274 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 275 | self.network_metrics.remove(metric_dict)
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 276 |
|
| 277 | #this removes the complete metric, all labels...
|
| 278 | #REGISTRY.unregister(self.prom_metrics[metric_dict['metric_key']])
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 279 | #self.registry.unregister(self.prom_metrics[metric_dict['metric_key']])
|
| 280 |
|
| 281 | for collector in self.registry._collectors :
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 282 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 283 | """
|
| 284 | INFO:root:name:sonemu_rx_count_packets
|
| 285 | labels:('vnf_name', 'vnf_interface')
|
| 286 | metrics:{(u'tsrc', u'output'): < prometheus_client.core.Gauge
|
| 287 | object
|
| 288 | at
|
| 289 | 0x7f353447fd10 >}
|
| 290 | """
|
| 291 | logging.info('{0}'.format(collector._metrics.values()))
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 292 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 293 | if (vnf_name, vnf_interface, 'None') in collector._metrics:
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 294 | logging.info('2 name:{0} labels:{1} metrics:{2}'.format(collector._name, collector._labelnames,
|
| 295 | collector._metrics))
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 296 | collector.remove(vnf_name, vnf_interface, 'None')
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 297 |
|
| 298 | # set values to NaN, prometheus api currently does not support removal of metrics
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 299 | #self.prom_metrics[metric_dict['metric_key']].labels(vnf_name, vnf_interface).set(float('nan'))
|
| 300 |
|
| 301 | # this removes the complete metric, all labels...
|
| 302 | # 1 single monitor job for all metrics of the SDN controller
|
| 303 | # we can only remove from the pushgateway grouping keys(labels) which we have defined for the add_to_pushgateway
|
| 304 | # we can not specify labels from the metrics to be removed
|
| 305 | # if we need to remove the metrics seperatelty, we need to give them a separate grouping key, and probably a diffferent registry also
|
| 306 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 307 |
|
| 308 | self.monitor_lock.release()
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 309 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 310 | logging.info('Stopped monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric))
|
| 311 | return 'Stopped monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric)
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 312 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 313 | # delete everything from this vnf
|
| 314 | elif metric_dict['vnf_name'] == vnf_name and vnf_interface is None and metric is None:
|
| 315 | self.monitor_lock.acquire()
|
| 316 | self.network_metrics.remove(metric_dict)
|
| 317 | for collector in self.registry._collectors:
|
| 318 | collector_dict = collector._metrics.copy()
|
| 319 | for name, interface, id in collector_dict:
|
| 320 | if name == vnf_name:
|
| 321 | logging.info('3 name:{0} labels:{1} metrics:{2}'.format(collector._name, collector._labelnames,
|
| 322 | collector._metrics))
|
| 323 | collector.remove(name, interface, 'None')
|
| 324 |
|
| 325 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 326 | self.monitor_lock.release()
|
| 327 | logging.info('Stopped monitoring vnf: {0}'.format(vnf_name))
|
| 328 | return 'Stopped monitoring: {0}'.format(vnf_name)
|
| 329 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 330 | return 'Error stopping monitoring metric: {0} on {1}:{2}'.format(metric, vnf_name, vnf_interface)
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 331 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 332 |
|
| 333 |
|
| 334 |
|
| 335 |
|
| 336 | # get all metrics defined in the list and export it to Prometheus
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 337 | def get_flow_metrics(self):
|
| 338 | while self.start_monitoring:
|
| 339 |
|
| 340 | self.monitor_flow_lock.acquire()
|
| 341 |
|
| 342 | for flow_dict in self.flow_metrics:
|
| 343 | data = {}
|
| 344 |
|
| 345 | data['cookie'] = flow_dict['cookie']
|
| stevenvanrossem | 1a5ced9 | 2016-08-07 00:52:13 +0200 | [diff] [blame] | 346 | data['cookie_mask'] = flow_dict['cookie']
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 347 |
|
| 348 | if 'tx' in flow_dict['metric_key']:
|
| 349 | data['match'] = {'in_port':flow_dict['mon_port']}
|
| 350 | elif 'rx' in flow_dict['metric_key']:
|
| 351 | data['out_port'] = flow_dict['mon_port']
|
| 352 |
|
| 353 |
|
| 354 | # query Ryu
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 355 | ret = self.net.ryu_REST('stats/flow', dpid=flow_dict['switch_dpid'], data=data)
|
| stevenvanrossem | 51d4ae7 | 2016-08-10 13:22:53 +0200 | [diff] [blame] | 356 | if isinstance(ret, dict):
|
| 357 | flow_stat_dict = ret
|
| 358 | elif isinstance(ret, basestring):
|
| 359 | flow_stat_dict = ast.literal_eval(ret.rstrip())
|
| 360 | else:
|
| 361 | flow_stat_dict = None
|
| 362 |
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 363 | logging.debug('received flow stat:{0} '.format(flow_stat_dict))
|
| stevenvanrossem | 3fc1393 | 2016-08-09 23:39:16 +0200 | [diff] [blame] | 364 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 365 | self.set_flow_metric(flow_dict, flow_stat_dict)
|
| 366 |
|
| 367 | self.monitor_flow_lock.release()
|
| 368 | time.sleep(1)
|
| 369 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 370 | def get_network_metrics(self):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 371 | while self.start_monitoring:
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 372 |
|
| 373 | self.monitor_lock.acquire()
|
| 374 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 375 | # group metrics by dpid to optimize the rest api calls
|
| 376 | dpid_list = [metric_dict['switch_dpid'] for metric_dict in self.network_metrics]
|
| 377 | dpid_set = set(dpid_list)
|
| 378 |
|
| 379 | for dpid in dpid_set:
|
| 380 |
|
| 381 | # query Ryu
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 382 | ret = self.net.ryu_REST('stats/port', dpid=dpid)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 383 | port_stat_dict = ast.literal_eval(ret)
|
| 384 |
|
| 385 | metric_list = [metric_dict for metric_dict in self.network_metrics
|
| 386 | if int(metric_dict['switch_dpid'])==int(dpid)]
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 387 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 388 | for metric_dict in metric_list:
|
| 389 | self.set_network_metric(metric_dict, port_stat_dict)
|
| 390 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 391 | self.monitor_lock.release()
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 392 | time.sleep(1)
|
| 393 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 394 | # add metric to the list to export to Prometheus, parse the Ryu port-stats reply
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 395 | def set_network_metric(self, metric_dict, port_stat_dict):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 396 | # vnf tx is the datacenter switch rx and vice-versa
|
| 397 | metric_key = self.switch_tx_rx(metric_dict['metric_key'])
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 398 | switch_dpid = metric_dict['switch_dpid']
|
| 399 | vnf_name = metric_dict['vnf_name']
|
| 400 | vnf_interface = metric_dict['vnf_interface']
|
| 401 | previous_measurement = metric_dict['previous_measurement']
|
| 402 | previous_monitor_time = metric_dict['previous_monitor_time']
|
| 403 | mon_port = metric_dict['mon_port']
|
| 404 |
|
| 405 | for port_stat in port_stat_dict[str(switch_dpid)]:
|
| 406 | if int(port_stat['port_no']) == int(mon_port):
|
| 407 | port_uptime = port_stat['duration_sec'] + port_stat['duration_nsec'] * 10 ** (-9)
|
| 408 | this_measurement = int(port_stat[metric_key])
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 409 |
|
| 410 | # set prometheus metric
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 411 | self.prom_metrics[metric_dict['metric_key']].\
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 412 | labels({'vnf_name': vnf_name, 'vnf_interface': vnf_interface, 'flow_id': None}).\
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 413 | set(this_measurement)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 414 |
|
| 415 | # 1 single monitor job for all metrics of the SDN controller
|
| 416 | pushadd_to_gateway(self.pushgateway, job='sonemu-SDNcontroller', registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 417 |
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame] | 418 | # also the rate is calculated here, but not used for now
|
| 419 | # (rate can be easily queried from prometheus also)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 420 | if previous_monitor_time <= 0 or previous_monitor_time >= port_uptime:
|
| 421 | metric_dict['previous_measurement'] = int(port_stat[metric_key])
|
| 422 | metric_dict['previous_monitor_time'] = port_uptime
|
| 423 | # do first measurement
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 424 | time.sleep(1)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 425 | self.monitor_lock.release()
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 426 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 427 | metric_rate = self.get_network_metrics()
|
| 428 | return metric_rate
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 429 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 430 | else:
|
| 431 | time_delta = (port_uptime - metric_dict['previous_monitor_time'])
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 432 | metric_rate = (this_measurement - metric_dict['previous_measurement']) / float(time_delta)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 433 |
|
| 434 | metric_dict['previous_measurement'] = this_measurement
|
| 435 | metric_dict['previous_monitor_time'] = port_uptime
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 436 | return metric_rate
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 437 |
|
| 438 | logging.exception('metric {0} not found on {1}:{2}'.format(metric_key, vnf_name, vnf_interface))
|
| 439 | return 'metric {0} not found on {1}:{2}'.format(metric_key, vnf_name, vnf_interface)
|
| 440 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 441 | def set_flow_metric(self, metric_dict, flow_stat_dict):
|
| 442 | # vnf tx is the datacenter switch rx and vice-versa
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 443 | metric_key = metric_dict['metric_key']
|
| 444 | switch_dpid = metric_dict['switch_dpid']
|
| 445 | vnf_name = metric_dict['vnf_name']
|
| 446 | vnf_interface = metric_dict['vnf_interface']
|
| 447 | previous_measurement = metric_dict['previous_measurement']
|
| 448 | previous_monitor_time = metric_dict['previous_monitor_time']
|
| 449 | cookie = metric_dict['cookie']
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 450 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 451 | counter = 0
|
| 452 | for flow_stat in flow_stat_dict[str(switch_dpid)]:
|
| 453 | if 'bytes' in metric_key:
|
| 454 | counter += flow_stat['byte_count']
|
| 455 | elif 'packet' in metric_key:
|
| 456 | counter += flow_stat['packet_count']
|
| 457 |
|
| 458 | flow_stat = flow_stat_dict[str(switch_dpid)][0]
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 459 | flow_uptime = flow_stat['duration_sec'] + flow_stat['duration_nsec'] * 10 ** (-9)
|
| 460 |
|
| 461 | self.prom_metrics[metric_dict['metric_key']]. \
|
| 462 | labels({'vnf_name': vnf_name, 'vnf_interface': vnf_interface, 'flow_id': cookie}). \
|
| 463 | set(counter)
|
| stevenvanrossem | 51d4ae7 | 2016-08-10 13:22:53 +0200 | [diff] [blame] | 464 | try:
|
| 465 | pushadd_to_gateway(self.pushgateway, job='sonemu-SDNcontroller', registry=self.registry)
|
| 466 | except Exception, e:
|
| 467 | logging.warning("Pushgateway not reachable: {0} {1}".format(Exception, e))
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 468 |
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 469 |
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 470 | def start_Prometheus(self, port=CADVISOR_PORT):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 471 | # prometheus.yml configuration file is located in the same directory as this file
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 472 | cmd = ["docker",
|
| 473 | "run",
|
| 474 | "--rm",
|
| 475 | "-p", "{0}:9090".format(port),
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 476 | "-v", "{0}/prometheus.yml:/etc/prometheus/prometheus.yml".format(os.path.dirname(os.path.abspath(__file__))),
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 477 | "-v", "{0}/profile.rules:/etc/prometheus/profile.rules".format(os.path.dirname(os.path.abspath(__file__))),
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 478 | "--name", "prometheus",
|
| 479 | "prom/prometheus"
|
| 480 | ]
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 481 | logging.info('Start Prometheus container {0}'.format(cmd))
|
| 482 | return Popen(cmd)
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 483 |
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 484 | def start_PushGateway(self, port=PUSHGATEWAY_PORT):
|
| stevenvanrossem | adfd06f | 2016-04-22 10:39:08 +0200 | [diff] [blame] | 485 | cmd = ["docker",
|
| 486 | "run",
|
| 487 | "-d",
|
| 488 | "-p", "{0}:9091".format(port),
|
| 489 | "--name", "pushgateway",
|
| 490 | "prom/pushgateway"
|
| 491 | ]
|
| 492 |
|
| 493 | logging.info('Start Prometheus Push Gateway container {0}'.format(cmd))
|
| 494 | return Popen(cmd)
|
| 495 |
|
| stevenvanrossem | a5aeb37 | 2016-08-18 17:32:24 +0200 | [diff] [blame] | 496 | def start_cAdvisor(self, port=8080):
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 497 | cmd = ["docker",
|
| 498 | "run",
|
| 499 | "--rm",
|
| 500 | "--volume=/:/rootfs:ro",
|
| 501 | "--volume=/var/run:/var/run:rw",
|
| 502 | "--volume=/sys:/sys:ro",
|
| 503 | "--volume=/var/lib/docker/:/var/lib/docker:ro",
|
| 504 | "--publish={0}:8080".format(port),
|
| 505 | "--name=cadvisor",
|
| 506 | "google/cadvisor:latest"
|
| 507 | ]
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 508 | logging.info('Start cAdvisor container {0}'.format(cmd))
|
| 509 | return Popen(cmd)
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 510 |
|
| 511 | def stop(self):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 512 | # stop the monitoring thread
|
| 513 | self.start_monitoring = False
|
| 514 | self.monitor_thread.join()
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 515 | self.monitor_flow_thread.join()
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 516 |
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 517 | # these containers are used for monitoring but are started now outside of son-emu
|
| stevenvanrossem | 2fdfbf4 | 2016-05-13 15:08:47 +0200 | [diff] [blame] | 518 | '''
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 519 | if self.prometheus_process is not None:
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 520 | logging.info('stopping prometheus container')
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 521 | self.prometheus_process.terminate()
|
| 522 | self.prometheus_process.kill()
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 523 | self._stop_container('prometheus')
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 524 |
|
| stevenvanrossem | adfd06f | 2016-04-22 10:39:08 +0200 | [diff] [blame] | 525 | if self.pushgateway_process is not None:
|
| 526 | logging.info('stopping pushgateway container')
|
| 527 | self.pushgateway_process.terminate()
|
| 528 | self.pushgateway_process.kill()
|
| 529 | self._stop_container('pushgateway')
|
| 530 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 531 | if self.cadvisor_process is not None:
|
| 532 | logging.info('stopping cadvisor container')
|
| 533 | self.cadvisor_process.terminate()
|
| 534 | self.cadvisor_process.kill()
|
| 535 | self._stop_container('cadvisor')
|
| stevenvanrossem | 9c8a412 | 2016-07-16 03:23:13 +0200 | [diff] [blame] | 536 | '''
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 537 |
|
| 538 | def switch_tx_rx(self,metric=''):
|
| 539 | # when monitoring vnfs, the tx of the datacenter switch is actually the rx of the vnf
|
| 540 | # so we need to change the metric name to be consistent with the vnf rx or tx
|
| 541 | if 'tx' in metric:
|
| 542 | metric = metric.replace('tx','rx')
|
| 543 | elif 'rx' in metric:
|
| 544 | metric = metric.replace('rx','tx')
|
| 545 |
|
| 546 | return metric
|
| 547 |
|
| 548 | def _stop_container(self, name):
|
| 549 | cmd = ["docker",
|
| 550 | "stop",
|
| 551 | name]
|
| 552 | Popen(cmd).wait()
|
| 553 |
|
| 554 | cmd = ["docker",
|
| 555 | "rm",
|
| 556 | name]
|
| 557 | Popen(cmd).wait()
|
| 558 |
|