| peusterm | 79ef6ae | 2016-07-08 13:53:57 +0200 | [diff] [blame] | 1 | """
|
| 2 | Copyright (c) 2015 SONATA-NFV
|
| 3 | ALL RIGHTS RESERVED.
|
| 4 |
|
| 5 | Licensed under the Apache License, Version 2.0 (the "License");
|
| 6 | you may not use this file except in compliance with the License.
|
| 7 | You may obtain a copy of the License at
|
| 8 |
|
| 9 | http://www.apache.org/licenses/LICENSE-2.0
|
| 10 |
|
| 11 | Unless required by applicable law or agreed to in writing, software
|
| 12 | distributed under the License is distributed on an "AS IS" BASIS,
|
| 13 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
| 14 | See the License for the specific language governing permissions and
|
| 15 | limitations under the License.
|
| 16 |
|
| 17 | Neither the name of the SONATA-NFV [, ANY ADDITIONAL AFFILIATION]
|
| 18 | nor the names of its contributors may be used to endorse or promote
|
| 19 | products derived from this software without specific prior written
|
| 20 | permission.
|
| 21 |
|
| 22 | This work has been performed in the framework of the SONATA project,
|
| 23 | funded by the European Commission under Grant number 671517 through
|
| 24 | the Horizon 2020 and 5G-PPP programmes. The authors would like to
|
| 25 | acknowledge the contributions of their colleagues of the SONATA
|
| 26 | partner consortium (www.sonata-nfv.eu).
|
| 27 | """
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 28 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 29 | import logging
|
| 30 | from mininet.node import OVSSwitch
|
| 31 | import ast
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 32 | import time
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 33 | from prometheus_client import start_http_server, Summary, Histogram, Gauge, Counter, REGISTRY, CollectorRegistry, \
|
| 34 | pushadd_to_gateway, push_to_gateway, delete_from_gateway
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 35 | import threading
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 36 | from subprocess import Popen
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 37 | import os
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 38 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 39 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 40 | logging.basicConfig(level=logging.INFO)
|
| 41 |
|
| 42 | """
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 43 | class to read openflow stats from the Ryu controller of the DCNetwork
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 44 | """
|
| 45 |
|
| 46 | class DCNetworkMonitor():
|
| 47 | def __init__(self, net):
|
| 48 | self.net = net
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 49 |
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 50 | # TODO: these global variables should be part of a config file?
|
| 51 | '''
|
| 52 | # prometheus is started outside of son-emu
|
| stevenvanrossem | 48db051 | 2016-05-18 15:43:24 +0200 | [diff] [blame] | 53 | prometheus_ip = '127.0.0.1'
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 54 | prometheus_port = '9090'
|
| 55 | self.prometheus_REST_api = 'http://{0}:{1}'.format(prometheus_ip, prometheus_port)
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 56 | '''
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 57 | # helper variables to calculate the metrics
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 58 | # pushgateway is started outside of son-emu and son-emu is started with net=host
|
| 59 | # so localhost:9091 works
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 60 | self.pushgateway = 'localhost:9091'
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 61 | # when sdk is started with docker-compose, we could use
|
| 62 | # self.pushgateway = 'pushgateway:9091'
|
| 63 | # Start up the server to expose the metrics to Prometheus
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 64 | #start_http_server(8000)
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 65 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 66 | # supported Prometheus metrics
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 67 | self.registry = CollectorRegistry()
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 68 | self.prom_tx_packet_count = Gauge('sonemu_tx_count_packets', 'Total number of packets sent',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 69 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 70 | self.prom_rx_packet_count = Gauge('sonemu_rx_count_packets', 'Total number of packets received',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 71 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 72 | self.prom_tx_byte_count = Gauge('sonemu_tx_count_bytes', 'Total number of bytes sent',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 73 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 74 | self.prom_rx_byte_count = Gauge('sonemu_rx_count_bytes', 'Total number of bytes received',
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 75 | ['vnf_name', 'vnf_interface', 'flow_id'], registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 76 |
|
| 77 | self.prom_metrics={'tx_packets':self.prom_tx_packet_count, 'rx_packets':self.prom_rx_packet_count,
|
| 78 | 'tx_bytes':self.prom_tx_byte_count,'rx_bytes':self.prom_rx_byte_count}
|
| 79 |
|
| 80 | # list of installed metrics to monitor
|
| 81 | # each entry can contain this data
|
| 82 | '''
|
| 83 | {
|
| 84 | switch_dpid = 0
|
| 85 | vnf_name = None
|
| 86 | vnf_interface = None
|
| 87 | previous_measurement = 0
|
| 88 | previous_monitor_time = 0
|
| 89 | metric_key = None
|
| 90 | mon_port = None
|
| 91 | }
|
| 92 | '''
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 93 | self.monitor_lock = threading.Lock()
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 94 | self.monitor_flow_lock = threading.Lock()
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 95 | self.network_metrics = []
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 96 | self.flow_metrics = []
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 97 |
|
| 98 | # start monitoring thread
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 99 | self.start_monitoring = True
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 100 | self.monitor_thread = threading.Thread(target=self.get_network_metrics)
|
| 101 | self.monitor_thread.start()
|
| 102 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 103 | self.monitor_flow_thread = threading.Thread(target=self.get_flow_metrics)
|
| 104 | self.monitor_flow_thread.start()
|
| 105 |
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 106 | # helper tools
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 107 | # Prometheus pushgateway and DB are started as external contianer, outside of son-emu
|
| stevenvanrossem | 2fdfbf4 | 2016-05-13 15:08:47 +0200 | [diff] [blame] | 108 | #self.pushgateway_process = self.start_PushGateway()
|
| 109 | #self.prometheus_process = self.start_Prometheus()
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 110 | self.cadvisor_process = self.start_cadvisor()
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 111 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 112 | # first set some parameters, before measurement can start
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 113 | def setup_flow(self, vnf_name, vnf_interface=None, metric='tx_packets', cookie=0):
|
| 114 |
|
| 115 | flow_metric = {}
|
| 116 |
|
| 117 | # check if port is specified (vnf:port)
|
| 118 | if vnf_interface is None:
|
| 119 | # take first interface by default
|
| 120 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 121 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 122 | vnf_interface = link_dict[0]['src_port_id']
|
| 123 |
|
| 124 | flow_metric['vnf_name'] = vnf_name
|
| 125 | flow_metric['vnf_interface'] = vnf_interface
|
| 126 |
|
| 127 | vnf_switch = None
|
| 128 | for connected_sw in self.net.DCNetwork_graph.neighbors(vnf_name):
|
| 129 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 130 | for link in link_dict:
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 131 | if link_dict[link]['src_port_id'] == vnf_interface:
|
| 132 | # found the right link and connected switch
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 133 | vnf_switch = connected_sw
|
| 134 | flow_metric['mon_port'] = link_dict[link]['dst_port_nr']
|
| 135 | break
|
| 136 |
|
| 137 | if not vnf_switch:
|
| 138 | logging.exception("vnf switch of {0}:{1} not found!".format(vnf_name, vnf_interface))
|
| 139 | return "vnf switch of {0}:{1} not found!".format(vnf_name, vnf_interface)
|
| 140 |
|
| 141 | try:
|
| 142 | # default port direction to monitor
|
| 143 | if metric is None:
|
| 144 | metric = 'tx_packets'
|
| 145 |
|
| 146 | next_node = self.net.getNodeByName(vnf_switch)
|
| 147 |
|
| 148 | if not isinstance(next_node, OVSSwitch):
|
| 149 | logging.info("vnf: {0} is not connected to switch".format(vnf_name))
|
| 150 | return
|
| 151 |
|
| 152 | flow_metric['previous_measurement'] = 0
|
| 153 | flow_metric['previous_monitor_time'] = 0
|
| 154 |
|
| 155 | flow_metric['switch_dpid'] = int(str(next_node.dpid), 16)
|
| 156 | flow_metric['metric_key'] = metric
|
| 157 | flow_metric['cookie'] = cookie
|
| 158 |
|
| 159 | self.monitor_flow_lock.acquire()
|
| 160 | self.flow_metrics.append(flow_metric)
|
| 161 | self.monitor_flow_lock.release()
|
| 162 |
|
| 163 | logging.info('Started monitoring flow:{3} {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie))
|
| 164 | return 'Started monitoring flow:{3} {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie)
|
| 165 |
|
| 166 | except Exception as ex:
|
| 167 | logging.exception("setup_metric error.")
|
| 168 | return ex.message
|
| 169 |
|
| stevenvanrossem | 1ef7702 | 2016-05-12 16:36:10 +0200 | [diff] [blame] | 170 | def stop_flow(self, vnf_name, vnf_interface=None, metric=None, cookie=0):
|
| 171 | for flow_dict in self.flow_metrics:
|
| 172 | if flow_dict['vnf_name'] == vnf_name and flow_dict['vnf_interface'] == vnf_interface \
|
| 173 | and flow_dict['metric_key'] == metric and flow_dict['cookie'] == cookie:
|
| 174 |
|
| 175 | self.monitor_flow_lock.acquire()
|
| 176 |
|
| 177 | self.flow_metrics.remove(flow_dict)
|
| 178 |
|
| 179 | for collector in self.registry._collectors:
|
| 180 | if (vnf_name, vnf_interface, cookie) in collector._metrics:
|
| stevenvanrossem | 1ef7702 | 2016-05-12 16:36:10 +0200 | [diff] [blame] | 181 | collector.remove(vnf_name, vnf_interface, cookie)
|
| 182 |
|
| 183 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 184 |
|
| 185 | self.monitor_flow_lock.release()
|
| 186 |
|
| 187 | logging.info('Stopped monitoring flow {3}: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie))
|
| 188 | return 'Stopped monitoring flow {3}: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric, cookie)
|
| 189 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 190 |
|
| 191 | # first set some parameters, before measurement can start
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 192 | def setup_metric(self, vnf_name, vnf_interface=None, metric='tx_packets'):
|
| 193 |
|
| 194 | network_metric = {}
|
| 195 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 196 | # check if port is specified (vnf:port)
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 197 | if vnf_interface is None:
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 198 | # take first interface by default
|
| 199 | connected_sw = self.net.DCNetwork_graph.neighbors(vnf_name)[0]
|
| 200 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 201 | vnf_interface = link_dict[0]['src_port_id']
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 202 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 203 | network_metric['vnf_name'] = vnf_name
|
| 204 | network_metric['vnf_interface'] = vnf_interface
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 205 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 206 | for connected_sw in self.net.DCNetwork_graph.neighbors(vnf_name):
|
| 207 | link_dict = self.net.DCNetwork_graph[vnf_name][connected_sw]
|
| 208 | for link in link_dict:
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 209 | if link_dict[link]['src_port_id'] == vnf_interface:
|
| 210 | # found the right link and connected switch
|
| stevenvanrossem | 307aa1f | 2016-05-06 10:35:15 +0200 | [diff] [blame] | 211 | network_metric['mon_port'] = link_dict[link]['dst_port_nr']
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 212 | break
|
| 213 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 214 | if 'mon_port' not in network_metric:
|
| 215 | logging.exception("vnf interface {0}:{1} not found!".format(vnf_name,vnf_interface))
|
| 216 | return "vnf interface {0}:{1} not found!".format(vnf_name,vnf_interface)
|
| 217 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 218 | try:
|
| 219 | # default port direction to monitor
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 220 | if metric is None:
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 221 | metric = 'tx_packets'
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 222 |
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 223 | vnf_switch = self.net.DCNetwork_graph.neighbors(str(vnf_name))
|
| 224 |
|
| 225 | if len(vnf_switch) > 1:
|
| 226 | logging.info("vnf: {0} has multiple ports".format(vnf_name))
|
| 227 | return
|
| 228 | elif len(vnf_switch) == 0:
|
| 229 | logging.info("vnf: {0} is not connected".format(vnf_name))
|
| 230 | return
|
| 231 | else:
|
| 232 | vnf_switch = vnf_switch[0]
|
| 233 | next_node = self.net.getNodeByName(vnf_switch)
|
| 234 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 235 | if not isinstance(next_node, OVSSwitch):
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 236 | logging.info("vnf: {0} is not connected to switch".format(vnf_name))
|
| 237 | return
|
| 238 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 239 | network_metric['previous_measurement'] = 0
|
| 240 | network_metric['previous_monitor_time'] = 0
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 241 |
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 242 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 243 | network_metric['switch_dpid'] = int(str(next_node.dpid), 16)
|
| 244 | network_metric['metric_key'] = metric
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 245 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 246 | self.monitor_lock.acquire()
|
| 247 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 248 | self.network_metrics.append(network_metric)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 249 | self.monitor_lock.release()
|
| 250 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 251 |
|
| 252 | logging.info('Started monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric))
|
| 253 | return 'Started monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric)
|
| stevenvanrossem | c5a536a | 2016-02-16 14:52:39 +0100 | [diff] [blame] | 254 |
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 255 | except Exception as ex:
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 256 | logging.exception("setup_metric error.")
|
| stevenvanrossem | ed711fd | 2016-04-11 16:59:29 +0200 | [diff] [blame] | 257 | return ex.message
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 258 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 259 | def stop_metric(self, vnf_name, vnf_interface=None, metric=None):
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 260 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 261 | for metric_dict in self.network_metrics:
|
| 262 | if metric_dict['vnf_name'] == vnf_name and metric_dict['vnf_interface'] == vnf_interface \
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 263 | and metric_dict['metric_key'] == metric:
|
| 264 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 265 | self.monitor_lock.acquire()
|
| 266 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 267 | self.network_metrics.remove(metric_dict)
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 268 |
|
| 269 | #this removes the complete metric, all labels...
|
| 270 | #REGISTRY.unregister(self.prom_metrics[metric_dict['metric_key']])
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 271 | #self.registry.unregister(self.prom_metrics[metric_dict['metric_key']])
|
| 272 |
|
| 273 | for collector in self.registry._collectors :
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 274 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 275 | """
|
| 276 | INFO:root:name:sonemu_rx_count_packets
|
| 277 | labels:('vnf_name', 'vnf_interface')
|
| 278 | metrics:{(u'tsrc', u'output'): < prometheus_client.core.Gauge
|
| 279 | object
|
| 280 | at
|
| 281 | 0x7f353447fd10 >}
|
| 282 | """
|
| 283 | logging.info('{0}'.format(collector._metrics.values()))
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 284 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 285 | if (vnf_name, vnf_interface, 'None') in collector._metrics:
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 286 | logging.info('2 name:{0} labels:{1} metrics:{2}'.format(collector._name, collector._labelnames,
|
| 287 | collector._metrics))
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 288 | collector.remove(vnf_name, vnf_interface, 'None')
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 289 |
|
| 290 | # set values to NaN, prometheus api currently does not support removal of metrics
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 291 | #self.prom_metrics[metric_dict['metric_key']].labels(vnf_name, vnf_interface).set(float('nan'))
|
| 292 |
|
| 293 | # this removes the complete metric, all labels...
|
| 294 | # 1 single monitor job for all metrics of the SDN controller
|
| 295 | # we can only remove from the pushgateway grouping keys(labels) which we have defined for the add_to_pushgateway
|
| 296 | # we can not specify labels from the metrics to be removed
|
| 297 | # if we need to remove the metrics seperatelty, we need to give them a separate grouping key, and probably a diffferent registry also
|
| 298 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 299 |
|
| 300 | self.monitor_lock.release()
|
| stevenvanrossem | bbdb5ee | 2016-04-15 15:18:44 +0200 | [diff] [blame] | 301 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 302 | logging.info('Stopped monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric))
|
| 303 | return 'Stopped monitoring: {2} on {0}:{1}'.format(vnf_name, vnf_interface, metric)
|
| stevenvanrossem | 9315da4 | 2016-04-11 12:10:06 +0200 | [diff] [blame] | 304 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 305 | # delete everything from this vnf
|
| 306 | elif metric_dict['vnf_name'] == vnf_name and vnf_interface is None and metric is None:
|
| 307 | self.monitor_lock.acquire()
|
| 308 | self.network_metrics.remove(metric_dict)
|
| 309 | for collector in self.registry._collectors:
|
| 310 | collector_dict = collector._metrics.copy()
|
| 311 | for name, interface, id in collector_dict:
|
| 312 | if name == vnf_name:
|
| 313 | logging.info('3 name:{0} labels:{1} metrics:{2}'.format(collector._name, collector._labelnames,
|
| 314 | collector._metrics))
|
| 315 | collector.remove(name, interface, 'None')
|
| 316 |
|
| 317 | delete_from_gateway(self.pushgateway, job='sonemu-SDNcontroller')
|
| 318 | self.monitor_lock.release()
|
| 319 | logging.info('Stopped monitoring vnf: {0}'.format(vnf_name))
|
| 320 | return 'Stopped monitoring: {0}'.format(vnf_name)
|
| 321 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 322 |
|
| 323 | # get all metrics defined in the list and export it to Prometheus
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 324 | def get_flow_metrics(self):
|
| 325 | while self.start_monitoring:
|
| 326 |
|
| 327 | self.monitor_flow_lock.acquire()
|
| 328 |
|
| 329 | for flow_dict in self.flow_metrics:
|
| 330 | data = {}
|
| 331 |
|
| 332 | data['cookie'] = flow_dict['cookie']
|
| 333 |
|
| 334 | if 'tx' in flow_dict['metric_key']:
|
| 335 | data['match'] = {'in_port':flow_dict['mon_port']}
|
| 336 | elif 'rx' in flow_dict['metric_key']:
|
| 337 | data['out_port'] = flow_dict['mon_port']
|
| 338 |
|
| 339 |
|
| 340 | # query Ryu
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 341 | ret = self.net.ryu_REST('stats/flow', dpid=flow_dict['switch_dpid'], data=data)
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 342 | flow_stat_dict = ast.literal_eval(ret)
|
| 343 |
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 344 | logging.debug('received flow stat:{0} '.format(flow_stat_dict))
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 345 | self.set_flow_metric(flow_dict, flow_stat_dict)
|
| 346 |
|
| 347 | self.monitor_flow_lock.release()
|
| 348 | time.sleep(1)
|
| 349 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 350 | def get_network_metrics(self):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 351 | while self.start_monitoring:
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 352 |
|
| 353 | self.monitor_lock.acquire()
|
| 354 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 355 | # group metrics by dpid to optimize the rest api calls
|
| 356 | dpid_list = [metric_dict['switch_dpid'] for metric_dict in self.network_metrics]
|
| 357 | dpid_set = set(dpid_list)
|
| 358 |
|
| 359 | for dpid in dpid_set:
|
| 360 |
|
| 361 | # query Ryu
|
| stevenvanrossem | 27b6d95 | 2016-05-10 16:37:57 +0200 | [diff] [blame] | 362 | ret = self.net.ryu_REST('stats/port', dpid=dpid)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 363 | port_stat_dict = ast.literal_eval(ret)
|
| 364 |
|
| 365 | metric_list = [metric_dict for metric_dict in self.network_metrics
|
| 366 | if int(metric_dict['switch_dpid'])==int(dpid)]
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 367 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 368 | for metric_dict in metric_list:
|
| 369 | self.set_network_metric(metric_dict, port_stat_dict)
|
| 370 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 371 | self.monitor_lock.release()
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 372 | time.sleep(1)
|
| 373 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 374 | # add metric to the list to export to Prometheus, parse the Ryu port-stats reply
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 375 | def set_network_metric(self, metric_dict, port_stat_dict):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 376 | # vnf tx is the datacenter switch rx and vice-versa
|
| 377 | metric_key = self.switch_tx_rx(metric_dict['metric_key'])
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 378 | switch_dpid = metric_dict['switch_dpid']
|
| 379 | vnf_name = metric_dict['vnf_name']
|
| 380 | vnf_interface = metric_dict['vnf_interface']
|
| 381 | previous_measurement = metric_dict['previous_measurement']
|
| 382 | previous_monitor_time = metric_dict['previous_monitor_time']
|
| 383 | mon_port = metric_dict['mon_port']
|
| 384 |
|
| 385 | for port_stat in port_stat_dict[str(switch_dpid)]:
|
| 386 | if int(port_stat['port_no']) == int(mon_port):
|
| 387 | port_uptime = port_stat['duration_sec'] + port_stat['duration_nsec'] * 10 ** (-9)
|
| 388 | this_measurement = int(port_stat[metric_key])
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 389 |
|
| 390 | # set prometheus metric
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 391 | self.prom_metrics[metric_dict['metric_key']].\
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 392 | labels({'vnf_name': vnf_name, 'vnf_interface': vnf_interface, 'flow_id': None}).\
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 393 | set(this_measurement)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 394 |
|
| 395 | # 1 single monitor job for all metrics of the SDN controller
|
| 396 | pushadd_to_gateway(self.pushgateway, job='sonemu-SDNcontroller', registry=self.registry)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 397 |
|
| stevenvanrossem | e131bf5 | 2016-07-14 11:42:09 +0200 | [diff] [blame^] | 398 | # also the rate is calculated here, but not used for now
|
| 399 | # (rate can be easily queried from prometheus also)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 400 | if previous_monitor_time <= 0 or previous_monitor_time >= port_uptime:
|
| 401 | metric_dict['previous_measurement'] = int(port_stat[metric_key])
|
| 402 | metric_dict['previous_monitor_time'] = port_uptime
|
| 403 | # do first measurement
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 404 | time.sleep(1)
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 405 | self.monitor_lock.release()
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 406 |
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 407 | metric_rate = self.get_network_metrics()
|
| 408 | return metric_rate
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 409 |
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 410 | else:
|
| 411 | time_delta = (port_uptime - metric_dict['previous_monitor_time'])
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 412 | metric_rate = (this_measurement - metric_dict['previous_measurement']) / float(time_delta)
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 413 |
|
| 414 | metric_dict['previous_measurement'] = this_measurement
|
| 415 | metric_dict['previous_monitor_time'] = port_uptime
|
| stevenvanrossem | 300e1e5 | 2016-04-22 22:17:51 +0200 | [diff] [blame] | 416 | return metric_rate
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 417 |
|
| 418 | logging.exception('metric {0} not found on {1}:{2}'.format(metric_key, vnf_name, vnf_interface))
|
| 419 | return 'metric {0} not found on {1}:{2}'.format(metric_key, vnf_name, vnf_interface)
|
| 420 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 421 | def set_flow_metric(self, metric_dict, flow_stat_dict):
|
| 422 | # vnf tx is the datacenter switch rx and vice-versa
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 423 | metric_key = metric_dict['metric_key']
|
| 424 | switch_dpid = metric_dict['switch_dpid']
|
| 425 | vnf_name = metric_dict['vnf_name']
|
| 426 | vnf_interface = metric_dict['vnf_interface']
|
| 427 | previous_measurement = metric_dict['previous_measurement']
|
| 428 | previous_monitor_time = metric_dict['previous_monitor_time']
|
| 429 | cookie = metric_dict['cookie']
|
| stevenvanrossem | a24b437 | 2016-04-14 09:55:20 +0200 | [diff] [blame] | 430 |
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 431 | # TODO aggregate all found flow stats
|
| 432 | flow_stat = flow_stat_dict[str(switch_dpid)][0]
|
| 433 | if 'bytes' in metric_key:
|
| 434 | counter = flow_stat['byte_count']
|
| 435 | elif 'packet' in metric_key:
|
| 436 | counter = flow_stat['packet_count']
|
| 437 |
|
| 438 | flow_uptime = flow_stat['duration_sec'] + flow_stat['duration_nsec'] * 10 ** (-9)
|
| 439 |
|
| 440 | self.prom_metrics[metric_dict['metric_key']]. \
|
| 441 | labels({'vnf_name': vnf_name, 'vnf_interface': vnf_interface, 'flow_id': cookie}). \
|
| 442 | set(counter)
|
| 443 | pushadd_to_gateway(self.pushgateway, job='sonemu-SDNcontroller', registry=self.registry)
|
| 444 |
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 445 |
|
| 446 | def start_Prometheus(self, port=9090):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 447 | # prometheus.yml configuration file is located in the same directory as this file
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 448 | cmd = ["docker",
|
| 449 | "run",
|
| 450 | "--rm",
|
| 451 | "-p", "{0}:9090".format(port),
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 452 | "-v", "{0}/prometheus.yml:/etc/prometheus/prometheus.yml".format(os.path.dirname(os.path.abspath(__file__))),
|
| stevenvanrossem | 61fd528 | 2016-04-29 12:41:54 +0200 | [diff] [blame] | 453 | "-v", "{0}/profile.rules:/etc/prometheus/profile.rules".format(os.path.dirname(os.path.abspath(__file__))),
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 454 | "--name", "prometheus",
|
| 455 | "prom/prometheus"
|
| 456 | ]
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 457 | logging.info('Start Prometheus container {0}'.format(cmd))
|
| 458 | return Popen(cmd)
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 459 |
|
| stevenvanrossem | adfd06f | 2016-04-22 10:39:08 +0200 | [diff] [blame] | 460 | def start_PushGateway(self, port=9091):
|
| 461 | cmd = ["docker",
|
| 462 | "run",
|
| 463 | "-d",
|
| 464 | "-p", "{0}:9091".format(port),
|
| 465 | "--name", "pushgateway",
|
| 466 | "prom/pushgateway"
|
| 467 | ]
|
| 468 |
|
| 469 | logging.info('Start Prometheus Push Gateway container {0}'.format(cmd))
|
| 470 | return Popen(cmd)
|
| 471 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 472 | def start_cadvisor(self, port=8090):
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 473 | cmd = ["docker",
|
| 474 | "run",
|
| 475 | "--rm",
|
| 476 | "--volume=/:/rootfs:ro",
|
| 477 | "--volume=/var/run:/var/run:rw",
|
| 478 | "--volume=/sys:/sys:ro",
|
| 479 | "--volume=/var/lib/docker/:/var/lib/docker:ro",
|
| 480 | "--publish={0}:8080".format(port),
|
| 481 | "--name=cadvisor",
|
| 482 | "google/cadvisor:latest"
|
| 483 | ]
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 484 | logging.info('Start cAdvisor container {0}'.format(cmd))
|
| 485 | return Popen(cmd)
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 486 |
|
| 487 | def stop(self):
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 488 | # stop the monitoring thread
|
| 489 | self.start_monitoring = False
|
| 490 | self.monitor_thread.join()
|
| stevenvanrossem | 461941c | 2016-05-10 11:41:29 +0200 | [diff] [blame] | 491 | self.monitor_flow_thread.join()
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 492 |
|
| stevenvanrossem | 2fdfbf4 | 2016-05-13 15:08:47 +0200 | [diff] [blame] | 493 | '''
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 494 | if self.prometheus_process is not None:
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 495 | logging.info('stopping prometheus container')
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 496 | self.prometheus_process.terminate()
|
| 497 | self.prometheus_process.kill()
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 498 | self._stop_container('prometheus')
|
| stevenvanrossem | c6abf13 | 2016-04-14 11:15:58 +0200 | [diff] [blame] | 499 |
|
| stevenvanrossem | adfd06f | 2016-04-22 10:39:08 +0200 | [diff] [blame] | 500 | if self.pushgateway_process is not None:
|
| 501 | logging.info('stopping pushgateway container')
|
| 502 | self.pushgateway_process.terminate()
|
| 503 | self.pushgateway_process.kill()
|
| 504 | self._stop_container('pushgateway')
|
| stevenvanrossem | 2fdfbf4 | 2016-05-13 15:08:47 +0200 | [diff] [blame] | 505 | '''
|
| stevenvanrossem | adfd06f | 2016-04-22 10:39:08 +0200 | [diff] [blame] | 506 |
|
| stevenvanrossem | b098cb5 | 2016-04-15 13:28:23 +0200 | [diff] [blame] | 507 | if self.cadvisor_process is not None:
|
| 508 | logging.info('stopping cadvisor container')
|
| 509 | self.cadvisor_process.terminate()
|
| 510 | self.cadvisor_process.kill()
|
| 511 | self._stop_container('cadvisor')
|
| 512 |
|
| 513 | def switch_tx_rx(self,metric=''):
|
| 514 | # when monitoring vnfs, the tx of the datacenter switch is actually the rx of the vnf
|
| 515 | # so we need to change the metric name to be consistent with the vnf rx or tx
|
| 516 | if 'tx' in metric:
|
| 517 | metric = metric.replace('tx','rx')
|
| 518 | elif 'rx' in metric:
|
| 519 | metric = metric.replace('rx','tx')
|
| 520 |
|
| 521 | return metric
|
| 522 |
|
| 523 | def _stop_container(self, name):
|
| 524 | cmd = ["docker",
|
| 525 | "stop",
|
| 526 | name]
|
| 527 | Popen(cmd).wait()
|
| 528 |
|
| 529 | cmd = ["docker",
|
| 530 | "rm",
|
| 531 | name]
|
| 532 | Popen(cmd).wait()
|
| 533 |
|