blob: 3f76df9c4779efd954e81603bd91a3468af7369d [file] [log] [blame]
peustermcbcd4c22015-12-28 11:33:42 +01001"""
2Distributed Cloud Emulator (dcemulator)
3(c) 2015 by Manuel Peuster <manuel.peuster@upb.de>
4"""
peusterm7aae6852016-01-12 14:53:18 +01005from mininet.node import Docker
peustermea8db832016-03-08 10:25:58 +01006from mininet.link import Link
peustermcbcd4c22015-12-28 11:33:42 +01007import logging
peusterm60bf8b82016-04-06 14:12:35 +02008import time
9import json
peustermcbcd4c22015-12-28 11:33:42 +010010
peusterm3444ae42016-03-16 20:46:41 +010011LOG = logging.getLogger("dcemulator")
12LOG.setLevel(logging.DEBUG)
13
peustermcbcd4c22015-12-28 11:33:42 +010014
15DCDPID_BASE = 1000 # start of switch dpid's used for data center switches
16
17
peusterm7aae6852016-01-12 14:53:18 +010018class EmulatorCompute(Docker):
19 """
20 Emulator specific compute node class.
21 Inherits from Dockernet's Docker host class.
22 Represents a single container connected to a (logical)
23 data center.
24 We can add emulator specific helper functions to it.
25 """
26
27 def __init__(
28 self, name, dimage, **kwargs):
peusterm42f08be2016-03-10 21:56:34 +010029 self.datacenter = kwargs.get("datacenter") # pointer to current DC
30 self.flavor_name = kwargs.get("flavor_name")
peusterm3444ae42016-03-16 20:46:41 +010031 LOG.debug("Starting compute instance %r in data center %r" % (name, str(self.datacenter)))
peusterm7aae6852016-01-12 14:53:18 +010032 # call original Docker.__init__
33 Docker.__init__(self, name, dimage, **kwargs)
34
35 def getNetworkStatus(self):
36 """
37 Helper method to receive information about the virtual networks
38 this compute instance is connected to.
39 """
peusterm056fd452016-01-12 15:32:25 +010040 # format list of tuples (name, Ip, MAC, isUp, status)
41 return [(str(i), i.IP(), i.MAC(), i.isUp(), i.status())
42 for i in self.intfList()]
peusterm7aae6852016-01-12 14:53:18 +010043
44 def getStatus(self):
45 """
46 Helper method to receive information about this compute instance.
47 """
peusterm056fd452016-01-12 15:32:25 +010048 status = {}
49 status["name"] = self.name
50 status["network"] = self.getNetworkStatus()
51 status["image"] = self.dimage
52 status["cpu_quota"] = self.cpu_quota
53 status["cpu_period"] = self.cpu_period
54 status["cpu_shares"] = self.cpu_shares
55 status["cpuset"] = self.cpuset
56 status["mem_limit"] = self.mem_limit
57 status["memswap_limit"] = self.memswap_limit
58 status["state"] = self.dcli.inspect_container(self.dc)["State"]
59 status["id"] = self.dcli.inspect_container(self.dc)["Id"]
peusterm2ec74e12016-01-13 11:17:53 +010060 status["datacenter"] = (None if self.datacenter is None
peusterma47db032016-02-04 14:55:29 +010061 else self.datacenter.label)
peusterm056fd452016-01-12 15:32:25 +010062 return status
peusterm7aae6852016-01-12 14:53:18 +010063
64
peustermcbcd4c22015-12-28 11:33:42 +010065class Datacenter(object):
66 """
67 Represents a logical data center to which compute resources
68 (Docker containers) can be added at runtime.
peusterme4e89d32016-01-07 09:14:54 +010069
70 Will also implement resource bookkeeping in later versions.
peustermcbcd4c22015-12-28 11:33:42 +010071 """
72
peusterma47db032016-02-04 14:55:29 +010073 DC_COUNTER = 1
74
peusterm60bf8b82016-04-06 14:12:35 +020075 def __init__(self, label, metadata={}, resource_log_path=None):
peustermcbcd4c22015-12-28 11:33:42 +010076 self.net = None # DCNetwork to which we belong
peusterma47db032016-02-04 14:55:29 +010077 # each node (DC) has a short internal name used by Mininet
78 # this is caused by Mininets naming limitations for swtiches etc.
79 self.name = "dc%d" % Datacenter.DC_COUNTER
80 Datacenter.DC_COUNTER += 1
peusterm53504942016-02-04 16:09:28 +010081 # use this for user defined names that can be longer than self.name
82 self.label = label
83 # dict to store arbitrary metadata (e.g. latitude and longitude)
84 self.metadata = metadata
peusterm60bf8b82016-04-06 14:12:35 +020085 # path to which resource information should be logged (e.g. for experiments). None = no logging
86 self.resource_log_path = resource_log_path
peusterm42f08be2016-03-10 21:56:34 +010087 # first prototype assumes one "bigswitch" per DC
88 self.switch = None
89 # keep track of running containers
90 self.containers = {}
91 # pointer to assigned resource model
92 self._resource_model = None
peustermcbcd4c22015-12-28 11:33:42 +010093
peusterme26487b2016-03-08 14:00:21 +010094 def __repr__(self):
95 return self.label
96
peustermcbcd4c22015-12-28 11:33:42 +010097 def _get_next_dc_dpid(self):
98 global DCDPID_BASE
99 DCDPID_BASE += 1
100 return DCDPID_BASE
101
102 def create(self):
103 """
104 Each data center is represented by a single switch to which
105 compute resources can be connected at run time.
106
peusterm9c252b62016-01-06 16:59:53 +0100107 TODO: This will be changed in the future to support multiple networks
peustermcbcd4c22015-12-28 11:33:42 +0100108 per data center
109 """
peusterm293cbc32016-01-13 17:05:28 +0100110 self.switch = self.net.addSwitch(
peustermcbcd4c22015-12-28 11:33:42 +0100111 "%s.s1" % self.name, dpid=hex(self._get_next_dc_dpid())[2:])
peusterm3444ae42016-03-16 20:46:41 +0100112 LOG.debug("created data center switch: %s" % str(self.switch))
peustermcbcd4c22015-12-28 11:33:42 +0100113
114 def start(self):
115 pass
116
peusterm42f08be2016-03-10 21:56:34 +0100117 def startCompute(self, name, image=None, command=None, network=None, flavor_name="tiny"):
peusterme4e89d32016-01-07 09:14:54 +0100118 """
119 Create a new container as compute resource and connect it to this
120 data center.
peusterm7f8e8402016-02-28 18:38:10 +0100121 :param name: name (string)
122 :param image: image name (string)
123 :param command: command (string)
124 :param network: networks list({"ip": "10.0.0.254/8"}, {"ip": "11.0.0.254/24"})
peusterm42f08be2016-03-10 21:56:34 +0100125 :param flavor_name: name of the flavor for this compute container
peusterm7f8e8402016-02-28 18:38:10 +0100126 :return:
peusterme4e89d32016-01-07 09:14:54 +0100127 """
peusterm4e98b632016-01-12 14:08:07 +0100128 assert name is not None
peusterm9165ef92016-01-13 13:50:39 +0100129 # no duplications
peustermbd44f4a2016-01-13 14:53:30 +0100130 if name in [c.name for c in self.net.getAllContainers()]:
peusterm9165ef92016-01-13 13:50:39 +0100131 raise Exception("Container with name %s already exists." % name)
peusterm4e98b632016-01-12 14:08:07 +0100132 # set default parameter
133 if image is None:
134 image = "ubuntu"
135 if network is None:
136 network = {} # {"ip": "10.0.0.254/8"}
peusterm7f8e8402016-02-28 18:38:10 +0100137 if isinstance(network, dict):
138 network = [network] # if we have only one network, put it in a list
139 if isinstance(network, list):
140 if len(network) < 1:
141 network.append({})
142
peusterm42f08be2016-03-10 21:56:34 +0100143 # allocate in resource resource model and compute resource limits for new container
peusterm71b3a2f2016-03-19 12:56:11 +0100144 cpu_limit = mem_limit = disk_limit = -1
145 cpu_period = cpu_quota = None
peusterm42f08be2016-03-10 21:56:34 +0100146 if self._resource_model is not None:
peusterm71b3a2f2016-03-19 12:56:11 +0100147 # call allocate in resource model to calculate resource limit for this container
peusterma769d952016-03-12 12:01:27 +0100148 (cpu_limit, mem_limit, disk_limit) = alloc = self._resource_model.allocate(name, flavor_name)
peusterm3444ae42016-03-16 20:46:41 +0100149 LOG.debug("Allocation result: %r" % str(alloc))
peusterm71b3a2f2016-03-19 12:56:11 +0100150 # check if we have a cpu_limit given by the used resource model
151 if cpu_limit > 0:
152 # calculate cpu period and quota for CFS
153 # (see: https://www.kernel.org/doc/Documentation/scheduler/sched-bwc.txt)
154 # TODO consider multi core machines etc! non trivial!
155 # Attention minimum cpu_quota is 1ms (micro)
156 cpu_period = 100000 # lets consider a fixed period of 100000 microseconds for now
157 cpu_quota = cpu_period * cpu_limit # calculate the fraction of cpu time for this container
158 LOG.debug(
159 "CPU limit: cpu_quota = cpu_period * cpu_limit = %f * %f = %f" % (cpu_period, cpu_limit, cpu_quota))
160 # ATTENTION >= 1000 to avoid a invalid argument system error ... no idea why
161 if cpu_quota < 1000:
162 cpu_quota = 1000
peusterm972a9f02016-03-25 14:58:05 +0100163 LOG.warning("Increased CPU quota for %r to avoid system error." % name)
164 # check if we have a mem_limit given by the used resource model
165 if mem_limit > 0:
166 LOG.debug(
167 "MEM limit: mem_limit = %f MB" % mem_limit)
168 # ATTENTION minimum mem_limit per container is 4MB
169 if mem_limit < 4:
170 mem_limit = 4
171 LOG.warning("Increased MEM limit for %r because it was less than 4.0 MB." % name)
peusterm7f8e8402016-02-28 18:38:10 +0100172 # create the container
peusterm42f08be2016-03-10 21:56:34 +0100173 d = self.net.addDocker(
174 "%s" % (name),
175 dimage=image,
176 dcmd=command,
177 datacenter=self,
peusterm71b3a2f2016-03-19 12:56:11 +0100178 flavor_name=flavor_name,
179 cpu_period=int(cpu_period) if cpu_limit > 0 else None, # set cpu limits if needed
180 cpu_quota=int(cpu_quota) if cpu_limit > 0 else None,
peusterm972a9f02016-03-25 14:58:05 +0100181 mem_limit="%dm" % int(mem_limit) if mem_limit > 0 else None, # set mem limits if needed
182 memswap_limit="%dm" % int(mem_limit) if mem_limit > 0 else None # lets set swap to mem limit for now
peusterm71b3a2f2016-03-19 12:56:11 +0100183 )
peusterm7f8e8402016-02-28 18:38:10 +0100184 # connect all given networks
185 for nw in network:
peustermea8db832016-03-08 10:25:58 +0100186 # TODO we cannot use TCLink here (see: https://github.com/mpeuster/dockernet/issues/3)
187 self.net.addLink(d, self.switch, params1=nw, cls=Link)
peusterm2ec74e12016-01-13 11:17:53 +0100188 # do bookkeeping
peusterma2ad9ff2016-01-11 17:10:07 +0100189 self.containers[name] = d
peusterm60bf8b82016-04-06 14:12:35 +0200190
191 # write resource log if a path is given
192 if self.resource_log_path is not None:
193 l = dict()
194 l["t"] = time.time()
195 l["name"] = name
196 l["compute"] = d.getStatus()
197 l["flavor_name"] = flavor_name
198 l["action"] = "allocate"
199 l["cpu_limit"] = cpu_limit
200 l["mem_limit"] = mem_limit
201 l["disk_limit"] = disk_limit
202 l["rm_state"] = None if self._resource_model is None else self._resource_model.get_state_dict()
203 # append to logfile
204 with open(self.resource_log_path, "a") as f:
205 f.write("%s\n" % json.dumps(l))
peustermfa4bcc72016-01-15 11:08:09 +0100206 return d # we might use UUIDs for naming later on
peustermcbcd4c22015-12-28 11:33:42 +0100207
peusterm7aae6852016-01-12 14:53:18 +0100208 def stopCompute(self, name):
peusterma2ad9ff2016-01-11 17:10:07 +0100209 """
210 Stop and remove a container from this data center.
211 """
peusterm9165ef92016-01-13 13:50:39 +0100212 assert name is not None
213 if name not in self.containers:
214 raise Exception("Container with name %s not found." % name)
peusterm60bf8b82016-04-06 14:12:35 +0200215 LOG.debug("Stopping compute instance %r in data center %r" % (name, str(self)))
peusterma2ad9ff2016-01-11 17:10:07 +0100216 self.net.removeLink(
217 link=None, node1=self.containers[name], node2=self.switch)
peustermc3b977e2016-01-12 10:09:35 +0100218 self.net.removeDocker("%s" % (name))
peusterma2ad9ff2016-01-11 17:10:07 +0100219 del self.containers[name]
peusterm42f08be2016-03-10 21:56:34 +0100220 # call resource model and free resources
221 if self._resource_model is not None:
222 self._resource_model.free(name)
peusterm60bf8b82016-04-06 14:12:35 +0200223
224 # write resource log if a path is given
225 if self.resource_log_path is not None:
226 l = dict()
227 l["t"] = time.time()
228 l["name"] = name
229 l["flavor_name"] = None
230 l["action"] = "free"
231 l["cpu_limit"] = -1
232 l["mem_limit"] = -1
233 l["disk_limit"] = -1
234 l["rm_state"] = None if self._resource_model is None else self._resource_model.get_state_dict()
235 # append to logfile
236 with open(self.resource_log_path, "a") as f:
237 f.write("%s\n" % json.dumps(l))
peusterm4e98b632016-01-12 14:08:07 +0100238 return True
239
240 def listCompute(self):
241 """
242 Return a list of all running containers assigned to this
243 data center.
244 """
peusterm5aa8cf22016-01-15 11:12:17 +0100245 return list(self.containers.itervalues())
peustermd313dc12016-02-04 15:36:02 +0100246
247 def getStatus(self):
248 """
249 Return a dict with status information about this DC.
250 """
peusterm53504942016-02-04 16:09:28 +0100251 return {
252 "label": self.label,
253 "internalname": self.name,
254 "switch": self.switch.name,
255 "n_running_containers": len(self.containers),
256 "metadata": self.metadata
257 }
peusterm42f08be2016-03-10 21:56:34 +0100258
259 def assignResourceModel(self, rm):
peusterm279565d2016-03-19 10:36:52 +0100260 """
261 Assign a resource model to this DC.
262 :param rm: a BaseResourceModel object
263 :return:
264 """
peusterm42f08be2016-03-10 21:56:34 +0100265 if self._resource_model is not None:
266 raise Exception("There is already an resource model assigned to this DC.")
267 self._resource_model = rm
268 self.net.rm_registrar.register(self, rm)
peusterm3444ae42016-03-16 20:46:41 +0100269 LOG.info("Assigned RM: %r to DC: %r" % (rm, self))
peusterm42f08be2016-03-10 21:56:34 +0100270