2 # -*- coding: utf-8 -*-
4 from constants import TESTBED_ID
16 from nepi.util import server
17 from nepi.util import parallel
19 class UnresponsiveNodeError(RuntimeError):
24 # Map Node attribute to plcapi filter name
25 'hostname' : 'hostname',
29 # Map Node attribute to (<tag name>, <plcapi filter expression>)
30 # There are replacements that are applied with string formatting,
31 # so '%' has to be escaped as '%%'.
32 'architecture' : ('arch','value'),
33 'operatingSystem' : ('fcdistro','value'),
34 'pl_distro' : ('pldistro','value'),
35 'minReliability' : ('reliability%(timeframe)s', ']value'),
36 'maxReliability' : ('reliability%(timeframe)s', '[value'),
37 'minBandwidth' : ('bw%(timeframe)s', ']value'),
38 'maxBandwidth' : ('bw%(timeframe)s', '[value'),
41 DEPENDS_PIDFILE = '/tmp/nepi-depends.pid'
42 DEPENDS_LOGFILE = '/tmp/nepi-depends.log'
43 RPM_FUSION_URL = 'http://download1.rpmfusion.org/free/fedora/rpmfusion-free-release-stable.noarch.rpm'
44 RPM_FUSION_URL_F12 = 'http://download1.rpmfusion.org/free/fedora/releases/12/Everything/x86_64/os/rpmfusion-free-release-12-1.noarch.rpm'
46 def __init__(self, api=None):
53 self.architecture = None
54 self.operatingSystem = None
58 self.minReliability = None
59 self.maxReliability = None
60 self.minBandwidth = None
61 self.maxBandwidth = None
62 self.min_num_external_ifaces = None
63 self.max_num_external_ifaces = None
66 # Applications and routes add requirements to connected nodes
67 self.required_packages = set()
68 self.required_vsys = set()
70 self.rpmFusion = False
71 self.env = collections.defaultdict(list)
73 # Testbed-derived attributes
75 self.ident_path = None
76 self.server_key = None
79 # Those are filled when an actual node is allocated
83 def _nepi_testbed_environment_setup(self):
84 command = cStringIO.StringIO()
85 command.write('export PYTHONPATH=$PYTHONPATH:%s' % (
86 ':'.join(["${HOME}/"+server.shell_escape(s) for s in self.pythonpath])
88 command.write(' ; export PATH=$PATH:%s' % (
89 ':'.join(["${HOME}/"+server.shell_escape(s) for s in self.pythonpath])
92 for envkey, envvals in self.env.iteritems():
93 for envval in envvals:
94 command.write(' ; export %s=%s' % (envkey, envval))
95 return command.getvalue()
97 def build_filters(self, target_filters, filter_map):
98 for attr, tag in filter_map.iteritems():
99 value = getattr(self, attr, None)
100 if value is not None:
101 target_filters[tag] = value
102 return target_filters
105 def applicable_filters(self):
106 has = lambda att : getattr(self,att,None) is not None
108 filter(has, self.BASEFILTERS.iterkeys())
109 + filter(has, self.TAGFILTERS.iterkeys())
112 def find_candidates(self, filter_slice_id=None):
113 print >>sys.stderr, "Finding candidates for", self.make_filter_description()
115 fields = ('node_id',)
116 replacements = {'timeframe':self.timeframe}
118 # get initial candidates (no tag filters)
119 basefilters = self.build_filters({}, self.BASEFILTERS)
120 rootfilters = basefilters.copy()
122 basefilters['|slice_ids'] = (filter_slice_id,)
124 # only pick healthy nodes
125 basefilters['run_level'] = 'boot'
126 basefilters['boot_state'] = 'boot'
127 basefilters['node_type'] = 'regular' # nepi can only handle regular nodes (for now)
128 basefilters['>last_contact'] = int(time.time()) - 5*3600 # allow 5h out of contact, for timezone discrepancies
130 # keyword-only "pseudofilters"
133 extra['peer'] = self.site
135 candidates = set(map(operator.itemgetter('node_id'),
136 self._api.GetNodes(filters=basefilters, fields=fields, **extra)))
138 # filter by tag, one tag at a time
139 applicable = self.applicable_filters
140 for tagfilter in self.TAGFILTERS.iteritems():
141 attr, (tagname, expr) = tagfilter
143 # don't bother if there's no filter defined
144 if attr in applicable:
145 tagfilter = rootfilters.copy()
146 tagfilter['tagname'] = tagname % replacements
147 tagfilter[expr % replacements] = getattr(self,attr)
148 tagfilter['node_id'] = list(candidates)
150 candidates &= set(map(operator.itemgetter('node_id'),
151 self._api.GetNodeTags(filters=tagfilter, fields=fields)))
153 # filter by vsys tags - special case since it doesn't follow
154 # the usual semantics
155 if self.required_vsys:
156 newcandidates = collections.defaultdict(set)
158 vsys_tags = self._api.GetNodeTags(
160 node_id = list(candidates),
161 fields = ['node_id','value'])
164 operator.itemgetter(['node_id','value']),
167 required_vsys = self.required_vsys
168 for node_id, value in vsys_tags:
169 if value in required_vsys:
170 newcandidates[value].add(node_id)
172 # take only those that have all the required vsys tags
173 newcandidates = reduce(
174 lambda accum, new : accum & new,
175 newcandidates.itervalues(),
178 # filter by iface count
179 if self.min_num_external_ifaces is not None or self.max_num_external_ifaces is not None:
180 # fetch interfaces for all, in one go
181 filters = basefilters.copy()
182 filters['node_id'] = list(candidates)
183 ifaces = dict(map(operator.itemgetter('node_id','interface_ids'),
184 self._api.GetNodes(filters=basefilters, fields=('node_id','interface_ids')) ))
186 # filter candidates by interface count
187 if self.min_num_external_ifaces is not None and self.max_num_external_ifaces is not None:
188 predicate = ( lambda node_id :
189 self.min_num_external_ifaces <= len(ifaces.get(node_id,())) <= self.max_num_external_ifaces )
190 elif self.min_num_external_ifaces is not None:
191 predicate = ( lambda node_id :
192 self.min_num_external_ifaces <= len(ifaces.get(node_id,())) )
194 predicate = ( lambda node_id :
195 len(ifaces.get(node_id,())) <= self.max_num_external_ifaces )
197 candidates = set(filter(predicate, candidates))
199 # make sure hostnames are resolvable
201 print >>sys.stderr, " Found", len(candidates), "candidates. Checking for reachability..."
203 hostnames = dict(map(operator.itemgetter('node_id','hostname'),
204 self._api.GetNodes(list(candidates), ['node_id','hostname'])
206 def resolvable(node_id):
208 addr = socket.gethostbyname(hostnames[node_id])
209 return addr is not None
212 candidates = set(parallel.pfilter(resolvable, candidates,
215 print >>sys.stderr, " Found", len(candidates), "reachable candidates."
219 def make_filter_description(self):
221 Makes a human-readable description of filtering conditions
225 # get initial candidates (no tag filters)
226 filters = self.build_filters({}, self.BASEFILTERS)
228 # keyword-only "pseudofilters"
230 filters['peer'] = self.site
232 # filter by tag, one tag at a time
233 applicable = self.applicable_filters
234 for tagfilter in self.TAGFILTERS.iteritems():
235 attr, (tagname, expr) = tagfilter
237 # don't bother if there's no filter defined
238 if attr in applicable:
239 filters[attr] = getattr(self,attr)
241 # filter by vsys tags - special case since it doesn't follow
242 # the usual semantics
243 if self.required_vsys:
244 filters['vsys'] = ','.join(list(self.required_vsys))
246 # filter by iface count
247 if self.min_num_external_ifaces is not None or self.max_num_external_ifaces is not None:
248 filters['num_ifaces'] = '-'.join([
249 str(self.min_num_external_ifaces or '0'),
250 str(self.max_num_external_ifaces or 'inf')
253 return '; '.join(map('%s: %s'.__mod__,filters.iteritems()))
255 def assign_node_id(self, node_id):
256 self._node_id = node_id
257 self.fetch_node_info()
259 def unassign_node(self):
261 self.__dict__.update(self.__orig_attrs)
263 def fetch_node_info(self):
266 info = self._api.GetNodes(self._node_id)[0]
267 tags = dict( (t['tagname'],t['value'])
268 for t in self._api.GetNodeTags(node_id=self._node_id, fields=('tagname','value')) )
270 orig_attrs['min_num_external_ifaces'] = self.min_num_external_ifaces
271 orig_attrs['max_num_external_ifaces'] = self.max_num_external_ifaces
272 self.min_num_external_ifaces = None
273 self.max_num_external_ifaces = None
276 replacements = {'timeframe':self.timeframe}
277 for attr, tag in self.BASEFILTERS.iteritems():
280 if hasattr(self, attr):
281 orig_attrs[attr] = getattr(self, attr)
282 setattr(self, attr, value)
283 for attr, (tag,_) in self.TAGFILTERS.iteritems():
284 tag = tag % replacements
287 if hasattr(self, attr):
288 orig_attrs[attr] = getattr(self, attr)
289 setattr(self, attr, value)
291 if 'peer_id' in info:
292 orig_attrs['site'] = self.site
293 self.site = self._api.peer_map[info['peer_id']]
295 if 'interface_ids' in info:
296 self.min_num_external_ifaces = \
297 self.max_num_external_ifaces = len(info['interface_ids'])
299 if 'ssh_rsa_key' in info:
300 orig_attrs['server_key'] = self.server_key
301 self.server_key = info['ssh_rsa_key']
303 self.__orig_attrs = orig_attrs
306 if self.home_path is None:
307 raise AssertionError, "Misconfigured node: missing home path"
308 if self.ident_path is None or not os.access(self.ident_path, os.R_OK):
309 raise AssertionError, "Misconfigured node: missing slice SSH key"
310 if self.slicename is None:
311 raise AssertionError, "Misconfigured node: unspecified slice"
313 def install_dependencies(self):
314 if self.required_packages:
315 # TODO: make dependant on the experiment somehow...
316 pidfile = self.DEPENDS_PIDFILE
317 logfile = self.DEPENDS_LOGFILE
319 # If we need rpmfusion, we must install the repo definition and the gpg keys
321 if self.operatingSystem == 'f12':
322 # Fedora 12 requires a different rpmfusion package
323 RPM_FUSION_URL = self.RPM_FUSION_URL_F12
325 # This one works for f13+
326 RPM_FUSION_URL = self.RPM_FUSION_URL
329 '( rpm -q $(rpm -q -p %(RPM_FUSION_URL)s) || rpm -i %(RPM_FUSION_URL)s ) &&'
331 'RPM_FUSION_URL' : RPM_FUSION_URL
336 # Start process in a "daemonized" way, using nohup and heavy
337 # stdin/out redirection to avoid connection issues
338 (out,err),proc = rspawn.remote_spawn(
339 "( %(rpmfusion)s yum -y install %(packages)s && echo SUCCESS || echo FAILURE )" % {
340 'packages' : ' '.join(self.required_packages),
341 'rpmfusion' : rpmFusion,
345 stderr = rspawn.STDOUT,
347 host = self.hostname,
349 user = self.slicename,
351 ident_key = self.ident_path,
352 server_key = self.server_key,
357 raise RuntimeError, "Failed to set up application: %s %s" % (out,err,)
359 def wait_provisioning(self, timeout = 20*60):
360 # recently provisioned nodes may not be up yet
363 while not self.is_alive():
364 time.sleep(sleeptime)
365 totaltime += sleeptime
366 sleeptime = min(30.0, sleeptime*1.5)
368 if totaltime > timeout:
369 # PlanetLab has a 15' delay on configuration propagation
370 # If we're above that delay, the unresponsiveness is not due
372 raise UnresponsiveNodeError, "Unresponsive host %s" % (self.hostname,)
374 def wait_dependencies(self, pidprobe=1, probe=0.5, pidmax=10, probemax=10):
375 if self.required_packages:
376 pidfile = self.DEPENDS_PIDFILE
380 for probenum in xrange(pidmax):
381 pidtuple = rspawn.remote_check_pid(
383 host = self.hostname,
385 user = self.slicename,
387 ident_key = self.ident_path,
388 server_key = self.server_key
396 raise RuntimeError, "Failed to obtain pidfile for dependency installer"
398 # wait for it to finish
399 while rspawn.RUNNING is rspawn.remote_status(
401 host = self.hostname,
403 user = self.slicename,
405 ident_key = self.ident_path,
406 server_key = self.server_key
409 probe = min(probemax, 1.5*probe)
412 logfile = self.DEPENDS_LOGFILE
414 (out,err),proc = server.popen_ssh_command(
415 "cat %s" % (server.shell_escape(logfile),),
416 host = self.hostname,
418 user = self.slicename,
420 ident_key = self.ident_path,
421 server_key = self.server_key
425 raise RuntimeError, "Failed to install dependencies: %s %s" % (out,err,)
427 success = out.strip().rsplit('\n',1)[-1].strip() == 'SUCCESS'
429 raise RuntimeError, "Failed to install dependencies - buildlog:\n%s\n%s" % (out,err,)
432 # Make sure all the paths are created where
433 # they have to be created for deployment
434 (out,err),proc = server.eintr_retry(server.popen_ssh_command)(
436 host = self.hostname,
438 user = self.slicename,
440 ident_key = self.ident_path,
441 server_key = self.server_key
446 elif not err and out.strip() == 'ALIVE':
452 def configure_routes(self, routes, devs):
454 Add the specified routes to the node's routing table
460 if dev.routes_here(route):
462 dest, prefix, nexthop, metric = route
464 "add %s%s gw %s %s" % (
466 (("/%d" % (prefix,)) if prefix and prefix != 32 else ""),
475 raise RuntimeError, "Route %s cannot be bound to any virtual interface " \
476 "- PL can only handle rules over virtual interfaces. Candidates are: %s" % (route,devs)
478 print >>sys.stderr, "Setting up routes for", self.hostname
480 (out,err),proc = server.popen_ssh_command(
481 "( sudo -S bash -c 'cat /vsys/vroute.out >&2' & ) ; sudo -S bash -c 'cat > /vsys/vroute.in' ; sleep 0.1" % dict(
482 home = server.shell_escape(self.home_path)),
483 host = self.hostname,
485 user = self.slicename,
487 ident_key = self.ident_path,
488 server_key = self.server_key,
489 stdin = '\n'.join(rules)
492 if proc.wait() or err:
493 raise RuntimeError, "Could not set routes (%s) errors: %s%s" % (rules,out,err)