2 # -*- coding: utf-8 -*-
4 from nepi.core.attributes import Attribute, AttributesMap
5 from nepi.util import validation
6 from nepi.util.constants import ApplicationStatus as AS, TestbedStatus as TS, TIME_NOW, DeploymentConfiguration as DC
7 from nepi.util.parser._xml import XmlExperimentParser
19 ATTRIBUTE_PATTERN_BASE = re.compile(r"\{#\[(?P<label>[-a-zA-Z0-9._]*)\](?P<expr>(?P<component>\.addr\[[0-9]+\]|\.route\[[0-9]+\]|\.trace\[[-a-zA-Z0-9._]+\])?.\[(?P<attribute>[-a-zA-Z0-9._]*)\])#}")
20 ATTRIBUTE_PATTERN_GUID_SUB = r"{#[%(guid)s]%(expr)s#}"
21 COMPONENT_PATTERN = re.compile(r"(?P<kind>[a-z]*)\[(?P<index>.*)\]")
23 def _undefer(deferred):
24 if hasattr(deferred, '_get'):
25 return deferred._get()
30 class TestbedController(object):
31 def __init__(self, testbed_id, testbed_version):
32 self._testbed_id = testbed_id
33 self._testbed_version = testbed_version
37 return self._testbed_id
40 def testbed_version(self):
41 return self._testbed_version
45 raise NotImplementedError
47 def defer_configure(self, name, value):
48 """Instructs setting a configuartion attribute for the testbed instance"""
49 raise NotImplementedError
51 def defer_create(self, guid, factory_id):
52 """Instructs creation of element """
53 raise NotImplementedError
55 def defer_create_set(self, guid, name, value):
56 """Instructs setting an initial attribute on an element"""
57 raise NotImplementedError
59 def defer_factory_set(self, guid, name, value):
60 """Instructs setting an attribute on a factory"""
61 raise NotImplementedError
63 def defer_connect(self, guid1, connector_type_name1, guid2,
64 connector_type_name2):
65 """Instructs creation of a connection between the given connectors"""
66 raise NotImplementedError
68 def defer_cross_connect(self,
69 guid, connector_type_name,
70 cross_guid, cross_testbed_guid,
71 cross_testbed_id, cross_factory_id,
72 cross_connector_type_name):
74 Instructs creation of a connection between the given connectors
75 of different testbed instances
77 raise NotImplementedError
79 def defer_add_trace(self, guid, trace_id):
80 """Instructs the addition of a trace"""
81 raise NotImplementedError
83 def defer_add_address(self, guid, address, netprefix, broadcast):
84 """Instructs the addition of an address"""
85 raise NotImplementedError
87 def defer_add_route(self, guid, destination, netprefix, nexthop, metric = 0):
88 """Instructs the addition of a route"""
89 raise NotImplementedError
92 """After do_setup the testbed initial configuration is done"""
93 raise NotImplementedError
97 After do_create all instructed elements are created and
100 raise NotImplementedError
102 def do_connect_init(self):
104 After do_connect_init all internal connections between testbed elements
107 raise NotImplementedError
109 def do_connect_compl(self):
111 After do_connect all internal connections between testbed elements
114 raise NotImplementedError
116 def do_preconfigure(self):
118 Done just before resolving netrefs, after connection, before cross connections,
119 useful for early stages of configuration, for setting up stuff that might be
120 required for netref resolution.
122 raise NotImplementedError
124 def do_configure(self):
125 """After do_configure elements are configured"""
126 raise NotImplementedError
128 def do_prestart(self):
129 """Before do_start elements are prestart-configured"""
130 raise NotImplementedError
132 def do_cross_connect_init(self, cross_data):
134 After do_cross_connect_init initiation of all external connections
135 between different testbed elements is performed
137 raise NotImplementedError
139 def do_cross_connect_compl(self, cross_data):
141 After do_cross_connect_compl completion of all external connections
142 between different testbed elements is performed
144 raise NotImplementedError
147 raise NotImplementedError
150 raise NotImplementedError
154 On testbed recovery (if recovery is a supported policy), the controller
155 instance will be re-created and the following sequence invoked:
158 defer_X - programming the testbed with persisted execution values
159 (not design values). Execution values (ExecImmutable attributes)
160 should be enough to recreate the testbed's state.
162 <cross-connection methods>
164 Start will not be called, and after cross connection invocations,
165 the testbed is supposed to be fully functional again.
167 raise NotImplementedError
169 def set(self, guid, name, value, time = TIME_NOW):
170 raise NotImplementedError
172 def get(self, guid, name, time = TIME_NOW):
173 raise NotImplementedError
175 def get_route(self, guid, index, attribute):
179 guid: guid of box to query
180 index: number of routing entry to fetch
181 attribute: one of Destination, NextHop, NetPrefix
183 raise NotImplementedError
185 def get_address(self, guid, index, attribute='Address'):
189 guid: guid of box to query
190 index: number of inteface to select
191 attribute: one of Address, NetPrefix, Broadcast
193 raise NotImplementedError
195 def get_attribute_list(self, guid, filter_flags = None, exclude = False):
196 raise NotImplementedError
198 def get_factory_id(self, guid):
199 raise NotImplementedError
201 def action(self, time, guid, action):
202 raise NotImplementedError
204 def status(self, guid):
205 raise NotImplementedError
207 def testbed_status(self):
208 raise NotImplementedError
210 def trace(self, guid, trace_id, attribute='value'):
211 raise NotImplementedError
213 def traces_info(self):
214 """ dictionary of dictionaries:
220 filesize = size in bytes,
224 raise NotImplementedError
227 raise NotImplementedError
229 class ExperimentController(object):
230 def __init__(self, experiment_xml, root_dir):
231 self._experiment_design_xml = experiment_xml
232 self._experiment_execute_xml = None
233 self._testbeds = dict()
234 self._deployment_config = dict()
235 self._netrefs = collections.defaultdict(set)
236 self._testbed_netrefs = collections.defaultdict(set)
237 self._cross_data = dict()
238 self._root_dir = root_dir
239 self._netreffed_testbeds = set()
240 self._guids_in_testbed_cache = dict()
241 self._failed_testbeds = set()
242 self._started_time = None
243 self._stopped_time = None
244 self._testbed_order = []
246 self._logger = logging.getLogger('nepi.core.execute')
247 level = logging.ERROR
248 if os.environ.get("NEPI_CONTROLLER_LOGLEVEL",
249 DC.ERROR_LEVEL) == DC.DEBUG_LEVEL:
250 level = logging.DEBUG
251 self._logger.setLevel(level)
253 if experiment_xml is None and root_dir is not None:
255 self.load_experiment_xml()
256 self.load_execute_xml()
258 self.persist_experiment_xml()
261 def experiment_design_xml(self):
262 return self._experiment_design_xml
265 def experiment_execute_xml(self):
266 return self._experiment_execute_xml
269 def started_time(self):
270 return self._started_time
273 def stopped_time(self):
274 return self._stopped_time
279 for testbed_guid in self._testbeds.keys():
280 _guids = self._guids_in_testbed(testbed_guid)
285 def persist_experiment_xml(self):
286 xml_path = os.path.join(self._root_dir, "experiment-design.xml")
287 f = open(xml_path, "w")
288 f.write(self._experiment_design_xml)
291 def persist_execute_xml(self):
292 xml_path = os.path.join(self._root_dir, "experiment-execute.xml")
293 f = open(xml_path, "w")
294 f.write(self._experiment_execute_xml)
297 def load_experiment_xml(self):
298 xml_path = os.path.join(self._root_dir, "experiment-design.xml")
299 f = open(xml_path, "r")
300 self._experiment_design_xml = f.read()
303 def load_execute_xml(self):
304 xml_path = os.path.join(self._root_dir, "experiment-execute.xml")
305 f = open(xml_path, "r")
306 self._experiment_execute_xml = f.read()
309 def trace(self, guid, trace_id, attribute='value'):
310 testbed = self._testbed_for_guid(guid)
312 return testbed.trace(guid, trace_id, attribute)
313 raise RuntimeError("No element exists with guid %d" % guid)
315 def traces_info(self):
317 for guid, testbed in self._testbeds.iteritems():
318 tinfo = testbed.traces_info()
320 traces_info[guid] = testbed.traces_info()
324 def _parallel(callables):
327 def wrapped(*p, **kw):
331 logging.exception("Exception occurred in asynchronous thread:")
332 excs.append(sys.exc_info())
334 wrapped = functools.wraps(callable)(wrapped)
336 # functools.partial not wrappable
339 threads = [ threading.Thread(target=wrap(callable)) for callable in callables ]
340 for thread in threads:
342 for thread in threads:
345 eTyp, eVal, eLoc = exc
346 raise eTyp, eVal, eLoc
349 self._started_time = time.time()
352 def _start(self, recover = False):
353 parser = XmlExperimentParser()
356 xml = self._experiment_execute_xml
358 xml = self._experiment_design_xml
359 data = parser.from_xml_to_data(xml)
361 # instantiate testbed controllers
362 to_recover, to_restart = self._init_testbed_controllers(data, recover)
363 all_restart = set(to_restart)
366 # persist testbed connection data, for potential recovery
367 self._persist_testbed_proxies()
369 # recover recoverable controllers
370 for guid in to_recover:
372 self._testbeds[guid].do_setup()
373 self._testbeds[guid].recover()
375 self._logger.exception("During recovery of testbed %s", guid)
378 self._failed_testbeds.add(guid)
380 def steps_to_configure(self, allowed_guids):
381 # perform setup in parallel for all test beds,
382 # wait for all threads to finish
384 self._logger.debug("ExperimentController: Starting parallel do_setup")
385 self._parallel([testbed.do_setup
386 for guid,testbed in self._testbeds.iteritems()
387 if guid in allowed_guids])
389 # perform create-connect in parallel, wait
390 # (internal connections only)
391 self._logger.debug("ExperimentController: Starting parallel do_create")
392 self._parallel([testbed.do_create
393 for guid,testbed in self._testbeds.iteritems()
394 if guid in allowed_guids])
396 self._logger.debug("ExperimentController: Starting parallel do_connect_init")
397 self._parallel([testbed.do_connect_init
398 for guid,testbed in self._testbeds.iteritems()
399 if guid in allowed_guids])
401 self._logger.debug("ExperimentController: Starting parallel do_connect_fin")
402 self._parallel([testbed.do_connect_compl
403 for guid,testbed in self._testbeds.iteritems()
404 if guid in allowed_guids])
406 self._logger.debug("ExperimentController: Starting parallel do_preconfigure")
407 self._parallel([testbed.do_preconfigure
408 for guid,testbed in self._testbeds.iteritems()
409 if guid in allowed_guids])
412 # Store testbed order
413 self._testbed_order.append(allowed_guids)
415 steps_to_configure(self, to_restart)
417 if self._netreffed_testbeds:
418 self._logger.debug("ExperimentController: Resolving netreffed testbeds")
419 # initally resolve netrefs
420 self.do_netrefs(data, fail_if_undefined=False)
422 # rinse and repeat, for netreffed testbeds
423 netreffed_testbeds = set(self._netreffed_testbeds)
425 to_recover, to_restart = self._init_testbed_controllers(data, recover)
426 all_restart.update(to_restart)
429 # persist testbed connection data, for potential recovery
430 self._persist_testbed_proxies()
432 # recover recoverable controllers
433 for guid in to_recover:
435 self._testbeds[guid].do_setup()
436 self._testbeds[guid].recover()
438 self._logger.exception("During recovery of testbed %s", guid)
441 self._failed_testbeds.add(guid)
443 # configure dependant testbeds
444 steps_to_configure(self, to_restart)
446 all_restart = [ self._testbeds[guid] for guid in all_restart ]
448 # final netref step, fail if anything's left unresolved
449 self._logger.debug("ExperimentController: Resolving do_netrefs")
450 self.do_netrefs(data, fail_if_undefined=False)
452 # Only now, that netref dependencies have been solve, it is safe to
453 # program cross_connections
454 self._logger.debug("ExperimentController: Programming testbed cross-connections")
455 self._program_testbed_cross_connections(data)
457 # perform do_configure in parallel for al testbeds
458 # (it's internal configuration for each)
459 self._logger.debug("ExperimentController: Starting parallel do_configure")
460 self._parallel([testbed.do_configure
461 for testbed in all_restart])
465 #print >>sys.stderr, "DO IT"
469 # cross-connect (cannot be done in parallel)
470 self._logger.debug("ExperimentController: Starting cross-connect")
471 for guid, testbed in self._testbeds.iteritems():
472 cross_data = self._get_cross_data(guid)
473 testbed.do_cross_connect_init(cross_data)
474 for guid, testbed in self._testbeds.iteritems():
475 cross_data = self._get_cross_data(guid)
476 testbed.do_cross_connect_compl(cross_data)
480 # Last chance to configure (parallel on all testbeds)
481 self._logger.debug("ExperimentController: Starting parallel do_prestart")
482 self._parallel([testbed.do_prestart
483 for testbed in all_restart])
485 # final netref step, fail if anything's left unresolved
486 self.do_netrefs(data, fail_if_undefined=True)
491 # update execution xml with execution-specific values
492 # TODO: BUG! BUggy code! cant stand all serializing all attribute values (ej: tun_key which is non ascci)"
493 self._update_execute_xml()
494 self.persist_execute_xml()
496 # start experiment (parallel start on all testbeds)
497 self._logger.debug("ExperimentController: Starting parallel do_start")
498 self._parallel([testbed.start
499 for testbed in all_restart])
503 def _clear_caches(self):
504 # Cleaning cache for safety.
505 self._guids_in_testbed_cache = dict()
507 def _persist_testbed_proxies(self):
508 TRANSIENT = (DC.RECOVER,)
510 # persist access configuration for all testbeds, so that
511 # recovery mode can reconnect to them if it becomes necessary
512 conf = ConfigParser.RawConfigParser()
513 for testbed_guid, testbed_config in self._deployment_config.iteritems():
514 testbed_guid = str(testbed_guid)
515 conf.add_section(testbed_guid)
516 for attr in testbed_config.get_attribute_list():
517 if attr not in TRANSIENT:
518 value = testbed_config.get_attribute_value(attr)
519 if value is not None:
520 conf.set(testbed_guid, attr, value)
522 f = open(os.path.join(self._root_dir, 'deployment_config.ini'), 'w')
526 def _load_testbed_proxies(self):
528 Attribute.STRING : 'get',
529 Attribute.BOOL : 'getboolean',
530 Attribute.ENUM : 'get',
531 Attribute.DOUBLE : 'getfloat',
532 Attribute.INTEGER : 'getint',
535 TRANSIENT = (DC.RECOVER,)
537 # deferred import because proxy needs
538 # our class definitions to define proxies
539 import nepi.util.proxy as proxy
541 conf = ConfigParser.RawConfigParser()
542 conf.read(os.path.join(self._root_dir, 'deployment_config.ini'))
543 for testbed_guid in conf.sections():
544 testbed_config = proxy.AccessConfiguration()
545 testbed_guid = str(testbed_guid)
546 for attr in testbed_config.get_attribute_list():
547 if attr not in TRANSIENT:
548 getter = getattr(conf, TYPEMAP.get(
549 testbed_config.get_attribute_type(attr),
552 value = getter(testbed_guid, attr)
553 testbed_config.set_attribute_value(attr, value)
554 except ConfigParser.NoOptionError:
558 def _unpersist_testbed_proxies(self):
560 os.remove(os.path.join(self._root_dir, 'deployment_config.ini'))
562 # Just print exceptions, this is just cleanup
563 self._logger.exception("Loading testbed configuration")
565 def _update_execute_xml(self):
567 # For all elements in testbed,
568 # - gather immutable execute-readable attribuets lists
570 # Generate new design description from design xml
571 # (Wait for attributes lists - implicit syncpoint)
573 # For all elements in testbed,
574 # - gather all immutable execute-readable attribute
575 # values, asynchronously
576 # (Wait for attribute values - implicit syncpoint)
578 # For all elements in testbed,
579 # - inject non-None values into new design
580 # Generate execute xml from new design
582 attribute_lists = dict(
583 (testbed_guid, collections.defaultdict(dict))
584 for testbed_guid in self._testbeds
587 for testbed_guid, testbed in self._testbeds.iteritems():
588 guids = self._guids_in_testbed(testbed_guid)
590 attribute_lists[testbed_guid][guid] = \
591 testbed.get_attribute_list_deferred(guid, Attribute.ExecImmutable)
593 parser = XmlExperimentParser()
594 execute_data = parser.from_xml_to_data(self._experiment_design_xml)
596 attribute_values = dict(
597 (testbed_guid, collections.defaultdict(dict))
598 for testbed_guid in self._testbeds
601 for testbed_guid, testbed_attribute_lists in attribute_lists.iteritems():
602 testbed = self._testbeds[testbed_guid]
603 for guid, attribute_list in testbed_attribute_lists.iteritems():
604 attribute_list = _undefer(attribute_list)
605 attribute_values[testbed_guid][guid] = dict(
606 (attribute, testbed.get_deferred(guid, attribute))
607 for attribute in attribute_list
610 for testbed_guid, testbed_attribute_values in attribute_values.iteritems():
611 for guid, attribute_values in testbed_attribute_values.iteritems():
612 for attribute, value in attribute_values.iteritems():
613 value = _undefer(value)
614 if value is not None:
615 execute_data.add_attribute_data(guid, attribute, value)
617 self._experiment_execute_xml = parser.to_xml(data=execute_data)
620 for testbed in self._testbeds.values():
622 self._unpersist_testbed_proxies()
623 self._stopped_time = time.time()
626 # reload perviously persisted testbed access configurations
627 self._failed_testbeds.clear()
628 self._load_testbed_proxies()
630 # re-program testbeds that need recovery
631 self._start(recover = True)
633 def is_finished(self, guid):
634 testbed = self._testbed_for_guid(guid)
636 return testbed.status(guid) == AS.STATUS_FINISHED
637 raise RuntimeError("No element exists with guid %d" % guid)
639 def _testbed_recovery_policy(self, guid, data = None):
641 parser = XmlExperimentParser()
642 data = parser.from_xml_to_data(self._experiment_design_xml)
644 return data.get_attribute_data(guid, DC.RECOVERY_POLICY)
646 def status(self, guid):
647 if guid in self._testbeds:
649 # report testbed status
650 if guid in self._failed_testbeds:
651 return TS.STATUS_FAILED
654 return self._testbeds[guid].status()
656 return TS.STATUS_UNRESPONSIVE
659 testbed = self._testbed_for_guid(guid)
660 if testbed is not None:
661 return testbed.status(guid)
663 return AS.STATUS_UNDETERMINED
665 def set(self, guid, name, value, time = TIME_NOW):
666 testbed = self._testbed_for_guid(guid)
668 testbed.set(guid, name, value, time)
670 raise RuntimeError("No element exists with guid %d" % guid)
672 def get(self, guid, name, time = TIME_NOW):
673 testbed = self._testbed_for_guid(guid)
675 return testbed.get(guid, name, time)
676 raise RuntimeError("No element exists with guid %d" % guid)
678 def get_deferred(self, guid, name, time = TIME_NOW):
679 testbed = self._testbed_for_guid(guid)
681 return testbed.get_deferred(guid, name, time)
682 raise RuntimeError("No element exists with guid %d" % guid)
684 def get_factory_id(self, guid):
685 testbed = self._testbed_for_guid(guid)
687 return testbed.get_factory_id(guid)
688 raise RuntimeError("No element exists with guid %d" % guid)
690 def get_testbed_id(self, guid):
691 testbed = self._testbed_for_guid(guid)
693 return testbed.testbed_id
694 raise RuntimeError("No element exists with guid %d" % guid)
696 def get_testbed_version(self, guid):
697 testbed = self._testbed_for_guid(guid)
699 return testbed.testbed_version
700 raise RuntimeError("No element exists with guid %d" % guid)
704 ordered_testbeds = set()
706 def shutdown_testbed(guid):
708 testbed = self._testbeds[guid]
709 ordered_testbeds.add(guid)
712 exceptions.append(sys.exc_info())
714 self._logger.debug("ExperimentController: Starting parallel shutdown")
716 for testbed_guids in reversed(self._testbed_order):
717 self._parallel([functools.partial(shutdown_testbed, guid)
718 for guid in testbed_guids])
719 remaining_guids = set(self._testbeds) - ordered_testbeds
721 self._parallel([functools.partial(shutdown_testbed, guid)
722 for guid in remaining_guids])
724 for exc_info in exceptions:
725 raise exc_info[0], exc_info[1], exc_info[2]
727 def _testbed_for_guid(self, guid):
728 for testbed_guid in self._testbeds.keys():
729 if guid in self._guids_in_testbed(testbed_guid):
730 if testbed_guid in self._failed_testbeds:
732 return self._testbeds[testbed_guid]
735 def _guids_in_testbed(self, testbed_guid):
736 if testbed_guid not in self._testbeds:
738 if testbed_guid not in self._guids_in_testbed_cache:
739 self._guids_in_testbed_cache[testbed_guid] = \
740 set(self._testbeds[testbed_guid].guids)
741 return self._guids_in_testbed_cache[testbed_guid]
744 def _netref_component_split(component):
745 match = COMPONENT_PATTERN.match(component)
747 return match.group("kind"), match.group("index")
749 return component, None
751 _NETREF_COMPONENT_GETTERS = {
753 lambda testbed, guid, index, name:
754 testbed.get_address(guid, int(index), name),
756 lambda testbed, guid, index, name:
757 testbed.get_route(guid, int(index), name),
759 lambda testbed, guid, index, name:
760 testbed.trace(guid, index, attribute = name),
762 lambda testbed, guid, index, name:
763 testbed.get(guid, name),
766 def resolve_netref_value(self, value, failval = None):
769 for match in ATTRIBUTE_PATTERN_BASE.finditer(value):
770 label = match.group("label")
771 if label.startswith('GUID-'):
772 ref_guid = int(label[5:])
774 expr = match.group("expr")
775 component = (match.group("component") or "")[1:] # skip the dot
776 attribute = match.group("attribute")
778 # split compound components into component kind and index
779 # eg: 'addr[0]' -> ('addr', '0')
780 component, component_index = self._netref_component_split(component)
782 # find object and resolve expression
783 for ref_testbed_guid, ref_testbed in self._testbeds.iteritems():
784 if component not in self._NETREF_COMPONENT_GETTERS:
785 raise ValueError, "Malformed netref: %r - unknown component" % (expr,)
786 elif ref_guid not in self._guids_in_testbed(ref_testbed_guid):
789 ref_value = self._NETREF_COMPONENT_GETTERS[component](
790 ref_testbed, ref_guid, component_index, attribute)
792 value = rv = value.replace(match.group(), ref_value)
795 # unresolvable netref
802 def do_netrefs(self, data, fail_if_undefined = False):
804 for (testbed_guid, guid), attrs in self._netrefs.items():
805 testbed = self._testbeds.get(testbed_guid)
806 if testbed is not None:
807 for name in set(attrs):
808 value = testbed.get(guid, name)
809 if isinstance(value, basestring):
810 ref_value = self.resolve_netref_value(value)
811 if ref_value is not None:
812 testbed.set(guid, name, ref_value)
814 elif fail_if_undefined:
815 raise ValueError, "Unresolvable netref in: %r=%r" % (name,value,)
817 del self._netrefs[(testbed_guid, guid)]
820 for testbed_guid, attrs in self._testbed_netrefs.items():
821 tb_data = dict(data.get_attribute_data(testbed_guid))
823 for name in set(attrs):
824 value = tb_data.get(name)
825 if isinstance(value, basestring):
826 ref_value = self.resolve_netref_value(value)
827 if ref_value is not None:
828 data.set_attribute_data(testbed_guid, name, ref_value)
830 elif fail_if_undefined:
831 raise ValueError, "Unresolvable netref in: %r" % (value,)
833 del self._testbed_netrefs[testbed_guid]
836 def _init_testbed_controllers(self, data, recover = False):
837 blacklist_testbeds = set(self._testbeds)
838 element_guids = list()
840 data_guids = data.guids
844 # gather label associations
845 for guid in data_guids:
846 if not data.is_testbed_data(guid):
847 (testbed_guid, factory_id) = data.get_box_data(guid)
848 label = data.get_attribute_data(guid, "label")
849 if label is not None:
850 if label in label_guids:
851 raise RuntimeError, "Label %r is not unique" % (label,)
852 label_guids[label] = guid
854 # create testbed controllers
855 for guid in data_guids:
856 if data.is_testbed_data(guid):
857 if guid not in self._testbeds:
859 self._create_testbed_controller(
860 guid, data, element_guids, recover)
863 blacklist_testbeds.add(guid)
868 policy = self._testbed_recovery_policy(guid, data=data)
869 if policy == DC.POLICY_RECOVER:
870 self._create_testbed_controller(
871 guid, data, element_guids, False)
873 elif policy == DC.POLICY_RESTART:
874 self._create_testbed_controller(
875 guid, data, element_guids, False)
879 self._failed_testbeds.add(guid)
883 # queue programmable elements
884 # - that have not been programmed already (blacklist_testbeds)
885 # - including recovered or restarted testbeds
886 # - but those that have no unresolved netrefs
887 for guid in data_guids:
888 if not data.is_testbed_data(guid):
889 (testbed_guid, factory_id) = data.get_box_data(guid)
890 if testbed_guid not in blacklist_testbeds:
891 element_guids.append(guid)
893 # replace references to elements labels for its guid
894 self._resolve_labels(data, data_guids, label_guids)
896 # program testbed controllers
898 self._program_testbed_controllers(element_guids, data)
900 return to_recover, to_restart
902 def _resolve_labels(self, data, data_guids, label_guids):
903 netrefs = self._netrefs
904 testbed_netrefs = self._testbed_netrefs
905 for guid in data_guids:
906 for name, value in data.get_attribute_data(guid):
907 if isinstance(value, basestring):
909 for match in ATTRIBUTE_PATTERN_BASE.finditer(value):
910 label = match.group("label")
911 if not label.startswith('GUID-'):
912 ref_guid = label_guids.get(label)
913 if ref_guid is not None:
914 value = value.replace(
916 ATTRIBUTE_PATTERN_GUID_SUB % dict(
917 guid = 'GUID-%d' % (ref_guid,),
918 expr = match.group("expr"),
921 data.set_attribute_data(guid, name, value)
923 # memorize which guid-attribute pairs require
924 # postprocessing, to avoid excessive controller-testbed
925 # communication at configuration time
926 # (which could require high-latency network I/O)
927 if not data.is_testbed_data(guid):
928 (testbed_guid, factory_id) = data.get_box_data(guid)
929 netrefs[(testbed_guid, guid)].add(name)
931 testbed_netrefs[guid].add(name)
937 def _create_testbed_controller(self, guid, data, element_guids, recover):
938 (testbed_id, testbed_version) = data.get_testbed_data(guid)
939 deployment_config = self._deployment_config.get(guid)
941 # deferred import because proxy needs
942 # our class definitions to define proxies
943 import nepi.util.proxy as proxy
945 if deployment_config is None:
947 deployment_config = proxy.AccessConfiguration()
949 for (name, value) in data.get_attribute_data(guid):
950 if value is not None and deployment_config.has_attribute(name):
951 # if any deployment config attribute has a netref, we can't
952 # create this controller yet
953 if isinstance(value, basestring) and ATTRIBUTE_PATTERN_BASE.search(value):
954 # remember to re-issue this one
955 self._netreffed_testbeds.add(guid)
958 # copy deployment config attribute
959 deployment_config.set_attribute_value(name, value)
962 self._deployment_config[guid] = deployment_config
964 if deployment_config is not None:
965 # force recovery mode
966 deployment_config.set_attribute_value("recover",recover)
968 testbed = proxy.create_testbed_controller(testbed_id, testbed_version,
970 for (name, value) in data.get_attribute_data(guid):
971 testbed.defer_configure(name, value)
972 self._testbeds[guid] = testbed
973 if guid in self._netreffed_testbeds:
974 self._netreffed_testbeds.remove(guid)
976 def _program_testbed_controllers(self, element_guids, data):
977 def resolve_create_netref(data, guid, name, value):
978 # Try to resolve create-time netrefs, if possible
979 if isinstance(value, basestring) and ATTRIBUTE_PATTERN_BASE.search(value):
981 nuvalue = self.resolve_netref_value(value)
983 # Any trouble means we're not in shape to resolve the netref yet
985 if nuvalue is not None:
986 # Only if we succeed we remove the netref deferral entry
988 data.set_attribute_data(guid, name, value)
989 if (testbed_guid, guid) in self._netrefs:
990 self._netrefs[(testbed_guid, guid)].discard(name)
993 for guid in element_guids:
994 (testbed_guid, factory_id) = data.get_box_data(guid)
995 testbed = self._testbeds.get(testbed_guid)
996 if testbed is not None:
998 testbed.defer_create(guid, factory_id)
1000 for (name, value) in data.get_attribute_data(guid):
1001 value = resolve_create_netref(data, guid, name, value)
1002 testbed.defer_create_set(guid, name, value)
1004 for guid in element_guids:
1005 (testbed_guid, factory_id) = data.get_box_data(guid)
1006 testbed = self._testbeds.get(testbed_guid)
1007 if testbed is not None:
1009 for trace_id in data.get_trace_data(guid):
1010 testbed.defer_add_trace(guid, trace_id)
1012 for (address, netprefix, broadcast) in data.get_address_data(guid):
1014 testbed.defer_add_address(guid, address, netprefix,
1017 for (destination, netprefix, nexthop, metric) in data.get_route_data(guid):
1018 testbed.defer_add_route(guid, destination, netprefix, nexthop, metric)
1019 # store connections data
1020 for (connector_type_name, other_guid, other_connector_type_name) \
1021 in data.get_connection_data(guid):
1022 (other_testbed_guid, other_factory_id) = data.get_box_data(
1024 if testbed_guid == other_testbed_guid:
1025 # each testbed should take care of enforcing internal
1026 # connection simmetry, so each connection is only
1027 # added in one direction
1028 testbed.defer_connect(guid, connector_type_name,
1029 other_guid, other_connector_type_name)
1031 def _program_testbed_cross_connections(self, data):
1032 data_guids = data.guids
1033 for guid in data_guids:
1034 if not data.is_testbed_data(guid):
1035 (testbed_guid, factory_id) = data.get_box_data(guid)
1036 testbed = self._testbeds.get(testbed_guid)
1037 if testbed is not None:
1038 for (connector_type_name, cross_guid, cross_connector_type_name) \
1039 in data.get_connection_data(guid):
1040 (testbed_guid, factory_id) = data.get_box_data(guid)
1041 (cross_testbed_guid, cross_factory_id) = data.get_box_data(
1043 if testbed_guid != cross_testbed_guid:
1044 cross_testbed = self._testbeds[cross_testbed_guid]
1045 cross_testbed_id = cross_testbed.testbed_id
1046 testbed.defer_cross_connect(guid, connector_type_name, cross_guid,
1047 cross_testbed_guid, cross_testbed_id, cross_factory_id,
1048 cross_connector_type_name)
1049 # save cross data for later
1050 self._logger.debug("ExperimentController: adding cross_connection data tbd=%d:guid=%d - tbd=%d:guid=%d" % \
1051 (testbed_guid, guid, cross_testbed_guid, cross_guid))
1052 self._add_crossdata(testbed_guid, guid, cross_testbed_guid,
1055 def _add_crossdata(self, testbed_guid, guid, cross_testbed_guid, cross_guid):
1056 if testbed_guid not in self._cross_data:
1057 self._cross_data[testbed_guid] = dict()
1058 if cross_testbed_guid not in self._cross_data[testbed_guid]:
1059 self._cross_data[testbed_guid][cross_testbed_guid] = set()
1060 self._cross_data[testbed_guid][cross_testbed_guid].add(cross_guid)
1062 def _get_cross_data(self, testbed_guid):
1064 if not testbed_guid in self._cross_data:
1067 # fetch attribute lists in one batch
1068 attribute_lists = dict()
1069 for cross_testbed_guid, guid_list in \
1070 self._cross_data[testbed_guid].iteritems():
1071 cross_testbed = self._testbeds[cross_testbed_guid]
1072 for cross_guid in guid_list:
1073 attribute_lists[(cross_testbed_guid, cross_guid)] = \
1074 cross_testbed.get_attribute_list_deferred(cross_guid)
1076 # fetch attribute values in another batch
1077 for cross_testbed_guid, guid_list in \
1078 self._cross_data[testbed_guid].iteritems():
1079 cross_data[cross_testbed_guid] = dict()
1080 cross_testbed = self._testbeds[cross_testbed_guid]
1081 for cross_guid in guid_list:
1082 elem_cross_data = dict(
1084 _testbed_guid = cross_testbed_guid,
1085 _testbed_id = cross_testbed.testbed_id,
1086 _testbed_version = cross_testbed.testbed_version)
1087 cross_data[cross_testbed_guid][cross_guid] = elem_cross_data
1088 attribute_list = attribute_lists[(cross_testbed_guid,cross_guid)]
1089 for attr_name in attribute_list:
1090 attr_value = cross_testbed.get_deferred(cross_guid, attr_name)
1091 elem_cross_data[attr_name] = attr_value
1093 # undefer all values - we'll have to serialize them probably later
1094 for cross_testbed_guid, testbed_cross_data in cross_data.iteritems():
1095 for cross_guid, elem_cross_data in testbed_cross_data.iteritems():
1096 for attr_name, attr_value in elem_cross_data.iteritems():
1097 elem_cross_data[attr_name] = _undefer(attr_value)
1101 class ExperimentSuite(object):
1102 def __init__(self, experiment_xml, access_config, repetitions,
1103 duration, wait_guids):
1104 self._experiment_xml = experiment_xml
1105 self._access_config = access_config
1106 self._experiments = dict()
1107 self._repetitions = repetitions
1108 self._duration = duration
1109 self._wait_guids = wait_guids
1110 self._current = None
1111 self._status = TS.STATUS_ZERO
1115 self._status = TS.STATUS_STARTED
1116 self._thread = threading.Thread(target = self._run_experiment_suite)
1117 self._thread.start()
1124 def _run_experiment_suite(self):
1125 for i in xrange[0, self.repetitions]:
1127 self._run_one_experiment()
1129 def _run_one_experiment(self):
1130 access_config = proxy.AccessConfiguration()
1131 for attr in self._access_config.attributes:
1132 access_config.set_attribute_value(attr.name, attr.value)
1133 access_config.set_attribute_value(DC.DEPLOYMENT_MODE, DC.MODE_DAEMON)
1134 root_dir = "%s_%d" % (
1135 access_config.get_attribute_value(DC.ROOT_DIRECTORY),
1137 access_config.set_attribute_value(DC.ROOT_DIRECTORY, root_dir)
1138 controller = proxy.create_experiment_controller(self._experiment_xml,
1140 self._experiments[self._current] = controller
1142 started_at = time.time()
1143 # wait until all specified guids have finished execution
1144 if self._wait_guids:
1145 while all(itertools.imap(controller.is_finished, self._wait_guids):
1147 # wait until the minimum experiment duration time has elapsed
1149 while (time.time() - started_at) < self._duration:
1153 controller.shutdown()