X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=nm.py;h=7236cc811c916ab07c2ccf70172510ae84510d7e;hb=8a73c41fa38f330fd125d85d693d1390ea2477a4;hp=85c9004fedf6f606f42a09f894509974ed38dbeb;hpb=6d65ae5c5fd545f02a92582b3ff8d961b46da0d4;p=nodemanager.git diff --git a/nm.py b/nm.py index 85c9004..7236cc8 100755 --- a/nm.py +++ b/nm.py @@ -1,5 +1,7 @@ #!/usr/bin/python - +# +# $Id$ +# $URL$ # # Useful information can be found at https://svn.planet-lab.org/wiki/NodeManager # @@ -17,6 +19,7 @@ import socket import os import sys import resource +import glob import logger import tools @@ -29,17 +32,23 @@ id="$Id$" savedargv = sys.argv[:] # NOTE: modules listed here should also be loaded in this order +# see the priority set in each module - lower comes first known_modules=['net','conf_files', 'sm', 'bwmon'] plugin_path = "/usr/share/NodeManager/plugins" +default_period=600 +default_random=301 + parser = optparse.OptionParser() parser.add_option('-d', '--daemon', action='store_true', dest='daemon', default=False, help='run daemonized') parser.add_option('-s', '--startup', action='store_true', dest='startup', default=False, help='run all sliver startup scripts') parser.add_option('-f', '--config', action='store', dest='config', default='/etc/planetlab/plc_config', help='PLC configuration file') parser.add_option('-k', '--session', action='store', dest='session', default='/etc/planetlab/session', help='API session key (or file)') -parser.add_option('-p', '--period', action='store', dest='period', default=600, help='Polling interval (sec)') -parser.add_option('-r', '--random', action='store', dest='random', default=301, help='Range for additional random polling interval (sec)') +parser.add_option('-p', '--period', action='store', dest='period', default=default_period, + help='Polling interval (sec) - default %d'%default_period) +parser.add_option('-r', '--random', action='store', dest='random', default=default_random, + help='Range for additional random polling interval (sec) -- default %d'%default_random) parser.add_option('-v', '--verbose', action='store_true', dest='verbose', default=False, help='more verbose log') parser.add_option('-P', '--path', action='store', dest='path', default=plugin_path, help='Path to plugins directory') @@ -50,28 +59,39 @@ parser.add_option('-m', '--module', action='store', dest='module', default='', h # Deal with plugins directory if os.path.exists(options.path): sys.path.append(options.path) - known_modules += [i[:-3] for i in os.listdir(options.path) if i.endswith(".py") and (i[:-3] not in known_modules)] + plugins = [ os.path.split(os.path.splitext(x)[0])[1] for x in glob.glob( os.path.join(options.path,'*.py') ) ] + known_modules += plugins modules = [] def GetSlivers(config, plc): '''Run call backs defined in modules''' try: - logger.log("Syncing w/ PLC") + logger.log("nm: Syncing w/ PLC") + # retrieve GetSlivers from PLC data = plc.GetSlivers() - if (options.verbose): logger.log_slivers(data) + # use the magic 'default' slice to retrieve system-wide defaults getPLCDefaults(data, config) + # tweak the 'vref' attribute from GetSliceFamily + setSliversVref (data) + # always dump it for debug purposes + # used to be done only in verbose; very helpful though, and tedious to obtain, + # so let's dump this unconditionnally + logger.log_slivers(data) + logger.verbose("nm: Sync w/ PLC done") except: - logger.log_exc() + logger.log_exc("nm: failed in GetSlivers") # XXX So some modules can at least boostrap. logger.log("nm: Can't contact PLC to GetSlivers(). Continuing.") data = {} # Invoke GetSlivers() functions from the callback modules for module in modules: +# logger.log('trigerring GetSlivers callback for module %s'%module.__name__) try: callback = getattr(module, 'GetSlivers') callback(data, config, plc) - except: logger.log_exc() + except: + logger.log_exc("nm: GetSlivers failed to run callback for module %r"%module) def getPLCDefaults(data, config): @@ -83,10 +103,32 @@ def getPLCDefaults(data, config): attr_dict = {} for attr in slice.get('attributes'): attr_dict[attr['tagname']] = attr['value'] if len(attr_dict): - logger.verbose("Found default slice overrides.\n %s" % attr_dict) + logger.verbose("nm: Found default slice overrides.\n %s" % attr_dict) config.OVERRIDES = attr_dict - elif 'OVERRIDES' in dir(config): del config.OVERRIDES + return + # NOTE: if an _default slice existed, it would have been found above and + # the routine would return. Thus, if we've gotten here, then no default + # slice is bound to this node. + if 'OVERRIDES' in dir(config): del config.OVERRIDES + +def setSliversVref (data): + ''' + Tweak the 'vref' attribute in all slivers based on the 'GetSliceFamily' key + ''' + # GetSlivers exposes the result of GetSliceFamily() as an separate key in data + # It is safe to override the attributes with this, as this method has the right logic + for sliver in data.get('slivers'): + try: + slicefamily=sliver.get('GetSliceFamily') + for att in sliver['attributes']: + if att['tagname']=='vref': + att['value']=slicefamily + continue + sliver['attributes'].append({ 'tagname':'vref','value':slicefamily}) + except: + logger.log_exc("nm: Could not overwrite 'vref' attribute from 'GetSliceFamily'",name=sliver['name']) + def run(): try: @@ -111,7 +153,7 @@ def run(): if options.module: assert options.module in known_modules running_modules=[options.module] - logger.verbose('Running single module %s'%options.module) + logger.verbose('nm: Running single module %s'%options.module) else: running_modules=known_modules for module in running_modules: @@ -122,6 +164,15 @@ def run(): except ImportError, err: print "Warning while loading module %s:" % module, err + default_priority=100 + # sort on priority (lower first) + def sort_module_priority (m1,m2): + return getattr(m1,'priority',default_priority) - getattr(m2,'priority',default_priority) + modules.sort(sort_module_priority) + + logger.verbose('modules priorities and order:') + for module in modules: logger.verbose ('%s: %s'%(getattr(module,'priority',default_priority),module.__name__)) + # Load /etc/planetlab/session if os.path.exists(options.session): session = file(options.session).read().strip() @@ -134,29 +185,29 @@ def run(): plc = PLCAPI(config.plc_api_uri, config.cacert, session, timeout=iperiod/2) #check auth - logger.log("Checking Auth.") + logger.log("nm: Checking Auth.") while plc.check_authentication() != True: try: plc.update_session() - logger.log("Authentication Failure. Retrying") + logger.log("nm: Authentication Failure. Retrying") except: - logger.log("Retry Failed. Waiting") + logger.log("nm: Retry Failed. Waiting") time.sleep(iperiod) - logger.log("Authentication Succeeded!") + logger.log("nm: Authentication Succeeded!") while True: # Main NM Loop - logger.verbose('mainloop - nm:getSlivers - period=%d random=%d'%(iperiod,irandom)) + logger.verbose('nm: mainloop - calling GetSlivers - period=%d random=%d'%(iperiod,irandom)) GetSlivers(config, plc) delay=iperiod + random.randrange(0,irandom) - logger.verbose('mainloop - sleeping for %d s'%delay) + logger.verbose('nm: mainloop - sleeping for %d s'%delay) time.sleep(delay) - except: logger.log_exc() + except: logger.log_exc("nm: failed in run") if __name__ == '__main__': - logger.log("Entering nm.py "+id) + logger.log("======================================== Entering nm.py "+id) run() else: # This is for debugging purposes. Open a copy of Python and import nm