X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=logger.py;h=3d3400ee854cd2b0a766954c454649072f68feec;hb=refs%2Fheads%2Fplanetstack;hp=c4f6ce6354cff1fb40beb3d714335d02fd689571;hpb=33f472e3e3589569f0272f7f53d07b011d2a5490;p=nodemanager.git diff --git a/logger.py b/logger.py index c4f6ce6..3d3400e 100644 --- a/logger.py +++ b/logger.py @@ -1,5 +1,3 @@ -# $Id$ -# $URL$ """A very simple logger that tries to be concurrency-safe.""" @@ -9,21 +7,24 @@ import traceback import subprocess import select -LOG_FILE = '/var/log/nm' -LOG_SLIVERS = '/var/log/getslivers.txt' +LOG_FILE = '/var/log/nodemanager' +LOG_SLIVERS = '/var/lib/nodemanager/getslivers.txt' +LOG_DATABASE = '/var/lib/nodemanager/database.txt' -# Thierry - trying to debug this for 4.2 # basically define 3 levels LOG_NONE=0 LOG_NODE=1 LOG_VERBOSE=2 # default is to log a reasonable amount of stuff for when running on operational nodes -LOG_LEVEL=1 +LOG_LEVEL=LOG_NODE def set_level(level): global LOG_LEVEL - assert level in [LOG_NONE,LOG_NODE,LOG_VERBOSE] - LOG_LEVEL=level + try: + assert level in [LOG_NONE,LOG_NODE,LOG_VERBOSE] + LOG_LEVEL=level + except: + logger.log("Failed to set LOG_LEVEL to %s"%level) def verbose(msg): log('(v) '+msg,LOG_VERBOSE) @@ -43,7 +44,7 @@ def log(msg,level=LOG_NODE): def log_exc(msg="",name=None): """Log the traceback resulting from an exception.""" - if name: + if name: log("%s: EXCEPTION caught <%s> \n %s" %(name, msg, traceback.format_exc())) else: log("EXCEPTION caught <%s> \n %s" %(msg, traceback.format_exc())) @@ -55,7 +56,9 @@ def log_exc(msg="",name=None): def log_missing_data (msg,key): log("%s: could not find the %s key in data (PLC connection down?) - IGNORED"%(msg,key)) -def log_data_in_file (data, file, message=""): +def log_data_in_file (data, file, message="",level=LOG_NODE): + if (level > LOG_LEVEL): + return import pprint, time try: f=open(file,'w') @@ -65,21 +68,24 @@ def log_data_in_file (data, file, message=""): pp=pprint.PrettyPrinter(stream=f,indent=2) pp.pprint(data) f.close() + verbose("logger:.log_data_in_file Owerwrote %s"%file) except: - log_verbose('log_data_in_file failed - file=%s - message=%r'%(file,message)) + log_exc('logger.log_data_in_file failed - file=%s - message=%r'%(file,message)) def log_slivers (data): log_data_in_file (data, LOG_SLIVERS, "raw GetSlivers") +def log_database (db): + log_data_in_file (db, LOG_DATABASE, "raw database") #################### child processes -# avoid waiting until the process returns; +# avoid waiting until the process returns; # that makes debugging of hanging children hard class Buffer: def __init__ (self,message='log_call: '): self.buffer='' self.message=message - + def add (self,c): self.buffer += c if c=='\n': self.flush() @@ -92,14 +98,16 @@ class Buffer: # time out in seconds - avoid hanging subprocesses - default is 5 minutes default_timeout_minutes=5 +# returns a bool that is True when everything goes fine and the retcod is 0 def log_call(command,timeout=default_timeout_minutes*60,poll=1): message=" ".join(command) log("log_call: running command %s" % message) verbose("log_call: timeout=%r s" % timeout) verbose("log_call: poll=%r s" % poll) trigger=time.time()+timeout - try: - child = subprocess.Popen(command, bufsize=1, + result = False + try: + child = subprocess.Popen(command, bufsize=1, stdout=subprocess.PIPE, stderr=subprocess.STDOUT, close_fds=True) buffer = Buffer() while True: @@ -112,17 +120,19 @@ def log_call(command,timeout=default_timeout_minutes*60,poll=1): if returncode != None: buffer.flush() # child is done and return 0 - if returncode == 0: - log("log_call: command completed (%s)" % message) + if returncode == 0: + log("log_call:end command (%s) completed" % message) + result=True break # child has failed else: - log("log_call: command return=%d (%s)" %(returncode,message)) - raise Exception("log_call: failed with returncode %d"%returncode) + log("log_call:end command (%s) returned with code %d" %(message,returncode)) + break # no : still within timeout ? if time.time() >= trigger: buffer.flush() child.terminate() - raise Exception("log_call: terminated command - exceeded timeout %d s"%timeout) + log("log_call:end terminating command (%s) - exceeded timeout %d s"%(message,timeout)) + break except: log_exc("failed to run command %s" % message) - + return result