2 """A very simple logger that tries to be concurrency-safe."""
10 LOG_FILE = '/var/log/nodemanager'
11 LOG_SLIVERS = '/var/lib/nodemanager/getslivers.txt'
12 LOG_DATABASE = '/var/lib/nodemanager/database.txt'
14 # basically define 3 levels
18 # default is to log a reasonable amount of stuff for when running on operational nodes
24 assert level in [LOG_NONE,LOG_NODE,LOG_VERBOSE]
27 logger.log("Failed to set LOG_LEVEL to %s"%level)
30 log('(v) '+msg,LOG_VERBOSE)
32 def log(msg,level=LOG_NODE):
33 """Write <msg> to the log file if level >= current log level (default LOG_NODE)."""
34 if (level > LOG_LEVEL):
37 fd = os.open(LOG_FILE, os.O_WRONLY | os.O_CREAT | os.O_APPEND, 0600)
38 if not msg.endswith('\n'): msg += '\n'
39 os.write(fd, '%s: %s' % (time.asctime(time.gmtime()), msg))
45 def log_exc(msg="",name=None):
46 """Log traceback resulting from an exception."""
48 if name: printout += "%s: "%name
49 printout += "EXCEPTION caught <%s> \n %s" %(msg, traceback.format_exc())
52 def log_trace(msg="",name=None):
53 """Log current stack"""
55 if name: printout += "%s: "%name
56 printout += "LOGTRACE\n"
57 for frame in traceback.format_stack():
58 printout += "..."+frame
62 ########## snapshot data to a file
63 # for some reason the various modules are still triggered even when the
64 # data from PLC cannot be reached
65 # we show this message instead of the exception stack instead in this case
66 def log_missing_data (msg,key):
67 log("%s: could not find the %s key in data (PLC connection down?) - IGNORED"%(msg,key))
69 def log_data_in_file (data, file, message="",level=LOG_NODE):
70 if (level > LOG_LEVEL):
75 now=time.strftime("Last update: %Y.%m.%d at %H:%M:%S %Z", time.localtime())
77 if message: f.write('Message:'+message+'\n')
78 pp=pprint.PrettyPrinter(stream=f,indent=2)
81 verbose("logger:.log_data_in_file Owerwrote %s"%file)
83 log_exc('logger.log_data_in_file failed - file=%s - message=%r'%(file,message))
85 def log_slivers (data):
86 log_data_in_file (data, LOG_SLIVERS, "raw GetSlivers")
87 def log_database (db):
88 log_data_in_file (db, LOG_DATABASE, "raw database")
90 #################### child processes
91 # avoid waiting until the process returns;
92 # that makes debugging of hanging children hard
95 def __init__ (self,message='log_call: '):
101 if c=='\n': self.flush()
105 log (self.message + self.buffer)
108 # time out in seconds - avoid hanging subprocesses - default is 5 minutes
109 default_timeout_minutes=5
111 # returns a bool that is True when everything goes fine and the retcod is 0
112 def log_call(command,timeout=default_timeout_minutes*60,poll=1):
113 message=" ".join(command)
114 log("log_call: running command %s" % message)
115 verbose("log_call: timeout=%r s" % timeout)
116 verbose("log_call: poll=%r s" % poll)
117 trigger=time.time()+timeout
120 child = subprocess.Popen(command, bufsize=1,
121 stdout=subprocess.PIPE, stderr=subprocess.STDOUT, close_fds=True)
124 # see if anything can be read within the poll interval
125 (r,w,x)=select.select([child.stdout],[],[],poll)
126 if r: buffer.add(child.stdout.read(1))
128 returncode=child.poll()
130 if returncode != None:
132 # child is done and return 0
134 log("log_call:end command (%s) completed" % message)
139 log("log_call:end command (%s) returned with code %d" %(message,returncode))
141 # no : still within timeout ?
142 if time.time() >= trigger:
145 log("log_call:end terminating command (%s) - exceeded timeout %d s"%(message,timeout))
147 except: log_exc("failed to run command %s" % message)