11 from datetime import datetime,timedelta
16 from pcucontrol import reboot
17 from monitor import config
18 from monitor.database.info.model import FindbadPCURecordSync, FindbadPCURecord, session
19 from monitor import database
20 from monitor import util
21 from monitor.wrapper import plc, plccache
22 from nodequery import pcu_select
23 from monitor.common import nmap_port_status
24 from monitor.scanapi import *
26 plc_lock = threading.Lock()
31 # this will be called when an exception occurs within a thread
32 def handle_exception(request, result):
33 print "Exception occured in request %s" % request.requestID
35 print "Result: %s" % i
37 def checkPCUs(l_pcus, cohash):
41 tp = threadpool.ThreadPool(10)
42 scanpcu = ScanPCU(global_round)
44 # CREATE all the work requests
45 for pcuname in l_pcus:
47 fbnodesync = FindbadPCURecordSync.findby_or_create(plc_pcuid=pcu_id, if_new_set={'round' : 0})
50 node_round = fbnodesync.round
51 if node_round < global_round or config.force:
52 # recreate node stats when refreshed
53 #print "%s" % nodename
54 req = threadpool.WorkRequest(scanpcu.collectInternal, [int(pcuname), cohash], {},
55 None, scanpcu.record, handle_exception)
58 # We just skip it, since it's "up to date"
60 print "%d %s %s" % (count, pcu_id, node_round)
62 # WAIT while all the work requests are processed.
68 # if more than two hours
69 if time.time() - begin > (60*60*1):
70 print "findbadpcus.py has run out of time!!!!!!"
72 except KeyboardInterrupt:
75 except threadpool.NoResultsPending:
76 print "All results collected."
79 print FindbadPCURecordSync.query.count()
80 print FindbadPCURecord.query.count()
87 l_pcus = plccache.l_pcus
90 fbsync = FindbadPCURecordSync.findby_or_create(plc_pcuid=0,
91 if_new_set={'round' : global_round})
93 global_round = fbsync.round
94 api = plc.getAuthAPI()
96 if config.site is not None:
97 site = api.GetSites(config.site)
98 l_nodes = api.GetNodes(site[0]['node_ids'], ['pcu_ids'])
101 pcus += node['pcu_ids']
103 l_pcus = [pcu for pcu in sets.Set(pcus)]
104 elif config.sitelist:
105 site_list = config.sitelist.split(',')
107 sites = api.GetSites(site_list)
110 node_ids += s['node_ids']
112 l_nodes = api.GetNodes(node_ids, ['pcu_ids'])
115 pcus += node['pcu_ids']
117 l_pcus = [pcu for pcu in sets.Set(pcus)]
119 elif config.pcuselect is not None:
120 n, pcus = pcu_select(config.pcuselect)
123 l_pcus = [pcu for pcu in sets.Set(pcus)]
125 elif config.nodelist == None and config.pcuid == None:
126 print "Calling API GetPCUs() : cachecalls(%s)" % config.cachecalls
127 l_pcus = [pcu['pcu_id'] for pcu in l_pcus]
128 elif config.nodelist is not None:
129 l_pcus = util.file.getListFromFile(config.nodelist)
130 l_pcus = [int(pcu) for pcu in l_pcus]
131 elif config.pcuid is not None:
132 l_pcus = [ config.pcuid ]
133 l_pcus = [int(pcu) for pcu in l_pcus]
136 # update global round number to force refreshes across all nodes
139 checkPCUs(l_pcus, cohash)
142 # update global round number to force refreshes across all nodes
143 fbsync.round = global_round
151 if __name__ == '__main__':
153 logger = logging.getLogger("monitor")
154 logger.setLevel(logging.DEBUG)
155 fh = logging.FileHandler("monitor.log", mode = 'a')
156 fh.setLevel(logging.DEBUG)
157 formatter = logging.Formatter('%(asctime)s %(levelname)s %(message)s')
158 fh.setFormatter(formatter)
159 logger.addHandler(fh)
160 from monitor import parser as parsermodule
161 parser = parsermodule.getParser()
162 parser.set_defaults(nodelist=None,
167 dbname="findbadpcus",
172 parser.add_option("-f", "--nodelist", dest="nodelist", metavar="FILE",
173 help="Provide the input file for the node list")
174 parser.add_option("", "--site", dest="site", metavar="FILE",
175 help="Get all pcus associated with the given site's nodes")
176 parser.add_option("", "--pcuselect", dest="pcuselect", metavar="FILE",
177 help="Query string to apply to the findbad pcus")
178 parser.add_option("", "--pcuid", dest="pcuid", metavar="id",
179 help="Provide the id for a single pcu")
181 parser.add_option("", "--cachenodes", action="store_true",
182 help="Cache node lookup from PLC")
183 parser.add_option("", "--dbname", dest="dbname", metavar="FILE",
184 help="Specify the name of the database to which the information is saved")
185 parser.add_option("", "--nocachecalls", action="store_false", dest="cachecalls",
186 help="Refresh the cached values")
187 parser.add_option("-i", "--increment", action="store_true", dest="increment",
188 help="Increment round number to force refresh or retry")
189 parser.add_option("", "--force", action="store_true", dest="force",
190 help="Force probe without incrementing global 'round'.")
191 parser = parsermodule.getParser(['defaults'], parser)
192 config = parsermodule.parse_args(parser)
193 if hasattr(config, 'cachecalls') and not config.cachecalls:
194 # NOTE: if explicilty asked, refresh cached values.
195 print "Reloading PLCCache"
198 # NOTE: evidently, there is a bizarre interaction between iLO and ssh
199 # when LANG is set... Do not know why. Unsetting LANG, fixes the problem.
200 if 'LANG' in os.environ:
201 del os.environ['LANG']
204 except Exception, err:
205 traceback.print_exc()
206 print "Exception: %s" % err
207 print "Saving data... exitting."