1 import turbogears as tg
2 from turbogears import controllers, expose, flash, exception_handler
3 from turbogears import widgets
4 from cherrypy import request, response
6 # from monitorweb import model
8 # log = logging.getLogger("monitorweb.controllers")
10 from monitor.database.info.model import *
11 #from monitor.database.zabbixapi.model import *
12 #from monitor.database.dborm import zab_session as session
13 #from monitor.database.dborm import zab_metadata as metadata
14 from monitor_xmlrpc import MonitorXmlrpcServer
16 from monitor import reboot
17 from monitor import scanapi
20 from monitor.wrapper.plccache import plcdb_hn2lb as site_hn2lb
22 from monitorweb.templates.links import *
25 # make it easier group objects without invoking the elixir auto-write feature.
29 def query_to_dict(query):
30 """ take a url query string and chop it up """
32 query_fields = query.split('&')
33 for f in query_fields:
34 (k,v) = urllib.splitvalue(f)
39 def format_ports(data, pcumodel=None):
44 supported_ports=reboot.model_to_object(pcumodel).supported_ports
46 # ports of a production node
47 supported_ports=[22,80,806]
49 if data and len(data.keys()) > 0 :
50 for port in supported_ports:
52 state = data[str(port)]
56 if state == "filtered":
59 retval.append( (port, state) )
62 retval = [( "Closed/Filtered", "state" )]
64 if filtered_length == len(supported_ports):
65 retval = [( "All Filtered", "state" )]
69 def format_pcu_shortstatus(pcu):
72 if pcu.reboot_trial_status == str(0):
74 elif pcu.reboot_trial_status == "NetDown" or pcu.reboot_trial_status == "Not_Run":
75 status = pcu.reboot_trial_status
81 def prep_pcu_for_display(pcu):
86 agg.loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
88 agg.loginbase = "unknown"
90 agg.pcuhist = HistoryPCURecord.query.get(pcu.plc_pcuid)
92 agg.ports = format_ports(pcu.port_status, pcu.plc_pcu_stats['model'])
93 agg.status = format_pcu_shortstatus(pcu)
95 #print pcu.entry_complete
96 agg.entry_complete_str = pcu.entry_complete
97 #pcu.entry_complete_str += "".join([ f[0] for f in pcu.entry_complete.split() ])
98 if pcu.dns_status == "NOHOSTNAME":
99 agg.dns_short_status = 'NoHost'
100 elif pcu.dns_status == "DNS-OK":
101 agg.dns_short_status = 'Ok'
102 elif pcu.dns_status == "DNS-NOENTRY":
103 agg.dns_short_status = 'NoEntry'
104 elif pcu.dns_status == "NO-DNS-OR-IP":
105 agg.dns_short_status = 'NoHostOrIP'
106 elif pcu.dns_status == "DNS-MISMATCH":
107 agg.dns_short_status = 'Mismatch'
110 class NodeWidget(widgets.Widget):
113 def prep_node_for_display(node, pcuhash=None, preppcu=True, asofdate=None):
117 if node.plc_pcuid and preppcu:
119 pcu = pcuhash[node.plc_pcuid]
121 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
124 agg.pcu_status = pcu.reboot_trial_status
125 agg.pcu_short_status = format_pcu_shortstatus(pcu)
126 agg.pcu = prep_pcu_for_display(pcu)
128 agg.pcu_short_status = "none"
129 agg.pcu_status = "nodata"
133 agg.pcu_status = "nopcu"
134 agg.pcu_short_status = "none"
138 if node.kernel_version:
139 agg.kernel = node.kernel_version.split()[2]
144 agg.loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
146 agg.loginbase = "unknown"
149 agg.site = HistorySiteRecord.by_loginbase(agg.loginbase)
152 agg.site = agg.site.get_as_of(asofdate)
155 # TODO: need a cleaner fix for this...
156 agg.site = HistorySiteRecord.by_loginbase("pl")
158 agg.site = HistorySiteRecord.by_loginbase("ple")
160 agg.history = HistoryNodeRecord.by_hostname(node.hostname)
162 agg.history = agg.history.get_as_of(asofdate)
164 agg.ports = format_ports(node.port_status)
167 exists = node.plc_node_stats['last_contact']
169 # TODO: this should not assign to the fb object!
170 node.plc_node_stats = {'last_contact' : None}
175 class Root(controllers.RootController, MonitorXmlrpcServer):
176 @expose(template="monitorweb.templates.welcome")
178 # log.debug("Happy TurboGears Controller Responding For Duty")
179 flash("Welcome To MyOps!")
180 return dict(now=time.ctime())
182 @expose(template="monitorweb.templates.nodelist", allow_json=True)
183 def node3(self, filter=None):
184 nhquery = HistoryNodeRecord.query.all()
188 if nh.status == filter:
195 fb = FindbadNodeRecord.get_latest_by(hostname=q.hostname)
198 return dict(now=time.ctime(), query=rquery)
200 @expose(template="monitorweb.templates.nodelist", allow_json=True)
201 def node2(self, filter=None):
202 nhquery = HistoryNodeRecord.query.all()
206 if nh.status == filter:
213 fb = FindbadNodeRecord.get_latest_by(hostname=q.hostname)
214 agg = prep_node_for_display(fb)
217 #fbquery = FindbadNodeRecord.get_all_latest()
218 #fbpcus = FindbadPCURecord.get_all_latest()
219 #def fbtohash(fbpculist):
221 # for p in fbpculist:
224 # pcuhash = fbtohash(fbpcus)
227 # for node in fbquery:
228 # # NOTE: reformat some fields.
229 # agg = prep_node_for_display(node, pcuhash)
230 # if not agg.history:
234 # if agg.history.status == filter:
239 widget = NodeWidget(template='monitorweb.templates.node_template')
240 return dict(now=time.ctime(), query=rquery, nodewidget=widget)
242 @expose(template="monitorweb.templates.nodelist")
243 def node(self, filter='boot'):
244 print "NODE------------------"
245 print "befor-len: ", len( [ i for i in session] )
246 session.flush(); session.clear()
247 print "after-len: ", len( [ i for i in session] )
248 fbquery = FindbadNodeRecord.get_all_latest()
250 filtercount = {'down' : 0, 'boot': 0, 'debug' : 0, 'diagnose' : 0, 'disabled': 0,
251 'neverboot' : 0, 'pending' : 0, 'all' : 0, None : 0}
253 # NOTE: reformat some fields.
254 agg = prep_node_for_display(node)
259 if agg.history.status in ['down', 'offline']:
260 if node.plc_node_stats and node.plc_node_stats['last_contact'] != None:
261 filtercount['down'] += 1
263 filtercount['neverboot'] += 1
264 elif agg.history.status in ['good', 'online']:
265 filtercount['boot'] += 1
266 elif agg.history.status in ['debug', 'monitordebug']:
267 filtercount['debug'] += 1
269 if filtercount.has_key(agg.history.status):
270 filtercount[agg.history.status] += 1
274 if filter == "neverboot":
275 if not node.plc_node_stats or node.plc_node_stats['last_contact'] == None:
277 elif filter == "all":
279 elif filter == agg.history.status:
281 elif filter == 'boot':
285 widget = NodeWidget(template='monitorweb.templates.node_template')
286 return dict(now=time.ctime(), query=query, fc=filtercount, nodewidget=widget)
288 def nodeaction_handler(self, tg_exceptions=None):
289 """Handle any kind of error."""
290 print "NODEACTION_HANDLER------------------"
292 if 'pcuid' in request.params:
293 pcuid = request.params['pcuid']
295 refurl = request.headers.get("Referer",link("pcu"))
298 # TODO: do this more intelligently...
299 uri_fields = urllib.splitquery(refurl)
300 if uri_fields[1] is not None:
301 val = query_to_dict(uri_fields[1])
304 elif 'hostname' in val:
305 pcuid = FindbadNodeRecord.get_latest_by(hostname=val['hostname']).plc_pcuid
311 cherry_trail = cherrypy._cputil.get_object_trail()
312 for i in cherry_trail:
316 return self.pcuview(None, pcuid, **dict(exceptions=tg_exceptions))
318 def nodeaction(self, **data):
319 print "NODEACTION------------------"
320 for item in data.keys():
321 print "%s %s" % ( item, data[item] )
323 if 'hostname' in data:
324 hostname = data['hostname']
326 flash("No hostname given in submitted data")
329 if 'submit' in data or 'type' in data:
331 action = data['submit']
333 action = data['type']
335 flash("No submit action given in submitted data")
338 if action == "Reboot":
339 print "REBOOT: %s" % hostname
340 ret = reboot.reboot_str(str(hostname))
342 if ret: raise RuntimeError("Error using PCU: " + str(ret))
343 flash("Reboot appeared to work. Allow at most 5 minutes. Then run ExternalScan to check current status.")
345 elif action == "ExternalScan":
346 scanapi.externalprobe(str(hostname))
347 flash("External Scan Successful!")
348 elif action == "InternalScan":
349 scanapi.internalprobe(str(hostname))
350 flash("Internal Scan Successful!")
353 raise RuntimeError("Unknown action given")
356 @expose(template="monitorweb.templates.simpleview")
357 def simpleview(self, **data):
358 return self.pre_view(**data)
360 @expose(template="monitorweb.templates.detailview")
361 def detailview(self, **data):
362 return self.pre_view(**data)
364 def pre_view(self, **data):
365 session.flush(); session.clear()
383 if len(obj.split(".")) > 1: hostname = obj
386 if 'loginbase' in data:
387 loginbase = data['loginbase']
389 if 'hostname' in data:
390 hostname = data['hostname']
393 try: pcuid = int(data['pcuid'])
397 try: since = int(since)
401 print "pcuid: %s" % pcuid
402 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
403 loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
406 node = FindbadNodeRecord.get_latest_by(hostname=hostname)
407 loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
410 actions = ActionRecord.query.filter_by(loginbase=loginbase
411 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
412 ).order_by(ActionRecord.date_created.desc())
413 actions = [ a for a in actions ]
414 sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
415 # NOTE: because a single pcu may be assigned to multiple hosts,
416 # track unique pcus by their plc_pcuid, then turn dict into list
418 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
419 # NOTE: reformat some fields.
420 agg = prep_node_for_display(node)
423 pcus[agg.pcu.pcu.plc_pcuid] = agg.pcu
425 for pcuid_key in pcus:
426 pcuquery += [pcus[pcuid_key]]
428 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions, since=since, exceptions=exceptions)
431 # TODO: add form validation
432 @expose(template="monitorweb.templates.pcuview")
433 @exception_handler(nodeaction_handler,"isinstance(tg_exceptions,RuntimeError)")
434 def pcuview(self, loginbase=None, pcuid=None, hostname=None, since=20, **data):
435 session.flush(); session.clear()
442 try: since = int(since)
448 if 'submit' in data.keys() or 'type' in data.keys():
449 if hostname: data['hostname'] = hostname
450 self.nodeaction(**data)
451 if 'exceptions' in data:
452 exceptions = data['exceptions']
456 if len(obj.split(".")) > 1: hostname = obj
460 print "pcuid: %s" % pcuid
461 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
462 loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
465 node = FindbadNodeRecord.get_latest_by(hostname=hostname)
466 loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
469 actions = ActionRecord.query.filter_by(loginbase=loginbase
470 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
471 ).order_by(ActionRecord.date_created.desc())
472 actions = [ a for a in actions ]
473 sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
475 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
476 # NOTE: reformat some fields.
477 agg = prep_node_for_display(node)
479 if agg.pcu: #.pcu.plc_pcuid: # not None
480 #pcu = FindbadPCURecord.get_latest_by(plc_pcuid=agg.plc_pcuid)
481 #prep_pcu_for_display(pcu)
482 pcus[agg.pcu.pcu.plc_pcuid] = agg.pcu
484 for pcuid_key in pcus:
485 pcuquery += [pcus[pcuid_key]]
487 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions, since=since, exceptions=exceptions)
489 @expose(template="monitorweb.templates.pcuhistory")
490 def pcuhistory(self, pcu_id=None):
493 fbnode = HistoryPCURecord.get_by(plc_pcuid=pcu_id)
494 l = fbnode.versions[-100:]
497 #prep_node_for_display(node)
500 return dict(query=query, pcu_id=pcu_id)
502 @expose(template="monitorweb.templates.nodescanhistory")
503 def nodescanhistory(self, hostname=None, length=10):
504 try: length = int(length)
507 fbnode = FindbadNodeRecord.get_by(hostname=hostname)
508 # TODO: add links for earlier history if desired.
509 l = fbnode.versions[-length:]
513 agg = prep_node_for_display(node, pcuhash=None, preppcu=False, asofdate=node.timestamp)
516 if 'length' in request.params:
517 del request.params['length']
518 return dict(query=query, hostname=hostname, params=request.params)
520 @expose(template="monitorweb.templates.nodehistory")
521 def nodehistory(self, hostname=None):
524 fbnode = HistoryNodeRecord.get_by(hostname=hostname)
525 l = fbnode.versions[-100:]
528 #prep_node_for_display(node)
531 return dict(query=query, hostname=hostname)
533 @expose(template="monitorweb.templates.sitehistory")
534 def sitehistory(self, loginbase=None):
537 fbsite = HistorySiteRecord.get_by(loginbase=loginbase)
538 # TODO: add links for earlier history if desired.
539 l = fbsite.versions[-100:]
543 return dict(query=query, loginbase=loginbase)
546 @expose(template="monitorweb.templates.pculist")
547 def pcu(self, filter='all'):
548 print "PCUVIEW------------------"
549 print "befor-len: ", len( [ i for i in session] )
550 session.flush(); session.clear()
551 print "after-len: ", len( [ i for i in session] )
552 fbquery = FindbadPCURecord.get_all_latest()
554 filtercount = {'ok' : 0, 'NetDown': 0, 'Not_Run' : 0, 'pending' : 0, 'all' : 0}
558 if node.reboot_trial_status == str(0):
559 filtercount['ok'] += 1
560 elif node.reboot_trial_status == 'NetDown' or node.reboot_trial_status == 'Not_Run':
561 filtercount[node.reboot_trial_status] += 1
563 filtercount['pending'] += 1
565 pcuagg = prep_pcu_for_display(node)
570 elif filter == "ok" and node.reboot_trial_status == str(0):
572 elif filter == node.reboot_trial_status:
574 elif filter == "pending":
575 # TODO: look in message logs...
576 if node.reboot_trial_status != str(0) and \
577 node.reboot_trial_status != 'NetDown' and \
578 node.reboot_trial_status != 'Not_Run':
582 return dict(query=query, fc=filtercount)
584 @expose(template="monitorweb.templates.sitelist")
585 def site(self, filter='all'):
586 print "SITE------------------"
587 print "befor-len: ", len( [ i for i in session] )
588 session.flush(); session.clear()
589 print "after-len: ", len( [ i for i in session] )
590 filtercount = {'good' : 0, 'down': 0, 'online':0, 'offline' : 0, 'new' : 0, 'pending' : 0, 'all' : 0}
591 fbquery = HistorySiteRecord.query.all()
595 filtercount['all'] += 1
596 if site.new and site.slices_used == 0 and not site.enabled:
597 filtercount['new'] += 1
598 elif not site.enabled:
599 filtercount['pending'] += 1
600 elif site.status in ['good', 'online']:
601 filtercount['good'] += 1
602 elif site.status in ['down', 'offline']:
603 filtercount['down'] += 1
608 elif filter == 'new' and site.new and site.slices_used == 0 and not site.enabled:
610 elif filter == "pending" and not site.enabled:
612 elif filter == 'good' and site.status in ['good', 'online']:
614 elif filter == 'down' and site.status in ['down', 'offline']:
617 return dict(query=query, fc=filtercount)
618 @expose(template="monitorweb.templates.sitesummary")
619 def sitesummary(self, loginbase="princeton"):
621 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
622 agg = prep_node_for_display(node)
625 return dict(nodequery=nodequery, loginbase=loginbase)
627 @expose(template="monitorweb.templates.summary")
628 def summary(self, since=7):
630 sumdata['nodes'] = {}
631 sumdata['sites'] = {}
634 def summarize(query, type):
636 if o.status not in sumdata[type]:
637 sumdata[type][o.status] = 0
638 sumdata[type][o.status] += 1
640 fbquery = HistorySiteRecord.query.all()
641 summarize(fbquery, 'sites')
642 fbquery = HistoryPCURecord.query.all()
643 summarize(fbquery, 'pcus')
644 fbquery = HistoryNodeRecord.query.all()
645 summarize(fbquery, 'nodes')
647 if 'monitordebug' in sumdata['nodes']:
648 d = sumdata['nodes']['monitordebug']
649 del sumdata['nodes']['monitordebug']
650 sumdata['nodes']['failboot'] = d
652 return dict(sumdata=sumdata, setorder=['good', 'offline', 'down', 'online'])
654 @expose(template="monitorweb.templates.actionsummary")
655 def actionsummary(self, since=7):
656 from monitor.wrapper.emailTxt import mailtxt
658 types = filter(lambda x: 'notice' in x, dir(mailtxt))
661 try: since = int(since)
665 acts = ActionRecord.query.filter(ActionRecord.action_type==t
666 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since))
667 results[t] = acts.count()
668 return dict(results=results)
670 @expose(template="monitorweb.templates.actionlist")
671 def actionlist(self, action_type='down_notice', since=7, loginbase=None):
673 try: since = int(since)
677 acts = ActionRecord.query.filter_by(loginbase=loginbase
678 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
679 ).order_by(ActionRecord.date_created.desc())
681 acts = ActionRecord.query.filter(ActionRecord.action_type==action_type
682 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
683 ).order_by(ActionRecord.date_created.desc())
684 query = [ a for a in acts ]
686 return dict(actions=query, action_type=action_type, since=since)