1 import turbogears as tg
2 from turbogears import controllers, expose, flash, exception_handler
3 from turbogears import widgets
4 from cherrypy import request, response
6 # from monitorweb import model
8 # log = logging.getLogger("monitorweb.controllers")
10 from monitor.database.info.model import *
11 #from monitor.database.zabbixapi.model import *
12 #from monitor.database.dborm import zab_session as session
13 #from monitor.database.dborm import zab_metadata as metadata
14 from monitor_xmlrpc import MonitorXmlrpcServer
16 from monitor import reboot
17 from monitor import scanapi
20 from monitor.wrapper.plccache import plcdb_hn2lb as site_hn2lb
22 from monitorweb.templates.links import *
24 class ObjectQueryFields(widgets.WidgetsList):
25 """The WidgetsList defines the fields of the form."""
30 class NodeQueryFields(widgets.WidgetsList):
31 """The WidgetsList defines the fields of the form."""
33 object = widgets.RadioButtonList(label="Query Type", options=[('nodes', 'All Nodes'),
34 ('nodehistory', 'Single Node History'),
35 #('sites', 'All Sites'),
36 #('sitehistory', 'Single Site History'),
38 nodehistory_hostname = widgets.TextField(label="Hostname Node History", attrs={'size':30})
40 hostname = widgets.CheckBox(label="Hostname")
41 firewall = widgets.CheckBox(label="Firewall?")
42 dns_status = widgets.CheckBox(label="DNS Status")
43 external_dns_status = widgets.CheckBox(label="Hostname Resolves?")
44 kernel_version = widgets.CheckBox(label="Kernel")
45 observed_status = widgets.CheckBox(label="Observed Status")
46 port_status = widgets.CheckBox(label="Port Status")
47 rpms = widgets.CheckBox(label="RPM")
48 rpmvalue = widgets.TextField(label="RPM Pattern")
50 class QueryForm(widgets.TableForm):
52 <form xmlns:py="http://purl.org/kid/ns#"
59 <div py:for="field in hidden_fields"
60 py:replace="field.display(value_for(field), **params_for(field))"
62 <table border="0" cellspacing="0" cellpadding="2" py:attrs="table_attrs">
63 <tr py:for="i, field in enumerate(fields)"
64 class="${i%2 and 'odd' or 'even'}"
67 <label class="fieldlabel" for="${field.field_id}" py:content="field.label" />
70 <span py:replace="field.display(value_for(field), **params_for(field))" />
71 <span py:if="error_for(field)" class="fielderror" py:content="error_for(field)" />
72 <span py:if="field.help_text" class="fieldhelp" py:content="field.help_text" />
77 <td py:content="submit.display(submit_text)" />
83 def getNodeQueryForm():
84 return QueryForm(fields=NodeQueryFields(), action="query")
86 # make it easier group objects without invoking the elixir auto-write feature.
90 def query_to_dict(query):
91 """ take a url query string and chop it up """
93 query_fields = query.split('&')
94 for f in query_fields:
95 (k,v) = urllib.splitvalue(f)
100 def format_ports(data, pcumodel=None):
105 supported_ports=reboot.model_to_object(pcumodel).supported_ports
107 # ports of a production node
108 supported_ports=[22,80,806]
110 if data and len(data.keys()) > 0 :
111 for port in supported_ports:
113 state = data[str(port)]
117 if state == "filtered":
120 retval.append( (port, state) )
123 retval = [( "Closed/Filtered", "state" )]
125 if filtered_length == len(supported_ports):
126 retval = [( "All Filtered", "state" )]
130 def format_pcu_shortstatus(pcu):
133 if pcu.reboot_trial_status == str(0):
135 elif pcu.reboot_trial_status == "NetDown" or pcu.reboot_trial_status == "Not_Run":
136 status = pcu.reboot_trial_status
142 def prep_pcu_for_display(pcu):
147 agg.loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
149 agg.loginbase = "unknown"
151 agg.pcuhist = HistoryPCURecord.query.get(pcu.plc_pcuid)
153 agg.ports = format_ports(pcu.port_status, pcu.plc_pcu_stats['model'])
154 agg.status = format_pcu_shortstatus(pcu)
156 #print pcu.entry_complete
157 agg.entry_complete_str = pcu.entry_complete
158 #pcu.entry_complete_str += "".join([ f[0] for f in pcu.entry_complete.split() ])
159 if pcu.dns_status == "NOHOSTNAME":
160 agg.dns_short_status = 'NoHost'
161 elif pcu.dns_status == "DNS-OK":
162 agg.dns_short_status = 'Ok'
163 elif pcu.dns_status == "DNS-NOENTRY":
164 agg.dns_short_status = 'NoEntry'
165 elif pcu.dns_status == "NO-DNS-OR-IP":
166 agg.dns_short_status = 'NoHostOrIP'
167 elif pcu.dns_status == "DNS-MISMATCH":
168 agg.dns_short_status = 'Mismatch'
171 class NodeWidget(widgets.Widget):
174 def prep_nodehist(node):
177 agg.loginbase = "unknown"
179 agg.loginbase = PlcSite.query.get(node.plc_siteid).plc_site_stats['login_base']
181 agg.loginbase = "exception"
186 def prep_node_for_display(node, pcuhash=None, preppcu=True, asofdate=None):
190 if node.plc_pcuid and preppcu:
192 pcu = pcuhash[node.plc_pcuid]
194 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
197 agg.pcu_status = pcu.reboot_trial_status
198 agg.pcu_short_status = format_pcu_shortstatus(pcu)
199 agg.pcu = prep_pcu_for_display(pcu)
201 agg.pcu_short_status = "none"
202 agg.pcu_status = "nodata"
206 agg.pcu_status = "nopcu"
207 agg.pcu_short_status = "none"
211 if node.kernel_version:
212 agg.kernel = node.kernel_version.split()[2]
217 agg.loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
219 agg.loginbase = "unknown"
222 agg.site = HistorySiteRecord.by_loginbase(agg.loginbase)
225 agg.site = agg.site.get_as_of(asofdate)
228 # TODO: need a cleaner fix for this...
229 agg.site = HistorySiteRecord.by_loginbase("pl")
231 agg.site = HistorySiteRecord.by_loginbase("ple")
233 agg.history = HistoryNodeRecord.by_hostname(node.hostname)
235 agg.history = agg.history.get_as_of(asofdate)
237 agg.ports = format_ports(node.port_status)
240 exists = node.plc_node_stats['last_contact']
242 # TODO: this should not assign to the fb object!
243 node.plc_node_stats = {'last_contact' : None}
248 class Root(controllers.RootController, MonitorXmlrpcServer):
249 @expose(template="monitorweb.templates.welcome")
251 # log.debug("Happy TurboGears Controller Responding For Duty")
252 flash("Welcome To MyOps!")
253 return dict(now=time.ctime())
255 @expose(template="monitorweb.templates.nodelist", allow_json=True)
256 def node3(self, filter=None):
257 nhquery = HistoryNodeRecord.query.all()
261 if nh.status == filter:
268 fb = FindbadNodeRecord.get_latest_by(hostname=q.hostname)
271 return dict(now=time.ctime(), query=rquery)
273 @expose(template="monitorweb.templates.nodelist", allow_json=True)
274 def node2(self, filter=None):
275 nhquery = HistoryNodeRecord.query.all()
279 if nh.status == filter:
286 fb = FindbadNodeRecord.get_latest_by(hostname=q.hostname)
287 agg = prep_node_for_display(fb)
290 widget = NodeWidget(template='monitorweb.templates.node_template')
291 return dict(now=time.ctime(), query=rquery, nodewidget=widget)
293 @expose(template="monitorweb.templates.query", allow_json=True)
294 def query(self, **data):
302 if 'object' in data and data['object'] == "nodes":
303 fbquery = FindbadNodeRecord.get_all_latest()
304 elif 'object' in data and data['object'] == "nodehistory":
305 hostname = data['nodehistory_hostname']
306 data['date_checked'] = 'date_checked'
307 fbrecord = FindbadNodeRecord.get_by(hostname=hostname)
308 fbquery = fbrecord.versions[-500:]
312 # NOTE: reformat some fields.
313 if type(node) is not type(FindbadNodeRecord):
314 agg = node.__dict__.copy()
317 agg.update(agg['plc_node_stats'])
318 if 'rpmvalue' in data and 'rpms' in data:
320 rpm_list = agg['rpms'].split()
321 rpm_list = filter(lambda x: data['rpmvalue'] in x, rpm_list)
322 agg['rpms'] = " ".join(rpm_list)
330 del fields['rpmvalue']
331 del fields['nodehistory_hostname']
333 return dict(now=time.ctime(), query=query, fields=fields, data=data, queryform=getNodeQueryForm())
335 @expose(template="monitorweb.templates.nodefast", allow_json=True)
336 def node(self, filter=None):
337 nhquery = HistoryNodeRecord.query.all()
341 if nh.status == filter:
342 agg = prep_nodehist(nh)
345 agg = prep_nodehist(nh)
348 return dict(now=time.ctime(), query=query)
350 @expose(template="monitorweb.templates.nodelist")
351 def nodeslow(self, filter='boot'):
352 print "NODE------------------"
353 print "befor-len: ", len( [ i for i in session] )
354 session.flush(); session.clear()
355 print "after-len: ", len( [ i for i in session] )
356 fbquery = FindbadNodeRecord.get_all_latest()
358 filtercount = {'down' : 0, 'boot': 0, 'debug' : 0, 'diagnose' : 0, 'disabled': 0,
359 'neverboot' : 0, 'pending' : 0, 'all' : 0, None : 0}
361 # NOTE: reformat some fields.
362 agg = prep_node_for_display(node)
367 if agg.history.status in ['down', 'offline']:
368 if node.plc_node_stats and node.plc_node_stats['last_contact'] != None:
369 filtercount['down'] += 1
371 filtercount['neverboot'] += 1
372 elif agg.history.status in ['good', 'online']:
373 filtercount['boot'] += 1
374 elif agg.history.status in ['debug', 'monitordebug']:
375 filtercount['debug'] += 1
377 if filtercount.has_key(agg.history.status):
378 filtercount[agg.history.status] += 1
382 if filter == "neverboot":
383 if not node.plc_node_stats or node.plc_node_stats['last_contact'] == None:
385 elif filter == "all":
387 elif filter == agg.history.status:
389 elif filter == 'boot':
393 widget = NodeWidget(template='monitorweb.templates.node_template')
394 return dict(now=time.ctime(), query=query, fc=filtercount, nodewidget=widget)
396 def nodeaction_handler(self, tg_exceptions=None):
397 """Handle any kind of error."""
398 print "NODEACTION_HANDLER------------------"
400 if 'pcuid' in request.params:
401 pcuid = request.params['pcuid']
403 refurl = request.headers.get("Referer",link("pcu"))
406 # TODO: do this more intelligently...
407 uri_fields = urllib.splitquery(refurl)
408 if uri_fields[1] is not None:
409 val = query_to_dict(uri_fields[1])
412 elif 'hostname' in val:
413 pcuid = FindbadNodeRecord.get_latest_by(hostname=val['hostname']).plc_pcuid
419 cherry_trail = cherrypy._cputil.get_object_trail()
420 for i in cherry_trail:
424 return self.pcuview(None, pcuid, **dict(exceptions=tg_exceptions))
426 def nodeaction(self, **data):
427 print "NODEACTION------------------"
428 for item in data.keys():
429 print "%s %s" % ( item, data[item] )
431 if 'hostname' in data:
432 hostname = data['hostname']
434 flash("No hostname given in submitted data")
437 if 'submit' in data or 'type' in data:
439 action = data['submit']
441 action = data['type']
443 flash("No submit action given in submitted data")
446 if action == "Reboot":
447 print "REBOOT: %s" % hostname
448 ret = reboot.reboot_str(str(hostname))
450 if ret: raise RuntimeError("Error using PCU: " + str(ret))
451 flash("Reboot appeared to work. Allow at most 5 minutes. Then run ExternalScan to check current status.")
453 elif action == "ExternalScan":
454 scanapi.externalprobe(str(hostname))
455 flash("External Scan Successful!")
456 elif action == "InternalScan":
457 scanapi.internalprobe(str(hostname))
458 flash("Internal Scan Successful!")
461 raise RuntimeError("Unknown action given")
464 @expose(template="monitorweb.templates.simpleview")
465 def simpleview(self, **data):
466 return self.pre_view(**data)
468 @expose(template="monitorweb.templates.detailview")
469 def detailview(self, **data):
470 return self.pre_view(**data)
472 def pre_view(self, **data):
473 session.flush(); session.clear()
480 # if objtype is not None, then treat 'hostname' or 'loginbase' as a search pattern
495 fields = obj.split(":")
498 obj = fields[1].replace("*", "%")
501 if len(obj.split(".")) > 1 or objtype == "node":
506 if 'loginbase' in data:
507 loginbase = data['loginbase']
509 if 'hostname' in data:
510 hostname = data['hostname']
513 try: pcuid = int(data['pcuid'])
517 try: since = int(since)
521 print "pcuid: %s" % pcuid
522 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
523 loginbase_list += [ PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base'] ]
527 nodes = [ FindbadNodeRecord.get_latest_by(hostname=hostname) ]
529 nodes = FindbadNodeRecord.query.filter(FindbadNodeRecord.hostname.like(hostname))
532 lb = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
533 if lb not in loginbase_list:
534 loginbase_list += [ lb ]
538 loginbase_list = [ loginbase ]
540 loginbase_list = HistorySiteRecord.query.filter(HistorySiteRecord.loginbase.like(loginbase))
541 loginbase_list = [ l.loginbase for l in loginbase_list ]
545 for loginbase in loginbase_list:
546 actions = ActionRecord.query.filter_by(loginbase=loginbase
547 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
548 ).order_by(ActionRecord.date_created.desc())
549 actions_list += [ a for a in actions ]
550 site = HistorySiteRecord.by_loginbase(loginbase)
552 sitequery.append(site)
553 # NOTE: because a single pcu may be assigned to multiple hosts,
554 # track unique pcus by their plc_pcuid, then turn dict into list
556 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
557 # NOTE: reformat some fields.
558 agg = prep_node_for_display(node)
561 pcus[agg.pcu.pcu.plc_pcuid] = agg.pcu
563 for pcuid_key in pcus:
564 pcuquery += [pcus[pcuid_key]]
566 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions_list, since=since, exceptions=exceptions)
569 # TODO: add form validation
570 @expose(template="monitorweb.templates.pcuview")
571 @exception_handler(nodeaction_handler,"isinstance(tg_exceptions,RuntimeError)")
572 def pcuview(self, loginbase=None, pcuid=None, hostname=None, since=20, **data):
573 session.flush(); session.clear()
580 try: since = int(since)
586 if 'submit' in data.keys() or 'type' in data.keys():
587 if hostname: data['hostname'] = hostname
588 self.nodeaction(**data)
589 if 'exceptions' in data:
590 exceptions = data['exceptions']
594 if len(obj.split(".")) > 1: hostname = obj
598 print "pcuid: %s" % pcuid
599 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
600 loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
603 node = FindbadNodeRecord.get_latest_by(hostname=hostname)
604 loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
607 actions = ActionRecord.query.filter_by(loginbase=loginbase
608 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
609 ).order_by(ActionRecord.date_created.desc())
610 actions = [ a for a in actions ]
611 sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
613 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
614 # NOTE: reformat some fields.
615 agg = prep_node_for_display(node)
617 if agg.pcu: #.pcu.plc_pcuid: # not None
618 #pcu = FindbadPCURecord.get_latest_by(plc_pcuid=agg.plc_pcuid)
619 #prep_pcu_for_display(pcu)
620 pcus[agg.pcu.pcu.plc_pcuid] = agg.pcu
622 for pcuid_key in pcus:
623 pcuquery += [pcus[pcuid_key]]
625 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions, since=since, exceptions=exceptions)
627 @expose(template="monitorweb.templates.pcuhistory")
628 def pcuhistory(self, pcu_id=None):
631 fbnode = HistoryPCURecord.get_by(plc_pcuid=pcu_id)
632 l = fbnode.versions[-100:]
635 #prep_node_for_display(node)
638 return dict(query=query, pcu_id=pcu_id)
640 @expose(template="monitorweb.templates.nodescanhistory")
641 def nodescanhistory(self, hostname=None, length=10):
642 try: length = int(length)
645 fbnode = FindbadNodeRecord.get_by(hostname=hostname)
646 # TODO: add links for earlier history if desired.
647 l = fbnode.versions[-length:]
651 agg = prep_node_for_display(node, pcuhash=None, preppcu=False, asofdate=node.timestamp)
654 if 'length' in request.params:
655 del request.params['length']
656 return dict(query=query, hostname=hostname, params=request.params)
658 @expose(template="monitorweb.templates.nodehistory")
659 def nodehistory(self, hostname=None):
662 fbnode = HistoryNodeRecord.get_by(hostname=hostname)
663 l = fbnode.versions[-100:]
666 #prep_node_for_display(node)
669 return dict(query=query, hostname=hostname)
671 @expose(template="monitorweb.templates.sitehistory")
672 def sitehistory(self, loginbase=None):
675 fbsite = HistorySiteRecord.get_by(loginbase=loginbase)
676 # TODO: add links for earlier history if desired.
677 l = fbsite.versions[-100:]
681 return dict(query=query, loginbase=loginbase)
684 @expose(template="monitorweb.templates.pculist")
685 def pcu(self, filter='all'):
686 print "PCUVIEW------------------"
687 print "befor-len: ", len( [ i for i in session] )
688 session.flush(); session.clear()
689 print "after-len: ", len( [ i for i in session] )
690 fbquery = FindbadPCURecord.get_all_latest()
692 filtercount = {'ok' : 0, 'NetDown': 0, 'Not_Run' : 0, 'pending' : 0, 'all' : 0}
696 if node.reboot_trial_status == str(0):
697 filtercount['ok'] += 1
698 elif node.reboot_trial_status == 'NetDown' or node.reboot_trial_status == 'Not_Run':
699 filtercount[node.reboot_trial_status] += 1
701 filtercount['pending'] += 1
703 pcuagg = prep_pcu_for_display(node)
708 elif filter == "ok" and node.reboot_trial_status == str(0):
710 elif filter == node.reboot_trial_status:
712 elif filter == "pending":
713 # TODO: look in message logs...
714 if node.reboot_trial_status != str(0) and \
715 node.reboot_trial_status != 'NetDown' and \
716 node.reboot_trial_status != 'Not_Run':
720 return dict(query=query, fc=filtercount)
722 @expose(template="monitorweb.templates.sitelist")
723 def site(self, filter='all'):
724 print "SITE------------------"
725 print "befor-len: ", len( [ i for i in session] )
726 session.flush(); session.clear()
727 print "after-len: ", len( [ i for i in session] )
728 filtercount = {'good' : 0, 'down': 0, 'online':0, 'offline' : 0, 'new' : 0, 'pending' : 0, 'all' : 0}
729 fbquery = HistorySiteRecord.query.all()
733 filtercount['all'] += 1
734 if site.new and site.slices_used == 0 and not site.enabled:
735 filtercount['new'] += 1
736 elif not site.enabled:
737 filtercount['pending'] += 1
738 elif site.status in ['good', 'online']:
739 filtercount['good'] += 1
740 elif site.status in ['down', 'offline']:
741 filtercount['down'] += 1
746 elif filter == 'new' and site.new and site.slices_used == 0 and not site.enabled:
748 elif filter == "pending" and not site.enabled:
750 elif filter == 'good' and site.status in ['good', 'online']:
752 elif filter == 'down' and site.status in ['down', 'offline']:
755 return dict(query=query, fc=filtercount)
756 @expose(template="monitorweb.templates.sitesummary")
757 def sitesummary(self, loginbase="princeton"):
759 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
760 agg = prep_node_for_display(node)
763 return dict(nodequery=nodequery, loginbase=loginbase)
765 @expose(template="monitorweb.templates.summary")
766 def summary(self, since=7):
768 sumdata['nodes'] = {}
769 sumdata['sites'] = {}
772 def summarize(query, type):
774 if o.status not in sumdata[type]:
775 sumdata[type][o.status] = 0
776 sumdata[type][o.status] += 1
778 fbquery = HistorySiteRecord.query.all()
779 summarize(fbquery, 'sites')
780 fbquery = HistoryPCURecord.query.all()
781 summarize(fbquery, 'pcus')
782 fbquery = HistoryNodeRecord.query.all()
783 summarize(fbquery, 'nodes')
785 if 'monitordebug' in sumdata['nodes']:
786 d = sumdata['nodes']['monitordebug']
787 del sumdata['nodes']['monitordebug']
788 sumdata['nodes']['failboot'] = d
790 return dict(sumdata=sumdata, setorder=['good', 'offline', 'down', 'online'])
792 @expose(template="monitorweb.templates.actionsummary")
793 def actionsummary(self, since=7):
794 from monitor.wrapper.emailTxt import mailtxt
796 types = filter(lambda x: 'notice' in x, dir(mailtxt))
799 try: since = int(since)
803 acts = ActionRecord.query.filter(ActionRecord.action_type==t
804 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since))
805 results[t] = acts.count()
806 return dict(results=results)
808 @expose(template="monitorweb.templates.actionlist")
809 def actionlist(self, action_type='down_notice', since=7, loginbase=None):
811 try: since = int(since)
815 acts = ActionRecord.query.filter_by(loginbase=loginbase
816 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
817 ).order_by(ActionRecord.date_created.desc())
819 acts = ActionRecord.query.filter(ActionRecord.action_type==action_type
820 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
821 ).order_by(ActionRecord.date_created.desc())
822 query = [ a for a in acts ]
824 return dict(actions=query, action_type=action_type, since=since)