1c4efe978823df71321e8f66cdb708fc8190b062
[monitor.git] / web / MonitorWeb / monitorweb / controllers.py
1 import turbogears as tg
2 from turbogears import controllers, expose, flash, exception_handler
3 from turbogears import widgets
4 from cherrypy import request, response
5 import cherrypy
6 # from monitorweb import model
7 # import logging
8 # log = logging.getLogger("monitorweb.controllers")
9 import re
10 from monitor.database.info.model import *
11 from monitor.database.zabbixapi.model import *
12 from monitor.database.dborm import zab_session as session
13 from monitor.database.dborm import zab_metadata as metadata
14 from monitor_xmlrpc import MonitorXmlrpcServer
15
16 from monitor import reboot
17 from monitor import scanapi
18
19 from monitor.wrapper.plccache import plcdb_id2lb as site_id2lb
20 from monitor.wrapper.plccache import plcdb_hn2lb as site_hn2lb
21 from monitor.wrapper.plccache import plcdb_lb2hn as site_lb2hn
22
23 from monitorweb.templates.links import *
24
25
26
27 def query_to_dict(query):
28         """ take a url query string and chop it up """
29         val = {}
30         query_fields = query.split('&')
31         for f in query_fields:
32                 (k,v) = urllib.splitvalue(f)
33                 val[k] = v
34
35         return val
36
37 def format_ports(data, pcumodel=None):
38         retval = []
39         filtered_length=0
40
41         if pcumodel:
42                 supported_ports=reboot.model_to_object(pcumodel).supported_ports
43         else:
44                 # ports of a production node
45                 supported_ports=[22,80,806]
46
47         if data and len(data.keys()) > 0 :
48                 for port in supported_ports:
49                         try:
50                                 state = data[str(port)]
51                         except:
52                                 state = "unknown"
53
54                         if state == "filtered":
55                                 filtered_length += 1
56                                 
57                         retval.append( (port, state) )
58
59         if retval == []: 
60                 retval = [( "Closed/Filtered", "state" )]
61
62         if filtered_length == len(supported_ports):
63                 retval = [( "All Filtered", "state" )]
64
65         return retval
66
67 def format_pcu_shortstatus(pcu):
68         status = "error"
69         if pcu:
70                 if pcu.reboot_trial_status == str(0):
71                         status = "Ok"
72                 elif pcu.reboot_trial_status == "NetDown" or pcu.reboot_trial_status == "Not_Run":
73                         status = pcu.reboot_trial_status
74                 else:
75                         status = "error"
76
77         return status
78
79 def prep_pcu_for_display(pcu):
80                 
81         try:
82                 pcu.loginbase = site_id2lb[pcu.plc_pcu_stats['site_id']]
83         except:
84                 pcu.loginbase = "unknown"
85
86         pcu.ports = format_ports(pcu.port_status, pcu.plc_pcu_stats['model'])
87         pcu.status = format_pcu_shortstatus(pcu)
88
89         #print pcu.entry_complete
90         pcu.entry_complete_str = pcu.entry_complete
91         #pcu.entry_complete_str += "".join([ f[0] for f in pcu.entry_complete.split() ])
92         if pcu.dns_status == "NOHOSTNAME":
93                 pcu.dns_short_status = 'NoHost'
94         elif pcu.dns_status == "DNS-OK":
95                 pcu.dns_short_status = 'Ok'
96         elif pcu.dns_status == "DNS-NOENTRY":
97                 pcu.dns_short_status = 'NoEntry'
98         elif pcu.dns_status == "NO-DNS-OR-IP":
99                 pcu.dns_short_status = 'NoHostOrIP'
100         elif pcu.dns_status == "DNS-MISMATCH":
101                 pcu.dns_short_status = 'Mismatch'
102
103 class NodeWidget(widgets.Widget):
104         pass
105
106 def prep_node_for_display(node):
107         if node.plc_pcuid:
108                 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
109                 if pcu:
110                         node.pcu_status = pcu.reboot_trial_status
111                         node.pcu_short_status = format_pcu_shortstatus(pcu)
112                         node.pcu = pcu
113                         prep_pcu_for_display(node.pcu)
114                 else:
115                         node.pcu_short_status = "none"
116                         node.pcu_status = "nodata"
117                         node.pcu = None
118
119         else:
120                 node.pcu_status = "nopcu"
121                 node.pcu_short_status = "none"
122                 node.pcu = None
123
124
125         if node.kernel_version:
126                 node.kernel = node.kernel_version.split()[2]
127         else:
128                 node.kernel = ""
129
130         try:
131                 node.loginbase = site_id2lb[node.plc_node_stats['site_id']]
132         except:
133                 node.loginbase = "unknown"
134
135         if node.loginbase:
136                 node.site = HistorySiteRecord.by_loginbase(node.loginbase)
137                 if node.site is None:
138                         # TODO: need a cleaner fix for this...
139                         node.site = HistorySiteRecord.by_loginbase("pl")
140                         
141
142         node.history = HistoryNodeRecord.by_hostname(node.hostname)
143
144         node.ports = format_ports(node.port_status)
145
146         try:
147                 exists = node.plc_node_stats['last_contact']
148         except:
149                 node.plc_node_stats = {'last_contact' : None}
150
151
152
153 class Root(controllers.RootController, MonitorXmlrpcServer):
154         @expose(template="monitorweb.templates.welcome")
155         def index(self):
156                 import time
157                 # log.debug("Happy TurboGears Controller Responding For Duty")
158                 flash("Your application is now running")
159                 return dict(now=time.ctime())
160
161         @expose(template="monitorweb.templates.pcuview")
162         def nodeview(self, hostname=None):
163                 nodequery=[]
164                 if hostname:
165                         for node in FindbadNodeRecord.get_latest_by(hostname=hostname):
166                                 # NOTE: reformat some fields.
167                                 prep_node_for_display(node)
168                                 nodequery += [node]
169
170                 return self.pcuview(None, None, hostname) # dict(nodequery=nodequery)
171
172         @expose(template="monitorweb.templates.nodelist")
173         def node(self, filter='boot'):
174                 import time
175                 fbquery = FindbadNodeRecord.get_all_latest()
176                 query = []
177                 filtercount = {'down' : 0, 'boot': 0, 'debug' : 0, 'diagnose' : 0, 'disabled': 0, 
178                                                 'neverboot' : 0, 'pending' : 0, 'all' : 0, None : 0}
179                 for node in fbquery:
180                         # NOTE: reformat some fields.
181                         prep_node_for_display(node)
182
183                         node.history.status
184
185                         if node.history.status in ['down', 'offline']:
186                                 if node.plc_node_stats and node.plc_node_stats['last_contact'] != None:
187                                         filtercount['down'] += 1
188                                 else:
189                                         filtercount['neverboot'] += 1
190                         elif node.history.status in ['good', 'online']:
191                                 filtercount['boot'] += 1
192                         elif node.history.status in ['debug', 'monitordebug']:
193                                 filtercount['debug'] += 1
194                         else:
195                                 filtercount[node.history.status] += 1
196                                 
197                         ## NOTE: count filters
198                         #if node.observed_status != 'DOWN':
199                         #       print node.hostname, node.observed_status
200                         #       if node.observed_status == 'DEBUG':
201                         #               if node.plc_node_stats['boot_state'] in ['debug', 'diagnose', 'disabled']:
202                         #                       filtercount[node.plc_node_stats['boot_state']] += 1
203                         #               else:
204                         #                       filtercount['debug'] += 1
205                         #                       
206                         #       else:
207                         #               filtercount[node.observed_status] += 1
208                         #else:
209                         #       if node.plc_node_stats and node.plc_node_stats['last_contact'] != None:
210                         #               filtercount[node.observed_status] += 1
211                         #       else:
212                         #               filtercount['neverboot'] += 1
213
214                         # NOTE: apply filter
215                         if filter == "neverboot":
216                                 if not node.plc_node_stats or node.plc_node_stats['last_contact'] == None:
217                                         query.append(node)
218                         elif filter == "all":
219                                 query.append(node)
220                         elif filter == node.history.status:
221                                 query.append(node)
222                         elif filter == 'boot':
223                                 query.append(node)
224
225                         #if filter == node.observed_status:
226                         #       if filter == "DOWN":
227                         #               if node.plc_node_stats['last_contact'] != None:
228                         #                       query.append(node)
229                         #       else:
230                         #               query.append(node)
231                         #elif filter == "neverboot":
232                         #       if not node.plc_node_stats or node.plc_node_stats['last_contact'] == None:
233                         #               query.append(node)
234                         #elif filter == "pending":
235                         #       # TODO: look in message logs...
236                         #       pass
237                         #elif filter == node.plc_node_stats['boot_state']:
238                         #       query.append(node)
239                         #elif filter == "all":
240                         #       query.append(node)
241                                 
242                 widget = NodeWidget(template='monitorweb.templates.node_template')
243                 return dict(now=time.ctime(), query=query, fc=filtercount, nodewidget=widget)
244         
245         def nodeaction_handler(self, tg_exceptions=None):
246                 """Handle any kind of error."""
247                 print "NODEACTION_HANDLER------------------"
248
249                 if 'pcuid' in request.params:
250                         pcuid = request.params['pcuid']
251                 else:
252                         refurl = request.headers.get("Referer",link("pcu"))
253                         print refurl
254
255                         # TODO: do this more intelligently...
256                         uri_fields = urllib.splitquery(refurl)
257                         if uri_fields[1] is not None:
258                                 val = query_to_dict(uri_fields[1])
259                                 if 'pcuid' in val:
260                                         pcuid = val['pcuid']
261                                 elif 'hostname' in val:
262                                         pcuid = FindbadNodeRecord.get_latest_by(hostname=val['hostname']).plc_pcuid
263                                 else:
264                                         pcuid=None
265                         else:
266                                 pcuid=None
267
268                 cherry_trail = cherrypy._cputil.get_object_trail()
269                 for i in cherry_trail:
270                         print "trail: ", i
271
272                 print pcuid
273                 return self.pcuview(None, pcuid, **dict(exceptions=tg_exceptions))
274
275         def nodeaction(self, **data):
276                 print "NODEACTION------------------"
277                 for item in data.keys():
278                         print "%s %s" % ( item, data[item] )
279
280                 if 'hostname' in data:
281                         hostname = data['hostname']
282                 else:
283                         flash("No hostname given in submitted data")
284                         return
285
286                 if 'submit' in data or 'type' in data:
287                         try:
288                                 action = data['submit']
289                         except:
290                                 action = data['type']
291                 else:
292                         flash("No submit action given in submitted data")
293                         return
294
295                 if action == "Reboot":
296                         print "REBOOT: %s" % hostname
297                         ret = reboot.reboot_str(str(hostname))
298                         print ret
299                         if ret: raise RuntimeError("Error using PCU: " + str(ret))
300                         flash("Reboot appeared to work.  Allow at most 5 minutes.  Then run ExternalScan to check current status.")
301
302                 elif action == "ExternalScan":
303                         scanapi.externalprobe(str(hostname))
304                         flash("External Scan Successful!")
305                 elif action == "InternalScan":
306                         scanapi.internalprobe(str(hostname))
307                         flash("Internal Scan Successful!")
308                 else:
309                         # unknown action
310                         raise RuntimeError("Unknown action given")
311                 return
312
313         # TODO: add form validation
314         @expose(template="monitorweb.templates.pcuview")
315         @exception_handler(nodeaction_handler,"isinstance(tg_exceptions,RuntimeError)")
316         def pcuview(self, loginbase=None, pcuid=None, hostname=None, **data):
317                 print "PCUVIEW------------------"
318                 session.clear()
319                 sitequery=[]
320                 pcuquery=[]
321                 nodequery=[]
322                 actions=[]
323                 exceptions = None
324
325                 for key in data:
326                         print key, data[key]
327
328                 if 'submit' in data.keys() or 'type' in data.keys():
329                         if hostname: data['hostname'] = hostname
330                         self.nodeaction(**data)
331                 if 'exceptions' in data:
332                         exceptions = data['exceptions']
333
334                 if loginbase:
335                         actions = ActionRecord.query.filter_by(loginbase=loginbase
336                                                         ).filter(ActionRecord.date_created >= datetime.now() - timedelta(7)
337                                                         ).order_by(ActionRecord.date_created.desc())
338                         actions = [ a for a in actions ]
339                         sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
340                         pcus = {}
341                         for plcnode in site_lb2hn[loginbase]:
342                                         node = FindbadNodeRecord.get_latest_by(hostname=plcnode['hostname'])
343                                         # NOTE: reformat some fields.
344                                         prep_node_for_display(node)
345                                         nodequery += [node]
346                                         if node.plc_pcuid:      # not None
347                                                 pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
348                                                 prep_pcu_for_display(pcu)
349                                                 pcus[node.plc_pcuid] = pcu
350
351                         for pcuid_key in pcus:
352                                 pcuquery += [pcus[pcuid_key]]
353
354                 if pcuid and hostname is None:
355                         print "pcuid: %s" % pcuid
356                         pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
357                         # NOTE: count filter
358                         prep_pcu_for_display(pcu)
359                         pcuquery += [pcu]
360                         if 'site_id' in pcu.plc_pcu_stats:
361                                 sitequery = [HistorySiteRecord.by_loginbase(pcu.loginbase)]
362                                 
363                         if 'nodenames' in pcu.plc_pcu_stats:
364                                 for nodename in pcu.plc_pcu_stats['nodenames']: 
365                                         print "query for %s" % nodename
366                                         node = FindbadNodeRecord.get_latest_by(hostname=nodename)
367                                         print "%s" % node.port_status
368                                         print "%s" % node.to_dict()
369                                         if node:
370                                                 prep_node_for_display(node)
371                                                 nodequery += [node]
372
373                 if hostname and pcuid is None:
374                                 node = FindbadNodeRecord.get_latest_by(hostname=hostname)
375                                 # NOTE: reformat some fields.
376                                 prep_node_for_display(node)
377                                 sitequery = [node.site]
378                                 nodequery += [node]
379                                 if node.plc_pcuid:      # not None
380                                         pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
381                                         prep_pcu_for_display(pcu)
382                                         pcuquery += [pcu]
383                         
384                 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions, exceptions=exceptions)
385
386         @expose(template="monitorweb.templates.nodehistory")
387         def nodehistory(self, hostname=None):
388                 query = []
389                 if hostname:
390                         fbnode = FindbadNodeRecord.get_by(hostname=hostname)
391                         # TODO: add links for earlier history if desired.
392                         l = fbnode.versions[-100:]
393                         l.reverse()
394                         for node in l:
395                                 prep_node_for_display(node)
396                                 query.append(node)
397                 return dict(query=query, hostname=hostname)
398
399         @expose(template="monitorweb.templates.sitehistory")
400         def sitehistory(self, loginbase=None):
401                 query = []
402                 if loginbase:
403                         fbsite = HistorySiteRecord.get_by(loginbase=loginbase)
404                         # TODO: add links for earlier history if desired.
405                         l = fbsite.versions[-100:]
406                         l.reverse()
407                         for site in l:
408                                 query.append(site)
409                 return dict(query=query, loginbase=loginbase)
410
411
412         @expose(template="monitorweb.templates.pculist")
413         def pcu(self, filter='all'):
414                 import time
415                 fbquery = FindbadPCURecord.get_all_latest()
416                 query = []
417                 filtercount = {'ok' : 0, 'NetDown': 0, 'Not_Run' : 0, 'pending' : 0, 'all' : 0}
418                 for node in fbquery:
419
420                         # NOTE: count filter
421                         if node.reboot_trial_status == str(0):
422                                 filtercount['ok'] += 1
423                         elif node.reboot_trial_status == 'NetDown' or node.reboot_trial_status == 'Not_Run':
424                                 filtercount[node.reboot_trial_status] += 1
425                         else:
426                                 filtercount['pending'] += 1
427
428                         prep_pcu_for_display(node)
429
430                         # NOTE: apply filter
431                         if filter == "all":
432                                 query.append(node)
433                         elif filter == "ok" and node.reboot_trial_status == str(0):
434                                 query.append(node)
435                         elif filter == node.reboot_trial_status:
436                                 query.append(node)
437                         elif filter == "pending":
438                                 # TODO: look in message logs...
439                                 if node.reboot_trial_status != str(0) and \
440                                         node.reboot_trial_status != 'NetDown' and \
441                                         node.reboot_trial_status != 'Not_Run':
442
443                                         query.append(node)
444                                 
445                 return dict(query=query, fc=filtercount)
446
447         @expose(template="monitorweb.templates.siteview")
448         def siteview(self, loginbase='pl'):
449                 # get site query
450                 sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
451                 nodequery = []
452                 for plcnode in site_lb2hn[loginbase]:
453                         for node in FindbadNodeRecord.get_latest_by(hostname=plcnode['hostname']):
454                                 # NOTE: reformat some fields.
455                                 prep_node_for_display(node)
456                                 nodequery += [node]
457                 return dict(sitequery=sitequery, nodequery=nodequery, fc={})
458
459         @expose(template="monitorweb.templates.sitelist")
460         def site(self, filter='all'):
461                 filtercount = {'good' : 0, 'down': 0, 'online':0, 'offline' : 0, 'new' : 0, 'pending' : 0, 'all' : 0}
462                 fbquery = HistorySiteRecord.query.all()
463                 query = []
464                 for site in fbquery:
465                         # count filter
466                         filtercount['all'] += 1
467                         if site.new and site.slices_used == 0 and not site.enabled:
468                                 filtercount['new'] += 1
469                         elif not site.enabled:
470                                 filtercount['pending'] += 1
471                         elif site.status in ['good', 'online']:
472                                 filtercount['good'] += 1
473                         elif site.status in ['down', 'offline']:
474                                 filtercount['down'] += 1
475
476                         # apply filter
477                         if filter == "all":
478                                 query.append(site)
479                         elif filter == 'new' and site.new and site.slices_used == 0 and not site.enabled:
480                                 query.append(site)
481                         elif filter == "pending" and not site.enabled:
482                                 query.append(site)
483                         elif filter == 'good' and site.status in ['good', 'online']:
484                                 query.append(site)
485                         elif filter == 'down' and site.status in ['down', 'offline']:
486                                 query.append(site)
487                                 
488                 return dict(query=query, fc=filtercount)
489
490         @expose(template="monitorweb.templates.actionlist")
491         def action(self, filter='all'):
492                 session.bind = metadata.bind
493                 filtercount = {'active' : 0, 'acknowledged': 0, 'all' : 0}
494                 # With Acknowledgement
495                 sql_ack = 'SELECT DISTINCT h.host,t.description,t.priority,t.lastchange,a.message,e.eventid '+ \
496               ' FROM triggers t,hosts h,items i,functions f, hosts_groups hg,escalations e,acknowledges a ' + \
497               ' WHERE f.itemid=i.itemid ' + \
498                   ' AND h.hostid=i.hostid ' + \
499                   ' AND hg.hostid=h.hostid ' + \
500                   ' AND t.triggerid=f.triggerid ' + \
501                   ' AND t.triggerid=e.triggerid ' + \
502                   ' AND a.eventid=e.eventid ' + \
503                   ' AND t.status=' + str(defines.TRIGGER_STATUS_ENABLED) + \
504                   ' AND i.status=' + str(defines.ITEM_STATUS_ACTIVE) + \
505                   ' AND h.status=' + str(defines.HOST_STATUS_MONITORED) + \
506                   ' AND t.value=' + str(defines.TRIGGER_VALUE_TRUE) + \
507               ' ORDER BY t.lastchange DESC';
508
509                 # WithOUT Acknowledgement
510                 sql_noack = 'SELECT DISTINCT h.host,t.description,t.priority,t.lastchange,e.eventid ' + \
511               ' FROM triggers t,hosts h,items i,functions f, hosts_groups hg,escalations e,acknowledges a ' + \
512               ' WHERE f.itemid=i.itemid ' + \
513                   ' AND h.hostid=i.hostid ' + \
514                   ' AND hg.hostid=h.hostid ' + \
515                   ' AND t.triggerid=f.triggerid ' + \
516                   ' AND t.triggerid=e.triggerid ' + \
517                   ' AND e.eventid not in (select eventid from acknowledges) ' + \
518                   ' AND t.status=' + str(defines.TRIGGER_STATUS_ENABLED) + \
519                   ' AND i.status=' + str(defines.ITEM_STATUS_ACTIVE) + \
520                   ' AND h.status=' + str(defines.HOST_STATUS_MONITORED) + \
521                   ' AND t.value=' + str(defines.TRIGGER_VALUE_TRUE) + \
522               ' ORDER BY t.lastchange DESC';
523                 # for i in session.execute(sql): print i
524
525                 query=[]
526                 replace = re.compile(' {.*}')
527                 for sql,ack in [(sql_ack,True), (sql_noack,False)]:
528                         result = session.execute(sql)
529                         for row in result:
530                                 try:
531                                         newrow = [ site_hn2lb[row[0].lower()] ] + [ r for r in row ]
532                                 except:
533                                         print site_hn2lb.keys()
534                                         newrow = [ "unknown" ] + [ r for r in row ]
535
536                                 newrow[2] = replace.sub("", newrow[2]) # strip {.*} expressions
537
538                                 # NOTE: filter count
539                                 filtercount['all'] += 1
540                                 if not ack: # for unacknowledged
541                                         filtercount['active'] += 1
542                                         if filter == 'active':
543                                                 query.append(newrow)
544                                 else:
545                                         filtercount['acknowledged'] += 1
546                                         if filter == 'acknowledged':
547                                                 query.append(newrow)
548                                         
549                                 if filter != "acknowledged" and filter != "active":
550                                         query.append(newrow)
551
552                 return dict(query=query, fc=filtercount)