added references to google gadgets
[monitor.git] / web / MonitorWeb / monitorweb / controllers.py
1 import turbogears as tg
2 from turbogears import controllers, expose, flash, exception_handler
3 from turbogears import widgets
4 from cherrypy import request, response
5 import cherrypy
6 # from monitorweb import model
7 # import logging
8 # log = logging.getLogger("monitorweb.controllers")
9 import re
10 from monitor.database.info.model import *
11 #from monitor.database.zabbixapi.model import *
12 #from monitor.database.dborm import zab_session as session
13 #from monitor.database.dborm import zab_metadata as metadata
14 from monitor_xmlrpc import MonitorXmlrpcServer
15
16 from monitor import reboot
17 from monitor import scanapi
18 import time
19
20 from monitor.wrapper.plccache import plcdb_hn2lb as site_hn2lb
21
22 from monitorweb.templates.links import *
23
24
25 # make it easier group objects without invoking the elixir auto-write feature.
26 class aggregate: pass
27
28
29 def query_to_dict(query):
30         """ take a url query string and chop it up """
31         val = {}
32         query_fields = query.split('&')
33         for f in query_fields:
34                 (k,v) = urllib.splitvalue(f)
35                 val[k] = v
36
37         return val
38
39 def format_ports(data, pcumodel=None):
40         retval = []
41         filtered_length=0
42
43         if pcumodel:
44                 supported_ports=reboot.model_to_object(pcumodel).supported_ports
45         else:
46                 # ports of a production node
47                 supported_ports=[22,80,806]
48
49         if data and len(data.keys()) > 0 :
50                 for port in supported_ports:
51                         try:
52                                 state = data[str(port)]
53                         except:
54                                 state = "unknown"
55
56                         if state == "filtered":
57                                 filtered_length += 1
58                                 
59                         retval.append( (port, state) )
60
61         if retval == []: 
62                 retval = [( "Closed/Filtered", "state" )]
63
64         if filtered_length == len(supported_ports):
65                 retval = [( "All Filtered", "state" )]
66
67         return retval
68
69 def format_pcu_shortstatus(pcu):
70         status = "error"
71         if pcu:
72                 if pcu.reboot_trial_status == str(0):
73                         status = "Ok"
74                 elif pcu.reboot_trial_status == "NetDown" or pcu.reboot_trial_status == "Not_Run":
75                         status = pcu.reboot_trial_status
76                 else:
77                         status = "error"
78
79         return status
80
81 def prep_pcu_for_display(pcu):
82         agg = aggregate()
83         agg.pcu = pcu 
84                 
85         try:
86                 agg.loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
87         except:
88                 agg.loginbase = "unknown"
89
90         agg.ports = format_ports(pcu.port_status, pcu.plc_pcu_stats['model'])
91         agg.status = format_pcu_shortstatus(pcu)
92
93         #print pcu.entry_complete
94         agg.entry_complete_str = pcu.entry_complete
95         #pcu.entry_complete_str += "".join([ f[0] for f in pcu.entry_complete.split() ])
96         if pcu.dns_status == "NOHOSTNAME":
97                 agg.dns_short_status = 'NoHost'
98         elif pcu.dns_status == "DNS-OK":
99                 agg.dns_short_status = 'Ok'
100         elif pcu.dns_status == "DNS-NOENTRY":
101                 agg.dns_short_status = 'NoEntry'
102         elif pcu.dns_status == "NO-DNS-OR-IP":
103                 agg.dns_short_status = 'NoHostOrIP'
104         elif pcu.dns_status == "DNS-MISMATCH":
105                 agg.dns_short_status = 'Mismatch'
106         return agg
107
108 class NodeWidget(widgets.Widget):
109         pass
110
111 def prep_node_for_display(node, pcuhash=None):
112         agg = aggregate()
113         agg.node = node
114
115         if node.plc_pcuid:
116                 if pcuhash:
117                         pcu = pcuhash[node.plc_pcuid]
118                 else:
119                         pcu = FindbadPCURecord.get_latest_by(plc_pcuid=node.plc_pcuid)
120
121                 if pcu:
122                         agg.pcu_status = pcu.reboot_trial_status
123                         agg.pcu_short_status = format_pcu_shortstatus(pcu)
124                         agg.pcu = prep_pcu_for_display(pcu)
125                 else:
126                         agg.pcu_short_status = "none"
127                         agg.pcu_status = "nodata"
128                         agg.pcu = None
129
130         else:
131                 agg.pcu_status = "nopcu"
132                 agg.pcu_short_status = "none"
133                 agg.pcu = None
134
135
136         if node.kernel_version:
137                 agg.kernel = node.kernel_version.split()[2]
138         else:
139                 agg.kernel = ""
140
141         try:
142                 agg.loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
143         except:
144                 agg.loginbase = "unknown"
145
146         if agg.loginbase:
147                 agg.site = HistorySiteRecord.by_loginbase(agg.loginbase)
148                 if agg.site is None:
149                         # TODO: need a cleaner fix for this...
150                         agg.site = HistorySiteRecord.by_loginbase("pl")
151                         if not agg.site:
152                                 agg.site = HistorySiteRecord.by_loginbase("ple")
153
154         agg.history = HistoryNodeRecord.by_hostname(node.hostname)
155
156         agg.ports = format_ports(node.port_status)
157
158         try:
159                 exists = node.plc_node_stats['last_contact']
160         except:
161                 # TODO: this should not assign to the fb object!
162                 node.plc_node_stats = {'last_contact' : None}
163         
164         return agg
165
166
167 class Root(controllers.RootController, MonitorXmlrpcServer):
168         @expose(template="monitorweb.templates.welcome")
169         def index(self):
170                 # log.debug("Happy TurboGears Controller Responding For Duty")
171                 flash("Welcome To MyOps!")
172                 return dict(now=time.ctime())
173
174         @expose(template="monitorweb.templates.nodelist")
175         def node2(self, filter='boot'):
176
177                 fbquery = FindbadNodeRecord.get_all_latest()
178                 fbpcus = FindbadPCURecord.get_all_latest()
179                 def fbtohash(fbpculist):
180                         h = {}
181                         for p in fbpculist:
182                                 h[p.plc_pcuid] = p
183
184                 pcuhash = fbtohash(fbpcus)
185
186                 query = []
187                 for node in fbquery:
188                         # NOTE: reformat some fields.
189                         agg = prep_node_for_display(node, pcuhash)
190
191                         if not agg.history:
192                                 continue
193
194                         query.append(agg)
195                                 
196                 widget = NodeWidget(template='monitorweb.templates.node_template')
197                 return dict(now=time.ctime(), query=query, nodewidget=widget)
198
199         @expose(template="monitorweb.templates.nodelist")
200         def node(self, filter='boot'):
201                 print "NODE------------------"
202                 print "befor-len: ", len( [ i for i in session] )
203                 session.flush(); session.clear()
204                 print "after-len: ", len( [ i for i in session] )
205                 fbquery = FindbadNodeRecord.get_all_latest()
206                 query = []
207                 filtercount = {'down' : 0, 'boot': 0, 'debug' : 0, 'diagnose' : 0, 'disabled': 0, 
208                                                 'neverboot' : 0, 'pending' : 0, 'all' : 0, None : 0}
209                 for node in fbquery:
210                         # NOTE: reformat some fields.
211                         agg = prep_node_for_display(node)
212
213                         if not agg.history:
214                                 continue
215
216                         if agg.history.status in ['down', 'offline']:
217                                 if node.plc_node_stats and node.plc_node_stats['last_contact'] != None:
218                                         filtercount['down'] += 1
219                                 else:
220                                         filtercount['neverboot'] += 1
221                         elif agg.history.status in ['good', 'online']:
222                                 filtercount['boot'] += 1
223                         elif agg.history.status in ['debug', 'monitordebug']:
224                                 filtercount['debug'] += 1
225                         else:
226                                 if filtercount.has_key(agg.history.status):
227                                         filtercount[agg.history.status] += 1
228                                 
229
230                         # NOTE: apply filter
231                         if filter == "neverboot":
232                                 if not node.plc_node_stats or node.plc_node_stats['last_contact'] == None:
233                                         query.append(agg)
234                         elif filter == "all":
235                                 query.append(agg)
236                         elif filter == agg.history.status:
237                                 query.append(agg)
238                         elif filter == 'boot':
239                                 query.append(agg)
240
241                                 
242                 widget = NodeWidget(template='monitorweb.templates.node_template')
243                 return dict(now=time.ctime(), query=query, fc=filtercount, nodewidget=widget)
244         
245         def nodeaction_handler(self, tg_exceptions=None):
246                 """Handle any kind of error."""
247                 print "NODEACTION_HANDLER------------------"
248
249                 if 'pcuid' in request.params:
250                         pcuid = request.params['pcuid']
251                 else:
252                         refurl = request.headers.get("Referer",link("pcu"))
253                         print refurl
254
255                         # TODO: do this more intelligently...
256                         uri_fields = urllib.splitquery(refurl)
257                         if uri_fields[1] is not None:
258                                 val = query_to_dict(uri_fields[1])
259                                 if 'pcuid' in val:
260                                         pcuid = val['pcuid']
261                                 elif 'hostname' in val:
262                                         pcuid = FindbadNodeRecord.get_latest_by(hostname=val['hostname']).plc_pcuid
263                                 else:
264                                         pcuid=None
265                         else:
266                                 pcuid=None
267
268                 cherry_trail = cherrypy._cputil.get_object_trail()
269                 for i in cherry_trail:
270                         print "trail: ", i
271
272                 print pcuid
273                 return self.pcuview(None, pcuid, **dict(exceptions=tg_exceptions))
274
275         def nodeaction(self, **data):
276                 print "NODEACTION------------------"
277                 for item in data.keys():
278                         print "%s %s" % ( item, data[item] )
279
280                 if 'hostname' in data:
281                         hostname = data['hostname']
282                 else:
283                         flash("No hostname given in submitted data")
284                         return
285
286                 if 'submit' in data or 'type' in data:
287                         try:
288                                 action = data['submit']
289                         except:
290                                 action = data['type']
291                 else:
292                         flash("No submit action given in submitted data")
293                         return
294
295                 if action == "Reboot":
296                         print "REBOOT: %s" % hostname
297                         ret = reboot.reboot_str(str(hostname))
298                         print ret
299                         if ret: raise RuntimeError("Error using PCU: " + str(ret))
300                         flash("Reboot appeared to work.  Allow at most 5 minutes.  Then run ExternalScan to check current status.")
301
302                 elif action == "ExternalScan":
303                         scanapi.externalprobe(str(hostname))
304                         flash("External Scan Successful!")
305                 elif action == "InternalScan":
306                         scanapi.internalprobe(str(hostname))
307                         flash("Internal Scan Successful!")
308                 else:
309                         # unknown action
310                         raise RuntimeError("Unknown action given")
311                 return
312
313         # TODO: add form validation
314         @expose(template="monitorweb.templates.pcuview")
315         @exception_handler(nodeaction_handler,"isinstance(tg_exceptions,RuntimeError)")
316         def pcuview(self, loginbase=None, pcuid=None, hostname=None, since=20, **data):
317                 print "PCUVIEW------------------"
318                 print "befor-len: ", len( [ i for i in session] )
319                 session.flush(); session.clear()
320                 print "after-len: ", len( [ i for i in session] )
321                 sitequery=[]
322                 pcuquery=[]
323                 nodequery=[]
324                 actions=[]
325                 exceptions = None
326
327                 try: since = int(since)
328                 except: since = 7
329
330                 for key in data:
331                         print key, data[key]
332
333                 if 'submit' in data.keys() or 'type' in data.keys():
334                         if hostname: data['hostname'] = hostname
335                         self.nodeaction(**data)
336                 if 'exceptions' in data:
337                         exceptions = data['exceptions']
338
339                 if pcuid:
340                         print "pcuid: %s" % pcuid
341                         pcu = FindbadPCURecord.get_latest_by(plc_pcuid=pcuid)
342                         loginbase = PlcSite.query.get(pcu.plc_pcu_stats['site_id']).plc_site_stats['login_base']
343
344                 if hostname:
345                         node = FindbadNodeRecord.get_latest_by(hostname=hostname)
346                         loginbase = PlcSite.query.get(node.plc_node_stats['site_id']).plc_site_stats['login_base']
347
348                 if loginbase:
349                         actions = ActionRecord.query.filter_by(loginbase=loginbase
350                                                         ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
351                                                         ).order_by(ActionRecord.date_created.desc())
352                         actions = [ a for a in actions ]
353                         sitequery = [HistorySiteRecord.by_loginbase(loginbase)]
354                         pcus = {}
355                         for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
356                                         # NOTE: reformat some fields.
357                                         agg = prep_node_for_display(node)
358                                         nodequery += [agg]
359                                         if agg.pcu: #.pcu.plc_pcuid:    # not None
360                                                 #pcu = FindbadPCURecord.get_latest_by(plc_pcuid=agg.plc_pcuid)
361                                                 #prep_pcu_for_display(pcu)
362                                                 pcus[agg.pcu.pcu.plc_pcuid] = agg.pcu
363
364                         for pcuid_key in pcus:
365                                 pcuquery += [pcus[pcuid_key]]
366
367                 return dict(sitequery=sitequery, pcuquery=pcuquery, nodequery=nodequery, actions=actions, since=since, exceptions=exceptions)
368
369         @expose(template="monitorweb.templates.pcuhistory")
370         def pcuhistory(self, pcu_id=None):
371                 query = []
372                 if pcu_id:
373                         fbnode = HistoryPCURecord.get_by(plc_pcuid=pcu_id)
374                         l = fbnode.versions[-100:]
375                         l.reverse()
376                         for pcu in l:
377                                 #prep_node_for_display(node)
378                                 query.append(pcu)
379
380                 return dict(query=query, pcu_id=pcu_id)
381
382         @expose(template="monitorweb.templates.nodehistory")
383         def nodehistory(self, hostname=None):
384                 query = []
385                 if hostname:
386                         #fbnode = FindbadNodeRecord.get_by(hostname=hostname)
387                         ## TODO: add links for earlier history if desired.
388                         #l = fbnode.versions[-100:]
389                         #l.reverse()
390                         #for node in l:
391                         #       prep_node_for_display(node)
392                         #       query.append(node)
393
394                         fbnode = HistoryNodeRecord.get_by(hostname=hostname)
395                         l = fbnode.versions[-100:]
396                         l.reverse()
397                         for node in l:
398                                 #prep_node_for_display(node)
399                                 query.append(node)
400
401                 return dict(query=query, hostname=hostname)
402
403         @expose(template="monitorweb.templates.sitehistory")
404         def sitehistory(self, loginbase=None):
405                 query = []
406                 if loginbase:
407                         fbsite = HistorySiteRecord.get_by(loginbase=loginbase)
408                         # TODO: add links for earlier history if desired.
409                         l = fbsite.versions[-100:]
410                         l.reverse()
411                         for site in l:
412                                 query.append(site)
413                 return dict(query=query, loginbase=loginbase)
414
415
416         @expose(template="monitorweb.templates.pculist")
417         def pcu(self, filter='all'):
418                 print "PCUVIEW------------------"
419                 print "befor-len: ", len( [ i for i in session] )
420                 session.flush(); session.clear()
421                 print "after-len: ", len( [ i for i in session] )
422                 fbquery = FindbadPCURecord.get_all_latest()
423                 query = []
424                 filtercount = {'ok' : 0, 'NetDown': 0, 'Not_Run' : 0, 'pending' : 0, 'all' : 0}
425                 for node in fbquery:
426
427                         # NOTE: count filter
428                         if node.reboot_trial_status == str(0):
429                                 filtercount['ok'] += 1
430                         elif node.reboot_trial_status == 'NetDown' or node.reboot_trial_status == 'Not_Run':
431                                 filtercount[node.reboot_trial_status] += 1
432                         else:
433                                 filtercount['pending'] += 1
434
435                         pcuagg = prep_pcu_for_display(node)
436
437                         # NOTE: apply filter
438                         if filter == "all":
439                                 query.append(pcuagg)
440                         elif filter == "ok" and node.reboot_trial_status == str(0):
441                                 query.append(pcuagg)
442                         elif filter == node.reboot_trial_status:
443                                 query.append(pcuagg)
444                         elif filter == "pending":
445                                 # TODO: look in message logs...
446                                 if node.reboot_trial_status != str(0) and \
447                                         node.reboot_trial_status != 'NetDown' and \
448                                         node.reboot_trial_status != 'Not_Run':
449
450                                         query.append(pcuagg)
451                                 
452                 return dict(query=query, fc=filtercount)
453
454         @expose(template="monitorweb.templates.sitelist")
455         def site(self, filter='all'):
456                 print "SITE------------------"
457                 print "befor-len: ", len( [ i for i in session] )
458                 session.flush(); session.clear()
459                 print "after-len: ", len( [ i for i in session] )
460                 filtercount = {'good' : 0, 'down': 0, 'online':0, 'offline' : 0, 'new' : 0, 'pending' : 0, 'all' : 0}
461                 fbquery = HistorySiteRecord.query.all()
462                 query = []
463                 for site in fbquery:
464                         # count filter
465                         filtercount['all'] += 1
466                         if site.new and site.slices_used == 0 and not site.enabled:
467                                 filtercount['new'] += 1
468                         elif not site.enabled:
469                                 filtercount['pending'] += 1
470                         elif site.status in ['good', 'online']:
471                                 filtercount['good'] += 1
472                         elif site.status in ['down', 'offline']:
473                                 filtercount['down'] += 1
474
475                         # apply filter
476                         if filter == "all":
477                                 query.append(site)
478                         elif filter == 'new' and site.new and site.slices_used == 0 and not site.enabled:
479                                 query.append(site)
480                         elif filter == "pending" and not site.enabled:
481                                 query.append(site)
482                         elif filter == 'good' and site.status in ['good', 'online']:
483                                 query.append(site)
484                         elif filter == 'down' and site.status in ['down', 'offline']:
485                                 query.append(site)
486                                 
487                 return dict(query=query, fc=filtercount)
488         @expose(template="monitorweb.templates.sitesummary")
489         def sitesummary(self, loginbase="princeton"):
490                 nodequery = []
491                 for node in FindbadNodeRecord.query.filter_by(loginbase=loginbase):
492                         agg = prep_node_for_display(node)
493                         nodequery += [agg]
494                 
495                 return dict(nodequery=nodequery, loginbase=loginbase)
496
497         @expose(template="monitorweb.templates.summary")
498         def summary(self, since=7):
499                 sumdata = {}
500                 sumdata['nodes'] = {}
501                 sumdata['sites'] = {}
502                 sumdata['pcus'] = {}
503
504                 def summarize(query, type):
505                         for o in query:
506                                 if o.status not in sumdata[type]:
507                                         sumdata[type][o.status] = 0
508                                 sumdata[type][o.status] += 1
509
510                 fbquery = HistorySiteRecord.query.all()
511                 summarize(fbquery, 'sites')
512                 fbquery = HistoryPCURecord.query.all()
513                 summarize(fbquery, 'pcus')
514                 fbquery = HistoryNodeRecord.query.all()
515                 summarize(fbquery, 'nodes')
516
517                 if 'monitordebug' in sumdata['nodes']:
518                         d = sumdata['nodes']['monitordebug']
519                         del sumdata['nodes']['monitordebug']
520                         sumdata['nodes']['failboot'] = d
521                 
522                 return dict(sumdata=sumdata, setorder=['good', 'offline', 'down', 'online']) 
523
524         @expose(template="monitorweb.templates.actionsummary")
525         def actionsummary(self, since=7):
526                 from monitor.wrapper.emailTxt import mailtxt
527
528                 types = filter(lambda x: 'notice' in x, dir(mailtxt))
529                 results = {}
530
531                 try: since = int(since)
532                 except: since = 7
533
534                 for  t in types:
535                         acts = ActionRecord.query.filter(ActionRecord.action_type==t
536                                         ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since))
537                         results[t] = acts.count()
538                 return dict(results=results)
539
540         @expose(template="monitorweb.templates.actionlist")
541         def actionlist(self, action_type='down_notice', since=7, loginbase=None):
542
543                 try: since = int(since)
544                 except: since = 7
545
546                 if loginbase:
547                         acts = ActionRecord.query.filter_by(loginbase=loginbase
548                                 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
549                                 ).order_by(ActionRecord.date_created.desc())
550                 else:
551                         acts = ActionRecord.query.filter(ActionRecord.action_type==action_type
552                                 ).filter(ActionRecord.date_created >= datetime.now() - timedelta(since)
553                                 ).order_by(ActionRecord.date_created.desc())
554                 query = [ a for a in acts ]
555                 
556                 return dict(actions=query, action_type=action_type, since=since)