updated module import statements. not sure how I missed these before.
[monitor.git] / zabbix / zabbixsite.py
1 #!/usr/bin/python
2
3 from os import getcwd
4 from os.path import dirname, exists, join
5 import sys
6 import md5
7 import glob
8
9 from monitor import config
10 from monitor.database.dborm import zab_session as session
11 from monitor.database.zabbixapi.model import *
12 from monitor.database.zabbixapi.emailZabbix import *
13 from monitor.database.zabbixapi import defines
14 from monitor.util.file import *
15
16
17
18 HOSTGROUP_NAME="%s_hostgroup"
19 USERGROUP_NAME="%s_usergroup"
20         
21 DISCOVERY_RULE_NAME="discovery rule for %s"
22 DISCOVERY_ACTION_NAME="Auto-discover %s action"
23 ESCALATION_ACTION_NAME="Escalation Action for %s"
24
25 def delete_site(loginbase):
26
27         # get host group, usrgrp
28         # get all users in usrgrp, delete each
29         usergroupname = USERGROUP_NAME % loginbase
30         hostgroupname = HOSTGROUP_NAME % loginbase
31         discovery_action_name = DISCOVERY_ACTION_NAME % loginbase
32         discovery_rule_name = DISCOVERY_RULE_NAME % loginbase
33         escalation_action_name = ESCALATION_ACTION_NAME % loginbase
34
35         ug = UsrGrp.get_by(name=usergroupname)
36         if ug:
37                 for user in ug.user_list:
38                         # remove user from group, if a member of no other groups, 
39                         # delete user.
40                         #user.delete()
41                         pass
42                 ug.delete()
43
44         hg = HostGroup.get_by(name=hostgroupname)
45         if hg: 
46                 # figure out how to delete all the hosts...
47                 # NOTE: hosts are listed in hg.host_list
48                 for host in hg.host_list:
49                         host.delete()
50                 hg.delete()
51
52         # delete dr
53         dr = DiscoveryRule.get_by(name=discovery_rule_name)
54         if dr: dr.delete()
55
56         da = Action.get_by(name=discovery_action_name)
57         if da: da.delete()
58
59         ea = Action.get_by(name=escalation_action_name)
60         if ea: ea.delete()
61
62         return
63
64
65 # NOTE: !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
66 ##     These functions can ONLY be run when the server and gui are offline.
67 ##     Any changes to the db while this is running risks introducing a failure
68 ##         to commit, and therefore error.
69 # NOTE: !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!
70 def setup_global():
71         # GLOBAL:
72         #       update mediatype for email.
73         ############################### MAIL
74         print "checking for MediaType Email"
75         mediatype = MediaType.get_by(description="Email")
76         if not mediatype:
77                 print "ERROR:  There is no defined media type for 'Email'"
78                 raise Exception("No Email Media type in Zabbix db")
79
80         print "checking for correct configuration"
81         mediatype = MediaType.get_by(smtp_email=config.from_email)
82         if not mediatype:
83                 mediatype = MediaType.get_by(description="Email")
84                 # NOTE: assumes smtp server is local to this machine.
85                 print "updating email server configuration"
86                 mediatype.smtp_server='localhost'
87                 mediatype.smtp_helo=".".join(config.MONITOR_HOSTNAME.split('.')[1:])
88                 mediatype.smtp_email=config.from_email
89
90         ############################# EMAIL
91         mailtxt.reformat({'hostname' : config.MONITOR_HOSTNAME, 
92                                           'support_email' : config.support_email})
93
94         ############################### CENTRAL SERVER
95         print "checking zabbix server host info"
96         zabbixserver = Host.get_by(host="ZABBIX Server")
97         if zabbixserver:
98                 # TODO: verify that this works.  it has failed once on fresh
99                 # install... not sure why.
100 #               print "Removing default Zabbix server entry"
101 #               zabbixserver.delete()
102                 zabbixserver.host="unused default server"
103
104                 # NOTE: creating a host and assigning a template cannot work 
105                 #       due to the crazy item, trigger, action
106                 #               copying that the php code does during a host add.
107                 # NOTE: Instead, reformat any *xml.in templates and import those
108                 #               during /etc/plc.d/monitor sync
109                 for file in glob.glob("%s/zabbix/templates/*.xml.in" % config.MONITOR_SCRIPT_ROOT):
110                         if 'zabbix_server' in file:
111                                 buf = loadFile(file)
112                                 args = {'hostname' : config.MONITOR_HOSTNAME, 'ip' : config.MONITOR_IP}
113                                 dumpFile(file[:-3], buf % args)
114
115
116         ##################### SCRIPTS 
117         ## TODO: add calls to check/reset the boot states.
118         print "checking scripts"
119         script1 = Script.find_or_create(name="RebootNode",
120                                                                         set_if_new = {
121                                                                                 'command':"%s/reboot.py {HOST.CONN}" % config.MONITOR_SCRIPT_ROOT,
122                                                                                 'host_access':3 # r/w)
123                                                                         })
124         script2 = Script.find_or_create(name="NMap",
125                                                         set_if_new = {
126                                                                 'command':"/usr/bin/nmap -A {HOST.CONN}",
127                                                                 'host_access':2 # r/o)
128                                                 })
129         return
130
131 def merge_iplist(iplist):
132         # TODO:  rewrite addresses as x.x.x.y-z rather than x.x.x.y,x.x.x.z if y-z==1
133         ips = iplist.split(',')
134         ips.sort()
135         prev=None
136         newlist=""
137         for ip in ips:
138                 fields = ip.split('.')
139                 first = ".".join(fields[:2])
140                 last  = int(fields[3])
141                 if prev:
142                         if last - prev == 1:
143                                 pass
144                 prev=last
145                 newlist += "%s,"
146         return newlist[:-1]
147
148 def setup_site(loginbase, techemail, piemail, iplist):
149
150         # TODO: remove old nodes that are no longer in the plcdb.
151         # TODO: remove old users that are no longer in the plcdb.
152         # TODO: consider creating two user groups for Tech & PI emails
153
154         # NOTE: setup default valus for EMAIL
155         mailtxt.reformat({'hostname' : config.MONITOR_HOSTNAME, 
156                                           'support_email' : config.support_email})
157
158         # NOTE: verify arguments
159         if len(iplist) > 255:
160                 raise Exception("iplist length is too long!")
161
162         BI_WEEKLY_ESC_PERIOD = int(60*60*24)
163         DISCOVERY_DELAY = 3600
164         BI_WEEKLY_ESC_PERIOD = int(240) # testing...
165         DISCOVERY_DELAY = 120 # testing
166
167         # User Group
168         site_user_group = UsrGrp.find_or_create(name=USERGROUP_NAME % loginbase)
169         #for user in set(techemail + piemail + [config.cc_email]):
170         for user in set([config.cc_email]):
171                 if not user: continue
172                 # USER
173                 u = User.find_or_create(alias=user, type=1,
174                                                                 set_if_new={'passwd' : md5.md5(user).hexdigest()},
175                                                                 # exec_if_new avoids creating a Media object that
176                                                                 # will not actually be used, if the user already exists
177                                                                 exec_if_new=lambda obj: \
178                                                                 obj.media_list.append( Media(mediatypeid=1, sendto=user)))
179
180                 if site_user_group not in u.usrgrp_list:
181                         u.append_group(site_user_group)
182
183         # HOST GROUP
184         plc_host_group = HostGroup.find_or_create(name="MyPLC Hosts")
185         print "myplc groupid: ", plc_host_group.groupid
186         site_host_group = HostGroup.find_or_create(name=HOSTGROUP_NAME % loginbase)
187         print "site groupid: ", site_host_group.groupid
188         plctemplate = Host.get_by(host="Template_Linux_PLC_Host")
189         escalation_action_name = ESCALATION_ACTION_NAME % loginbase
190         discovery_action_name = DISCOVERY_ACTION_NAME % loginbase
191         discovery_rule_name = DISCOVERY_RULE_NAME % loginbase
192
193         # ADD hg to ug
194         if site_host_group not in site_user_group.hostgroup_list:
195                 site_user_group.append_hostgroup(site_host_group)
196
197         # DISCOVERY RULE & CHECK
198         dr = DiscoveryRule.find_or_create(name=discovery_rule_name,
199                           delay=DISCOVERY_DELAY,
200                           proxy_hostid=0,
201                           set_if_new = {'iprange':iplist},
202                           exec_if_new=lambda obj: \
203                                 obj.discoverycheck_list.append( DiscoveryCheck(type=9, 
204                                                                                 key_="system.uname", ports=10050) )
205                         )
206         if dr.iprange != iplist:
207                 dr.iprange = iplist
208                 
209
210         # DISCOVERY ACTION for these servers
211         a = Action.find_or_create(name=discovery_action_name,
212                         eventsource=defines.EVENT_SOURCE_DISCOVERY,
213                         status=defines.DRULE_STATUS_ACTIVE,
214                         evaltype=defines.ACTION_EVAL_TYPE_AND_OR)
215         if len(a.actioncondition_list) == 0:
216                 a.actioncondition_list=[
217                                         # Host IP Matches
218                                         ActionCondition(
219                                                 conditiontype=defines.CONDITION_TYPE_DHOST_IP,
220                                                 operator=defines.CONDITION_OPERATOR_EQUAL,
221                                                 value=iplist),
222                                         # AND, Service type is Zabbix agent
223                                         ActionCondition(
224                                                 conditiontype=defines.CONDITION_TYPE_DSERVICE_TYPE,
225                                                 operator=defines.CONDITION_OPERATOR_EQUAL,
226                                                 value=defines.SVC_AGENT),
227                                         # AND, Received system.uname value like 'Linux'
228                                         ActionCondition(
229                                                 conditiontype=defines.CONDITION_TYPE_DVALUE,
230                                                 operator=defines.CONDITION_OPERATOR_LIKE,
231                                                 value="Linux"),
232                                         # AND, Discovery status is Discover
233                                         ActionCondition(
234                                                 conditiontype=defines.CONDITION_TYPE_DSTATUS,
235                                                 operator=defines.CONDITION_OPERATOR_EQUAL,
236                                                 value=defines.DOBJECT_STATUS_DISCOVER),
237                                 ]
238                                 # THEN
239                 a.actionoperation_list=[
240                                         # Send Email
241                                         ActionOperation(
242                                                 operationtype=defines.OPERATION_TYPE_MESSAGE,
243                                                 shortdata=mailtxt.node_discovered_subject,
244                                                 longdata=mailtxt.node_discovered,
245                                                 object=defines.OPERATION_OBJECT_GROUP, 
246                                                 objectid=site_user_group.usrgrpid, 
247                                                 esc_period=0, esc_step_to=1, esc_step_from=1, 
248                                         ),
249                                         # Add Host
250                                         ActionOperation(
251                                                 operationtype=defines.OPERATION_TYPE_HOST_ADD,
252                                                 object=0, objectid=0,
253                                                 esc_period=0, esc_step_from=1, esc_step_to=1),
254                                         # Add To Group PLC Hosts
255                                         ActionOperation(
256                                                 operationtype=defines.OPERATION_TYPE_GROUP_ADD,
257                                                 object=0, objectid=plc_host_group.groupid,
258                                                 esc_period=0, esc_step_from=1, esc_step_to=1),
259                                         # Add To Group LoginbaseSiteGroup
260                                         ActionOperation(
261                                                 operationtype=defines.OPERATION_TYPE_GROUP_ADD,
262                                                 object=0, objectid=site_host_group.groupid,
263                                                 esc_period=0, esc_step_from=1, esc_step_to=1),
264                                         # Link to Template 'Template_Linux_PLC_Host'
265                                         ActionOperation(
266                                                 operationtype=defines.OPERATION_TYPE_TEMPLATE_ADD,
267                                                 object=0, objectid=plctemplate.hostid,
268                                                 esc_period=0, esc_step_from=1, esc_step_to=1),
269                                 ]
270         else:
271                 # TODO: verify iplist is up-to-date
272                 # NOTE: len(a.actioncondition_list) > 0
273                 #ip_condition  = a.actioncondition_list[0]
274                 ip_condition = filter(lambda x: x.conditiontype == defines.CONDITION_TYPE_DHOST_IP, a.actioncondition_list)[0]
275                 print ip_condition.conditiontype
276                 print defines.CONDITION_TYPE_DHOST_IP
277                 assert ip_condition.conditiontype == defines.CONDITION_TYPE_DHOST_IP
278                 if ip_condition.value != iplist:
279                         ip_condition.value = iplist
280
281         # ESCALATION ACTION for these servers
282         ea = Action.find_or_create(name=escalation_action_name,
283                         eventsource=defines.EVENT_SOURCE_TRIGGERS,
284                         status=defines.ACTION_STATUS_ENABLED,
285                         evaltype=defines.ACTION_EVAL_TYPE_AND_OR,
286                         esc_period=BI_WEEKLY_ESC_PERIOD,        # three days
287                         recovery_msg=1,
288                         set_if_new={
289                                 'r_shortdata':"Thank you for maintaining {HOSTNAME}!",
290                                 'r_longdata': mailtxt.thankyou_nodeup, }
291                         )
292         if len(ea.actioncondition_list) == 0:
293                         # THEN this is a new entry
294                 print "SETTING UP ESCALATION ACTION"
295                 ea.actioncondition_list=[
296                                 ActionCondition(conditiontype=defines.CONDITION_TYPE_TRIGGER_VALUE, 
297                                                                 operator=defines.CONDITION_OPERATOR_EQUAL, 
298                                                                 value=defines.TRIGGER_VALUE_TRUE),
299                                 ActionCondition(conditiontype=defines.CONDITION_TYPE_TRIGGER_NAME, 
300                                                                 operator=defines.CONDITION_OPERATOR_LIKE, 
301                                                                 value="is unreachable"),
302                                 ActionCondition(conditiontype=defines.CONDITION_TYPE_HOST_GROUP, 
303                                                                 operator=defines.CONDITION_OPERATOR_EQUAL, 
304                                                                 value=site_host_group.groupid),
305                         ]
306                 ea.actionoperation_list=[
307                                 # STAGE 1
308                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE,
309                                         shortdata=mailtxt.nodedown_one_subject,
310                                         longdata=mailtxt.nodedown_one,
311                                         object=defines.OPERATION_OBJECT_GROUP, 
312                                         objectid=site_user_group.usrgrpid, 
313                                         esc_period=0, esc_step_to=3, esc_step_from=3, 
314                                         operationcondition_list=[ OperationConditionNotAck() ] ),
315                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE,
316                                         shortdata=mailtxt.nodedown_one_subject,
317                                         longdata=mailtxt.nodedown_one,
318                                         object=defines.OPERATION_OBJECT_GROUP, 
319                                         objectid=site_user_group.usrgrpid, 
320                                         esc_period=0, esc_step_to=7, esc_step_from=7, 
321                                         operationcondition_list=[ OperationConditionNotAck() ] ),
322                                 # STAGE 2
323                                 ActionOperation(operationtype=defines.OPERATION_TYPE_COMMAND, 
324                                         esc_step_from=10, esc_step_to=10, 
325                                         esc_period=0,
326                                         shortdata="",
327                                         longdata="%s:%s/checkslices.py {HOSTNAME} disablesite" % ( config.MONITOR_HOSTNAME, config.MONITOR_SCRIPT_ROOT ), 
328                                         operationcondition_list=[ OperationConditionNotAck() ]),
329                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE, 
330                                         shortdata=mailtxt.nodedown_two_subject,
331                                         longdata=mailtxt.nodedown_two,
332                                         esc_step_from=10, esc_step_to=10, 
333                                         esc_period=0, 
334                                         object=defines.OPERATION_OBJECT_GROUP, 
335                                         objectid=site_user_group.usrgrpid, 
336                                         operationcondition_list=[ OperationConditionNotAck() ] ), 
337                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE, 
338                                         shortdata=mailtxt.nodedown_two_subject,
339                                         longdata=mailtxt.nodedown_two,
340                                         esc_step_from=14, esc_step_to=14, 
341                                         esc_period=0, 
342                                         object=defines.OPERATION_OBJECT_GROUP, 
343                                         objectid=site_user_group.usrgrpid, 
344                                         operationcondition_list=[ OperationConditionNotAck() ] ), 
345
346                                 # STAGE 3
347                                 ActionOperation(operationtype=defines.OPERATION_TYPE_COMMAND, 
348                                         esc_step_from=17, esc_step_to=17, 
349                                         esc_period=0, 
350                                         shortdata="",
351                                         longdata="%s:%s/checkslices.py {HOSTNAME} disableslices" % ( config.MONITOR_HOSTNAME, config.MONITOR_SCRIPT_ROOT ), 
352                                         # TODO: send notice to users of slices
353                                         operationcondition_list=[ OperationConditionNotAck() ]),
354                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE, 
355                                         shortdata=mailtxt.nodedown_three_subject,
356                                         longdata=mailtxt.nodedown_three,
357                                         esc_step_from=17, esc_step_to=17, 
358                                         esc_period=0, 
359                                         object=defines.OPERATION_OBJECT_GROUP, 
360                                         objectid=site_user_group.usrgrpid, 
361                                         operationcondition_list=[ OperationConditionNotAck() ] ), 
362                                 # STAGE 4++
363                                 ActionOperation(operationtype=defines.OPERATION_TYPE_COMMAND, 
364                                         esc_step_from=21, esc_step_to=0, 
365                                         esc_period=int(BI_WEEKLY_ESC_PERIOD*3.5),
366                                         shortdata="",
367                                         longdata="%s:%s/checkslices.py {HOSTNAME} forever" % ( config.MONITOR_HOSTNAME, config.MONITOR_SCRIPT_ROOT), 
368                                         operationcondition_list=[ OperationConditionNotAck() ]),
369                                 ActionOperation(operationtype=defines.OPERATION_TYPE_MESSAGE, 
370                                         shortdata=mailtxt.nodedown_four_subject,
371                                         longdata=mailtxt.nodedown_four,
372                                         esc_step_from=21, esc_step_to=0, 
373                                         esc_period=int(BI_WEEKLY_ESC_PERIOD*3.5),
374                                         object=defines.OPERATION_OBJECT_GROUP, 
375                                         objectid=site_user_group.usrgrpid, 
376                                         operationcondition_list=[ OperationConditionNotAck() ] ), 
377                         ]
378
379 if __name__ == "__main__":
380         setup_global()
381         session.flush()