add two cases for resolving nodes that run out of disk space during boot-strap
[monitor.git] / config.d / init-bootman-sequence.py
1 #!/usr/bin/python
2 from monitor.database.info.model import *
3
4 def getSequences():
5
6                 # TODO: This can be replaced with a DB definition at a future time.
7                 #               This would make it possible for an admin to introduce new
8                 #               patterns without touching code.
9                 
10                 sequences = {}
11                 # restart_bootmanager_boot
12                 for n in ["bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-update3-disk-update4-done",
13                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-disk-update4-update3-exception-protoerror-update-protoerror-debug-done",
14                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-implementerror-bootupdatefail-update-debug-done",
15
16                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-exception-protoerror-update-protoerror-debug-done",
17
18                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-exception-protoerror-protoerror2-protoerror-protoerror2-debug-validate-done",
19                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-disk-update4-update3-exception-protoerror-update-debug-done",
20                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-exception-chrootfail-update-debug-done",
21                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-exception-protoerror-protoerror-debug-validate-done",
22                                 "bminit-cfg-auth-protoerror-exception-update-debug-validate-exception-done",
23                                 "bminit-cfg-auth-getplc-update-debug-done",
24                                 "bminit-cfg-auth-protoerror2-debug-done",
25                                 "bminit-cfg-auth-getplc-exception-protoerror-update-protoerror-debug-done",
26                                 "bminit-cfg-auth-protoerror-exception-update-protoerror-debug-done",
27                                 "bminit-cfg-auth-protoerror-exception-update-bootupdatefail-authfail-debug-done",
28                                 "bminit-cfg-auth-protoerror-exception-update-debug-done",
29                                 "bminit-cfg-auth-getplc-exception-protoerror-update-debug-done",
30                                 "bminit-cfg-auth-getplc-implementerror-update-debug-done",
31                                 "bminit-cfg-auth-authfail2-protoerror2-debug-done",
32                                 ]:
33                         sequences.update({n : "restart_bootmanager_boot"})
34
35                 #       conn.restart_bootmanager('reinstall')
36                 for n in [ "bminit-cfg-auth-getplc-installinit-validate-exception-modulefail-update-debug-done",
37                                 "bminit-cfg-auth-getplc-update-installinit-validate-exception-modulefail-update-debug-done",
38                                 "bminit-cfg-auth-getplc-installinit-validate-bmexceptmount-exception-noinstall-update-debug-done",
39                                 "bminit-cfg-auth-getplc-update-installinit-validate-bmexceptmount-exception-noinstall-update-debug-done",
40                                 "bminit-cfg-auth-getplc-installinit-validate-bmexceptvgscan-exception-noinstall-update-debug-done",
41                                 "bminit-cfg-auth-getplc-update-installinit-validate-exception-noinstall-update-debug-done",
42                                 "bminit-cfg-auth-getplc-hardware-installinit-installdisk-bziperror-exception-update-debug-done",
43                                 "bminit-cfg-auth-getplc-update-hardware-installinit-installdisk-installbootfs-exception-update-debug-done",
44                                 "bminit-cfg-auth-getplc-update-installinit-validate-bmexceptvgscan-exception-noinstall-update-debug-done",
45                                 "bminit-cfg-auth-getplc-hardware-installinit-installdisk-installbootfs-exception-update-debug-done",
46                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-nofilereference-update-debug-done",
47                                 "bminit-cfg-auth-getplc-update-hardware-installinit-installdisk-exception-mkfsfail-update-debug-done",
48                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-exception-chrootfail-update-debug-done",
49                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-exception-chrootfail-update-debug-done",
50                                 "bminit-cfg-auth-getplc-update-hardware-installinit-installdisk-installbootfs-installcfg-installstop-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-kernelcopyfail-exception-update-debug-done",
51                                 "bminit-cfg-auth-getplc-hardware-installinit-installdisk-installbootfs-installcfg-installstop-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-kernelcopyfail-exception-update-debug-done",
52                                 "bminit-cfg-auth-getplc-installinit-validate-exception-noinstall-update-debug-done",
53                                 # actual solution appears to involve removing the bad files, and
54                                 # continually trying to boot the node.
55                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-implementerror-update-debug-done",
56                                 "bminit-cfg-auth-getplc-installinit-validate-exception-bmexceptmount-exception-noinstall-update-debug-done",
57                                 "bminit-cfg-auth-getplc-update-installinit-validate-exception-bmexceptmount-exception-noinstall-update-debug-done",
58                                 "bminit-cfg-auth-getplc-update-installinit-validate-bmexceptvgscan-exception-noinstall-update-debug-validate-bmexceptvgscan-done",
59                                 "bminit-cfg-auth-getplc-update-installinit-validate-exception-noinstall-update-debug-validate-done",
60                                 "bminit-cfg-auth-getplc-installinit-validate-bmexceptvgscan-exception-noinstall-update-debug-validate-bmexceptvgscan-done",
61                                 "bminit-cfg-auth-getplc-installinit-validate-bmexceptvgscan-exception-noinstall-debug-validate-bmexceptvgscan-done",
62                                 "bminit-cfg-auth-getplc-update-installinit-validate-bmexceptvgscan-exception-noinstall-debug-validate-bmexceptvgscan-done",
63                                 "bminit-cfg-auth-getplc-update-installinit-validate-exception-missingkernel-debug-validate-done",
64                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-implementerror-nospace-debug-validate-done",
65                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-disk-update4-update3-update3-nospace-nospace-nospace-nospace-nospace-nospace-nospace-nospace-implementerror-nospace-debug-validate-done",
66                                 ]:
67                         sequences.update({n : "restart_bootmanager_rins"})
68
69                 # repair_node_keys
70                 for n in ["bminit-cfg-auth-bootcheckfail-authfail-exception-update-bootupdatefail-authfail-debug-validate-exception-done",
71                                         "bminit-cfg-auth-bootcheckfail-authfail-exception-update-bootupdatefail-authfail-debug-done",
72                                         "bminit-cfg-auth-bootcheckfail-authfail-exception-update-debug-validate-exception-done",
73                                         "bminit-cfg-auth-bootcheckfail-authfail-exception-authfail-debug-validate-exception-done",
74                                         "bminit-cfg-auth-authfail-debug-done",
75                                         "bminit-cfg-auth-authfail2-authfail-debug-done",
76                                 ]:
77                         sequences.update({n: "repair_node_keys"})
78
79                 #   conn.restart_node('reinstall')
80                 for n in ["bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-exception-chrootfail-update-debug-done",
81                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-update3-disk-update4-exception-chrootfail-update-debug-done",
82                                 "bminit-cfg-auth-getplc-hardware-installinit-installdisk-installbootfs-installcfg-exception-chrootfail-update-debug-done",
83                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-writeerror-exception-chrootfail-update-debug-done",
84                                 "bminit-cfg-auth-getplc-update-hardware-installinit-exception-bmexceptrmfail-update-debug-done",
85                                 "bminit-cfg-auth-getplc-hardware-installinit-exception-bmexceptrmfail-update-debug-done",
86                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-disk-update4-update3-implementerror-bootupdatefail-update-debug-done",
87                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-readonlyfs-update-debug-done",
88                                 "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-update3-nospace-exception-update-debug-done",
89                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-nospace-update-debug-done",
90                                 "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-update-debug-done",
91                                 "bminit-cfg-auth-getplc-update-hardware-installinit-installdisk-installbootfs-exception-downloadfail-update-debug-done",
92                                 ]:
93                         sequences.update({n : "restart_node_rins"})
94
95                 #       restart_node_boot
96                 for n in ["bminit-cfg-auth-getplc-implementerror-bootupdatefail-update-debug-done",
97                                  "bminit-cfg-auth-implementerror-bootcheckfail-update-debug-done",
98                                  "bminit-cfg-auth-implementerror-bootcheckfail-update-implementerror-bootupdatefail-done",
99                                  "bminit-cfg-auth-getplc-update-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-nospace-update-debug-done",
100                                  "bminit-cfg-auth-getplc-hardware-installinit-installdisk-installbootfs-exception-downloadfail-update-debug-done",
101                                  "bminit-cfg-auth-getplc-update-installinit-validate-implementerror-update-debug-done",
102                                  "bminit-cfg-auth-getplc-exception-update-bootupdatefail-debug-done",
103                                  ]:
104                         sequences.update({n: "restart_node_boot"})
105
106                 # fsck_repair
107                 for n in ["bminit-cfg-auth-getplc-update-installinit-validate-fsckabort-exception-fsckfail-bmexceptmount-exception-noinstall-update-debug-validate-fsckabort-exception-fsckfail-bmexceptmount-done",
108                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail-exception-noinstall-update-debug-validate-exception-fsckfail-done",
109                                   "bminit-cfg-auth-getplc-update-installinit-validate-exception-fsckfail-exception-noinstall-update-debug-validate-exception-fsckfail-done",
110                                   "bminit-cfg-auth-getplc-update-installinit-validate-exception-fsckfail2-exception-noinstall-update-debug-validate-exception-fsckfail2-done",
111                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail2-exception-debug-validate-done",
112                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail2-exception-debug-validate-exception-fsckfail2-done",
113                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail2-exception-debug-validate-exception-fsckfail-done",
114                                   "bminit-cfg-auth-getplc-update-installinit-validate-fsckabort-exception-fsckfail-exception-debug-validate-fsckabort-exception-fsckfail-done",
115                                   "bminit-cfg-auth-getplc-update-installinit-validate-exception-fsckfail2-exception-debug-validate-exception-fsckfail2-done",
116                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail-exception-debug-validate-exception-fsckfail2-done",
117                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail-exception-debug-validate-exception-fsckfail-done",
118                                   "bminit-cfg-auth-getplc-installinit-validate-exception-fsckfail-exception-debug-validate-done",
119                                   "bminit-cfg-auth-getplc-update-installinit-validate-exception-fsckfail-exception-debug-validate-exception-fsckfail-done",
120                                   "bminit-cfg-auth-getplc-update-debug-validate-exception-fsckfail-done",
121                                 ]:
122                         sequences.update({n : "fsck_repair"})
123
124                 # nodeconfig_notice
125                 for n in ["bminit-cfg-exception-nocfg-update-bootupdatefail-nonode-debug-done",
126                                   "bminit-cfg-exception-update-bootupdatefail-nonode-debug-done",
127                                   "bminit-cfg-exception-update-bootupdatefail-nonode-debug-validate-exception-done",
128                                   "bminit-cfg-exception-nocfg-update-bootupdatefail-nonode-debug-validate-exception-done",
129                                   "bminit-cfg-auth-bootcheckfail-nonode-exception-update-bootupdatefail-nonode-debug-done",
130                                   "bminit-cfg-exception-noconfig-nonode-debug-validate-exception-done",
131                                   "bminit-cfg-exception-noconfig-update-debug-validate-exception-done",
132                                   "bminit-cfg-exception-noparseconfig-debug-validate-exception-done",
133                                   "bminit-cfg-exception-noconfig-debug-validate-exception-done",
134                                   "bminit-cfg-auth-authfail2-nonode-debug-done",
135                                 ]:
136                         sequences.update({n : "nodeconfig_notice"})
137
138                 for n in [ "bminit-cfg-exception-nodehostname-update-debug-done", 
139                                    "bminit-cfg-update-exception-nodehostname-update-debug-validate-exception-done",
140                                    "bminit-cfg-update-exception-nodehostname-update-debug-done", 
141                                    "bminit-cfg-exception-nodehostname-debug-validate-bmexceptvgscan-done",
142                                    "bminit-cfg-exception-nodehostname-debug-validate-exception-done",
143                                 ]:
144                         sequences.update({n : "nodenetwork_email"})
145
146                 # noblockdevice_notice
147                 for n in ["bminit-cfg-auth-getplc-update-hardware-exception-noblockdev-hardwarerequirefail-update-debug-done",
148                                 "bminit-cfg-auth-getplc-update-hardware-noblockdev-exception-hardwarerequirefail-update-debug-validate-bmexceptvgscan-done",
149                                 "bminit-cfg-auth-getplc-hardware-exception-noblockdev-hardwarerequirefail-update-debug-done",
150                                 "bminit-cfg-auth-getplc-update-hardware-noblockdev-exception-hardwarerequirefail-update-debug-done",
151                                 "bminit-cfg-auth-getplc-hardware-noblockdev-exception-hardwarerequirefail-update-debug-done",
152                                 "bminit-cfg-auth-getplc-hardware-noblockdev-exception-hardwarerequirefail-debug-validate-bmexceptvgscan-done",
153                                 "bminit-cfg-auth-getplc-update-hardware-noblockdev-exception-hardwarerequirefail-debug-validate-bmexceptvgscan-done",
154                                 ]:
155                         sequences.update({n : "noblockdevice_notice"})
156
157                 # update_bootcd_email
158                 for n in [ "bminit-cfg-auth-getplc-hardware-exception-hardwarerequirefail-update-debug-done",
159                                 ]:
160                         sequences.update({n : "update_bootcd_email"})
161
162                 for n in [ "bminit-cfg-auth-getplc-installinit-validate-rebuildinitrd-netcfg-update3-implementerror-nofilereference-update-debug-done",
163                                 ]:
164                         sequences.update({n: "unknownsequence_notice"})
165
166                 # minimalhardware_notice
167                 for n in [ "bminit-cfg-auth-getplc-hardware-exception-disktoosmall-hardwarerequirefail-update-debug-done",
168                                         "bminit-cfg-auth-getplc-hardware-disktoosmall-exception-hardwarerequirefail-update-debug-done",
169                                         "bminit-cfg-auth-getplc-update-hardware-exception-hardwarerequirefail-debug-validate-bmexceptvgscan-done",
170                                         "bminit-cfg-auth-getplc-hardware-exception-hardwarerequirefail-debug-validate-bmexceptvgscan-done",
171                                 ]:
172                         sequences.update({n: "minimalhardware_notice"})
173
174                 # baddisk_notice
175                 sequences.update({"bminit-cfg-auth-getplc-update-hardware-exception-hardwarerequirefail-update-debug-done" : "baddisk_notice"})
176
177                 # baddns_notice
178                 for n in [ 
179                  "bminit-cfg-update-implementerror-bootupdatefail-dnserror-update-implementerror-bootupdatefail-dnserror-done",
180                         "bminit-cfg-auth-implementerror-bootcheckfail-dnserror-update-implementerror-bootupdatefail-dnserror-done",
181                         ]:
182                         sequences.update( { n : "baddns_notice"})
183
184                 return sequences
185
186 sequences = getSequences()
187
188 for s in sequences:
189         bms = BootmanSequenceRecord.get_by(sequence=s)
190         if not bms:
191                 bms = BootmanSequenceRecord(sequence=s, action=sequences[s])
192                 bms.flush()
193
194 session.flush()