improve error handling and reporting for hpilos.
[pcucontrol.git] / pcucontrol / util / command.py
1 import os
2 from select import select 
3 import subprocess
4 import signal
5 import time
6 import traceback
7 import fcntl
8
9 DEBUG= 0
10
11 class ExceptionTimeout(Exception): pass
12 class ExceptionReadTimeout(Exception): pass
13 COMMAND_TIMEOUT = 60
14 ssh_options = { 'StrictHostKeyChecking':'no', 
15                                 'BatchMode':'yes', 
16                                 'PasswordAuthentication':'no',
17                                 'ConnectTimeout':'%s' % COMMAND_TIMEOUT}
18
19 class Sopen(subprocess.Popen):
20         def kill(self, sig = signal.SIGTERM):
21                 try:
22                         # NOTE: this also kills parent... so doesn't work like I want.
23                         # NOTE: adding 'exec' before the cmd removes the extra sh, and
24                         #               partially addresses this problem.
25                         #os.killpg(os.getpgid(self.pid), signal.SIGKILL)
26                         os.kill(self.pid, sig)
27                 except OSError:
28                         # no such process, due to it already exiting...
29                         pass
30
31
32 def read_t(stream, count=1, timeout=COMMAND_TIMEOUT*2):
33         if count == 1:
34                 retstr = ""
35
36                 while True:
37                         lin, lout, lerr = select([stream], [], [], timeout)
38                         if len(lin) == 0:
39                                 print "timeout!"
40                                 raise ExceptionReadTimeout("TIMEOUT reading from command")
41
42                         try:
43                                 outbytes = stream.read(count)
44                         except IOError, err:
45                                 print 'no content yet.'
46                                 # due to no content.
47                                 # the select timeout should catch this.
48                                 continue
49
50                         if not outbytes:
51                                 break
52                         retstr += outbytes
53
54                 return retstr
55         else:
56                 lin, lout, lerr = select([stream], [], [], timeout)
57                 if len(lin) == 0:
58                         raise ExceptionReadTimeout("TIMEOUT reading from command")
59
60                 return stream.read(count)
61
62 class CMD:
63         def __init__(self):
64                 pass
65
66         def run_noexcept(self, cmd, timeout=COMMAND_TIMEOUT*2):
67
68                 try:
69                         return CMD.run(self,cmd,timeout)
70                 except ExceptionTimeout:
71                         print traceback.print_exc()
72                         return ("", "ScriptTimeout")
73                 except ExceptionReadTimeout:
74                         print traceback.print_exc()
75                         return ("", "RunningScriptTimeout")
76                 except KeyboardInterrupt:
77                         print "Interrupted, exiting..."
78                         sys.exit(1)
79                 except Exception, err:
80                         #from monitor.common import email_exception
81                         #email_exception()
82                         return ("", str(err))
83                         
84         def system(self, cmd, timeout=COMMAND_TIMEOUT*2):
85                 (o,e) = self.run(cmd, timeout)
86                 self.output = o
87                 self.error = e
88                 if self.s.returncode is None:
89                         self.s.wait()
90                 return self.s.returncode
91
92         def run(self, cmd, timeout=COMMAND_TIMEOUT*2):
93
94                 s = Sopen(cmd, shell=True, stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE, close_fds=True)
95                 self.s = s
96                 (f_in, f_out, f_err) = (s.stdin, s.stdout, s.stderr)
97                 lout, lin, lerr = select([f_out], [], [f_err], timeout)
98                 if len(lin) == 0 and len(lout) == 0 and len(lerr) == 0:
99                         # Reached a timeout!  Nuke process so it does not hang.
100                         print "TIMEOUT!!!!!!!!!!!!!!!!!!!"
101                         s.kill(signal.SIGKILL)
102                         raise ExceptionTimeout("TIMEOUT Running: %s" % cmd)
103                 else:
104                         #print "RETURNING"
105                         #print len(lin), len(lout), len(lerr)
106                         pass
107
108                 o_value = ""
109                 e_value = ""
110
111                 #o_value = f_out.read()
112                 flags = fcntl.fcntl(f_out, fcntl.F_GETFL)
113                 fcntl.fcntl(f_out, fcntl.F_SETFL, flags | os.O_NONBLOCK)
114
115                 try:
116                         o_value = read_t(f_out,1,30)
117                 except ExceptionReadTimeout:
118                         s.kill(signal.SIGKILL)
119                         raise ExceptionReadTimeout("TIMEOUT: failed to read from cmd: %s" % cmd)
120                         
121                 e_value = f_err.read()
122
123                 o_value = o_value.strip()
124                 e_value = e_value.strip()
125
126                 f_out.close()
127                 f_in.close()
128                 f_err.close()
129                 s.poll()
130                 s.kill(signal.SIGKILL)
131
132                 return (o_value, e_value)
133
134         def runargs(self, args, timeout=COMMAND_TIMEOUT*2):
135
136                 #print "CMD.run(%s)" % " ".join(args)
137                 s = Sopen(args, shell=True, stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE, close_fds=True)
138                 self.s = s
139                 (f_in, f_out, f_err) = (s.stdin, s.stdout, s.stderr)
140                 lout, lin, lerr = select([f_out], [], [f_err], timeout)
141                 if len(lin) == 0 and len(lout) == 0 and len(lerr) == 0:
142                         # Reached a timeout!  Nuke process so it does not hang.
143                         s.kill(signal.SIGKILL)
144                         raise ExceptionTimeout("TIMEOUT Running: %s" % cmd)
145                 o_value = f_out.read()
146                 e_value = ""
147                 if o_value == "":       # An error has occured
148                         e_value = f_err.read()
149
150                 o_value = o_value.strip()
151                 e_value = e_value.strip()
152
153                 f_out.close()
154                 f_in.close()
155                 f_err.close()
156                 s.kill(signal.SIGKILL)
157
158                 return (o_value, e_value)
159
160
161 class SSH(CMD):
162         def __init__(self, user, host, port=22, options = ssh_options):
163                 self.options = options
164                 self.user = user
165                 self.host = host
166                 self.port = port
167                 return
168
169         def __options_to_str(self):
170                 options = ""
171                 for o,v in self.options.iteritems():
172                         options = options + "-o %s=%s " % (o,v)
173                 return options
174
175         def run(self, cmd, timeout=COMMAND_TIMEOUT*2):
176                 cmd = "ssh -p %s %s %s@%s '%s'" % (self.port, self.__options_to_str(), 
177                                                                         self.user, self.host, cmd)
178                 #print "SSH.run(%s)" % cmd
179                 return CMD.run(self, cmd, timeout)
180
181         def get_file(self, rmt_filename, local_filename=None):
182                 if local_filename == None:
183                         local_filename = "./"
184                 cmd = "scp -P %s -B %s %s@%s:%s %s" % (self.port, self.__options_to_str(), 
185                                                                         self.user, self.host, 
186                                                                         rmt_filename, local_filename)
187                 # output :
188                 #       errors will be on stderr,
189                 #   success will have a blank stderr...
190                 return CMD.run_noexcept(self, cmd)
191
192         def run_noexcept(self, cmd):
193                 cmd = "ssh -p %s %s %s@%s '%s'" % (self.port, self.__options_to_str(), 
194                                                                         self.user, self.host, cmd)
195                 #print "SSH.run_noexcept(%s)" % cmd
196                 return CMD.run_noexcept(self, cmd)
197
198         def run_noexcept2(self, cmd, timeout=COMMAND_TIMEOUT*2):
199                 cmd = "exec ssh -p %s %s %s@%s %s" % (self.port, self.__options_to_str(), 
200                                                                         self.user, self.host, cmd)
201                 #print cmd
202                 r = CMD.run_noexcept(self, cmd, timeout)
203                 self.ret = -1
204
205                 return r
206
207         def system2(self, cmd, timeout=COMMAND_TIMEOUT*2):
208                 cmd = "ssh -p %s %s %s@%s %s" % (self.port, self.__options_to_str(), 
209                                                                         self.user, self.host, cmd)
210                 #print "SSH.system2(%s)" % cmd
211                 return CMD.system(self, cmd, timeout)
212
213         def runE(self, cmd):
214                 cmd = "ssh -p %s %s %s@%s '%s'" % (self.port, self.__options_to_str(), 
215                                                                         self.user, self.host, cmd)
216                 if ( DEBUG == 1 ):
217                         print cmd,
218                 (f_in, f_out, f_err) = os.popen3(cmd)
219
220                 value = f_out.read()
221                 if value == "": # An error has occured
222                         value = f_err.read()
223                         value = value.strip()
224
225                 if ( DEBUG == 1 ):
226                         print " == %s" % value
227                 f_out.close()
228                 f_in.close()
229                 f_err.close()
230                 return value.strip()
231                 
232 class MyTimer:
233         def __init__(self):
234                 self.start = time.time()
235
236         def end(self):
237                 self.end = time.time()
238                 t = self.end-self.start
239                 return t
240
241         def diff(self):
242                 self.end = time.time()
243                 t = self.end-self.start
244                 self.start = self.end
245                 return t