cleanup slice-fs-* steps, nicer output, and shows contents when it's wrong
[tests.git] / system / TestNode.py
index 18b4239..28b013a 100644 (file)
@@ -1,8 +1,32 @@
-import os, sys, time, base64
-import xmlrpclib
+# Thierry Parmentelat <thierry.parmentelat@inria.fr>
+# Copyright (C) 2010 INRIA 
+#
+import sys, os, os.path, time, base64
 
 import utils
 from TestUser import TestUser
+from TestBoxQemu import TestBoxQemu
+from TestSsh import TestSsh
+from Completer import CompleterTask
+
+class CompleterTaskNodeSsh (CompleterTask):
+    def __init__ (self, hostname, qemuname, local_key, command=None, message=None, boot_state="boot", expected=True, dry_run=False):
+        self.hostname=hostname
+        self.qemuname=qemuname
+        self.boot_state=boot_state
+        self.local_key=local_key
+        self.command=command if command is not None else "hostname;uname -a"
+        self.expected=expected
+        self.dry_run = dry_run
+        self.message = message if message else "cannot reach %s in %s mode"%(self.hostname, self.boot_state)
+        self.test_ssh =  TestSsh (self.hostname,key=self.local_key)
+    def run (self, silent):
+        command = self.test_ssh.actual_command(self.command)
+        retcod=utils.system (command, silent=silent, dry_run=self.dry_run)
+        if self.expected:       return retcod==0
+        else:                   return retcod !=0
+    def failure_message (self):
+        return self.message
 
 class TestNode:
 
@@ -10,10 +34,52 @@ class TestNode:
        self.test_plc=test_plc
        self.test_site=test_site
        self.node_spec=node_spec
-
+        
     def name(self):
         return self.node_spec['node_fields']['hostname']
+    
+    def dry_run (self):
+        return self.test_plc.options.dry_run
+    @staticmethod
+    def is_qemu_model (model):
+        return model.find("qemu") >= 0
+    def is_qemu (self):
+        return TestNode.is_qemu_model(self.node_spec['node_fields']['model'])
+
+    @staticmethod
+    def is_real_model (model):
+        return not TestNode.is_qemu_model(model)
+    def is_real (self):
+        return TestNode.is_real_model (self.node_spec['node_fields']['model'])
+
+    def buildname(self):
+        return self.test_plc.options.buildname
         
+    def nodedir (self):
+        if self.is_qemu():
+            return "qemu-%s"%self.name()
+        else:
+            return "real-%s"%self.name()
+
+    # this returns a hostname
+    def host_box (self):
+        if self.is_real ():
+            return 'localhost'
+        else:
+            try:
+                return self.node_spec['host_box']
+            except:
+                utils.header("WARNING : qemu nodes need a host box")
+                return 'localhost'
+
+    # this returns a TestBoxQemu instance - cached in .test_box_value
+    def test_box (self):
+        try:
+            return self.test_box_value
+        except:
+            self.test_box_value = TestBoxQemu (self.host_box(),self.buildname())
+            return self.test_box_value
+
     def create_node (self):
         ownername = self.node_spec['owner']
         user_spec = self.test_site.locate_user(ownername)
@@ -21,33 +87,48 @@ class TestNode:
         userauth = test_user.auth()
         utils.header("node %s created by user %s"%(self.name(),test_user.name()))
         rootauth=self.test_plc.auth_root()
-        server = self.test_plc.server
-        server.AddNode(userauth,
-                       self.test_site.site_spec['site_fields']['login_base'],
-                       self.node_spec['node_fields'])
+        server = self.test_plc.apiserver
+        node_id=server.AddNode(userauth,
+                               self.test_site.site_spec['site_fields']['login_base'],
+                               self.node_spec['node_fields'])
+        server.SetNodePlainBootstrapfs(userauth,
+                                       self.node_spec['node_fields']['hostname'],
+                                       'YES')
         # create as reinstall to avoid user confirmation
-        server.UpdateNode(userauth, self.name(), {'boot_state':'rins'})
-        # populate network interfaces - primary
-        server.AddNodeNetwork(userauth,self.name(),
-                                            self.node_spec['network_fields'])
+        server.UpdateNode(userauth, self.name(), {'boot_state':'reinstall'})
+
+        if not self.test_plc.has_addresses_api():
+#            print 'USING OLD INTERFACE'
+            # populate network interfaces - primary
+            server.AddInterface(userauth,self.name(),
+                                self.node_spec['interface_fields'])
+        else:
+#            print 'USING NEW INTERFACE with separate ip addresses'
+            # this is for setting the 'dns' stuff that now goes with the node
+            server.UpdateNode (userauth, self.name(), self.node_spec['node_fields_nint'])
+            interface_id = server.AddInterface (userauth, self.name(),self.node_spec['interface_fields_nint'])
+            server.AddIpAddress (userauth, interface_id, self.node_spec['ipaddress_fields'])
+            route_fields=self.node_spec['route_fields']
+            route_fields['interface_id']=interface_id
+            server.AddRoute (userauth, node_id, self.node_spec['route_fields'])
+            pass
         # populate network interfaces - others
         if self.node_spec.has_key('extra_interfaces'):
             for interface in self.node_spec['extra_interfaces']:
-                server.AddNodeNetwork(userauth,self.name(),
-                                                    interface['network_fields'])
-                if interface.has_key('attributes'):
-                    for (attribute,value) in interface['attributes'].iteritems():
+                server.AddInterface(userauth,self.name(), interface['interface_fields'])
+                if interface.has_key('settings'):
+                    for (attribute,value) in interface['settings'].iteritems():
                         # locate node network
-                        nn = server.GetNodeNetworks(userauth,{'ip':interface['network_fields']['ip']})[0]
-                        nnid=nn['nodenetwork_id']
+                        interface = server.GetInterfaces(userauth,{'ip':interface['interface_fields']['ip']})[0]
+                        interface_id=interface['interface_id']
                         # locate or create node network attribute type
                         try:
-                            nnst = server.GetNodeNetworkSettingTypes(userauth,{'name':attribute})[0]
+                            interface_tagtype = server.GetTagTypes(userauth,{'name':attribute})[0]
                         except:
-                            nnst = server.AddNodeNetworkSettingType(rootauth,{'category':'test',
-                                                                          'name':attribute})
+                            interface_tagtype = server.AddTagType(rootauth,{'category':'test',
+                                                                            'tagname':attribute})
                         # attach value
-                        server.AddNodeNetworkSetting(userauth,nnid,attribute,value)
+                        server.AddInterfaceTag(userauth,interface_id,attribute,value)
 
     def delete_node (self):
         # uses the right auth as far as poss.
@@ -58,50 +139,210 @@ class TestNode:
             auth = test_user.auth()
         except:
             auth=self.test_plc.auth_root()
-        self.test_plc.server.DeleteNode(auth,self.name())
-
-    def conffile(self,image,hostname,path):
-        template='%s/template-vmplayer/node.vmx'%(path)
-        actual='%s/vmplayer-%s/node.vmx'%(path,hostname)
-        sed_command="sed -e s,@BOOTCD@,%s,g %s > %s"%(image,template,actual)
-        utils.header('Creating %s from %s'%(actual,template))
-        utils.system(sed_command)
-
-    def create_boot_cd(self,path):
-        node_spec=self.node_spec
-        hostname=node_spec['node_fields']['hostname']
-        utils.header('Initializing vmplayer area for node %s'%hostname)
-        clean_dir="rm -rf %s/vmplayer-%s"%(path,hostname)
-        mkdir_command="mkdir -p %s/vmplayer-%s"%(path,hostname)
-        tar_command="tar -C %s/template-vmplayer -cf - . | tar -C %s/vmplayer-%s -xf -"%(path,path,hostname)
-        utils.system(clean_dir)
-        utils.system(mkdir_command)
-        utils.system(tar_command);
-        utils.header('Creating boot medium for node %s'%hostname)
-        encoded=self.test_plc.server.GetBootMedium(self.test_plc.auth_root(), hostname, 'node-iso', '')
+        self.test_plc.apiserver.DeleteNode(auth,self.name())
+
+    # Do most of the stuff locally - will be pushed on host_box - *not* the plc - later if needed
+    def qemu_local_init(self):
+        "all nodes : init a clean local directory for holding node-dep stuff like iso image..."
+        utils.system("rm -rf %s"%self.nodedir())
+        utils.system("mkdir %s"%self.nodedir())
+        if not self.is_qemu():
+            return True
+        return utils.system("rsync -v -a --exclude .svn template-qemu/ %s/"%self.nodedir())==0
+
+    def bootcd(self):
+        "all nodes: invoke GetBootMedium and store result locally"
+        utils.header("Calling GetBootMedium for %s"%self.name())
+        options = []
+        if self.is_qemu():
+            options.append('serial')
+            options.append('no-hangcheck')
+        encoded=self.test_plc.apiserver.GetBootMedium(self.test_plc.auth_root(), 
+                                                      self.name(), 'node-iso', '', options)
         if (encoded == ''):
-            raise Exception, 'boot.iso not found'
-        file=open(path+'/vmplayer-'+hostname+'/boot_file.iso','w')
-        file.write(base64.b64decode(encoded))
+            raise Exception, 'GetBootmedium failed'
+
+        filename="%s/%s.iso"%(self.nodedir(),self.name())
+        utils.header('Storing boot medium into %s'%filename)
+        if self.dry_run():
+            print "Dry_run: skipped writing of iso image"
+            return True
+        else:
+            file(filename,'w').write(base64.b64decode(encoded))
+            return True
+
+    def nodestate_reinstall (self):
+        "all nodes: mark PLCAPI boot_state as reinstall"
+        self.test_plc.apiserver.UpdateNode(self.test_plc.auth_root(),
+                                           self.name(),{'boot_state':'reinstall'})
+        return True
+    
+    def nodestate_safeboot (self):
+        "all nodes: mark PLCAPI boot_state as safeboot"
+        self.test_plc.apiserver.UpdateNode(self.test_plc.auth_root(),
+                                           self.name(),{'boot_state':'safeboot'})
+        return True
+    
+    def nodestate_boot (self):
+        "all nodes: mark PLCAPI boot_state as boot"
+        self.test_plc.apiserver.UpdateNode(self.test_plc.auth_root(),
+                                           self.name(),{'boot_state':'boot'})
+        return True
+
+    def nodestate_show (self):
+        "all nodes: show PLCAPI boot_state"
+        if self.dry_run():
+            print "Dry_run: skipped getting current node state"
+            return True
+        state=self.test_plc.apiserver.GetNodes(self.test_plc.auth_root(), self.name(), ['boot_state'])[0]['boot_state']
+        print self.name(),':',state
+        return True
+    
+    def qemu_local_config(self):
+        "all nodes: compute qemu config qemu.conf and store it locally"
+        if not self.is_qemu():
+            return
+        mac=self.node_spec['interface_fields']['mac']
+        hostname=self.node_spec['node_fields']['hostname']
+        ip=self.node_spec['interface_fields']['ip']
+        auth=self.test_plc.auth_root()
+        target_arch=self.test_plc.apiserver.GetPlcRelease(auth)['build']['target-arch']
+        conf_filename="%s/qemu.conf"%(self.nodedir())
+        if self.dry_run():
+            print "dry_run: skipped actual storage of qemu.conf"
+            return True
+        utils.header('Storing qemu config for %s in %s'%(self.name(),conf_filename))
+        file=open(conf_filename,'w')
+        file.write('MACADDR=%s\n'%mac)
+        file.write('NODE_ISO=%s.iso\n'%self.name())
+        file.write('HOSTNAME=%s\n'%hostname)
+        file.write('IP=%s\n'%ip)
+        file.write('TARGET_ARCH=%s\n'%target_arch)
         file.close()
-        utils.header('boot cd created for %s'%hostname)
-        self.conffile('boot_file.iso',hostname, path)
+        return True
+
+    def qemu_clean (self):
+        utils.header("Cleaning up qemu for host %s on box %s"%(self.name(),self.test_box().hostname()))
+        dry_run=self.dry_run()
+        self.test_box().rmdir(self.nodedir(), dry_run=dry_run)
+        return True
 
-    def start_node (self,options):
+    def qemu_export (self):
+        "all nodes: push local node-dep directory on the qemu box"
+        # if relevant, push the qemu area onto the host box
+        if self.test_box().is_local():
+            return True
+        dry_run=self.dry_run()
+        utils.header ("Cleaning any former sequel of %s on %s"%(self.name(),self.host_box()))
+        utils.header ("Transferring configuration files for node %s onto %s"%(self.name(),self.host_box()))
+        return self.test_box().copy(self.nodedir(),recursive=True,dry_run=dry_run)==0
+            
+    def qemu_start (self):
+        "all nodes: start the qemu instance (also runs qemu-bridge-init start)"
         model=self.node_spec['node_fields']['model']
-        if model.find("vmware") >= 0:
-            self.start_vmware(options)
-        elif model.find("qemu") >= 0:
-            self.start_qemu(options)
+        #starting the Qemu nodes before 
+        if self.is_qemu():
+            self.start_qemu()
         else:
-            utils.header("TestNode.start_node : ignoring model %s"%model)
+            utils.header("TestNode.qemu_start : %s model %s taken as real node"%(self.name(),model))
+        return True
 
-    def start_vmware (self,options):
-        hostname=self.node_spec['node_fields']['hostname']
-        path=options.path
-        display=options.display
-        utils.header('Starting vmplayer for node %s on %s'%(hostname,display))
-        utils.system('cd %s/vmplayer-%s ; DISPLAY=%s vmplayer node.vmx < /dev/null >/dev/null 2>/dev/null &'%(path,hostname,display))
+    def qemu_timestamp (self):
+        "all nodes: start the qemu instance (also runs qemu-bridge-init start)"
+        test_box = self.test_box()
+        test_box.run_in_buildname("mkdir -p %s"%self.nodedir(), dry_run=self.dry_run())
+        now=int(time.time())
+        return test_box.run_in_buildname("echo %d > %s/timestamp"%(now,self.nodedir()), dry_run=self.dry_run())==0
+
+    def start_qemu (self):
+        test_box = self.test_box()
+        utils.header("Starting qemu node %s on %s"%(self.name(),test_box.hostname()))
+
+        test_box.run_in_buildname("%s/qemu-bridge-init start >> %s/log.txt"%(self.nodedir(),self.nodedir()),
+                                  dry_run=self.dry_run())
+        # kick it off in background, as it would otherwise hang
+        test_box.run_in_buildname("%s/qemu-start-node 2>&1 >> %s/log.txt"%(self.nodedir(),self.nodedir()))
+
+    def list_qemu (self):
+        utils.header("Listing qemu for host %s on box %s"%(self.name(),self.test_box().hostname()))
+        command="%s/qemu-kill-node -l %s"%(self.nodedir(),self.name())
+        self.test_box().run_in_buildname(command, dry_run=self.dry_run())
+        return True
+
+    def kill_qemu (self):
+        #Prepare the log file before killing the nodes
+        test_box = self.test_box()
+        # kill the right processes 
+        utils.header("Stopping qemu for node %s on box %s"%(self.name(),self.test_box().hostname()))
+        command="%s/qemu-kill-node %s"%(self.nodedir(),self.name())
+        self.test_box().run_in_buildname(command, dry_run=self.dry_run())
+        return True
+
+    def gather_qemu_logs (self):
+        if not self.is_qemu():
+            return True
+        remote_log="%s/log.txt"%self.nodedir()
+        local_log="logs/node.qemu.%s.txt"%self.name()
+        self.test_box().test_ssh.fetch(remote_log,local_log,dry_run=self.dry_run())
+
+    def keys_clear_known_hosts (self):
+        "remove test nodes entries from the local known_hosts file"
+        TestSsh(self.name()).clear_known_hosts()
+        return True
+
+    def create_test_ssh(self):
+        # get the plc's keys for entering the node
+        vservername=self.test_plc.vservername
+###        # assuming we've run testplc.fetch_keys()
+###        key = "keys/%(vservername)s.rsa"%locals()
+        # fetch_keys doesn't grab the root key anymore
+        key = "keys/key_admin.rsa"
+        return TestSsh(self.name(), buildname=self.buildname(), key=key)
+
+    def check_hooks (self):
+        extensions = [ 'py','pl','sh' ]
+        path='hooks/node'
+        scripts=utils.locate_hooks_scripts ('node '+self.name(), path,extensions)
+        overall = True
+        for script in scripts:
+            if not self.check_hooks_script (script):
+                overall = False
+        return overall
+
+    def check_hooks_script (self,local_script):
+        # push the script on the node's root context
+        script_name=os.path.basename(local_script)
+        utils.header ("NODE hook %s (%s)"%(script_name,self.name()))
+        test_ssh=self.create_test_ssh()
+        test_ssh.copy_home(local_script)
+        if test_ssh.run("./"+script_name) != 0:
+            utils.header ("WARNING: node hooks check script %s FAILED (ignored)"%script_name)
+            #return False
+            return True
+        else:
+            utils.header ("SUCCESS: node hook %s OK"%script_name)
+            return True
+
+    def has_libvirt (self):
+        test_ssh=self.create_test_ssh()
+        return test_ssh.run ("rpm -q --quiet libvirt-client")==0
+
+    def _check_system_slice (self, slicename,dry_run=False):
+        sitename=self.test_plc.plc_spec['settings']['PLC_SLICE_PREFIX']
+        vservername="%s_%s"%(sitename,slicename)
+        test_ssh=self.create_test_ssh()
+        if self.has_libvirt():
+            utils.header("Checking system slice %s using virsh"%slicename)
+            return test_ssh.run("virsh --connect lxc:// list | grep -q ' %s '"%vservername,
+                                dry_run=dry_run)==0
+        else:
+            (retcod,output)=utils.output_of(test_ssh.actual_command("cat /vservers/%s/etc/slicefamily 2> /dev/null")%vservername)
+            # get last line only as ssh pollutes the output
+            slicefamily=output.split("\n")[-1]
+            utils.header("Found slicefamily '%s'for slice %s"%(slicefamily,slicename))
+            if retcod != 0: 
+                return False
+            utils.header("Checking system slice %s using vserver-stat"%slicename)
+            return test_ssh.run("vserver-stat | grep %s"%vservername,dry_run=dry_run)==0
+        
         
-    def start_qemu (self, options):
-        utils.header ("TestNode.start_qemu: not implemented yet")