X-Git-Url: http://git.onelab.eu/?a=blobdiff_plain;f=system%2FTestPlc.py;h=463e79410eda680e1053ffe0d88a71b1f15525a4;hb=1c87dd36c45ad0896491f51aa8bdf63f8668da25;hp=8e947b9f7551014ee3a44252f03c0952d3a9202d;hpb=083f275498458649d2bb099fc93f76b5d91e0618;p=tests.git diff --git a/system/TestPlc.py b/system/TestPlc.py index 8e947b9..463e794 100644 --- a/system/TestPlc.py +++ b/system/TestPlc.py @@ -16,11 +16,10 @@ from TestUser import TestUser from TestKey import TestKey from TestSlice import TestSlice from TestSliver import TestSliver -from TestBox import TestBox +from TestBoxQemu import TestBoxQemu from TestSsh import TestSsh from TestApiserver import TestApiserver from TestSliceSfa import TestSliceSfa -from TestUserSfa import TestUserSfa # step methods must take (self) and return a boolean (options is a member of the class) @@ -39,14 +38,11 @@ def standby_generic (func): return actual def node_mapper (method): - def actual(self): + def actual(self,*args, **kwds): overall=True node_method = TestNode.__dict__[method.__name__] - for site_spec in self.plc_spec['sites']: - test_site = TestSite (self,site_spec) - for node_spec in site_spec['nodes']: - test_node = TestNode (self,test_site,node_spec) - if not node_method(test_node): overall=False + for test_node in self.all_nodes(): + if not node_method(test_node, *args, **kwds): overall=False return overall # restore the doc text actual.__doc__=method.__doc__ @@ -86,33 +82,38 @@ SEPSFA='' class TestPlc: default_steps = [ - 'display', 'resources_pre', SEP, - 'delete_vs','create_vs','install', 'configure', 'start', SEP, - 'fetch_keys', 'store_keys', 'clear_known_hosts', SEP, + 'show', SEP, + 'vs_delete','timestamp_vs','vs_create', SEP, + 'plc_install', 'plc_configure', 'plc_start', SEP, + 'keys_fetch', 'keys_store', 'keys_clear_known_hosts', SEP, 'initscripts', 'sites', 'nodes', 'slices', 'nodegroups', 'leases', SEP, - 'reinstall_node', 'init_node','bootcd', 'configure_qemu', 'export_qemu', 'kill_all_qemus', 'start_node', SEP, - 'install_sfa', 'configure_sfa', 'cross_configure_sfa', 'import_sfa', 'start_sfa', SEPSFA, - 'configure_sfi@1', 'add_user_sfa@1', 'add_sfa@1', 'create_sfa@1', SEPSFA, - 'update_user_sfa@1', 'update_sfa@1', 'view_sfa@1', SEPSFA, - # we used to run plcsh_stress_test, and then nodes_ssh_debug and nodes_ssh_boot + 'nodestate_reinstall', 'qemu_local_init','bootcd', 'qemu_local_config', SEP, + 'qemu_export', 'qemu_kill_mine', 'qemu_start', 'timestamp_qemu', SEP, + 'sfa_install_all', 'sfa_configure', 'cross_sfa_configure', 'sfa_start', 'sfa_import', SEPSFA, + 'sfi_configure@1', 'sfa_add_user@1', 'sfa_add_slice@1', 'sfa_discover@1', SEPSFA, + 'sfa_create_slice@1', 'sfa_check_slice_plc@1', SEPSFA, + 'sfa_update_user@1', 'sfa_update_slice@1', 'sfa_view@1', 'sfa_utest@1',SEPSFA, + # we used to run plcsh_stress_test, and then ssh_node_debug and ssh_node_boot # but as the stress test might take a while, we sometimes missed the debug mode.. - 'nodes_ssh_debug', 'plcsh_stress_test@1', SEP, - 'nodes_ssh_boot', 'check_slice', 'check_initscripts', SEP, - 'check_slice_sfa@1', 'delete_slice_sfa@1', 'delete_user_sfa@1', SEPSFA, - 'check_tcp', 'check_hooks@1', SEP, - 'force_gather_logs', 'force_resources_post', SEP, + 'ssh_node_debug@1', 'plcsh_stress_test@1', SEP, + 'ssh_node_boot@1', 'ssh_slice', 'check_initscripts', SEP, + 'ssh_slice_sfa@1', 'sfa_delete_slice@1', 'sfa_delete_user@1', SEPSFA, + 'check_tcp', 'check_sys_slice', SEP, + 'force_gather_logs', SEP, ] other_steps = [ - 'show_boxes', 'resources_list','resources_release','resources_release_plc','resources_release_qemu',SEP, - 'stop', 'vs_start', SEP, - 'clean_initscripts', 'clean_nodegroups','clean_all_sites', SEP, - 'clean_sites', 'clean_nodes', 'clean_slices', 'clean_keys', SEP, - 'clean_leases', 'list_leases', SEP, + 'export', 'show_boxes', SEP, + 'check_hooks', 'plc_stop', 'vs_start', 'vs_stop', SEP, + 'delete_initscripts', 'delete_nodegroups','delete_all_sites', SEP, + 'delete_sites', 'delete_nodes', 'delete_slices', 'keys_clean', SEP, + 'delete_leases', 'list_leases', SEP, 'populate' , SEP, - 'list_all_qemus', 'list_qemus', 'kill_qemus', SEP, - 'plcclean_sfa', 'dbclean_sfa', 'stop_sfa','uninstall_sfa', 'clean_sfi', SEP, - 'db_dump' , 'db_restore', SEP, - 'standby_1 through 20',SEP, + 'nodestate_show','nodestate_safeboot','nodestate_boot', SEP, + 'qemu_list_all', 'qemu_list_mine', 'qemu_kill_all', SEP, + 'sfa_install_core', 'sfa_install_sfatables', 'sfa_install_plc', 'sfa_install_client', SEPSFA, + 'sfa_plcclean', 'sfa_dbclean', 'sfa_stop','sfa_uninstall', 'sfi_clean', SEPSFA, + 'plc_db_dump' , 'plc_db_restore', SEP, + 'standby_1_through_20',SEP, ] @staticmethod @@ -124,7 +125,7 @@ class TestPlc: return step != SEP and step != SEPSFA # turn off the sfa-related steps when build has skipped SFA - # this is originally for centos5 as recent SFAs won't build on this platformb + # this is originally for centos5 as recent SFAs won't build on this platform @staticmethod def check_whether_build_has_sfa (rpms_url): # warning, we're now building 'sface' so let's be a bit more picky @@ -139,14 +140,10 @@ class TestPlc: def __init__ (self,plc_spec,options): self.plc_spec=plc_spec self.options=options - self.test_ssh=TestSsh(self.plc_spec['hostname'],self.options.buildname) - try: - self.vserverip=plc_spec['vserverip'] - self.vservername=plc_spec['vservername'] - self.url="https://%s:443/PLCAPI/"%plc_spec['vserverip'] - self.vserver=True - except: - raise Exception,'chroot-based myplc testing is deprecated' + self.test_ssh=TestSsh(self.plc_spec['host_box'],self.options.buildname) + self.vserverip=plc_spec['vserverip'] + self.vservername=plc_spec['vservername'] + self.url="https://%s:443/PLCAPI/"%plc_spec['vserverip'] self.apiserver=TestApiserver(self.url,options.dry_run) def name(self): @@ -154,7 +151,7 @@ class TestPlc: return "%s.%s"%(name,self.vservername) def hostname(self): - return self.plc_spec['hostname'] + return self.plc_spec['host_box'] def is_local (self): return self.test_ssh.is_local() @@ -170,24 +167,60 @@ class TestPlc: def start_guest (self): return utils.system(self.test_ssh.actual_command(self.start_guest_in_host())) + def stop_guest (self): + return utils.system(self.test_ssh.actual_command(self.stop_guest_in_host())) + def run_in_guest (self,command): return utils.system(self.actual_command_in_guest(command)) def run_in_host (self,command): return self.test_ssh.run_in_buildname(command) - #command gets run in the vserver + #command gets run in the plc's vm def host_to_guest(self,command): - return "vserver %s exec %s"%(self.vservername,command) + if self.options.plcs_use_lxc: + return "ssh -o StrictHostKeyChecking=no %s %s"%(self.vserverip,command) + else: + return "vserver %s exec %s"%(self.vservername,command) - #command gets run in the vserver + def vm_root_in_host(self): + if self.options.plcs_use_lxc: + return "/var/lib/lxc/%s/rootfs/"%(self.vservername) + else: + return "/vservers/%s"%(self.vservername) + + def vm_timestamp_path (self): + if self.options.plcs_use_lxc: + return "/var/lib/lxc/%s/%s.timestamp"%(self.vservername,self.vservername) + else: + return "/vservers/%s.timestamp"%(self.vservername) + + #start/stop the vserver def start_guest_in_host(self): - return "vserver %s start"%(self.vservername) + if self.options.plcs_use_lxc: + return "lxc-start --daemon --name=%s"%(self.vservername) + else: + return "vserver %s start"%(self.vservername) + + def stop_guest_in_host(self): + if self.options.plcs_use_lxc: + return "lxc-stop --name=%s"%(self.vservername) + else: + return "vserver %s stop"%(self.vservername) # xxx quick n dirty def run_in_guest_piped (self,local,remote): return utils.system(local+" | "+self.test_ssh.actual_command(self.host_to_guest(remote),keep_stdin=True)) + # does a yum install in the vs, ignore yum retcod, check with rpm + def yum_install (self, rpms): + if isinstance (rpms, list): + rpms=" ".join(rpms) + self.run_in_guest("yum -y install %s"%rpms) + # yum-complete-transaction comes with yum-utils, that is in vtest.pkgs + self.run_in_guest("yum-complete-transaction -y") + return self.run_in_guest("rpm -q %s"%rpms)==0 + def auth_root (self): return {'Username':self.plc_spec['PLC_ROOT_USER'], 'AuthMethod':'password', @@ -286,25 +319,25 @@ class TestPlc: return True # make this a valid step - def kill_all_qemus(self): + def qemu_kill_all(self): 'kill all qemu instances on the qemu boxes involved by this setup' # this is the brute force version, kill all qemus on that host box for (box,nodes) in self.gather_hostBoxes().iteritems(): # pass the first nodename, as we don't push template-qemu on testboxes nodedir=nodes[0].nodedir() - TestBox(box,self.options.buildname).kill_all_qemus(nodedir) + TestBoxQemu(box,self.options.buildname).qemu_kill_all(nodedir) return True # make this a valid step - def list_all_qemus(self): + def qemu_list_all(self): 'list all qemu instances on the qemu boxes involved by this setup' for (box,nodes) in self.gather_hostBoxes().iteritems(): # this is the brute force version, kill all qemus on that host box - TestBox(box,self.options.buildname).list_all_qemus() + TestBoxQemu(box,self.options.buildname).qemu_list_all() return True # kill only the right qemus - def list_qemus(self): + def qemu_list_mine(self): 'list qemu instances for our nodes' for (box,nodes) in self.gather_hostBoxes().iteritems(): # the fine-grain version @@ -313,7 +346,7 @@ class TestPlc: return True # kill only the right qemus - def kill_qemus(self): + def qemu_kill_mine(self): 'kill the qemu instances for our nodes' for (box,nodes) in self.gather_hostBoxes().iteritems(): # the fine-grain version @@ -322,12 +355,31 @@ class TestPlc: return True #################### display config - def display (self): + def show (self): "show test configuration after localization" self.display_pass (1) self.display_pass (2) return True + def export (self): + "print cut'n paste-able stuff to export env variables to your shell" + # guess local domain from hostname + domain=socket.gethostname().split('.',1)[1] + fqdn="%s.%s"%(self.plc_spec['host_box'],domain) + print "export BUILD=%s"%self.options.buildname + if self.options.plcs_use_lxc: + print "export PLCHOSTLXC=%s"%fqdn + else: + print "export PLCHOSTVS=%s"%fqdn + print "export GUESTNAME=%s"%self.plc_spec['vservername'] + vplcname=self.plc_spec['vservername'].split('-')[-1] + print "export GUESTHOSTNAME=%s.%s"%(vplcname,domain) + # find hostname of first node + (hostname,qemubox) = self.all_node_infos()[0] + print "export KVMHOST=%s.%s"%(qemubox,domain) + print "export NODE=%s"%(hostname) + return True + # entry point always_display_keys=['PLC_WWW_HOST','nodes','sites',] def display_pass (self,passno): @@ -419,7 +471,8 @@ class TestPlc: @staticmethod def display_mapping_plc (plc_spec): print '+ MyPLC',plc_spec['name'] - print '+\tvserver address = root@%s:/vservers/%s'%(plc_spec['hostname'],plc_spec['vservername']) + # WARNING this would not be right for lxc-based PLC's - should be harmless though + print '+\tvserver address = root@%s:/vservers/%s'%(plc_spec['host_box'],plc_spec['vservername']) print '+\tIP = %s/%s'%(plc_spec['PLC_API_HOST'],plc_spec['vserverip']) for site_spec in plc_spec['sites']: for node_spec in site_spec['nodes']: @@ -431,46 +484,36 @@ class TestPlc: print '+\tqemu box %s'%node_spec['host_box'] print '+\thostname=%s'%node_spec['node_fields']['hostname'] - def resources_pre (self): - "run site-dependant pre-test script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_pre(self) - - def resources_post (self): - "run site-dependant post-test script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_post(self) - - def resources_list (self): - "run site-dependant list script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_list(self) - - def resources_release (self): - "run site-dependant release script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_release(self) - - def resources_release_plc (self): - "run site-dependant release script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_release_plc(self) - - def resources_release_qemu (self): - "run site-dependant release script as defined in LocalTestResources" - from LocalTestResources import local_resources - return local_resources.step_release_qemu(self) - - def delete_vs(self): + # write a timestamp in /vservers/<>.timestamp + # cannot be inside the vserver, that causes vserver .. build to cough + def timestamp_vs (self): + now=int(time.time()) + # TODO-lxc check this one + # a first approx. is to store the timestamp close to the VM root like vs does + stamp_path=self.vm_timestamp_path () + stamp_dir = os.path.dirname (stamp_path) + utils.system(self.test_ssh.actual_command("mkdir -p %s"%stamp_dir)) + return utils.system(self.test_ssh.actual_command("echo %d > %s"%(now,stamp_path)))==0 + + # this is called inconditionnally at the beginning of the test sequence + # just in case this is a rerun, so if the vm is not running it's fine + def vs_delete(self): "vserver delete the test myplc" - self.run_in_host("vserver --silent %s delete"%self.vservername) - return True + stamp_path=self.vm_timestamp_path() + self.run_in_host("rm -f %s"%stamp_path) + if self.options.plcs_use_lxc: + self.run_in_host("lxc-stop --name %s"%self.vservername) + self.run_in_host("lxc-destroy --name %s"%self.vservername) + return True + else: + self.run_in_host("vserver --silent %s delete"%self.vservername) + return True ### install # historically the build was being fetched by the tests # now the build pushes itself as a subdir of the tests workdir # so that the tests do not have to worry about extracting the build (svn, git, or whatever) - def create_vs (self): + def vs_create (self): "vserver creation (no install done)" # push the local build/ dir to the testplc box if self.is_local(): @@ -495,7 +538,10 @@ class TestPlc: test_env_options += " -p %s"%self.options.personality test_env_options += " -d %s"%self.options.pldistro test_env_options += " -f %s"%self.options.fcdistro - script="vtest-init-vserver.sh" + if self.options.plcs_use_lxc: + script="vtest-init-lxc.sh" + else: + script="vtest-init-vserver.sh" vserver_name = self.vservername vserver_options="--netdev eth0 --interface %s"%self.vserverip try: @@ -509,7 +555,7 @@ class TestPlc: return self.run_in_host(create_vserver) == 0 ### install_rpm - def install(self): + def plc_install(self): "yum install myplc, noderepo, and the plain bootstrapfs" # workaround for getting pgsql8.2 on centos5 @@ -529,13 +575,12 @@ class TestPlc: pkgs_list.append ("slicerepo-%s"%nodefamily) pkgs_list.append ("myplc") pkgs_list.append ("noderepo-%s"%nodefamily) - pkgs_list.append ("bootstrapfs-%s-plain"%nodefamily) + pkgs_list.append ("nodeimage-%s-plain"%nodefamily) pkgs_string=" ".join(pkgs_list) - self.run_in_guest("yum -y install %s"%pkgs_string) - return self.run_in_guest("rpm -q %s"%pkgs_string)==0 + return self.yum_install (pkgs_list) ### - def configure(self): + def plc_configure(self): "run plc-config-tty" tmpname='%s.plc-config-tty'%(self.name()) fileconf=open(tmpname,'w') @@ -546,7 +591,7 @@ class TestPlc: 'PLC_MAIL_ENABLED', 'PLC_MAIL_SUPPORT_ADDRESS', 'PLC_DB_HOST', - 'PLC_DB_PASSWORD', +# 'PLC_DB_PASSWORD', # Above line was added for integrating SFA Testing 'PLC_API_HOST', 'PLC_WWW_HOST', @@ -555,6 +600,7 @@ class TestPlc: 'PLC_NET_DNS2', 'PLC_RESERVATION_GRANULARITY', 'PLC_OMF_ENABLED', + 'PLC_OMF_XMPP_SERVER', ]: fileconf.write ('e %s\n%s\n'%(var,self.plc_spec[var])) fileconf.write('w\n') @@ -565,12 +611,12 @@ class TestPlc: utils.system('rm %s'%tmpname) return True - def start(self): + def plc_start(self): "service plc start" self.run_in_guest('service plc start') return True - def stop(self): + def plc_stop(self): "service plc stop" self.run_in_guest('service plc stop') return True @@ -580,29 +626,36 @@ class TestPlc: self.start_guest() return True + def vs_stop (self): + "stop the PLC vserver" + self.stop_guest() + return True + # stores the keys from the config for further use - def store_keys(self): + def keys_store(self): "stores test users ssh keys in keys/" for key_spec in self.plc_spec['keys']: TestKey(self,key_spec).store_key() return True - def clean_keys(self): + def keys_clean(self): "removes keys cached in keys/" - utils.system("rm -rf %s/keys/"%os.path(sys.argv[0])) + utils.system("rm -rf ./keys") + return True # fetches the ssh keys in the plc's /etc/planetlab and stores them in keys/ # for later direct access to the nodes - def fetch_keys(self): + def keys_fetch(self): "gets ssh keys in /etc/planetlab/ and stores them locally in keys/" dir="./keys" if not os.path.isdir(dir): os.mkdir(dir) vservername=self.vservername + vm_root=self.vm_root_in_host() overall=True prefix = 'debug_ssh_key' for ext in [ 'pub', 'rsa' ] : - src="/vservers/%(vservername)s/etc/planetlab/%(prefix)s.%(ext)s"%locals() + src="%(vm_root)s/etc/planetlab/%(prefix)s.%(ext)s"%locals() dst="keys/%(vservername)s-debug.%(ext)s"%locals() if self.test_ssh.fetch(src,dst) != 0: overall=False return overall @@ -611,7 +664,7 @@ class TestPlc: "create sites with PLCAPI" return self.do_sites() - def clean_sites (self): + def delete_sites (self): "delete sites with PLCAPI" return self.do_sites(action="delete") @@ -630,18 +683,19 @@ class TestPlc: test_site.create_users() return True - def clean_all_sites (self): + def delete_all_sites (self): "Delete all sites in PLC, and related objects" print 'auth_root',self.auth_root() site_ids = [s['site_id'] for s in self.apiserver.GetSites(self.auth_root(), {}, ['site_id'])] for site_id in site_ids: print 'Deleting site_id',site_id self.apiserver.DeleteSite(self.auth_root(),site_id) + return True def nodes (self): "create nodes with PLCAPI" return self.do_nodes() - def clean_nodes (self): + def delete_nodes (self): "delete nodes with PLCAPI" return self.do_nodes(action="delete") @@ -665,7 +719,7 @@ class TestPlc: def nodegroups (self): "create nodegroups with PLCAPI" return self.do_nodegroups("add") - def clean_nodegroups (self): + def delete_nodegroups (self): "delete nodegroups with PLCAPI" return self.do_nodegroups("delete") @@ -712,7 +766,7 @@ class TestPlc: return ok - def clean_leases (self): + def delete_leases (self): "remove all leases in the myplc side" lease_ids= [ l['lease_id'] for l in self.apiserver.GetLeases(self.auth_root())] utils.header("Cleaning leases %r"%lease_ids) @@ -760,8 +814,7 @@ class TestPlc: tag_type_id = self.apiserver.AddTagType(auth, {'tagname':nodegroupname, 'description': 'for nodegroup %s'%nodegroupname, - 'category':'test', - 'min_role_id':10}) + 'category':'test'}) print 'located tag (type)',nodegroupname,'as',tag_type_id # create nodegroup nodegroups = self.apiserver.GetNodeGroups (auth, {'groupname':nodegroupname}) @@ -797,6 +850,15 @@ class TestPlc: overall=False return overall + # a list of TestNode objs + def all_nodes (self): + nodes=[] + for site_spec in self.plc_spec['sites']: + test_site = TestSite (self,site_spec) + for node_spec in site_spec['nodes']: + nodes.append(TestNode (self,test_site,node_spec)) + return nodes + # return a list of tuples (nodename,qemuname) def all_node_infos (self) : node_infos = [] @@ -862,7 +924,7 @@ class TestPlc: return True def nodes_booted(self): - return self.nodes_check_boot_state('boot',timeout_minutes=30,silent_minutes=20) + return self.nodes_check_boot_state('boot',timeout_minutes=30,silent_minutes=28) def check_nodes_ssh(self,debug,timeout_minutes,silent_minutes,period=15): # compute timeout @@ -909,16 +971,16 @@ class TestPlc: # only useful in empty plcs return True - def nodes_ssh_debug(self): + def ssh_node_debug(self): "Tries to ssh into nodes in debug mode with the debug ssh key" - return self.check_nodes_ssh(debug=True,timeout_minutes=10,silent_minutes=5) + return self.check_nodes_ssh(debug=True,timeout_minutes=10,silent_minutes=8) - def nodes_ssh_boot(self): + def ssh_node_boot(self): "Tries to ssh into nodes in production mode with the root ssh key" - return self.check_nodes_ssh(debug=False,timeout_minutes=40,silent_minutes=15) + return self.check_nodes_ssh(debug=False,timeout_minutes=40,silent_minutes=38) @node_mapper - def init_node (self): + def qemu_local_init (self): "all nodes : init a clean local directory for holding node-dep stuff like iso image..." pass @node_mapper @@ -926,15 +988,27 @@ class TestPlc: "all nodes: invoke GetBootMedium and store result locally" pass @node_mapper - def configure_qemu (self): + def qemu_local_config (self): "all nodes: compute qemu config qemu.conf and store it locally" pass @node_mapper - def reinstall_node (self): + def nodestate_reinstall (self): "all nodes: mark PLCAPI boot_state as reinstall" pass @node_mapper - def export_qemu (self): + def nodestate_safeboot (self): + "all nodes: mark PLCAPI boot_state as safeboot" + pass + @node_mapper + def nodestate_boot (self): + "all nodes: mark PLCAPI boot_state as boot" + pass + @node_mapper + def nodestate_show (self): + "all nodes: show PLCAPI boot_state" + pass + @node_mapper + def qemu_export (self): "all nodes: push local node-dep directory on the qemu box" pass @@ -952,9 +1026,9 @@ class TestPlc: def do_check_initscripts(self): overall = True for slice_spec in self.plc_spec['slices']: - if not slice_spec.has_key('initscriptname'): + if not slice_spec.has_key('initscriptstamp'): continue - initscript=slice_spec['initscriptname'] + stamp=slice_spec['initscriptstamp'] for nodename in slice_spec['nodenames']: (site,node) = self.locate_node (nodename) # xxx - passing the wrong site - probably harmless @@ -962,7 +1036,7 @@ class TestPlc: test_slice = TestSlice (self,test_site,slice_spec) test_node = TestNode (self,test_site,node) test_sliver = TestSliver (self, test_node, test_slice) - if not test_sliver.check_initscript(initscript): + if not test_sliver.check_initscript_stamp(stamp): overall = False return overall @@ -977,7 +1051,7 @@ class TestPlc: self.apiserver.AddInitScript(self.auth_root(),initscript['initscript_fields']) return True - def clean_initscripts (self): + def delete_initscripts (self): "delete initscripts with PLCAPI" for initscript in self.plc_spec['initscripts']: initscript_name = initscript['initscript_fields']['name'] @@ -994,7 +1068,7 @@ class TestPlc: "create slices with PLCAPI" return self.do_slices() - def clean_slices (self): + def delete_slices (self): "delete slices with PLCAPI" return self.do_slices("delete") @@ -1013,17 +1087,22 @@ class TestPlc: return True @slice_mapper - def check_slice(self): + def ssh_slice(self): "tries to ssh-enter the slice with the user key, to ensure slice creation" pass @node_mapper - def clear_known_hosts (self): + def keys_clear_known_hosts (self): "remove test nodes entries from the local known_hosts file" pass @node_mapper - def start_node (self) : + def qemu_start (self) : + "all nodes: start the qemu instance (also runs qemu-bridge-init start)" + pass + + @node_mapper + def timestamp_qemu (self) : "all nodes: start the qemu instance (also runs qemu-bridge-init start)" pass @@ -1045,11 +1124,39 @@ class TestPlc: overall=False return overall + # painfully enough, we need to allow for some time as netflow might show up last + def check_sys_slice (self): + "all nodes: check that a system slice is alive" +# would probably make more sense to check for netflow, +# but that one is currently not working in the lxc distro +# return self.check_systemslice ('netflow') + return self.check_systemslice ('drl') + + # we have the slices up already here, so it should not take too long + def check_systemslice (self, slicename, timeout_minutes=5, period=15): + timeout = datetime.datetime.now()+datetime.timedelta(minutes=timeout_minutes) + test_nodes=self.all_nodes() + while test_nodes: + for test_node in test_nodes: + if test_node.check_systemslice (slicename,dry_run=self.options.dry_run): + utils.header ("ok") + test_nodes.remove(test_node) + else: + print '.', + if not test_nodes: + return True + if datetime.datetime.now () > timeout: + for test_node in test_nodes: + utils.header ("can't find system slice %s in %s"%(slicename,test_node.name())) + return False + time.sleep(period) + return True + def plcsh_stress_test (self): "runs PLCAPI stress test, that checks Add/Update/Delete on all types - preserves contents" # install the stress-test in the plc image location = "/usr/share/plc_api/plcsh_stress_test.py" - remote="/vservers/%s/%s"%(self.vservername,location) + remote="%s/%s"%(self.vm_root_in_host(),location) self.test_ssh.copy_abs("plcsh_stress_test.py",remote) command = location command += " -- --check" @@ -1061,36 +1168,51 @@ class TestPlc: # in particular runs with --preserve (dont cleanup) and without --check # also it gets run twice, once with the --foreign option for creating fake foreign entries - ### install_sfa_rpm - def install_sfa(self): - "yum install sfa, sfa-plc and sfa-client" - # ignore yum retcod - self.run_in_guest("yum -y install sfa sfa-client sfa-plc sfa-sfatables") - return self.run_in_guest("rpm -q sfa sfa-client sfa-plc sfa-sfatables")==0 + def sfa_install_all (self): + "yum install sfa sfa-plc sfa-sfatables sfa-client" + return self.yum_install ("sfa sfa-plc sfa-sfatables sfa-client") + + def sfa_install_core(self): + "yum install sfa" + return self.yum_install ("sfa") + + def sfa_install_plc(self): + "yum install sfa-plc" + return self.yum_install("sfa-plc") + def sfa_install_client(self): + "yum install sfa-client" + return self.yum_install("sfa-client") + + def sfa_install_sfatables(self): + "yum install sfa-sfatables" + return self.yum_install ("sfa-sfatables") - def dbclean_sfa(self): + def sfa_dbclean(self): "thoroughly wipes off the SFA database" - self.run_in_guest("sfa-nuke-plc.py")==0 + self.run_in_guest("sfa-nuke.py")==0 or \ + self.run_in_guest("sfa-nuke-plc.py") or \ + self.run_in_guest("sfaadmin.py registry nuke") return True - def plcclean_sfa(self): + def sfa_plcclean(self): "cleans the PLC entries that were created as a side effect of running the script" # ignore result sfa_spec=self.plc_spec['sfa'] - slicename='%s_%s'%(sfa_spec['login_base'],sfa_spec['slicename']) - try: self.apiserver.DeleteSlice(self.auth_root(),slicename) - except: print "Slice %s already absent from PLC db"%slicename + for sfa_slice_spec in sfa_spec['sfa_slice_specs']: + slicename='%s_%s'%(sfa_slice_spec['login_base'],sfa_slice_spec['slicename']) + try: self.apiserver.DeleteSlice(self.auth_root(),slicename) + except: print "Slice %s already absent from PLC db"%slicename - username="%s@%s"%(sfa_spec['regularuser'],sfa_spec['domain']) - try: self.apiserver.DeletePerson(self.auth_root(),username) - except: print "User %s already absent from PLC db"%username + username="%s@%s"%(sfa_slice_spec['regularuser'],sfa_slice_spec['domain']) + try: self.apiserver.DeletePerson(self.auth_root(),username) + except: print "User %s already absent from PLC db"%username - print "REMEMBER TO RUN import_sfa AGAIN" + print "REMEMBER TO RUN sfa_import AGAIN" return True - def uninstall_sfa(self): + def sfa_uninstall(self): "uses rpm to uninstall sfa - ignore result" self.run_in_guest("rpm -e sfa sfa-sfatables sfa-client sfa-plc") self.run_in_guest("rm -rf /var/lib/sfa") @@ -1100,6 +1222,25 @@ class TestPlc: self.run_in_guest("rpm -e --noscripts sfa-plc") return True + ### run unit tests for SFA + # NOTE: for some reason on f14/i386, yum install sfa-tests fails for no reason + # Running Transaction + # Transaction couldn't start: + # installing package sfa-tests-1.0-21.onelab.i686 needs 204KB on the / filesystem + # [('installing package sfa-tests-1.0-21.onelab.i686 needs 204KB on the / filesystem', (9, '/', 208896L))] + # no matter how many Gbs are available on the testplc + # could not figure out what's wrong, so... + # if the yum install phase fails, consider the test is successful + # other combinations will eventually run it hopefully + def sfa_utest(self): + "yum install sfa-tests and run SFA unittests" + self.run_in_guest("yum -y install sfa-tests") + # failed to install - forget it + if self.run_in_guest("rpm -q sfa-tests")!=0: + utils.header("WARNING: SFA unit tests failed to install, ignoring") + return True + return self.run_in_guest("/usr/share/sfa/tests/testAll.py")==0 + ### def confdir(self): dirname="conf.%s"%self.plc_spec['name'] @@ -1111,13 +1252,13 @@ class TestPlc: def conffile(self,filename): return "%s/%s"%(self.confdir(),filename) - def confsubdir(self,dirname,clean): + def confsubdir(self,dirname,clean,dry_run=False): subdirname="%s/%s"%(self.confdir(),dirname) if clean: utils.system("rm -rf %s"%subdirname) if not os.path.isdir(subdirname): utils.system("mkdir -p %s"%subdirname) - if not os.path.isdir(subdirname): + if not dry_run and not os.path.isdir(subdirname): raise "Cannot create config subdir %s for plc %s"%(dirname,self.name()) return subdirname @@ -1126,26 +1267,29 @@ class TestPlc: return utils.system("rm -rf %s"%filename)==0 ### - def configure_sfa(self): + def sfa_configure(self): "run sfa-config-tty" tmpname=self.conffile("sfa-config-tty") fileconf=open(tmpname,'w') for var in [ 'SFA_REGISTRY_ROOT_AUTH', 'SFA_INTERFACE_HRN', -# 'SFA_REGISTRY_LEVEL1_AUTH', + 'SFA_REGISTRY_LEVEL1_AUTH', 'SFA_REGISTRY_HOST', 'SFA_AGGREGATE_HOST', 'SFA_SM_HOST', + 'SFA_PLC_URL', 'SFA_PLC_USER', 'SFA_PLC_PASSWORD', - 'SFA_PLC_DB_HOST', - 'SFA_PLC_DB_USER', - 'SFA_PLC_DB_PASSWORD', - 'SFA_PLC_URL', + 'SFA_DB_HOST', + 'SFA_DB_USER', + 'SFA_DB_PASSWORD', + 'SFA_DB_NAME', + 'SFA_API_LOGLEVEL', ]: - fileconf.write ('e %s\n%s\n'%(var,self.plc_spec['sfa'][var])) + if self.plc_spec['sfa'].has_key(var): + fileconf.write ('e %s\n%s\n'%(var,self.plc_spec['sfa'][var])) # the way plc_config handles booleans just sucks.. - for var in ['SFA_API_DEBUG']: + for var in []: val='false' if self.plc_spec['sfa'][var]: val='true' fileconf.write ('e %s\n%s\n'%(var,val)) @@ -1158,8 +1302,9 @@ class TestPlc: return True def aggregate_xml_line(self): - return '' % \ - (self.vserverip,self.plc_spec['sfa']['SFA_REGISTRY_ROOT_AUTH']) + port=self.plc_spec['sfa']['neighbours-port'] + return '' % \ + (self.vserverip,self.plc_spec['sfa']['SFA_REGISTRY_ROOT_AUTH'],port) def registry_xml_line(self): return '' % \ @@ -1167,7 +1312,8 @@ class TestPlc: # a cross step that takes all other plcs in argument - def cross_configure_sfa(self, other_plcs): + def cross_sfa_configure(self, other_plcs): + "writes aggregates.xml and registries.xml that point to all other PLCs in the test" # of course with a single plc, other_plcs is an empty list if not other_plcs: return True @@ -1179,134 +1325,104 @@ class TestPlc: file(reg_fname,"w").write("%s\n" % \ " ".join([ plc.registry_xml_line() for plc in other_plcs ])) utils.header ("(Over)wrote %s"%reg_fname) - return self.test_ssh.copy_abs(agg_fname,'/vservers/%s/etc/sfa/aggregates.xml'%self.vservername)==0 \ - and self.test_ssh.copy_abs(reg_fname,'/vservers/%s/etc/sfa/registries.xml'%self.vservername)==0 + return self.test_ssh.copy_abs(agg_fname,'/%s/etc/sfa/aggregates.xml'%self.vm_root_in_host())==0 \ + and self.test_ssh.copy_abs(reg_fname,'/%s/etc/sfa/registries.xml'%self.vm_root_in_host())==0 - def import_sfa(self): + def sfa_import(self): "sfa-import-plc" - auth=self.plc_spec['sfa']['SFA_REGISTRY_ROOT_AUTH'] - return self.run_in_guest('sfa-import-plc.py')==0 + auth=self.plc_spec['sfa']['SFA_REGISTRY_ROOT_AUTH'] + return self.run_in_guest('sfa-import.py')==0 or \ + self.run_in_guest('sfa-import-plc.py')==0 or \ + self.run_in_guest('sfaadmin.py registry import_registry')==0 # not needed anymore # self.run_in_guest('cp /etc/sfa/authorities/%s/%s.pkey /etc/sfa/authorities/server.key'%(auth,auth)) - def start_sfa(self): + def sfa_start(self): "service sfa start" return self.run_in_guest('service sfa start')==0 - def configure_sfi(self): + def sfi_configure(self): + "Create /root/sfi on the plc side for sfi client configuration" + if self.options.dry_run: + utils.header("DRY RUN - skipping step") + return True sfa_spec=self.plc_spec['sfa'] - "sfi client configuration" - dir_name=self.confsubdir("dot-sfi",clean=True) - file_name=dir_name + os.sep + sfa_spec['piuser'] + '.pkey' - fileconf=open(file_name,'w') - fileconf.write (self.plc_spec['keys'][0]['private']) - fileconf.close() - utils.header ("(Over)wrote %s"%file_name) - - file_name=dir_name + os.sep + 'sfi_config' - fileconf=open(file_name,'w') - SFI_AUTH="%s.%s"%(sfa_spec['SFA_REGISTRY_ROOT_AUTH'],sfa_spec['login_base']) - fileconf.write ("SFI_AUTH='%s'"%SFI_AUTH) - fileconf.write('\n') - SFI_USER=SFI_AUTH + '.' + sfa_spec['piuser'] - fileconf.write ("SFI_USER='%s'"%SFI_USER) - fileconf.write('\n') - SFI_REGISTRY='http://' + sfa_spec['SFA_PLC_DB_HOST'] + ':12345/' - fileconf.write ("SFI_REGISTRY='%s'"%SFI_REGISTRY) - fileconf.write('\n') - SFI_SM='http://' + sfa_spec['SFA_PLC_DB_HOST'] + ':12347/' - fileconf.write ("SFI_SM='%s'"%SFI_SM) - fileconf.write('\n') - fileconf.close() - utils.header ("(Over)wrote %s"%file_name) - - file_name=dir_name + os.sep + 'person.xml' - fileconf=open(file_name,'w') - for record in sfa_spec['sfa_person_xml']: - person_record=record - fileconf.write(person_record) - fileconf.write('\n') - fileconf.close() - utils.header ("(Over)wrote %s"%file_name) - - file_name=dir_name + os.sep + 'slice.xml' - fileconf=open(file_name,'w') - for record in sfa_spec['sfa_slice_xml']: - slice_record=record - #slice_record=sfa_spec['sfa_slice_xml'] - fileconf.write(slice_record) - fileconf.write('\n') - utils.header ("(Over)wrote %s"%file_name) - fileconf.close() - - file_name=dir_name + os.sep + 'slice.rspec' - fileconf=open(file_name,'w') - slice_rspec='' - for (key, value) in sfa_spec['sfa_slice_rspec'].items(): - slice_rspec +=value - fileconf.write(slice_rspec) - fileconf.write('\n') - fileconf.close() - utils.header ("(Over)wrote %s"%file_name) - - # push to the remote root's .sfi - location = "root/.sfi" - remote="/vservers/%s/%s"%(self.vservername,location) - self.test_ssh.copy_abs(dir_name, remote, recursive=True) + # cannot use sfa_slice_mapper to pass dir_name + for slice_spec in self.plc_spec['sfa']['sfa_slice_specs']: + site_spec = self.locate_site (slice_spec['sitename']) + test_site = TestSite(self,site_spec) + test_slice=TestSliceSfa(self,test_site,slice_spec) + dir_name=self.confsubdir("dot-sfi/%s"%slice_spec['slicename'],clean=True,dry_run=self.options.dry_run) + test_slice.sfi_config(dir_name) + # push into the remote /root/sfi area + location = test_slice.sfi_path() + remote="%s/%s"%(self.vm_root_in_host(),location) + self.test_ssh.mkdir(remote,abs=True) + # need to strip last level or remote otherwise we get an extra dir level + self.test_ssh.copy_abs(dir_name, os.path.dirname(remote), recursive=True) return True - def clean_sfi (self): - self.run_in_guest("rm -rf /root/.sfi") + def sfi_clean (self): + "clean up /root/sfi on the plc side" + self.run_in_guest("rm -rf /root/sfi") return True - def add_user_sfa(self): - return TestUserSfa(self).add_user() + @slice_sfa_mapper + def sfa_add_user(self): + "run sfi.py add" + pass + + @slice_sfa_mapper + def sfa_update_user(self): + "run sfi.py update" + + @slice_sfa_mapper + def sfa_add_slice(self): + "run sfi.py add (on Registry) from slice.xml" + pass @slice_sfa_mapper - def add_sfa(self): - "run sfi.py add (on Registry)" + def sfa_discover(self): + "discover resources into resouces_in.rspec" pass @slice_sfa_mapper - def create_sfa(self): - "run sfi.py create (on SM) for 1st-time creation" + def sfa_create_slice(self): + "run sfi.py create (on SM) - 1st time" pass - def update_user_sfa(self): - return TestUserSfa(self).update_user() + @slice_sfa_mapper + def sfa_check_slice_plc(self): + "check sfa_create_slice at the plcs - all local nodes should be in slice" + pass @slice_sfa_mapper - def update_sfa(self): + def sfa_update_slice(self): "run sfi.py create (on SM) on existing object" pass - def view_sfa(self): - "run sfi.py list and sfi.py show (both on Registry) and sfi.py slices and sfi.py resources (both on SM)" - sfa_spec=self.plc_spec['sfa'] - auth=sfa_spec['SFA_REGISTRY_ROOT_AUTH'] - return \ - self.run_in_guest("sfi.py -d /root/.sfi/ list %s.%s"%(auth,sfa_spec['login_base']))==0 and \ - self.run_in_guest("sfi.py -d /root/.sfi/ show %s.%s"%(auth,sfa_spec['login_base']))==0 and \ - self.run_in_guest("sfi.py -d /root/.sfi/ slices")==0 and \ - self.run_in_guest("sfi.py -d /root/.sfi/ resources -o resources")==0 + @slice_sfa_mapper + def sfa_view(self): + "various registry-related calls" + pass @slice_sfa_mapper - def check_slice_sfa(self): + def ssh_slice_sfa(self): "tries to ssh-enter the SFA slice" pass - def delete_user_sfa(self): - "run sfi.py delete (on SM) for user" - test_user_sfa=TestUserSfa(self) - return test_user_sfa.delete_user() + @slice_sfa_mapper + def sfa_delete_user(self): + "run sfi.py delete" + pass @slice_sfa_mapper - def delete_slice_sfa(self): + def sfa_delete_slice(self): "run sfi.py delete (on SM), sfi.py remove (on Registry) to clean slices" pass - def stop_sfa(self): + def sfa_stop(self): "service sfa stop" self.run_in_guest('service sfa stop')==0 return True @@ -1315,7 +1431,7 @@ class TestPlc: "creates random entries in the PLCAPI" # install the stress-test in the plc image location = "/usr/share/plc_api/plcsh_stress_test.py" - remote="/vservers/%s/%s"%(self.vservername,location) + remote="%s/%s"%(self.vm_root_in_host(),location) self.test_ssh.copy_abs("plcsh_stress_test.py",remote) command = location command += " -- --preserve --short-names" @@ -1329,6 +1445,7 @@ class TestPlc: "gets all possible logs from plc's/qemu node's/slice's for future reference" # (1.a) get the plc's /var/log/ and store it locally in logs/myplc.var-log./* # (1.b) get the plc's /var/lib/pgsql/data/pg_log/ -> logs/myplc.pgsql-log./* + # (1.c) get the plc's /root/sfi -> logs/sfi./ # (2) get all the nodes qemu log and store it as logs/node.qemu..log # (3) get the nodes /var/log and store is as logs/node.var-log./* # (4) as far as possible get the slice's /var/log as logs/sliver.var-log./* @@ -1338,6 +1455,9 @@ class TestPlc: # (1.b) print "-------------------- TestPlc.gather_logs : PLC's /var/lib/psql/data/pg_log/" self.gather_pgsql_logs () + # (1.c) + print "-------------------- TestPlc.gather_logs : PLC's /root/sfi/" + self.gather_root_sfi () # (2) print "-------------------- TestPlc.gather_logs : nodes's QEMU logs" for site_spec in self.plc_spec['sites']: @@ -1375,6 +1495,12 @@ class TestPlc: command = to_plc + "| tar -C logs/myplc.pgsql-log.%s -xf -"%self.name() utils.system(command) + def gather_root_sfi (self): + utils.system("mkdir -p logs/sfi.%s"%self.name()) + to_plc = self.actual_command_in_guest("tar -C /root/sfi/ -cf - .") + command = to_plc + "| tar -C logs/sfi.%s -xf -"%self.name() + utils.system(command) + def gather_nodes_var_logs (self): for site_spec in self.plc_spec['sites']: test_site = TestSite (self,site_spec) @@ -1400,14 +1526,14 @@ class TestPlc: name=str(d) return "/root/%s-%s.sql"%(database,name) - def db_dump(self): + def plc_db_dump(self): 'dump the planetlab5 DB in /root in the PLC - filename has time' dump=self.dbfile("planetab5") self.run_in_guest('pg_dump -U pgsqluser planetlab5 -f '+ dump) utils.header('Dumped planetlab5 database in %s'%dump) return True - def db_restore(self): + def plc_db_restore(self): 'restore the planetlab5 DB - looks broken, but run -n might help' dump=self.dbfile("planetab5") ##stop httpd service @@ -1421,6 +1547,9 @@ class TestPlc: utils.header('Database restored from ' + dump) + def standby_1_through_20(self): + """convenience function to wait for a specified number of minutes""" + pass @standby_generic def standby_1(): pass @standby_generic