sleep between polls
[sfa.git] / sfa / openstack / osaggregate.py
1
2 import os
3 import socket
4 import base64
5 import string
6 import random
7 import time    
8 from collections import defaultdict
9 from nova.exception import ImageNotFound
10 from nova.api.ec2.cloud import CloudController
11 from sfa.util.faults import SfaAPIError, SliverDoesNotExist
12 from sfa.util.sfatime import utcparse, datetime_to_string, datetime_to_epoch
13 from sfa.rspecs.rspec import RSpec
14 from sfa.rspecs.elements.hardware_type import HardwareType
15 from sfa.rspecs.elements.node import Node
16 from sfa.rspecs.elements.sliver import Sliver
17 from sfa.rspecs.elements.login import Login
18 from sfa.rspecs.elements.disk_image import DiskImage
19 from sfa.rspecs.elements.services import Services
20 from sfa.rspecs.elements.interface import Interface
21 from sfa.util.xrn import Xrn
22 from sfa.planetlab.plxrn import PlXrn 
23 from sfa.openstack.osxrn import OSXrn, hrn_to_os_slicename
24 from sfa.rspecs.version_manager import VersionManager
25 from sfa.openstack.security_group import SecurityGroup
26 from sfa.util.sfalogging import logger
27
28 def pubkeys_to_user_data(pubkeys):
29     user_data = "#!/bin/bash\n\n"
30     for pubkey in pubkeys:
31         pubkey = pubkey.replace('\n', '')
32         user_data += "echo %s >> /root/.ssh/authorized_keys" % pubkey
33         user_data += "\n"
34         user_data += "echo >> /root/.ssh/authorized_keys"
35         user_data += "\n"
36     return user_data
37
38 def instance_to_sliver(instance, xrn=None):
39     sliver_urn = None
40     if slice_xrn:
41         sliver_xrn = Xrn(xrn=slice_xrn, type='slice', id=instance.id).get_urn()
42
43     sliver = Sliver({'slice_id': sliver_urn,
44                      'name': instance.name,
45                      'type': instance.name,
46                      'cpus': str(instance.vcpus),
47                      'memory': str(instance.ram),
48                      'storage':  str(instance.disk)})
49     return sliver
50
51 def image_to_rspec_disk_image(image):
52     img = DiskImage()
53     img['name'] = image['name']
54     img['description'] = image['name']
55     img['os'] = image['name']
56     img['version'] = image['name']    
57     return img
58     
59 class OSAggregate:
60
61     def __init__(self, driver):
62         self.driver = driver
63
64     def get_availability_zones(self):
65         zones = self.driver.shell.nova_manager.dns_domains.domains()
66         if not zones:
67             zones = ['cloud']
68         else:
69             zones = [zone.name for zone in zones]
70         return zones
71
72
73     def list_resources(self, version=None, options={}):
74         version_manager = VersionManager()
75         version = version_manager.get_version(version)
76         rspec_version = version_manager._get_version(version.type, version.version, 'ad')
77         rspec = RSpec(version=version, user_options=options)
78         nodes = self.get_aggregate_nodes()
79         rspec.version.add_nodes(nodes)
80         return rspec.toxml()
81
82     def describe(self, urns, version=None, options={}):
83         # update nova connection
84         tenant_name = OSXrn(xrn=urns[0], type='slice').get_tenant_name()
85         self.driver.shell.nova_manager.connect(tenant=tenant_name)
86         instances = self.get_instances(urns)
87         if len(instances) == 0:
88             raise SliverDoesNotExist("You have not allocated any slivers here")
89
90         geni_slivers = []
91         rspec_nodes = []
92         for instance in instances:
93             rspec_nodes.append(self.instance_to_rspec_node(instance))
94             geni_slivers.append(self.instance_to_geni_sliver(instance))
95         version_manager = VersionManager()
96         version = version_manager.get_version(version)
97         rspec_version = version_manager._get_version(version.type, version.version, 'manifest')
98         rspec = RSpec(version=version, user_options=options)
99         rspec.version.add_nodes(rspec_nodes)
100         result = {'geni_urn': Xrn(urns[0]).get_urn(),
101                   'geni_rspec': rspec.toxml(), 
102                   'geni_slivers': geni_slivers}
103         
104         return result
105
106     def get_instances(self, urns):
107         # parse slice names and sliver ids
108         names = set()
109         ids = set()
110         for urn in urns:
111             xrn = OSXrn(xrn=urn)
112             names.add(xrn.get_slice_name())
113             if xrn.id:
114                 ids.add(xrn.id)
115
116         # look up instances
117         instances = []
118         for name in name:
119             servers = self.driver.shell.nova_manager.servers.findall(name=name)
120             instances.extend(servers)
121
122         # filter on id
123         if ids:
124             instances = [server in servers if server.id in ids]
125
126         return instances
127
128     def instance_to_rspec_node(self, instance):
129         # determine node urn
130         node_xrn = instance.metadata.get('component_id')
131         if not node_xrn:
132             node_xrn = OSXrn('cloud', type='node')
133         else:
134             node_xrn = OSXrn(xrn=node_xrn, type='node')
135
136         rspec_node = Node()
137         rspec_node['component_id'] = node_xrn.urn
138         rspec_node['component_name'] = node_xrn.name
139         rspec_node['component_manager_id'] = Xrn(self.driver.hrn, 'authority+cm').get_urn()
140         if instance.metadata.get('client_id'):
141             rspec_node['client_id'] = instance.metadata.get('client_id')
142         flavor = self.driver.shell.nova_manager.flavors.find(id=instance.flavor['id'])
143         rspec_node['slivers'] = [self.instance_to_sliver(flavor)]
144         image = self.driver.shell.image_manager.get_images(id=instance.image['id'])
145         if isinstance(image, list) and len(image) > 0:
146             image = image[0]
147         disk_image = image_to_rspec_disk_image(image)
148         sliver['disk_image'] = [disk_image]
149
150         # build interfaces            
151         rspec_node['services'] = []
152         rspec_node['interfaces'] = []
153         addresses = instance.addresses
154         # HACK: public ips are stored in the list of private, but 
155         # this seems wrong. Assume pub ip is the last in the list of 
156         # private ips until openstack bug is fixed.      
157         if addresses.get('private'):
158             login = Login({'authentication': 'ssh-keys',
159                            'hostname': addresses.get('private')[-1]['addr'],
160                            'port':'22', 'username': 'root'})
161             service = Services({'login': login})
162             rspec_node['services'].append(service)    
163         
164         for private_ip in addresses.get('private', []):
165             if_xrn = PlXrn(auth=self.driver.hrn, 
166                            interface='node%s:eth0' % (instance.hostId)) 
167             interface = Interface({'component_id': if_xrn.urn})
168             interface['ips'] =  [{'address': private_ip['addr'],
169                                  #'netmask': private_ip['network'],
170                                  'type': private_ip['version']}]
171             rspec_node['interfaces'].append(interface) 
172         
173         # slivers always provide the ssh service
174         for public_ip in addresses.get('public', []):
175             login = Login({'authentication': 'ssh-keys', 
176                            'hostname': public_ip['addr'], 
177                            'port':'22', 'username': 'root'})
178             service = Services({'login': login})
179             rspec_node['services'].append(service)
180         return rspec_node
181
182
183     def instance_to_sliver(self, instance, xrn=None):
184         if xrn:
185             xrn = Xrn(xrn=slice_xrn, type='slice', id=instance.id).get_urn()
186
187         sliver = Sliver({'sliver_id': xrn.get_urn(),
188                          'name': instance.name,
189                          'type': instance.name,
190                          'cpus': str(instance.vcpus),
191                          'memory': str(instance.ram),
192                          'storage':  str(instance.disk)})
193         return sliver   
194
195     def instance_to_geni_sliver(self, instance):
196         op_status = "geni_unknown"
197         state = instance.state.lower()
198         if state == 'active':
199             op_status = 'geni_ready'
200         elif state == 'building': 
201             op_status = 'geni_configuring'
202         elif state == 'failed':
203             op_status =' geni_failed'
204          
205         urn = OSXrn(name=instance.name, type='slice', id=instance.id).get_urn()
206         # required fields
207         geni_sliver = {'geni_sliver_urn': urn, 
208                        'geni_expires': None,
209                        'geni_allocation_status': 'geni_provisioned',
210                        'geni_operational_status': op_status,
211                        'geni_error': None,
212                        'plos_created_at': datetime_to_string(utcparse(instance.created)),
213                        'plos_sliver_type': self.shell.nova_manager.flavors.find(id=instance.flavor['id']).name,
214                         }
215
216
217         return geni_sliver
218                         
219     def get_aggregate_nodes(self):
220         zones = self.get_availability_zones()
221         # available sliver/instance/vm types
222         instances = self.driver.shell.nova_manager.flavors.list()
223         if isinstance(instances, dict):
224             instances = instances.values()
225         # available images
226         images = self.driver.shell.image_manager.get_images_detailed()
227         disk_images  = [image_to_rspec_disk_image(img) for img in images if img['container_format'] in ['ami', 'ovf']]
228         rspec_nodes = []
229         for zone in zones:
230             rspec_node = Node()
231             xrn = OSXrn(zone, type='node')
232             rspec_node['component_id'] = xrn.urn
233             rspec_node['component_name'] = xrn.name
234             rspec_node['component_manager_id'] = Xrn(self.driver.hrn, 'authority+cm').get_urn()
235             rspec_node['exclusive'] = 'false'
236             rspec_node['hardware_types'] = [HardwareType({'name': 'plos-pc'}),
237                                                 HardwareType({'name': 'pc'})]
238             slivers = []
239             for instance in instances:
240                 sliver = self.instance_to_sliver(instance)
241                 sliver['disk_image'] = disk_images
242                 slivers.append(sliver)
243         
244             rspec_node['slivers'] = slivers
245             rspec_nodes.append(rspec_node) 
246
247         return rspec_nodes 
248
249     def create_tenant(self, tenant_name):
250         tenants = self.driver.shell.auth_manager.tenants.findall(name=tenant_name)
251         if not tenants:
252             self.driver.shell.auth_manager.tenants.create(tenant_name, tenant_name)
253             tenant = self.driver.shell.auth_manager.tenants.find(name=tenant_name)
254         else:
255             tenant = tenants[0]
256         return tenant
257             
258     def create_instance_key(self, slice_hrn, user):
259         slice_name = Xrn(slice_hrn).leaf
260         user_name = Xrn(user['urn']).leaf
261         key_name = "%s_%s" % (slice_name, user_name)
262         pubkey = user['keys'][0]
263         key_found = False
264         existing_keys = self.driver.shell.nova_manager.keypairs.findall(name=key_name)
265         for existing_key in existing_keys:
266             if existing_key.public_key != pubkey:
267                 self.driver.shell.nova_manager.keypairs.delete(existing_key)
268             elif existing_key.public_key == pubkey:
269                 key_found = True
270
271         if not key_found:
272             self.driver.shell.nova_manager.keypairs.create(key_name, pubkey)
273         return key_name       
274         
275
276     def create_security_group(self, slicename, fw_rules=[]):
277         # use default group by default
278         group_name = 'default' 
279         if isinstance(fw_rules, list) and fw_rules:
280             # Each sliver get's its own security group.
281             # Keep security group names unique by appending some random
282             # characters on end.
283             random_name = "".join([random.choice(string.letters+string.digits)
284                                            for i in xrange(6)])
285             group_name = slicename + random_name 
286             security_group = SecurityGroup(self.driver)
287             security_group.create_security_group(group_name)
288             for rule in fw_rules:
289                 security_group.add_rule_to_group(group_name, 
290                                              protocol = rule.get('protocol'), 
291                                              cidr_ip = rule.get('cidr_ip'), 
292                                              port_range = rule.get('port_range'), 
293                                              icmp_type_code = rule.get('icmp_type_code'))
294         return group_name
295
296     def add_rule_to_security_group(self, group_name, **kwds):
297         security_group = SecurityGroup(self.driver)
298         security_group.add_rule_to_group(group_name=group_name, 
299                                          protocol=kwds.get('protocol'), 
300                                          cidr_ip =kwds.get('cidr_ip'), 
301                                          icmp_type_code = kwds.get('icmp_type_code'))
302
303  
304
305     def run_instances(self, instance_name, tenant_name, rspec, key_name, pubkeys):
306         #logger.debug('Reserving an instance: image: %s, flavor: ' \
307         #            '%s, key: %s, name: %s' % \
308         #            (image_id, flavor_id, key_name, slicename))
309
310         # make sure a tenant exists for this slice
311         tenant = self.create_tenant(tenant_name)  
312
313         # add the sfa admin user to this tenant and update our nova client connection
314         # to use these credentials for the rest of this session. This emsures that the instances
315         # we create will be assigned to the correct tenant.
316         sfa_admin_user = self.driver.shell.auth_manager.users.find(name=self.driver.shell.auth_manager.opts['OS_USERNAME'])
317         user_role = self.driver.shell.auth_manager.roles.find(name='user')
318         admin_role = self.driver.shell.auth_manager.roles.find(name='admin')
319         self.driver.shell.auth_manager.roles.add_user_role(sfa_admin_user, admin_role, tenant)
320         self.driver.shell.auth_manager.roles.add_user_role(sfa_admin_user, user_role, tenant)
321         self.driver.shell.nova_manager.connect(tenant=tenant.name)  
322
323         authorized_keys = "\n".join(pubkeys)
324         files = {'/root/.ssh/authorized_keys': authorized_keys}
325         rspec = RSpec(rspec)
326         requested_instances = defaultdict(list)
327         # iterate over clouds/zones/nodes
328         for node in rspec.version.get_nodes_with_slivers():
329             instances = node.get('slivers', [])
330             if not instances:
331                 continue
332             for instance in instances:
333                 try: 
334                     metadata = {}
335                     flavor_id = self.driver.shell.nova_manager.flavors.find(name=instance['name'])
336                     image = instance.get('disk_image')
337                     if image and isinstance(image, list):
338                         image = image[0]
339                     image_id = self.driver.shell.nova_manager.images.find(name=image['name'])
340                     fw_rules = instance.get('fw_rules', [])
341                     group_name = self.create_security_group(instance_name, fw_rules)
342                     metadata['security_groups'] = group_name
343                     if node.get('component_id'):
344                         metadata['component_id'] = node['component_id']
345                     if node.get('client_id'):
346                         metadata['client_id'] = node['client_id'] 
347                     self.driver.shell.nova_manager.servers.create(flavor=flavor_id,
348                                                             image=image_id,
349                                                             key_name = key_name,
350                                                             security_groups = [group_name],
351                                                             files=files,
352                                                             meta=metadata, 
353                                                             name=instance_name)
354                 except Exception, err:    
355                     logger.log_exc(err)                                
356                            
357
358
359     def delete_instance(self, tenant_name, instance_name, id=None):
360     
361         def _delete_security_group(instance):
362             security_group = instance.metadata.get('security_groups', '')
363             if security_group:
364                 manager = SecurityGroup(self.driver)
365                 timeout = 10.0 # wait a maximum of 10 seconds before forcing the security group delete
366                 start_time = time.time()
367                 instance_deleted = False
368                 while instance_deleted == False and (time.time() - start_time) < timeout:
369                     inst = self.driver.shell.nova_manager.servers.findall(id=instance.id)
370                     if not inst:
371                         instance_deleted = True
372                     time.sleep(.5)
373                 manager.delete_security_group(security_group)
374
375         thread_manager = ThreadManager() 
376         self.driver.shell.nova_manager.connect(tenant=tenant_name)
377         args = {'name': instance_name}
378         if id:
379             args['id'] = id
380         instances = self.driver.shell.nova_manager.servers.findall(**args)
381         security_group_manager = SecurityGroup(self.driver)
382         for instance in instances:
383             # destroy instance
384             self.driver.shell.nova_manager.servers.delete(instance)
385             # deleate this instance's security groups
386             thread_manager.run(_delete_security_group, instance)
387         return 1
388
389     def stop_instances(self, instance_name, tenant_name, id=None):
390         self.driver.shell.nova_manager.connect(tenant=tenant_name)
391         args = {'name': instance_name}
392         if id:
393             args['id'] = id
394         instances = self.driver.shell.nova_manager.servers.findall(**args)
395         for instance in instances:
396             self.driver.shell.nova_manager.servers.pause(instance)
397         return 1
398
399     def start_instances(self, instance_name, tenant_name, id=None):
400         self.driver.shell.nova_manager.connect(tenant=tenant_name)
401         args = {'name': instance_name}
402         if id:
403             args['id'] = id
404         instances = self.driver.shell.nova_manager.servers.findall(**args)
405         for instance in instances:
406             self.driver.shell.nova_manager.servers.resume(instance)
407         return 1
408
409     def restart_instances(self, instacne_name, tenant_name, id=None):
410         self.stop_instances(instance_name, tenant_name, id)
411         self.start_instances(instance_name, tenant_name, id)
412         return 1 
413
414     def update_instances(self, project_name):
415         pass