Openstack liberty源码分析之云主机的启动过程3

来源：互联网发布：少儿保险排名知乎编辑：程序博客网时间：2024/05/04 04:49

接上篇Openstack liberty源码分析之云主机的启动过程2, 简单回顾下：nova-conductor收到nova-scheduler返回的主机列表后，依次发送异步rpc请求给目标主机的nova-compute服务，下面继续来看nova-compute服务的处理过程：

nova-compute

根据路由映射，nova-compute中处理云主机启动请求的方法为
nova/compute/manager.py.ComputeManager.py.build_and_run_instance, 该方法没有做实质性的工作，只是通过eventlet创建一个工作线程用于后续的云主机启动工作，以便解耦rpc工作线程，该工作线程后续调用_do_build_and_run_instance方法继续后续操作，一起来看一看：

#该处省略了装饰器定义def _do_build_and_run_instance(self, context, instance, image,            request_spec, filter_properties, admin_password,             injected_files,            requested_networks, security_groups,             block_device_mapping,            node=None, limits=None):     #该处省略了异常处理       LOG.info(_LI('Starting instance...'), context=context,                  instance=instance)     #instance是一个InstancV2实例对象，这里更新实例状态，并通过     #`conductor rpc api`发送同步请求到`conductor`执行实例状态更新     instance.vm_state = vm_states.BUILDING     instance.task_state = None     instance.save(expected_task_state=                    (task_states.SCHEDULING, None))     # b64 decode the files to inject:     decoded_files = self._decode_files(injected_files)     #limits包含node的资源限制，包括：内存和磁盘     if limits is None:         limits = {}     if node is None:         node = self.driver.get_available_nodes(refresh=True)[0]         LOG.debug('No node specified, defaulting to %s', node,     #省略了异常处理，将调用请求转发给_build_and_run_instance执行后续     #处理     self._build_and_run_instance(context, instance, image,                    decoded_files, admin_password,                     requested_networks,                    security_groups, block_device_mapping,                     node, limits,                    filter_properties)    return build_results.ACTIVE

继续来看看_build_and_run_instance的实现：

def _build_and_run_instance(self, context, instance, image,             injected_files,            admin_password, requested_networks,             security_groups,            block_device_mapping, node, limits,             filter_properties):     """image是一个包含镜像信息的字典，‘name’是镜像的名字，例子中的镜像     信息如下：     {         u'status': u'active', u'deleted': False,          u'container_format': u'bare', u'min_ram': 0,          u'updated_at': u'2016-03-24T06:58:33.000000',          u'min_disk': 0,          u'owner': u'25520b29dce346d38bc4b055c5ffbfcb',          u'is_public': True, u'deleted_at': None,          u'properties': {}, u'size': 1401421824,          u'name': u'ceph-centos-65-x64-20g.qcow2',         u'checksum': u'a97deac197e76e1f5a427484b1e5df4c',          u'created_at': u'2016-03-24T06:57:28.000000',          u'disk_format': u'qcow2',          u'id': u'226bc6e5-60d7-4a2c-bf0d-a568a1e26e00'     }     """    image_name = image.get('name')    '''省略异常处理'''    #获取/创建ResourceTracker实例，为后续的资源申请做准备    rt = self._get_resource_tracker(node)    #limits包含node的内存，磁盘等资源配额信息，验证node中的资源是否满足    #该次启动请求，资源不足则抛出异常，可以在日志文件中看到类似的INFO log    # ”Attempting claim: memory 2048 MB, disk 20 GB“    with rt.instance_claim(context, instance, limits):        # NOTE(russellb) It's important that this validation be        # done        # *after* the resource tracker instance claim, as that         #is where the host is set on the instance.        self._validate_instance_group_policy(context, instance,                        filter_properties)        #为云主机申请网络资源，完成块设备验证及映射，更新实例状态        with self._build_resources(context, instance,                        requested_networks, security_groups,                         image,                        block_device_mapping) as resources:            instance.vm_state = vm_states.BUILDING            instance.task_state = task_states.SPAWNING            # NOTE(JoshNang) This also saves the changes to the            # instance from _allocate_network_async, as they             # aren't            # saved in that function to prevent races.            instance.save(expected_task_state=                            task_states.BLOCK_DEVICE_MAPPING)            block_device_info = resources['block_device_info']            network_info = resources['network_info']            #调用hypervisor的spawn方法启动云主机实例，我使用的是            #libvirt；所以这里跳转到`nova/virt/libvirt/driver.py/            #LibvirtDriver.spawn，见下面的分析            self.driver.spawn(context, instance, image,                                     injected_files,                                      admin_password,                                     network_info=network_info,                           block_device_info=block_device_info)

def spawn(self, context, instance, image_meta, injected_files,              admin_password, network_info=None,               block_device_info=None):    """主要实现三个功能：    1. 从glance下载镜像（如果本地_base目录没有的话），然后上传到后端存储    2. 生成libvirt xml文件    3. 调用libvirt启动实例    """    #根据image字典信息创建`nova/objects/image_meta.py/ImageMeta    #对象    image_meta = objects.ImageMeta.from_dict(image_meta)    #根据模拟器类型，获取块设备及光驱的总线类型，默认使用kvm，所以：    #块设备，默认使用virtio；光驱，默认使用ide；并且根据    #block_device_info设置设备映射，最后返回包含    #{disk_bus,cdrom_bus,mapping}的字典    disk_info = blockinfo.get_disk_info(CONF.libvirt.virt_type,                                            instance,                                            image_meta,                                            block_device_info)    #从glance下载镜像（如果本地_base目录没有的话），然后上传到后端存储    #具体分析见后文    self._create_image(context, instance,                           disk_info['mapping'],                           network_info=network_info,                           block_device_info=block_device_info,                           files=injected_files,                           admin_pass=admin_password)    #生成libvirt xml文件，具体分析见后文    xml = self._get_guest_xml(context, instance, network_info,                                  disk_info, image_meta,                           block_device_info=block_device_info,                                  write_to_disk=True)    #调用libvirt启动实例，具体分析见后文    self._create_domain_and_network(context, xml, instance,                                         network_info,                                        disk_info,                        block_device_info=block_device_info)    LOG.debug("Instance is running", instance=instance)    def _wait_for_boot():        """Called at an interval until the VM is running."""        state = self.get_info(instance).state        if state == power_state.RUNNING:            LOG.info(_LI("Instance spawned successfully."),                         instance=instance)            raise loopingcall.LoopingCallDone()   #等待实例创建结果（通过libvirt获取云主机状态判断）   timer = loopingcall.FixedIntervalLoopingCall(_wait_for_boot)        timer.start(interval=0.5).wait()

如果spawn方法正常返回，云主机实例就创建成功了。可以在Dashboard上看到新创建的云主机为’运行’状态，通过virsh list命令也可以在宿主上看到实例进程。下面先来看看是_create_image如何创建磁盘的。

创建系统磁盘

_create_image方法代码很长，下面先来看看镜像磁盘的创建过程；另外在下面的分析中只给出关键部分代码，详细内容请读者查阅源码文件:
nova/virt/libvirt/driver.py/LibvirtDriver._create_image

 def _create_image(self, context, instance,                   disk_mapping, suffix='',                   disk_images=None, network_info=None,                   block_device_info=None, files=None,                   admin_pass=None, inject_files=True,                   fallback_from_host=None):    #由于我们是从镜像启动，所以booted_from_volume=False    booted_from_volume = self._is_booted_from_volume(                                    instance, disk_mapping)    ......    """输入参数：disk_images:None    根据instance实例信息填充disk_images    {    'kernel_id': u'',     'image_id': u'226bc6e5-60d7-4a2c-bf0d-a568a1e26e00',     'ramdisk_id': u''    }    """    if not disk_images:        disk_images = {'image_id': instance.image_ref,                       'kernel_id': instance.kernel_id,                       'ramdisk_id': instance.ramdisk_id}    ......    #booted_from_volume=False    if not booted_from_volume:        #根据`image_id`hash，生成系统磁盘名        root_fname = imagecache.get_cache_fname(disk_images,                                                     'image_id')        #root_gb是系统盘的大小，我的例子中是20（20G）        size = instance.root_gb * units.Gi        #输入参数：suffix=''        if size == 0 or suffix == '.rescue':            size = None        #由于我们采用的存储后端是ceph，所以这里生成的backend=Rbd        #`disk`参数作为生成的设备名后缀：'uuid_disk'        backend = image('disk')        #正常启动云主机，至此task_state=spawning状态        if instance.task_state == task_states.RESIZE_FINISH:                       backend.create_snap(                        libvirt_utils.RESIZE_SNAPSHOT_NAME)        #Rbd支持clone操作        if backend.SUPPORTS_CLONE:            def clone_fallback_to_fetch(*args, **kwargs):                try:                    backend.clone(context,                                     disk_images['image_id'])                except exception.ImageUnacceptable:                    #如果调用clone发生异常，就调用fecth_image                    #下载镜像                    libvirt_utils.fetch_image(*args, **kwargs)            fetch_func = clone_fallback_to_fetch        else:            #如果后端使用的lvm，那个就是走这里            fetch_func = libvirt_utils.fetch_image        #_try_fetch_image_cache直接调用        #`backend.cache = Rbd.cache`方法从glance下载镜像        #并创建系统盘上传到后端存储,如果出现ImageNotFound异常，        #则会尝试从本地的()        self._try_fetch_image_cache(backend, fetch_func,                                         context,                                        root_fname,                                        disk_images['image_id'],                                        instance, size,                                         fallback_from_host)    ......

下面来看nova/virt/libvirt/imagebackend.py/Rbd.cache的实现：

def cache(self, fetch_func, filename, size=None, *args, **kwargs):    @utils.synchronized(filename, external=True,                             lock_path=self.lock_path)    def fetch_func_sync(target, *args, **kwargs):        # The image may have been fetched while a subsequent        # call was waiting to obtain the lock.        if not os.path.exists(target):            fetch_func(target=target, *args, **kwargs)    #合成本地镜像缓存路径，可以在nova.conf文件中修改instances_path和    #image_cache_subdirectory_name配置缓存路径，我的环境为：    #/opt/stack/data/nova/instances/_base    #有读者可能想到这里应该能用高速设备，提升性能了！！！    base_dir = os.path.join(CONF.instances_path,                 CONF.image_cache_subdirectory_name)    if not os.path.exists(base_dir):        fileutils.ensure_tree(base_dir)    #拼接镜像路径：/opt/stack/data/nova/instances/_base/filename    #我的例子为：/opt/stack/data/nova/instances/_base/    #cb241933d7daa40a536db47d41376dd03a83b517    base = os.path.join(base_dir, filename)    #如果镜像不存在（通常都不存在）就从glance下载    #（调用RBDDriver.exits方法判断）    if not self.check_image_exists() or not                                         os.path.exists(base):        #fetch_func_sync是fetch_func的互斥版本，下面分析继续        #create_image        self.create_image(fetch_func_sync, base, size,                              *args, **kwargs)    #Rbd不支持fallocate    if (size and self.preallocate and self._can_fallocate() and                os.access(self.path, os.W_OK)):         utils.execute('fallocate', '-n', '-l', size, self.path)----------------------------------------------------------#nova/virt/libvirt/imagebackend.py/Rbd.create_imagedef create_image(self, prepare_template, base, size, *args,                                                 **kwargs):    """如果本地没有镜像缓存就先从glance下载到本地，否则直接从本地缓存导入    输入参数prepare_template指向fetch_func_sync，函数调用链条如下    (忽略装饰器)：    prepare_template（fetch_func_sync）        -> fetch_func(clone_fallback_to_fetch)            (如果由于镜像是qcow格式，抛异常了，就会执行下面的fetch_image调用)            -> Rbd.clone                 -> libvirt_utils.fetch_image    具体请看下文clone的代码分析    """    if not self.check_image_exists():        prepare_template(target=base, max_size=size, *args, **kwargs)    # prepare_template() may have cloned the image into a new rbd    # image already instead of downloading it locally    #上面的prepare_template方法将镜像下载到本地缓存后（如果本地没有的    #话），RBDDriver再调用`rdb import`将镜像上传到nova的存储后端    #如果镜像是raw格式的话，镜像将不会缓存在本地，rbd直接在rbd pool    #间完成clone，我想你应该知道：用rbd作为glance及nova后端，镜像格式就    #应该是raw了吧！！！    if not self.check_image_exists():        self.driver.import_image(base, self.rbd_name)    self.verify_base_size(base, size)    if size and size > self.get_disk_size(self.rbd_name):        self.driver.resize(self.rbd_name, size)---------------------------------------------------------#如果check_image_exists发现本地没有镜像缓存，就会触发下面的clone调用def clone(self, context, image_id_or_uri):    #通过glanceclient获取镜像元信息    image_meta = IMAGE_API.get(context, image_id_or_uri,                                   include_locations=True)    """    [    {'url': u'rbd://1ee20ded-caae-419d-9fe3-5919f129cf55/images/226bc6e5-60d7-4a2c-bf0d-a568a1e26e00/snap', 'metadata': {}}    ]          """                      locations = image_meta['locations']    LOG.debug('Image locations are: %(locs)s' % {'locs': locations})    #我的镜像是qcow2格式的，所以这里抛异常了    #所以如果以Rbd作为nova的后端存储，最好上传raw格式的镜像(在后面的分析    #中可以看到：会把非raw格式的镜像转换为raw，这会带来性能损耗)    #还记得LibvirtDriver._create_image方法中说，如果clone异常了，    #就会再次调用libvirt_utils.fetch_image方法吧！在这里就看到效果了    if image_meta.get('disk_format') not in ['raw', 'iso']:        reason = _('Image is not raw format')        raise exception.ImageUnacceptable(image_id=image_id_or_uri,                                              reason=reason)    #如果是raw格式的镜像，则执行这里    for location in locations:        #判断是否支持clone，如果是raw格式就支持；        #直接调用clone方法克隆image（将image从源pool拷贝到目的pool）        if self.driver.is_cloneable(location, image_meta):            return self.driver.clone(location, self.rbd_name)    #如果是其他格式，则抛异常    reason = _('No image locations are accessible')    raise exception.ImageUnacceptable(image_id=image_id_or_uri,                                          reason=reason)-----------------------------------------------------------"""正如上面说的：如果不是raw格式，`Rbd.clone`方法会抛异常，再次调用`libvirt_utils.fetch_image`下载镜像，而该方法直接调用`nova/virt/images.py/fetch_to_raw`方法，一起来看看："""def fetch_to_raw(context, image_href, path, user_id,                                 project_id, max_size=0):    """    1.从glance下载镜像到本地，保存到'hash(image_id).part'文件    2.如果需要的话，将镜像转换为raw格式，保存到'hash（image_id）.converted'    3.删除'hash(image_id).part'文件，重命    名'hash（image_id）.converted'为'hash（image_id）'    """    #path就是之前`Rbd.cache`方法中的base，我的例子中是：    #/opt/stack/data/nova/instances/_base/    #cb241933d7daa40a536db47d41376dd03a83b517    path_tmp = "%s.part" % path    #调用glanceclient从glance下载image镜像，并存储在path_tmp路径上    fetch(context, image_href, path_tmp, user_id, project_id,          max_size=max_size)    with fileutils.remove_path_on_error(path_tmp):        #调用`qemu-img info`命令获取刚才下载的image镜像文件的信息        data = qemu_img_info(path_tmp)        #镜像格式        fmt = data.file_format        if fmt is None:            raise exception.ImageUnacceptable(                reason=_("'qemu-img info' parsing failed."),                image_id=image_href)        #不支持后备文件        backing_file = data.backing_file        if backing_file is not None:            raise exception.ImageUnacceptable(image_id=image_href,                reason=(_("fmt=%(fmt)s backed by: %(backing_file)s") %                        {'fmt': fmt, 'backing_file': backing_file}))        """        # We can't generally shrink incoming images, so         #disallow        # images > size of the flavor we're booting.  Checking         #here avoids        # an immediate DoS where we convert large qcow images         #to raw        # (which may compress well but not be sparse).        # TODO(p-draigbrady): loop through all flavor sizes, so        # that        # we might continue here and not discard the download.        # If we did that we'd have to do the higher level size         #checks        # irrespective of whether the base image was prepared         #or not.        """        disk_size = data.virtual_size        if max_size and max_size < disk_size:            LOG.error(_LE('%(base)s virtual size %(disk_size)s'                   'larger than flavor root disk size (size)s'),                      {'base': path,                       'disk_size': disk_size,                       'size': max_size})            raise exception.FlavorDiskSmallerThanImage(                flavor_size=max_size, image_size=disk_size)        #如果不是raw格式，强制转换为raw格式        if fmt != "raw" and CONF.force_raw_images:            staged = "%s.converted" % path            LOG.debug("%s was %s, converting to raw" %                                         (image_href, fmt))            with fileutils.remove_path_on_error(staged):                try:                    """调用`qemu-img convert`命令将之前下载的非raw                    格式镜像path_tmp转换为raw格式，并存储到staged文                    件中                    """                    convert_image(path_tmp, staged, fmt, 'raw')                except exception.ImageUnacceptable as exp:                    # re-raise to include image_href                    raise  exception.ImageUnacceptable(                          image_id=image_href,                        reason=_("Unable to convert image to                         raw: %(exp)s") % {'exp': exp})                #删除最开始下载的非raw格式镜像文件                os.unlink(path_tmp)                #调用`qemu-img info`命令获取转换格式后的image                #镜像文件的信息,如果不是raw格式就抛异常                data = qemu_img_info(staged)                if data.file_format != "raw":                    raise exception.ImageUnacceptable(                        image_id=image_href,                        reason=_("Converted to raw, but format                         is now %s") % data.file_format)                #重命名转换的镜像文件                  os.rename(staged, path)        else:            os.rename(path_tmp, path)

小结：上面分析了以ceph rbd作为存储后端的系统磁盘生成过程，有这么几个要点：

当以ceph rdb作为存储后端的时候，最好使用raw格式的镜像
如果由于某些原因使用了qcow2之类的镜像格式，最好将_base缓存目录放到高速设备上，加快云主机的启动速度
创建/配置非系统磁盘
回到nova/virt/libvirt/driver.py/LibvirtDriver._create_image

def _create_image(self, context, instance,                   disk_mapping, suffix='',                   disk_images=None, network_info=None,                   block_device_info=None, files=None,                   admin_pass=None, inject_files=True,                   fallback_from_host=None):    """先看看disk_mapping参数：定义了三个设备    disk_mapping: {    'disk.config': {'bus': 'ide', 'type': 'cdrom', 'dev': 'hdd'},     'disk': {'bus': 'virtio', 'boot_index': '1',                             'type': 'disk', 'dev': u'vda'},     'root': {'bus': 'virtio', 'boot_index': '1',                             'type': 'disk', 'dev': u'vda'}}    """    #disk_mapping不包含下述磁盘并且处理逻辑与前面创建系统盘相似，    #直接跳过`disk.local`,`disk.swap`,`ephemerals`部分代码    .......    # Config drive（默认使用配置磁盘）    if configdrive.required_by(instance):        LOG.info(_LI('Using config drive'), instance=instance)        extra_md = {}        #管理员密码        if admin_pass:            extra_md['admin_pass'] = admin_pass        #输入参数files=[], network_info包含详细的网络配置信息，        #instance是InstanceV2对象，包含云主机详细信息        #获取云主机实例的配置信息,创建InstanceMetadata对象        inst_md = instance_metadata.InstanceMetadata(instance,                            content=files, extra_md=extra_md,                             network_info=network_info)        with configdrive.ConfigDriveBuilder(instance_md=inst_md)                                                     as cdb:            #拼接配置文件的路径：            #CONF.instances_path/instance.uuid/disk.conf            #CONF.instances_path可以在nova.conf中配置            configdrive_path =                    self._get_disk_config_path(instance, suffix)            LOG.info(_LI('Creating config drive at %(path)s'),                                {'path': configdrive_path},                                         instance=instance)            try:                #调用ConfigDriveBuilder.make_drive方法创建配置文件                #内部调用CONF.mkisofs_cmd（默认genisoimage）工具创                #建configdrive_path文件，内容为云主机配置信息                cdb.make_drive(configdrive_path)            except processutils.ProcessExecutionError as e:                with excutils.save_and_reraise_exception():                    LOG.error(_LE('Creating config drive'                                 'failed with error: %s'),                                  e, instance=instance)        try:            # Tell the storage backend about the config drive            #根据类型创建配置磁盘后端，我的例子中使用rbd，所以创建的是            #Rbd实例（否则就是raw实例）            config_drive_image = self.image_backend.image(                        instance, 'disk.config' + suffix,                        self._get_disk_config_image_type())            #这里会调用`rbd import`命令将configdrive_path文件导入到            #ceph中（磁盘名为：instance_uuid_disk.conf）            config_drive_image.import_file(                    instance, configdrive_path, 'disk.config' +                                                         suffix)        finally:            # NOTE(mikal): if the config drive was imported             #into RBD, then we no longer need the local copy            #删除本地的配置文件            if CONF.libvirt.images_type == 'rbd':                os.unlink(configdrive_path)    # File injection only if needed    #默认情况下inject_partition=-2，就是不允许直接将配置注入到磁盘中    #另外，如果云主机是从磁盘启动的，是不支持注入的    elif inject_files and CONF.libvirt.inject_partition != -2:        if booted_from_volume:            LOG.warn(_LW('File injection into a boot from'                     'volume instance is not supported'),                                      instance=instance)        #注入到系统盘中，具体请看nova/virt/disk/vfs下的相关代码        #主要是借助guestfs模块实现        self._inject_data(                instance, network_info, admin_pass, files,                                                     suffix)   #通常virt_type=kvm,如果是uml，则磁盘需要root权限   if CONF.libvirt.virt_type == 'uml':       libvirt_utils.chown(image('disk').path, 'root')

生成libvirt xml配置

经过上面的_create_image方法所有的磁盘设备都配置好了，下面来看看libvirt xml的生成过程：

#nova/virt/libvirt/driver.py/LibvirtDriver._get_guest_xmldef _get_guest_xml(self, context, instance, network_info,                         disk_info,                        image_meta, rescue=None,                        block_device_info=None,                         write_to_disk=False):    """NOTE(danms): Stringifying a NetworkInfo will take a     lock. Do this ahead of time so that we don't acquire it     while also holding the logging lock.    """    """代码逻辑很清晰：    1. 根据配置生成云主机配置字典    2. 将配置字典转换为xml格式    3. xml保存到本地    """    network_info_str = str(network_info)    msg = ('Start _get_guest_xml '               'network_info=%(network_info)s '               'disk_info=%(disk_info)s '               'image_meta=%(image_meta)s rescue=%(rescue)s '               'block_device_info=%(block_device_info)s' %               {'network_info': network_info_str,                'disk_info': disk_info,                'image_meta': image_meta, 'rescue': rescue,                'block_device_info': block_device_info})    # NOTE(mriedem): block_device_info can contain     #auth_password so we need to sanitize the password in the     #message.    LOG.debug(strutils.mask_password(msg), instance=instance)    conf = self._get_guest_config(instance, network_info,                                       image_meta,                                      disk_info, rescue,                                       block_device_info,                                      context)    #将云主机配置转换为xml格式    xml = conf.to_xml()    #记录到本地磁盘    if write_to_disk:        instance_dir = libvirt_utils.get_instance_path(instance)        #将xml配置保存到CONF.instance_path/instance_uuid/libvirt.xml        xml_path = os.path.join(instance_dir, 'libvirt.xml')        libvirt_utils.write_to_file(xml_path, xml)    LOG.debug('End _get_guest_xml xml=%(xml)s',                  {'xml': xml}, instance=instance)    return xml

_get_guest_xml方法比较简单，这里不再分析了，有疑问的读者可以联系我一起讨论。

启动云主机

函数实现如下：

def _create_domain_and_network(self, context, xml, instance,                                    network_info,                                   disk_info,                                    block_device_info=None,                                   power_on=True, reboot=False,                                   vifs_already_plugged=False):    #几个关键的输入参数如下：    """    disk_info:    {    'disk_bus': 'virtio', 'cdrom_bus': 'ide',     'mapping': {        'disk.config': {'bus': 'ide', 'type': 'cdrom',                                                 'dev': 'hdd'},         'disk': {'bus': 'virtio', 'boot_index': '1',                                'type': 'disk', 'dev': u'vda'},         'root': {'bus': 'virtio',             'boot_index': '1', 'type': 'disk', 'dev': u'vda'}        }    }    block_device_info:    {        'swap': None, 'root_device_name': u'/dev/vda',         'ephemerals': [], 'block_device_mapping': []    }     network_info:包含云主机的网络配置信息    [VIF({'profile': {}, 'ovs_interfaceid': None,     'preserve_on_delete': False,     'network': Network({'bridge': u'brq20f5ec1b-4f', 'subnets':     [Subnet({'ips': [FixedIP({'meta': {}, 'version': 4, 'type':     'fixed', 'floating_ips': [], 'address':     u'xx.xxx.xxx.xxx'})], 'version': 4, 'meta': {'dhcp_server':     u'xx.xxx.xxx.xxx'}, 'dns': [], 'routes': [], 'cidr':     u'xx.xxx.xxx.0/xxx', 'gateway': IP({'meta': {}, 'version':     4, 'type': 'gateway', 'address': u'10.240.227.1'})})],     'meta': {'injected': False, 'tenant_id':     u'25520b29dce346d38bc4b055c5ffbfcb',     'should_create_bridge': True}, 'id': u'20f5ec1b-4f96-41d8-    97f3-6776db0d00a7', 'label': u'10.240.227.x'}), 'devname':     u'tapefe77b47-fe', 'vnic_type': u'normal', 'qbh_params':      None, 'meta': {}, 'details': {u'port_filter': True},      'address': u'fa:16:3e:5e:64:80', 'active': False, 'type':      u'bridge', 'id': u'efe77b47-fef8-48ff-93ee-8da753a6d2bb',     'qbg_params': None})]    """    #获取块设备映射，由输入参数我们知道block_device_mapping=[]    block_device_mapping = driver.block_device_info_get_mapping(            block_device_info)    #获取image的metadata    image_meta = objects.ImageMeta.from_instance(instance)    #如果开启了磁盘加密，就用指定的加密算法加密磁盘    #我们这里block_device_mapping=[],忽略相关的代码    for vol in block_device_mapping:        .......    #vif_plugging_timeout=300(默认5分钟)    #检查neutron网络事件，如果vif是非active状态，就需要处理plug事件    #我的例子中events为：[('network-vif-plugged', u'efe77b47-    #fef8-48ff-93ee-8da753a6d2bb')]    timeout = CONF.vif_plugging_timeout    if (self._conn_supports_start_paused and        utils.is_neutron() and not        vifs_already_plugged and power_on and timeout):            events = self._get_neutron_events(network_info)        else:            events = []     #pause = true     pause = bool(events)     guest = None     #忽略try{ }except处理代码     #在启动云主机前，需要先准备好虚拟网卡     #调用ComputeVirtAPI.wait_for_instance_event处理neutron网络     #事件，这里是network-vif-plugged事件，在     #wait_for_instance_event中启动eventlet线程处理事件，并等待结束     #如果发生异常，则调用self._neutron_failed_callback处理。     with self.virtapi.wait_for_instance_event(                instance, events, deadline=timeout,                error_callback=self._neutron_failed_callback):          #安装虚拟网卡（我使用的是bridge，最终调用的是          #LibvirtGenericVIFDriver.plug_bridge方法）          """  简单分析如下：           调用self.plug_vifs后，内部会通过判断vif的类型（我的例子中用          的是bridge）来调用具体的接口，然后具体的调用是这样的：          self.plug_vifs ->           nova/virt/libvirt/vif.py/LibvirtGenericVIFDriver.plug           -> LibvirtGenericVIFDriver.plug_bridge ->          nova/network/linux_net.py/          LinuxBridgeInterfaceDriver.ensure_bridge, 最后是通过          brctl工具创建的bridge，具体的实现读者可以自行看看          """          self.plug_vifs(instance, network_info)          #设置基本的iptables规则          self.firewall_driver.setup_basic_filtering(instance,                                               network_info)          #为云主机设置网络过滤规则，防火墙策略         self.firewall_driver.prepare_instance_filter(instance,                                               network_info)          with self._lxc_disk_handler(instance, image_meta,                                            block_device_info,                                             disk_info):               #调用libvirt库启动虚拟机               #xml是云主机xml配置，pause=true，power_on=true               #我使用的是qemu-kvm，所以先会通过qemu:///system连接               #hypervisor,然后执行define，最后启动云主机               guest = self._create_domain(                        xml, pause=pause, power_on=power_on)         #no-ops         self.firewall_driver.apply_instance_filter(instance,                                                 network_info)     # Resume only if domain has been paused     if pause:         guest.resume()     return guest

如果一切正常，返回到LibvirtDriver.spawn等待云主机启动完成。虚拟机启动成功后，继续返回到_build_and_run_instance，在该方法的末尾会更新云主机状态，更新数据库，发送通知给scheduler更新资源使用情况。

总得来说，云主机启动过程中各个模块之间的交互还没蛮复杂的。有很多细节需要考虑。需要多多花时间斟酌。

0 0

Openstack liberty源码分析 之 云主机的启动过程3

nova-compute

创建系统磁盘

创建/配置非系统磁盘

生成libvirt xml配置

启动云主机

Openstack liberty源码分析之云主机的启动过程3