基于镜像卷启动的虚机快照代码分析
基于ocata版本进行跟踪分析
1、nova-api接受并处理请求的入口函数nova/api/openstack/compute/servers.py/ServersController._action_create_image
nova/api/openstack/compute/servers.py class ServersController(wsgi.Controller): @wsgi.action('createImage') @common.check_snapshots_enabled @validation.schema(schema_servers.create_image, '2.0', '2.0') @validation.schema(schema_servers.create_image, '2.1') def _action_create_image(self, req, id, body): """Snapshot a server instance.""" # 从req中获取请求的上下文,并验证执行权限 context = req.environ['nova.context'] context.can(server_policies.SERVERS % 'create_image') # 从body中解析出传递的参数,快照名称及属性信息 entity = body["createImage"] image_name = common.normalize_name(entity["name"]) metadata = entity.get('metadata', {}) # Starting from microversion 2.39 we don't check quotas on createImage if api_version_request.is_supported( req, max_version= api_version_request.MAX_IMAGE_META_PROXY_API_VERSION): # 检查快照属性的相关配额信息 common.check_img_metadata_properties_quota(context, metadata) #通过虚机uuid,从数据库中获取虚机实例的信息,返回的是一个实例对象 instance = self._get_server(context, req, id) #从数据库bloack_device_mapping表里面获取该虚机所有的块设备映射信息 bdms = objects.BlockDeviceMappingList.get_by_instance_uuid(context, instance.uuid) try: # 判断虚机是基于镜像启动还是基于磁盘启动 if compute_utils.is_volume_backed_instance(context, instance,bdms): context.can(server_policies.SERVERS %'create_image:allow_volume_backed') #基于磁盘启动的虚机快照入口 image = self.compute_api.snapshot_volume_backed( context, instance, image_name, extra_properties=metadata) else: #基于镜像启动的虚机快照入口 image = self.compute_api.snapshot(context, instance, image_name, extra_properties=metadata) ......... # build location of newly-created image entity image_id = str(image['id']) #根据glance配置为该镜像生成url image_ref = glance.generate_image_url(image_id) resp = webob.Response(status_int=202) resp.headers['Location'] = image_ref return resp
因此可以看到,执行基于磁盘启动虚机快照时,实际走的是“ compute_api.snapshot_volume_backed ”
nova/compute/api.py @profiler.trace_cls("compute_api") class API(base.Base): """API for interacting with the compute manager.""" def snapshot_volume_backed(self, context, instance, name, extra_properties=None): """Snapshot the given volume-backed instance. :param instance: nova.objects.instance.Instance object :param name: name of the backup or snapshot :param extra_properties: dict of extra image properties to include :returns: the new image metadata """ #获取虚机的metadata属性 image_meta = self._initialize_instance_snapshot_metadata(instance, name, extra_properties)------s1步 # the new image is simply a bucket of properties (particularly the # block device mapping, kernel and ramdisk IDs) with no image data, # hence the zero size 新镜像只是一堆属性(特别是块设备映射、内核和ramdisk id),没有映像数据,因此大小为零 image_meta['size'] = 0 for attr in ('container_format', 'disk_format'):---清除镜像metadata属性中的 container_format,disk_format 属性 image_meta.pop(attr, None) properties = image_meta['properties'] # clean properties before filling # 清除properties属性里面的'block_device_mapping', 'bdm_v2', 'root_device_name'相关属性值 for key in ('block_device_mapping', 'bdm_v2', 'root_device_name'): properties.pop(key, None) # 将实例中的‘root_device_name’属性更新到properties属性里,image_meta的最终内容如: # { # 'name': u'snapshot1', # u'min_ram': u'0', # u'min_disk': u'20', # 'is_public': False, # 'properties': { # u'base_image_ref': u'', # 'root_device_name': u'/dev/vda' # }, # 'size': 0 # } if instance.root_device_name: properties['root_device_name'] = instance.root_device_name quiesced = False if instance.vm_state == vm_states.ACTIVE: try: # 判断虚拟机的状态,如果虚拟机处于active,则通过rpc通知虚拟机进入静默状态 self.compute_rpcapi.quiesce_instance(context, instance) quiesced = True except (exception.InstanceQuiesceNotSupported, exception.QemuGuestAgentNotEnabled, exception.NovaException, NotImplementedError) as err: if strutils.bool_from_string(instance.system_metadata.get( 'image_os_require_quiesce')): raise else: LOG.info(_LI('Skipping quiescing instance: ' '%(reason)s.'), {'reason': err}, instance=instance) # 从数据库中获取该虚机所关联的所有块设备,结果会返回一个BlockDeviceMappingList对象 bdms = objects.BlockDeviceMappingList.get_by_instance_uuid(context, instance.uuid) mapping = [] #做快照的操作,虚机挂在了多少个卷设备,就要做多少次快照 for bdm in bdms:--------s2步 #映射关系中没有块设备,则忽略此条映射 if bdm.no_device: continue if bdm.is_volume:----这个读取的是block_device_mapping表里面的destination_type字段 # create snapshot based on volume_id volume = self.volume_api.get(context, bdm.volume_id)----调用cinderclient去,根据卷的volume_id从数据库获取卷的详细信息---s4步 # NOTE(yamahata): Should we wait for snapshot creation? # Linux LVM snapshot creation completes in # short time, it doesn't matter for now. name = _('snapshot for %s') % image_meta['name']----快照的名字进行组装,比如快照名称是snapshot1,则这里就是snapshot for snapshot1 LOG.debug('Creating snapshot from volume %s.', volume['id'], instance=instance) snapshot = self.volume_api.create_snapshot_force(------------s3步,调用cinderclient,给cinder发送强制创建快照的请求 context, volume['id'], name, volume['display_description']) mapping_dict = block_device.snapshot_from_bdm(snapshot['id'],bdm)-----s5步 #过滤掉已经在数据库中存在的字段 mapping_dict = mapping_dict.get_image_mapping() else: mapping_dict = bdm.get_image_mapping() mapping.append(mapping_dict)----将云主机所有的映射关系都添加到mapping中 #通过rpc.case发送异步请求给nova-compute # nova-compute接收到消息后,会等到快照完成后对文件系统进行解冻( if quiesced: self.compute_rpcapi.unquiesce_instance(context, instance, mapping) # 更新云主机metadata信息中的properties信息 if mapping: properties['block_device_mapping'] = mapping properties['bdm_v2'] = True """ #到这一步时,会到添加一条记录到glance快照(镜像)数据库条目 #(会在Dashboard的镜像面板显示一条名为snapshot1的快照记录), # 快照的大部分信息都拷贝至系统盘属性,这是因为卷快照是可以直接用来启动云主机的, # 另外'block_device_mapping'属性中包含所有的volume设备快照信息(如果有的话), # 每个volume设备快照信息作为一条记录,记录在image_properties数据表; # { 'name': u'snapshot1', 'min_ram': u'0', 'min_disk': u'20', 'is_public': False, 'properties': { 'bdm_v2': True, 'block_device_mapping': [{ 'guest_format': None, 'boot_index': 0, 'no_device': None, 'image_id': None, 'volume_id': None, 'device_name': u'/dev/vda', 'disk_bus': u'virtio', 'volume_size': 20, 'source_type': 'snapshot', 'device_type': u'disk', 'snapshot_id': u'cede2421-ea68-4a8e-937d-c27074b9024b', 'destination_type': 'volume', 'delete_on_termination': False }], 'base_image_ref': u'', 'root_device_name': u'/dev/vda' }, 'size': 0 } """ return self.image_api.create(context, image_meta)
s1步,主要作用是根据虚机的镜像元数据初始化该虚机快照的元数据
nova/compute/api.py class API(base.Base): def _initialize_instance_snapshot_metadata(self, instance, name, extra_properties=None): """Initialize new metadata for a snapshot of the given instance. :param instance: nova.objects.instance.Instance object :param name: string for name of the snapshot :param extra_properties: dict of extra metadata properties to include :returns: the new instance snapshot metadata """ image_meta = utils.get_image_from_system_metadata(instance.system_metadata)-------获取虚机的镜像源数据 image_meta.update({'name': name,'is_public': False})----把镜像元数据的中镜像的名字,更改为快照的名字 # Delete properties that are non-inheritable properties = image_meta['properties'] for key in CONF.non_inheritable_image_properties:----删除镜像数据中不能继承的属性, properties.pop(key, None) # The properties in extra_properties have precedence properties.update(extra_properties or {}) return image_meta 返回值为 { u'min_disk': u'20', 'is_public': False, 'min_ram': u'0', 'properties': { 'base_image_ref': u'' }, 'name': u'snapshot1' }
s2 步 block_device_mapping表里面的数据样例
*************************** 376. row *************************** created_at: 2019-07-18 12:35:24 updated_at: 2019-07-18 12:35:46 deleted_at: 2019-07-18 12:35:46 id: 24081 device_name: /dev/vdb delete_on_termination: 0 snapshot_id: NULL volume_id: e6f0ddca-74cf-40c9-8db6-d64f32d8ded4 volume_size: NULL no_device: NULL connection_info: null instance_uuid: f9846a41-72c2-4e67-99d3-8391fae7a3ce deleted: 24081 source_type: volume destination_type: volume guest_format: NULL device_type: NULL disk_bus: NULL boot_index: NULL image_id: NULL tag: NULL *************************** 377. row *************************** created_at: 2019-07-19 03:02:57----------基于镜像启动block_device_mapping形式 updated_at: 2019-07-19 03:02:57 deleted_at: 2019-07-19 03:10:42 id: 24084 device_name: /dev/vda delete_on_termination: 1 snapshot_id: NULL volume_id: NULL volume_size: NULL no_device: 0 connection_info: NULL instance_uuid: 99f10424-2ad3-4cdb-8ca5-ebd166d5853c deleted: 24084 source_type: image destination_type: local guest_format: NULL device_type: disk disk_bus: NULL boot_index: 0 image_id: 3006d221-72a6-4fe0-bcdc-d4ace809d8c7 tag: NULL
s5步 block_device.snapshot_from_bdm(snapshot['id'],bdm)
根据bdm信息,来构建快照的dict格式属性信息,返回一个BlockDeviceDict对象,属性如下: { 'guest_format': None, 'boot_index': 0, 'no_device': None, 'connection_info': None, 'snapshot_id': u'cede2421-ea68-4a8e-937d-c27074b9024b', 'volume_size': 20, 'device_name': u'/dev/vda', 'disk_bus': u'virtio', 'image_id': None, 'source_type': 'snapshot', 'device_type': u'disk', 'volume_id': None, 'destination_type': 'volume', 'delete_on_termination': False }
nova-api主要是 完成了以下工作:
1)如果是在线快照,则冻结/解冻结文件系统
2)创建glance数据库镜像记录(包含所有卷的快照信息)
2、cinder-api服务的相关处理
nova-api服务里面s3步的操作,调用cinder的api create_snapshot_force 创建新的卷,实为cinder api的接受请求,进行相关的处理
其详解如下, from nova.volume import cinder self.volume_api = volume_api or cinder.API() snapshot = self.volume_api.create_snapshot_force(context, volume['id'], name, volume['display_description']) nova/volume/cinder.py def create_snapshot_force(self, context, volume_id, name, description): item = cinderclient(context).volume_snapshots.create(volume_id,True,name,description) return _untranslate_snapshot_summary_view(context, item)
因此可以看出,实际调用的是cinder client的 volume_snapshots 的 create 方法,其在cinder api的入口函数为
cinder/api/v2/snapshots.py class SnapshotsController(wsgi.Controller): @wsgi.response(202) def create(self, req, body): """Creates a new snapshot.""" # 根据上下文的分析,当nova-api等其他client在发送创建卷快照的请求之后,本方法会接受到请求 # 方法接收到的参数有: # req:Request对象,包含有本次请求的上下内容,包含有用于鉴权的凭证等内容 # body:快照的属性信息,包含有如下内容: # { # u'snapshot': { # u'volume_id': u'60e16af2-0684-433c-a1b6-c1af1c2523fc', # u'force': True, # u'description': u'', # u'name': u'snapshot for snapshot1', # u'metadata': {} # } # } kwargs = {} #获取上下文的context信息和获取快照属性中的信息 context = req.environ['cinder.context'] self.assert_valid_body(body, 'snapshot') snapshot = body['snapshot'] #获取快照的metadata信息,snapshot_id kwargs['metadata'] = snapshot.get('metadata', None) try: volume_id = snapshot['volume_id'] except KeyError: msg = _("'volume_id' must be specified") raise exc.HTTPBadRequest(explanation=msg) #从数据库中获取卷信息 volume = self.volume_api.get(context, volume_id) #获取传递进来的参数中是否使用强制快照,force=True表示采取强制快照 force = snapshot.get('force', False) msg = _LI("Create snapshot from volume %s") LOG.info(msg, volume_id) #验证快照名及快照描述是否合法,长度不能超过256个字符 self.validate_name_and_description(snapshot) # NOTE(thingee): v2 API allows name instead of display_name # 用display_name代替name参数 if 'name' in snapshot: snapshot['display_name'] = snapshot.pop('name') try: #参数类型转换,如果是非True/False的值,则抛异常 force = strutils.bool_from_string(force, strict=True) except ValueError as error: err_msg = encodeutils.exception_to_unicode(error) msg = _("Invalid value for 'force': '%s'") % err_msg raise exception.InvalidParameterValue(err=msg) # 开始进行快照的操作,根据force值的不同走不通的分支 if force: new_snapshot = self.volume_api.create_snapshot_force(-----s2.1 context, volume, snapshot.get('display_name'), snapshot.get('description'), **kwargs) else: new_snapshot = self.volume_api.create_snapshot(-----s2.2 context, volume, snapshot.get('display_name'), snapshot.get('description'), **kwargs) req.cache_db_snapshot(new_snapshot) return self._view_builder.detail(req, new_snapshot) """ from cinder import volume self.volume_api = volume.API() """ cinder/volume/api.py class API(base.Base): def create_snapshot_force(self, context, volume, name, description, metadata=None): result = self._create_snapshot(context, volume, name, description, True, metadata) LOG.info(_LI("Snapshot force create request issued successfully."), resource=result) return result def create_snapshot(self, context, volume, name, description, metadata=None, cgsnapshot_id=None, group_snapshot_id=None): result = self._create_snapshot(context, volume, name, description, False, metadata, cgsnapshot_id, group_snapshot_id) LOG.info(_LI("Snapshot create request issued successfully."), resource=result) return result def _create_snapshot(self, context, volume, name, description, force=False, metadata=None, cgsnapshot_id=None, group_snapshot_id=None): #保证卷操作处于冻结状态,并且是可进行快照,检查配额是否可用 volume.assert_not_frozen() #在cinder的snapshot数据表中创建一条快照记录,即会在云硬盘快照面板显示一条名为“snapshot for snapshot1”的记录 snapshot = self.create_snapshot_in_db(----s2.3 context, volume, name, description, force, metadata, cgsnapshot_id, True, group_snapshot_id) # 调用rpc.case将create_snapshot的消息投递到消息队列该消息 self.volume_rpcapi.create_snapshot(context, volume, snapshot)---s2.4 给cinder-volume发送rpc请求信息 return snapshot
可以看到两个方法都是调用了“ _create_snapshot ”,只是在传递第5个参数 force 时不一样,同时force为False时,
需要传递其他几个参数(实际上也为空)
cinder-api的操作总结为如下两个方面:
1)卷状态条件检查及配额检查
2)创建glance数据库快照记录(记录的是单个卷快照的信息)
3、cinder-volume服务对快照的处理
s2.4步中,cinder-api通过rpc给cinder-volume服务发送创建快照的请求,cinder-volume服务接受到请求,并处理,其函数入口为manager.py文件中create_snapshot方法
cinder/volume/manager.py class VolumeManager(manager.CleanableManager, manager.SchedulerDependentManager): """Manages attachable block storage devices.""" @objects.Snapshot.set_workers def create_snapshot(self, context, snapshot): """Creates and exports the snapshot.""" # 获取请求上下文 context = context.elevated() # 通过消息队列,通知ceilometer快照发生变化 self._notify_about_snapshot_usage( context, snapshot, "create.start") try: """异常处理代码,有任何异常则退出并设置快照状态为error""" # NOTE(flaper87): Verify the driver is enabled # before going forward. The exception will be caught # and the snapshot status updated. # 确保存储驱动已经初始化,否则抛出异常 utils.require_driver_initialized(self.driver) # Pass context so that drivers that want to use it, can, # but it is not a requirement for all drivers. snapshot.context = context # 调用后端存储驱动执行快照 model_update = self.driver.create_snapshot(snapshot)---------s3.1 步 # 完成之后,更新数据库条目,若返回的是None,则不执行 if model_update: snapshot.update(model_update) snapshot.save() except Exception as error: # 若之前几步操作出现问题,则将快照的状态置为error with excutils.save_and_reraise_exception(): snapshot.status = fields.SnapshotStatus.ERROR snapshot.save() self.db.snapshot_metadata_update( context, snapshot.id, {'error': six.text_type(error)}, False) # 从cinder的数据库中获取卷的信息 vol_ref = self.db.volume_get(context, snapshot.volume_id) # 如果该卷的bootable属性为True,表示该卷是启动卷,表示云主机是通过卷启动的,即系统盘, # 如果是非启动卷,则跳过 if vol_ref.bootable: try: # 用卷的metadata信息来更新snapshot的metadata信息,需要保证系统盘的元数据与其快照的元数据一致 self.db.volume_glance_metadata_copy_to_snapshot( context, snapshot.id, snapshot.volume_id) except exception.GlanceMetadataNotFound: # 更新snapshot的元数据如果抛出GlanceMetadataNotFound, # 表示从glance中找不到卷的元数据信息,可以直接跳过 # If volume is not created from image, No glance metadata # would be available for that volume in # volume glance metadata table pass except exception.CinderException as ex: LOG.exception(_LE("Failed updating snapshot" " metadata using the provided volumes" " %(volume_id)s metadata"), {'volume_id': snapshot.volume_id}, resource=snapshot) # 如果抛出cinder方面的异常,则有可能是快照出现问题,则直接将快照的状态置为error snapshot.status = fields.SnapshotStatus.ERROR snapshot.save() self.db.snapshot_metadata_update(context, snapshot.id, {'error': six.text_type(ex)}, False) raise exception.MetadataCopyFailure(reason=six.text_type(ex)) # 若一路过来没有出现异常,则代表快照完成,将快照状态标记为可用,进度为100%,并保存状态 snapshot.status = fields.SnapshotStatus.AVAILABLE snapshot.progress = '100%' snapshot.save() # 通过消息队列,通知ceilometer快照完成 self._notify_about_snapshot_usage(context, snapshot, "create.end") LOG.info(_LI("Create snapshot completed successfully"), resource=snapshot) return snapshot.id
从上面的代码中可以找到,执行快照其实是调用底层的后端存储来做的,即s3.1 步的“driver.create_snapshot(snapshot)”,
针对不同的存储类型,会有不同的处理方式
因此cinder-volume服务快照功能很简单:调用后端存储执行快照,然后更新glance数据库快照记录
学习过程中,参考如下博客 https://www.cnblogs.com/qianyeliange/p/9713146.html