123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468 |
- # Library for manipulations with qcow2 image
- #
- # Copyright (c) 2020 Virtuozzo International GmbH.
- # Copyright (C) 2012 Red Hat, Inc.
- #
- # This program is free software; you can redistribute it and/or modify
- # it under the terms of the GNU General Public License as published by
- # the Free Software Foundation; either version 2 of the License, or
- # (at your option) any later version.
- #
- # This program is distributed in the hope that it will be useful,
- # but WITHOUT ANY WARRANTY; without even the implied warranty of
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- # GNU General Public License for more details.
- #
- # You should have received a copy of the GNU General Public License
- # along with this program. If not, see <http://www.gnu.org/licenses/>.
- #
- import struct
- import string
- import json
- class ComplexEncoder(json.JSONEncoder):
- def default(self, obj):
- if hasattr(obj, 'to_json'):
- return obj.to_json()
- else:
- return json.JSONEncoder.default(self, obj)
- class Qcow2Field:
- def __init__(self, value):
- self.value = value
- def __str__(self):
- return str(self.value)
- class Flags64(Qcow2Field):
- def __str__(self):
- bits = []
- for bit in range(64):
- if self.value & (1 << bit):
- bits.append(bit)
- return str(bits)
- class BitmapFlags(Qcow2Field):
- flags = {
- 0x1: 'in-use',
- 0x2: 'auto'
- }
- def __str__(self):
- bits = []
- for bit in range(64):
- flag = self.value & (1 << bit)
- if flag:
- bits.append(self.flags.get(flag, f'bit-{bit}'))
- return f'{self.value:#x} ({bits})'
- class Enum(Qcow2Field):
- def __str__(self):
- return f'{self.value:#x} ({self.mapping.get(self.value, "<unknown>")})'
- class Qcow2StructMeta(type):
- # Mapping from c types to python struct format
- ctypes = {
- 'u8': 'B',
- 'u16': 'H',
- 'u32': 'I',
- 'u64': 'Q'
- }
- def __init__(self, name, bases, attrs):
- if 'fields' in attrs:
- self.fmt = '>' + ''.join(self.ctypes[f[0]] for f in self.fields)
- class Qcow2Struct(metaclass=Qcow2StructMeta):
- """Qcow2Struct: base class for qcow2 data structures
- Successors should define fields class variable, which is: list of tuples,
- each of three elements:
- - c-type (one of 'u8', 'u16', 'u32', 'u64')
- - format (format_spec to use with .format() when dump or 'mask' to dump
- bitmasks)
- - field name
- """
- def __init__(self, fd=None, offset=None, data=None):
- """
- Two variants:
- 1. Specify data. fd and offset must be None.
- 2. Specify fd and offset, data must be None. offset may be omitted
- in this case, than current position of fd is used.
- """
- if data is None:
- assert fd is not None
- buf_size = struct.calcsize(self.fmt)
- if offset is not None:
- fd.seek(offset)
- data = fd.read(buf_size)
- else:
- assert fd is None and offset is None
- values = struct.unpack(self.fmt, data)
- self.__dict__ = dict((field[2], values[i])
- for i, field in enumerate(self.fields))
- def dump(self, is_json=False):
- if is_json:
- print(json.dumps(self.to_json(), indent=4, cls=ComplexEncoder))
- return
- for f in self.fields:
- value = self.__dict__[f[2]]
- if isinstance(f[1], str):
- value_str = f[1].format(value)
- else:
- value_str = str(f[1](value))
- print('{:<25} {}'.format(f[2], value_str))
- def to_json(self):
- return dict((f[2], self.__dict__[f[2]]) for f in self.fields)
- class Qcow2BitmapExt(Qcow2Struct):
- fields = (
- ('u32', '{}', 'nb_bitmaps'),
- ('u32', '{}', 'reserved32'),
- ('u64', '{:#x}', 'bitmap_directory_size'),
- ('u64', '{:#x}', 'bitmap_directory_offset')
- )
- def __init__(self, fd, cluster_size):
- super().__init__(fd=fd)
- tail = struct.calcsize(self.fmt) % 8
- if tail:
- fd.seek(8 - tail, 1)
- position = fd.tell()
- self.cluster_size = cluster_size
- self.read_bitmap_directory(fd)
- fd.seek(position)
- def read_bitmap_directory(self, fd):
- fd.seek(self.bitmap_directory_offset)
- self.bitmap_directory = \
- [Qcow2BitmapDirEntry(fd, cluster_size=self.cluster_size)
- for _ in range(self.nb_bitmaps)]
- def dump(self):
- super().dump()
- for entry in self.bitmap_directory:
- print()
- entry.dump()
- def to_json(self):
- fields_dict = super().to_json()
- fields_dict['bitmap_directory'] = self.bitmap_directory
- return fields_dict
- class Qcow2BitmapDirEntry(Qcow2Struct):
- fields = (
- ('u64', '{:#x}', 'bitmap_table_offset'),
- ('u32', '{}', 'bitmap_table_size'),
- ('u32', BitmapFlags, 'flags'),
- ('u8', '{}', 'type'),
- ('u8', '{}', 'granularity_bits'),
- ('u16', '{}', 'name_size'),
- ('u32', '{}', 'extra_data_size')
- )
- def __init__(self, fd, cluster_size):
- super().__init__(fd=fd)
- self.cluster_size = cluster_size
- # Seek relative to the current position in the file
- fd.seek(self.extra_data_size, 1)
- bitmap_name = fd.read(self.name_size)
- self.name = bitmap_name.decode('ascii')
- # Move position to the end of the entry in the directory
- entry_raw_size = self.bitmap_dir_entry_raw_size()
- padding = ((entry_raw_size + 7) & ~7) - entry_raw_size
- fd.seek(padding, 1)
- self.bitmap_table = Qcow2BitmapTable(fd=fd,
- offset=self.bitmap_table_offset,
- nb_entries=self.bitmap_table_size,
- cluster_size=self.cluster_size)
- def bitmap_dir_entry_raw_size(self):
- return struct.calcsize(self.fmt) + self.name_size + \
- self.extra_data_size
- def dump(self):
- print(f'{"Bitmap name":<25} {self.name}')
- super(Qcow2BitmapDirEntry, self).dump()
- self.bitmap_table.dump()
- def to_json(self):
- # Put the name ahead of the dict
- return {
- 'name': self.name,
- **super().to_json(),
- 'bitmap_table': self.bitmap_table
- }
- class Qcow2BitmapTableEntry(Qcow2Struct):
- fields = (
- ('u64', '{}', 'entry'),
- )
- BME_TABLE_ENTRY_RESERVED_MASK = 0xff000000000001fe
- BME_TABLE_ENTRY_OFFSET_MASK = 0x00fffffffffffe00
- BME_TABLE_ENTRY_FLAG_ALL_ONES = 1
- def __init__(self, fd):
- super().__init__(fd=fd)
- self.reserved = self.entry & self.BME_TABLE_ENTRY_RESERVED_MASK
- self.offset = self.entry & self.BME_TABLE_ENTRY_OFFSET_MASK
- if self.offset:
- if self.entry & self.BME_TABLE_ENTRY_FLAG_ALL_ONES:
- self.type = 'invalid'
- else:
- self.type = 'serialized'
- elif self.entry & self.BME_TABLE_ENTRY_FLAG_ALL_ONES:
- self.type = 'all-ones'
- else:
- self.type = 'all-zeroes'
- def to_json(self):
- return {'type': self.type, 'offset': self.offset,
- 'reserved': self.reserved}
- class Qcow2BitmapTable:
- def __init__(self, fd, offset, nb_entries, cluster_size):
- self.cluster_size = cluster_size
- position = fd.tell()
- fd.seek(offset)
- self.entries = [Qcow2BitmapTableEntry(fd) for _ in range(nb_entries)]
- fd.seek(position)
- def dump(self):
- bitmap_table = enumerate(self.entries)
- print(f'{"Bitmap table":<14} {"type":<15} {"size":<12} {"offset"}')
- for i, entry in bitmap_table:
- if entry.type == 'serialized':
- size = self.cluster_size
- else:
- size = 0
- print(f'{i:<14} {entry.type:<15} {size:<12} {entry.offset}')
- def to_json(self):
- return self.entries
- QCOW2_EXT_MAGIC_BITMAPS = 0x23852875
- class QcowHeaderExtension(Qcow2Struct):
- class Magic(Enum):
- mapping = {
- 0xe2792aca: 'Backing format',
- 0x6803f857: 'Feature table',
- 0x0537be77: 'Crypto header',
- QCOW2_EXT_MAGIC_BITMAPS: 'Bitmaps',
- 0x44415441: 'Data file'
- }
- def to_json(self):
- return self.mapping.get(self.value, "<unknown>")
- fields = (
- ('u32', Magic, 'magic'),
- ('u32', '{}', 'length')
- # length bytes of data follows
- # then padding to next multiply of 8
- )
- def __init__(self, magic=None, length=None, data=None, fd=None,
- cluster_size=None):
- """
- Support both loading from fd and creation from user data.
- For fd-based creation current position in a file will be used to read
- the data.
- The cluster_size value may be obtained by dependent structures.
- This should be somehow refactored and functionality should be moved to
- superclass (to allow creation of any qcow2 struct), but then, fields
- of variable length (data here) should be supported in base class
- somehow. Note also, that we probably want to parse different
- extensions. Should they be subclasses of this class, or how to do it
- better? Should it be something like QAPI union with discriminator field
- (magic here). So, it's a TODO. We'll see how to properly refactor this
- when we have more qcow2 structures.
- """
- if fd is None:
- assert all(v is not None for v in (magic, length, data))
- self.magic = magic
- self.length = length
- if length % 8 != 0:
- padding = 8 - (length % 8)
- data += b'\0' * padding
- self.data = data
- else:
- assert all(v is None for v in (magic, length, data))
- super().__init__(fd=fd)
- if self.magic == QCOW2_EXT_MAGIC_BITMAPS:
- self.obj = Qcow2BitmapExt(fd=fd, cluster_size=cluster_size)
- self.data = None
- else:
- padded = (self.length + 7) & ~7
- self.data = fd.read(padded)
- assert self.data is not None
- self.obj = None
- if self.data is not None:
- data_str = self.data[:self.length]
- if all(c in string.printable.encode(
- 'ascii') for c in data_str):
- data_str = f"'{ data_str.decode('ascii') }'"
- else:
- data_str = '<binary>'
- self.data_str = data_str
- def dump(self):
- super().dump()
- if self.obj is None:
- print(f'{"data":<25} {self.data_str}')
- else:
- self.obj.dump()
- def to_json(self):
- # Put the name ahead of the dict
- res = {'name': self.Magic(self.magic), **super().to_json()}
- if self.obj is not None:
- res['data'] = self.obj
- else:
- res['data_str'] = self.data_str
- return res
- @classmethod
- def create(cls, magic, data):
- return QcowHeaderExtension(magic, len(data), data)
- class QcowHeader(Qcow2Struct):
- fields = (
- # Version 2 header fields
- ('u32', '{:#x}', 'magic'),
- ('u32', '{}', 'version'),
- ('u64', '{:#x}', 'backing_file_offset'),
- ('u32', '{:#x}', 'backing_file_size'),
- ('u32', '{}', 'cluster_bits'),
- ('u64', '{}', 'size'),
- ('u32', '{}', 'crypt_method'),
- ('u32', '{}', 'l1_size'),
- ('u64', '{:#x}', 'l1_table_offset'),
- ('u64', '{:#x}', 'refcount_table_offset'),
- ('u32', '{}', 'refcount_table_clusters'),
- ('u32', '{}', 'nb_snapshots'),
- ('u64', '{:#x}', 'snapshot_offset'),
- # Version 3 header fields
- ('u64', Flags64, 'incompatible_features'),
- ('u64', Flags64, 'compatible_features'),
- ('u64', Flags64, 'autoclear_features'),
- ('u32', '{}', 'refcount_order'),
- ('u32', '{}', 'header_length'),
- )
- def __init__(self, fd):
- super().__init__(fd=fd, offset=0)
- self.set_defaults()
- self.cluster_size = 1 << self.cluster_bits
- fd.seek(self.header_length)
- self.load_extensions(fd)
- if self.backing_file_offset:
- fd.seek(self.backing_file_offset)
- self.backing_file = fd.read(self.backing_file_size)
- else:
- self.backing_file = None
- def set_defaults(self):
- if self.version == 2:
- self.incompatible_features = 0
- self.compatible_features = 0
- self.autoclear_features = 0
- self.refcount_order = 4
- self.header_length = 72
- def load_extensions(self, fd):
- self.extensions = []
- if self.backing_file_offset != 0:
- end = min(self.cluster_size, self.backing_file_offset)
- else:
- end = self.cluster_size
- while fd.tell() < end:
- ext = QcowHeaderExtension(fd=fd, cluster_size=self.cluster_size)
- if ext.magic == 0:
- break
- else:
- self.extensions.append(ext)
- def update_extensions(self, fd):
- fd.seek(self.header_length)
- extensions = self.extensions
- extensions.append(QcowHeaderExtension(0, 0, b''))
- for ex in extensions:
- buf = struct.pack('>II', ex.magic, ex.length)
- fd.write(buf)
- fd.write(ex.data)
- if self.backing_file is not None:
- self.backing_file_offset = fd.tell()
- fd.write(self.backing_file)
- if fd.tell() > self.cluster_size:
- raise Exception('I think I just broke the image...')
- def update(self, fd):
- header_bytes = self.header_length
- self.update_extensions(fd)
- fd.seek(0)
- header = tuple(self.__dict__[f] for t, p, f in QcowHeader.fields)
- buf = struct.pack(QcowHeader.fmt, *header)
- buf = buf[0:header_bytes-1]
- fd.write(buf)
- def dump_extensions(self, is_json=False):
- if is_json:
- print(json.dumps(self.extensions, indent=4, cls=ComplexEncoder))
- return
- for ex in self.extensions:
- print('Header extension:')
- ex.dump()
- print()
|