Source code for COT.helpers.api

#!/usr/bin/env python
#
# api.py - API to abstract away operations that require third-party
#          helper software not part of a standard Python distro.
#
# April 2014, Glenn F. Matthews
# Copyright (c) 2013-2015 the COT project developers.
# See the COPYRIGHT.txt file at the top-level directory of this distribution
# and at https://github.com/glennmatthews/cot/blob/master/COPYRIGHT.txt.
#
# This file is part of the Common OVF Tool (COT) project.
# It is subject to the license terms in the LICENSE.txt file found in the
# top-level directory of this distribution and at
# https://github.com/glennmatthews/cot/blob/master/LICENSE.txt. No part
# of COT, including this file, may be copied, modified, propagated, or
# distributed except according to the terms contained in the LICENSE.txt file.

"""API for abstract access to third-party helper tools.

Abstracts away operations that require third-party helper programs,
especially those that are not available through PyPI.

The actual helper programs are provided by individual classes in this package.

**Functions**

.. autosummary::
  :nosignatures:

  convert_disk_image
  create_disk_image
  get_checksum
  get_disk_capacity
  get_disk_format
"""

import hashlib
import logging
import os
import re
from distutils.version import StrictVersion

from .fatdisk import FatDisk
from .mkisofs import MkIsoFS
from .ovftool import OVFTool
from .qemu_img import QEMUImg
from .vmdktool import VmdkTool

logger = logging.getLogger(__name__)

FATDISK = FatDisk()
MKISOFS = MkIsoFS()
OVFTOOL = OVFTool()
QEMUIMG = QEMUImg()
VMDKTOOL = VmdkTool()


[docs]def get_checksum(path_or_obj, checksum_type):
    """Get the checksum of the given file.

    :param str path_or_obj: File path to checksum OR an opened file object
    :param str checksum_type: Supported values are 'md5' and 'sha1'.
    :return: String containing hexadecimal file checksum
    """
    if checksum_type == 'md5':
        h = hashlib.md5()
    elif checksum_type == 'sha1':
        h = hashlib.sha1()
    else:
        raise NotImplementedError(
            "No support for generating checksum type {0}"
            .format(checksum_type))

    BLOCKSIZE = 65536

    # Is it a file or do we need to open it?
    try:
        path_or_obj.read(0)
        file_obj = path_or_obj
    except AttributeError:
        file_obj = open(path_or_obj, 'rb')

    try:
        while True:
            buf = file_obj.read(BLOCKSIZE)
            if len(buf) == 0:
                break
            h.update(buf)
    finally:
        if file_obj != path_or_obj:
            file_obj.close()

    return h.hexdigest()


[docs]def get_disk_format(file_path):
    """Get the disk image format of the given file.

    .. warning::
      If :attr:`file_path` refers to a file which is not a disk image at all,
      this function will return ``('raw', None)``.

    :param str file_path: Path to disk image file to inspect.
    :return: ``(format, subformat)``

      * ``format`` may be ``'vmdk'``, ``'raw'``, or ``'qcow2'``
      * ``subformat`` may be ``None``, or various strings for ``'vmdk'`` files.
    """
    file_format = QEMUIMG.get_disk_format(file_path)

    if file_format == 'vmdk':
        # Look at the VMDK file header to determine the sub-format
        with open(file_path, 'rb') as f:
            # The header contains a fun mix of binary and ASCII, so ignore
            # any errors in decoding binary data to strings
            header = f.read(1000).decode('ascii', 'ignore')
            # Detect the VMDK format from the output:
            match = re.search('createType="(.*)"', header)
            if not match:
                raise RuntimeError("Could not find VMDK 'createType' in the "
                                   "file header:\n{0}".format(header))
            vmdk_format = match.group(1)
        logger.info("VMDK sub-format is '{0}'".format(vmdk_format))
        return (file_format, vmdk_format)
    else:
        # No known/applicable sub-format
        return (file_format, None)


[docs]def get_disk_capacity(file_path):
    """Get the storage capacity of the given disk image.

    :param str file_path: Path to disk image file to inspect
    :return: Disk capacity, in bytes
    """
    return QEMUIMG.get_disk_capacity(file_path)


[docs]def convert_disk_image(file_path, output_dir, new_format, new_subformat=None):
    """Convert the given disk image to the requested format/subformat.

    If the disk is already in this format then it is unchanged;
    otherwise, will convert to a new disk in the specified output_dir
    and return its path.

    Current supported conversions:

    * .vmdk (any format) to .vmdk (streamOptimized)
    * .img to .vmdk (streamOptimized)

    :param str file_path: Disk image file to inspect/convert
    :param str output_dir: Directory to place converted image into, if needed
    :param str new_format: Desired final format
    :param str new_subformat: Desired final subformat
    :return:
      * :attr:`file_path`, if no conversion was required
      * or a file path in :attr:`output_dir` containing the converted image

    :raise ValueUnsupportedError: if the :attr:`new_format` and/or
      :attr:`new_subformat` are not supported conversion targets.
    """
    curr_format, curr_subformat = get_disk_format(file_path)

    if curr_format == new_format and curr_subformat == new_subformat:
        logger.info("Disk image {0} is already in '{1}' format - "
                    "no conversion required."
                    .format(file_path,
                            (new_format if not new_subformat else
                             (new_format + "," + new_subformat))))
        return file_path

    file_name = os.path.basename(file_path)
    (file_string, file_extension) = os.path.splitext(file_name)

    new_file_path = None
    # any temporary file we should delete before returning
    temp_path = None

    if new_format == 'vmdk' and new_subformat == 'streamOptimized':
        new_file_path = os.path.join(output_dir, file_string + '.vmdk')
        # QEMU only supports streamOptimized images in versions >= 2.1.0
        if QEMUIMG.version >= StrictVersion("2.1.0"):
            new_file_path = QEMUIMG.convert_disk_image(
                file_path, output_dir, new_format, new_subformat)
        else:
            # Older versions of qemu-img don't support streamOptimized VMDKs,
            # so we have to use qemu-img + vmdktool to get the desired result.

            # We have to pass through raw format on the way, even if the
            # existing image is a non-streamOptimized vmdk.
            if curr_format != 'raw':
                # Use qemu-img to convert to raw format
                temp_path = QEMUIMG.convert_disk_image(
                    file_path, output_dir, 'raw')
                file_path = temp_path

            # Use vmdktool to convert raw image to stream-optimized VMDK
            new_file_path = VMDKTOOL.convert_disk_image(
                file_path, output_dir, new_format, new_subformat)

    else:
        raise NotImplementedError(
            "no support for converting disk to {0} / {1}"
            .format(new_format, new_subformat))

    logger.info("Successfully converted from ({0},{1}) to ({2},{3})"
                .format(curr_format, curr_subformat,
                        new_format, new_subformat))

    if temp_path is not None:
        os.remove(temp_path)

    return new_file_path


[docs]def create_disk_image(file_path, file_format=None,
                      capacity=None, contents=[]):
    """Create a new disk image at the requested location.

    Either :attr:`capacity` or :attr:`contents` or both must be specified.

    :param str file_path: Desired location of new disk image
    :param str file_format: Desired image format (if not specified, this will
      be derived from the file extension of :attr:`file_path`)

    :param capacity: Disk capacity. A string like '16M' or '1G'.
    :param list contents: List of file paths to package into the created image.
      If not specified, the image will be left blank and unformatted.
    """
    if not capacity and not contents:
        raise RuntimeError("Either capacity or contents must be specified!")

    if not file_format:
        # Guess format from file extension
        file_format = os.path.splitext(file_path)[1][1:]
        if not file_format:
            raise RuntimeError(
                "Unable to guess file format from desired filename {0}"
                .format(file_path))
        if file_format == 'img':
            file_format = 'raw'
        logger.debug("Guessed file format is {0}".format(file_format))

    if not contents:
        QEMUIMG.create_blank_disk(file_path, capacity, file_format)
    elif file_format == 'iso':
        MKISOFS.create_iso(file_path, contents)
    elif file_format == 'raw' or file_format == 'img':
        FATDISK.create_raw_image(file_path, contents, capacity)
    else:
        # We could create a raw image then convert it to the
        # desired format but there's no use case for that at present.
        raise NotImplementedError(
            "unable to create disk of format {0} with the given contents"
            .format(file_format))