Source code for pylorax.api.projects

#
# Copyright (C) 2017  Red Hat, Inc.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program.  If not, see <http://www.gnu.org/licenses/>.
#
import logging
log = logging.getLogger("lorax-composer")

from ConfigParser import ConfigParser
import fnmatch
from glob import glob
import os
import time

from yum.Errors import YumBaseError
from pylorax.api.bisect import insort_left

TIME_FORMAT = "%Y-%m-%dT%H:%M:%S"


[docs]class ProjectsError(Exception):
    pass


[docs]def api_time(t):
    """Convert time since epoch to a string

    :param t: Seconds since epoch
    :type t: int
    :returns: Time string
    :rtype: str
    """
    return time.strftime(TIME_FORMAT, time.localtime(t))


[docs]def api_changelog(changelog):
    """Convert the changelog to a string

    :param changelog: A list of time, author, string tuples.
    :type changelog: tuple
    :returns: The most recent changelog text or ""
    :rtype: str

    This returns only the most recent changelog entry.
    """
    try:
        entry = changelog[0][2]
    except IndexError:
        entry = ""
    return entry


[docs]def yaps_to_project(yaps):
    """Extract the details from a YumAvailablePackageSqlite object

    :param yaps: Yum object with package details
    :type yaps: YumAvailablePackageSqlite
    :returns: A dict with the name, summary, description, and url.
    :rtype: dict

    upstream_vcs is hard-coded to UPSTREAM_VCS
    """
    return {"name":         yaps.name,
            "summary":      yaps.summary,
            "description":  yaps.description,
            "homepage":     yaps.url,
            "upstream_vcs": "UPSTREAM_VCS"}


[docs]def yaps_to_build(yaps):
    """Extract the build details from a hawkey.Package object

    :param yaps: Yum object with package details
    :type yaps: YumAvailablePackageSqlite
    :returns: A dict with the build details, epoch, release, arch, build_time, changelog, ...
    :rtype: dict

    metadata entries are hard-coded to {}

    Note that this only returns the build dict, it does not include the name, description, etc.
    """
    return {"epoch":      int(yaps.epoch),
            "release":    yaps.release,
            "arch":       yaps.arch,
            "build_time": api_time(yaps.buildtime),
            "changelog":  api_changelog(yaps.returnChangelog()),
            "build_config_ref": "BUILD_CONFIG_REF",
            "build_env_ref":    "BUILD_ENV_REF",
            "metadata":    {},
            "source":      {"license":    yaps.license,
                            "version":    yaps.version,
                            "source_ref": "SOURCE_REF",
                            "metadata":   {}}}


[docs]def yaps_to_project_info(yaps):
    """Extract the details from a YumAvailablePackageSqlite object

    :param yaps: Yum object with package details
    :type yaps: YumAvailablePackageSqlite
    :returns: A dict with the project details, as well as epoch, release, arch, build_time, changelog, ...
    :rtype: dict

    metadata entries are hard-coded to {}
    """
    return {"name":         yaps.name,
            "summary":      yaps.summary,
            "description":  yaps.description,
            "homepage":     yaps.url,
            "upstream_vcs": "UPSTREAM_VCS",
            "builds":       [yaps_to_build(yaps)]}


[docs]def tm_to_dep(tm):
    """Extract the info from a TransactionMember object

    :param tm: A Yum transaction object
    :type tm: TransactionMember
    :returns: A dict with name, epoch, version, release, arch
    :rtype: dict
    """
    return {"name":     tm.name,
            "epoch":    int(tm.epoch),
            "version":  tm.version,
            "release":  tm.release,
            "arch":     tm.arch}


[docs]def proj_to_module(proj):
    """Extract the name from a YumAvailablePackageSqlite object

    :param proj: Project details
    :type proj: dict
    :returns: A dict with name, and group_type
    :rtype: dict

    group_type is hard-coded to "rpm"
    """
    return {"name": proj["name"],
            "group_type": "rpm"}


[docs]def dep_evra(dep):
    """Return the epoch:version-release.arch for the dep

    :param dep: dependency dict
    :type dep: dict
    :returns: epoch:version-release.arch
    :rtype: str
    """
    if dep["epoch"] == 0:
        return dep["version"]+"-"+dep["release"]+"."+dep["arch"]
    else:
        return str(dep["epoch"])+":"+dep["version"]+"-"+dep["release"]+"."+dep["arch"]

[docs]def dep_nevra(dep):
    """Return the name-epoch:version-release.arch"""
    return dep["name"]+"-"+dep_evra(dep)

[docs]def projects_list(yb):
    """Return a list of projects

    :param yb: yum base object
    :type yb: YumBase
    :returns: List of project info dicts with name, summary, description, homepage, upstream_vcs
    :rtype: list of dicts
    """
    try:
        ybl = yb.doPackageLists(pkgnarrow="available", showdups=False)
    except YumBaseError as e:
        raise ProjectsError("There was a problem listing projects: %s" % str(e))
    finally:
        yb.closeRpmDB()
    projs = _unique_dicts(map(yaps_to_project, ybl.available), key=lambda p: p["name"].lower())
    return sorted(projs, key=lambda p: p["name"].lower())

[docs]def projects_info(yb, project_names):
    """Return details about specific projects

    :param yb: yum base object
    :type yb: YumBase
    :param project_names: List of names of projects to get info about
    :type project_names: str
    :returns: List of project info dicts with yaps_to_project as well as epoch, version, release, etc.
    :rtype: list of dicts
    """
    try:
        ybl = yb.doPackageLists(pkgnarrow="available", patterns=project_names, showdups=False)
    except YumBaseError as e:
        raise ProjectsError("There was a problem with info for %s: %s" % (project_names, str(e)))
    finally:
        yb.closeRpmDB()
    return _unique_projs(ybl.available)

def _unique_projs(projs):
    """Return a sorted list of projects with builds combined into one project entry

    :param yaps: Yum object with package details
    :type yaps: YumAvailablePackageSqlite
    :returns: List of project info dicts with yaps_to_project as well as epoch, version, release, etc.
    :rtype: list of dicts
    """
    # iterate over ybl.available
    # - if ybl.name isn't in the results yet, add yaps_to_project_info in sorted position
    # - if ybl.name is already in results, get its builds. If the build for the project is different
    #   in any way (version, arch, etc.) add it to the entry's builds list. If it is the same,
    #   skip it.
    results = []
    results_names = {}
    for p in projs:
        if p.name.lower() not in results_names:
            idx = insort_left(results, yaps_to_project_info(p), key=lambda p: p["name"].lower())
            results_names[p.name.lower()] = idx
        else:
            build = yaps_to_build(p)
            if build not in results[results_names[p.name.lower()]]["builds"]:
                results[results_names[p.name.lower()]]["builds"].append(build)

    return results


[docs]def filterVersionGlob(pkgs, version):
    """Filter a list of yum package objects with a version glob

    :param pkgs: list of yum package objects
    :type pkgs: list
    :param version: version matching glob
    :type version: str

    pkgs should be a list of all the versions of the *same* package.
    Return the latest package that matches the 'version' glob.
    """
    # Pick the version(s) matching the version glob
    matches = [po for po in pkgs if fnmatch.fnmatchcase(po.version, version)]
    if not matches:
        raise RuntimeError("No package version matching %s" % version)

    # yum implements __cmd__ using verCMP so this will return the highest matching version
    return max(matches)

def _findPackageGlob(yb, pkg_name):
    """Find the package(s) that match a name glob

    :param yb: yum base object
    :type yb: YumBase
    :param pkg_name: Name or fileglob of the name to find
    :type pkg_name: str
    :returns: list of yum package objects or empty list
    """
    (exact, globbed, _unmatched) = yb.pkgSack.matchPackageNames([pkg_name])
    pkgs = exact + globbed
    if pkgs:
        return pkgs

    # Nothing matched, check rpmdb
    pkgs = yb.rpmdb.returnPackages(patterns=[pkg_name], ignore_case=False)
    if pkgs:
        return pkgs

    # Nothing matched, find a matching dep
    return yb.returnPackagesByDep(pkg_name)


def _depsolve(yb, projects, groups):
    """Find the dependencies for a list of projects and groups

    :param yb: yum base object
    :type yb: YumBase
    :param projects: The projects and version globs to find the dependencies for
    :type projects: List of tuples
    :param groups: The groups to include in dependency solving
    :type groups: List of str
    :returns: A list of errors that were encountered while depsolving the packages
    :rtype: list of strings
    :raises: ProjectsError if there was a problem installing something
    """
    # This resets the transaction
    yb.closeRpmDB()
    install_errors = []
    for name in groups:
        yb.selectGroup(name, ["mandatory", "default"])

    for name, version in projects:
        if not version:
            version = "*"
        pattern = "%s %s" % (name, version)

        # yum.install's pattern matches the whole nevra, which can result in -* matching
        # unexpected packages. So we need to implement our own version globbing.
        # First get a list of packages, then filter that by the version
        pkgs = _findPackageGlob(yb, name)
        if not pkgs:
            install_errors.append((name, "No package name matching %s" % name))
            continue

        try:
            po = filterVersionGlob(pkgs, version)
            log.debug("Chose %s as best match for %s", po.nevra, pattern)

            yb.install(po=po)
        except (YumBaseError, RuntimeError) as e:
            install_errors.append((pattern, str(e)))

    return install_errors

[docs]def projects_depsolve(yb, projects, groups):
    """Return the dependencies for a list of projects

    :param yb: yum base object
    :type yb: YumBase
    :param projects: The projects and version globs to find the dependencies for
    :type projects: List of tuples
    :param groups: The groups to include in dependency solving
    :type groups: List of str
    :returns: NEVRA's of the project and its dependencies
    :rtype: list of dicts
    :raises: ProjectsError if there was a problem installing something
    """
    try:
        install_errors = _depsolve(yb, projects, groups)

        # Were there problems installing these packages?
        if install_errors:
            raise ProjectsError("The following package(s) had problems: %s" % ",".join(["%s (%s)" % (pattern, err) for pattern, err in install_errors]))

        (rc, msg) = yb.buildTransaction()
        if rc not in [0, 1, 2]:
            raise ProjectsError("There was a problem depsolving %s: %s" % (projects, msg))
        yb.tsInfo.makelists()
        deps = sorted(map(tm_to_dep, yb.tsInfo.installed + yb.tsInfo.depinstalled), key=lambda p: p["name"].lower())
    except YumBaseError as e:
        raise ProjectsError("There was a problem depsolving %s: %s" % (projects, str(e)))
    finally:
        yb.closeRpmDB()
    return deps

[docs]def estimate_size(packages, block_size=4096):
    """Estimate the installed size of a package list

    :param packages: The packages to be installed
    :type packages: list of TransactionMember objects
    :param block_size: The block size to use for rounding up file sizes.
    :type block_size: int
    :returns: Tuple of the the estimated size needed, and the size anaconda will calculate
    :rtype: tuple(int, int)

    Estimating actual requirements is difficult without the actual file sizes, which
    yum doesn't provide access to. So use the file count and block size to estimate
    a minimum size for each package.

    Anaconda only takes into account the installedsize of each package. It then fudges
    this by 35% to make sure there is enough space.
    """
    installed_size = 0
    anaconda_size = 0
    for p in packages:
        installed_size += len(p.po.filelist) * block_size
        installed_size += p.po.installedsize
        # anaconda only takes into account installedsize
        anaconda_size += p.po.installedsize
        # also count the RPM package size (yum cache)
        installed_size += ((p.po.size / block_size) + 1) * block_size
    return (installed_size, anaconda_size)

[docs]def projects_depsolve_with_size(yb, projects, groups, with_core=True):
    """Return the dependencies and installed size for a list of projects

    :param yb: yum base object
    :type yb: YumBase
    :param projects: The projects and version globs to find the dependencies for
    :type projects: List of tuples
    :param groups: The groups to include in dependency solving
    :type groups: List of str
    :returns: installed size, size estimated by anaconda, and a list of NEVRA's of the project and its dependencies
    :rtype: tuple of (int, int, list of dicts)
    :raises: ProjectsError if there was a problem installing something

    The anaconda_size only includes the installed package size, not file block or cache estimation like
    installed_size includes.
    """
    try:
        install_errors = _depsolve(yb, projects, groups)

        # Were there problems installing these packages?
        if install_errors:
            raise ProjectsError("The following package(s) had problems: %s" % ",".join(["%s (%s)" % (pattern, err) for pattern, err in install_errors]))

        if with_core:
            yb.selectGroup("core", group_package_types=['mandatory', 'default', 'optional'])
        (rc, msg) = yb.buildTransaction()
        if rc not in [0, 1, 2]:
            raise ProjectsError("There was a problem depsolving %s: %s" % (projects, msg))
        yb.tsInfo.makelists()
        (installed_size, anaconda_size) = estimate_size(yb.tsInfo.installed + yb.tsInfo.depinstalled)
        deps = sorted(map(tm_to_dep, yb.tsInfo.installed + yb.tsInfo.depinstalled), key=lambda p: p["name"].lower())
    except YumBaseError as e:
        raise ProjectsError("There was a problem depsolving %s: %s" % (projects, str(e)))
    finally:
        yb.closeRpmDB()
    return (installed_size, anaconda_size, deps)

[docs]def modules_list(yb, module_names):
    """Return a list of modules

    :param yb: yum base object
    :type yb: YumBase
    :param offset: Number of modules to skip
    :type limit: int
    :param limit: Maximum number of modules to return
    :type limit: int
    :returns: List of module information and total count
    :rtype: tuple of a list of dicts and an Int

    Modules don't exist in RHEL7 so this only returns projects
    and sets the type to "rpm"
    """
    projs = _unique_dicts(projects_info(yb, module_names), key=lambda p: p["name"].lower())
    return list(map(proj_to_module, projs))

def _unique_dicts(lst, key):
    """Return a new list of dicts, only including one match of key(d)

    :param lst: list of dicts
    :type lst: list
    :param key: key function to match lst entries
    :type key: function
    :returns: list of the unique lst entries
    :rtype: list

    Uses key(d) to test for duplicates in the returned list, creating a
    list of unique return values.
    """
    result = []
    result_keys = []
    for d in lst:
        if key(d) not in result_keys:
            result.append(d)
            result_keys.append(key(d))
    return result

[docs]def modules_info(yb, module_names):
    """Return details about a module, including dependencies

    :param yb: yum base object
    :type yb: YumBase
    :param module_names: Names of the modules to get info about
    :type module_names: str
    :returns: List of dicts with module details and dependencies.
    :rtype: list of dicts
    """
    try:
        # Get the info about each module
        ybl = yb.doPackageLists(pkgnarrow="available", patterns=module_names, showdups=False)
    except YumBaseError as e:
        raise ProjectsError("There was a problem with info for %s: %s" % (module_names, str(e)))
    finally:
        yb.closeRpmDB()

    modules = sorted(map(yaps_to_project, ybl.available), key=lambda p: p["name"].lower())
    # Add the dependency info to each one
    for module in modules:
        module["dependencies"] = projects_depsolve(yb, [(module["name"], "*")], [])

    return modules

[docs]def yum_repo_to_file_repo(repo):
    """Return a string representation of a repo dict suitable for writing to a .repo file

    :param repo: Yum Repository represented as a dict
    :type repo: dict
    :returns: A string
    :rtype: str

    The YumRepo.dump() function does not produce a string that can be used as a
    yum .repo file. So do this manually with only the attributes we care about.
    """
    repo_str = "[%s]\n" % repo["id"]
    if repo["metalink"]:
        repo_str += "metalink = %s\n" % repo["metalink"]
    elif repo["mirrorlist"]:
        repo_str += "mirrorlist = %s\n" % repo["mirrorlist"]
    elif repo["baseurl"]:
        repo_str += "baseurl = %s\n" % repo["baseurl"][0]
    else:
        raise RuntimeError("Repo has no baseurl, metalink, or mirrorlist")

    # proxy is optional
    if "proxy" in repo:
        repo_str += "proxy = %s\n" % repo["proxy"]

    repo_str += "sslverify = %s\n" % repo["sslverify"]
    repo_str += "gpgcheck = %s\n" % repo["gpgcheck"]
    if "gpgkey" in repo:
        repo_str += "gpgkey = %s\n" % ",".join(repo["gpgkey"])

    return repo_str

[docs]def repo_to_source(repo, system_source):
    """Return a Weldr Source dict created from the YumRepository

    :param repo: Yum Repository
    :type repo: yum.yumRepo.YumRepository
    :param system_source: True if this source is an immutable system source
    :type system_source: bool
    :returns: A dict with Weldr Source fields filled in
    :rtype: dict

    Example::

        {
          "check_gpg": true,
          "check_ssl": true,
          "gpgkey_url": [
            "file:///etc/pki/rpm-gpg/RPM-GPG-KEY-fedora-28-x86_64"
          ],
          "name": "fedora",
          "proxy": "http://proxy.brianlane.com:8123",
          "system": true
          "type": "yum-metalink",
          "url": "https://mirrors.fedoraproject.org/metalink?repo=fedora-28&arch=x86_64"
        }

    """
    source = {"name": repo.id, "system": system_source}
    if repo.baseurl:
        source["url"] = repo.baseurl[0]
        source["type"] = "yum-baseurl"
    elif repo.metalink:
        source["url"] = repo.metalink
        source["type"] = "yum-metalink"
    elif repo.mirrorlist:
        source["url"] = repo.mirrorlist
        source["type"] = "yum-mirrorlist"
    else:
        raise RuntimeError("Repo has no baseurl, metalink, or mirrorlist")

    # proxy is optional
    if repo.proxy:
        source["proxy"] = repo.proxy

    if not repo.sslverify:
        source["check_ssl"] = False
    else:
        source["check_ssl"] = True

    if not repo.gpgcheck:
        source["check_gpg"] = False
    else:
        source["check_gpg"] = True

    if repo.gpgkey:
        source["gpgkey_urls"] = repo.gpgkey

    return source

[docs]def source_to_repo(source):
    """Return an add_enable_repo kwargs dict created from a source dict

    :param source: A Weldr source dict
    :type source: dict
    :returns: A yum YumRepository object
    :rtype: yum.yumRepo.YumRepository

    The dict it suitable for passing to yum's add_enable_repo function
    after popping off baseurl and mirrorlist.

    Example::

        {
          "gpgcheck": True,
          "sslverify": True,
          "gpgkey": ["file:///etc/pki/rpm-gpg/RPM-GPG-KEY-fedora-28-x86_64"],
          "id": "fedora",
          "proxy": "http://proxy.brianlane.com:8123",
          "baseurl": "https://mirrors.fedoraproject.org/metalink?repo=fedora-28&arch=x86_64",
          "metalink": None,
          "mirrorlist": None
        }

    """
    repo = {"id": source["name"]}

    # This will allow errors to be raised so we can catch them
    # without this they are logged, but the repo is silently disabled
    repo["skip_if_unavailable"] = False

    if source["type"] == "yum-baseurl":
        repo["baseurl"] = [source["url"]]
        repo["metalink"] = None
        repo["mirrorlist"] = None
    elif source["type"] == "yum-metalink":
        repo["metalink"] = source["url"]
        repo["baseurl"] = []
        repo["mirrorlist"] = None
    elif source["type"] == "yum-mirrorlist":
        repo["mirrorlist"] = source["url"]
        repo["baseurl"] = []
        repo["metalink"] = None

    if "proxy" in source:
        repo["proxy"] = source["proxy"]

    if source["check_ssl"]:
        repo["sslverify"] = True
    else:
        repo["sslverify"] = False

    if source["check_gpg"]:
        repo["gpgcheck"] = True
    else:
        repo["gpgcheck"] = False

    if "gpgkey_urls" in source:
        repo["gpgkey"] = source["gpgkey_urls"]

    return repo

[docs]def get_source_ids(source_path):
    """Return a list of the source ids in a file

    :param source_path: Full path and filename of the source (yum repo) file
    :type source_path: str
    :returns: A list of source id strings
    :rtype: list of str
    """
    if not os.path.exists(source_path):
        return []

    cfg = ConfigParser()
    cfg.read(source_path)
    return cfg.sections()

[docs]def get_repo_sources(source_glob):
    """Return a list of sources from a directory of yum repositories

    :param source_glob: A glob to use to match the source files, including full path
    :type source_glob: str
    :returns: A list of the source ids in all of the matching files
    :rtype: list of str
    """
    sources = []
    for f in glob(source_glob):
        sources.extend(get_source_ids(f))
    return sources

[docs]def delete_repo_source(source_glob, source_name):
    """Delete a source from a repo file

    :param source_glob: A glob of the repo sources to search
    :type source_glob: str
    :returns: None
    :raises: ProjectsError if there was a problem

    A repo file may have multiple sources in it, delete only the selected source.
    If it is the last one in the file, delete the file.

    WARNING: This will delete ANY source, the caller needs to ensure that a system
    source_name isn't passed to it.
    """
    found = False
    for f in glob(source_glob):
        try:
            cfg = ConfigParser()
            cfg.read(f)
            if source_name in cfg.sections():
                found = True
                cfg.remove_section(source_name)
                # If there are other sections, rewrite the file without the deleted one
                if len(cfg.sections()) > 0:
                    with open(f, "w") as cfg_file:
                        cfg.write(cfg_file)
                else:
                    # No sections left, just delete the file
                    os.unlink(f)
        except Exception as e:
            raise ProjectsError("Problem deleting repo source %s: %s" % (source_name, str(e)))
    if not found:
        raise ProjectsError("source %s not found" % source_name)
Navigation

Source code for pylorax.api.projects

Quick search

Navigation