#
# Copyright (C) 2017 Red Hat, Inc.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
#
import logging
log = logging.getLogger("lorax-composer")
from ConfigParser import ConfigParser
import fnmatch
from glob import glob
import os
import time
from yum.Errors import YumBaseError
from pylorax.api.bisect import insort_left
TIME_FORMAT = "%Y-%m-%dT%H:%M:%S"
[docs]class ProjectsError(Exception):
pass
[docs]def api_time(t):
"""Convert time since epoch to a string
:param t: Seconds since epoch
:type t: int
:returns: Time string
:rtype: str
"""
return time.strftime(TIME_FORMAT, time.localtime(t))
[docs]def api_changelog(changelog):
"""Convert the changelog to a string
:param changelog: A list of time, author, string tuples.
:type changelog: tuple
:returns: The most recent changelog text or ""
:rtype: str
This returns only the most recent changelog entry.
"""
try:
entry = changelog[0][2]
except IndexError:
entry = ""
return entry
[docs]def yaps_to_project(yaps):
"""Extract the details from a YumAvailablePackageSqlite object
:param yaps: Yum object with package details
:type yaps: YumAvailablePackageSqlite
:returns: A dict with the name, summary, description, and url.
:rtype: dict
upstream_vcs is hard-coded to UPSTREAM_VCS
"""
return {"name": yaps.name,
"summary": yaps.summary,
"description": yaps.description,
"homepage": yaps.url,
"upstream_vcs": "UPSTREAM_VCS"}
[docs]def yaps_to_build(yaps):
"""Extract the build details from a hawkey.Package object
:param yaps: Yum object with package details
:type yaps: YumAvailablePackageSqlite
:returns: A dict with the build details, epoch, release, arch, build_time, changelog, ...
:rtype: dict
metadata entries are hard-coded to {}
Note that this only returns the build dict, it does not include the name, description, etc.
"""
return {"epoch": int(yaps.epoch),
"release": yaps.release,
"arch": yaps.arch,
"build_time": api_time(yaps.buildtime),
"changelog": api_changelog(yaps.returnChangelog()),
"build_config_ref": "BUILD_CONFIG_REF",
"build_env_ref": "BUILD_ENV_REF",
"metadata": {},
"source": {"license": yaps.license,
"version": yaps.version,
"source_ref": "SOURCE_REF",
"metadata": {}}}
[docs]def yaps_to_project_info(yaps):
"""Extract the details from a YumAvailablePackageSqlite object
:param yaps: Yum object with package details
:type yaps: YumAvailablePackageSqlite
:returns: A dict with the project details, as well as epoch, release, arch, build_time, changelog, ...
:rtype: dict
metadata entries are hard-coded to {}
"""
return {"name": yaps.name,
"summary": yaps.summary,
"description": yaps.description,
"homepage": yaps.url,
"upstream_vcs": "UPSTREAM_VCS",
"builds": [yaps_to_build(yaps)]}
[docs]def tm_to_dep(tm):
"""Extract the info from a TransactionMember object
:param tm: A Yum transaction object
:type tm: TransactionMember
:returns: A dict with name, epoch, version, release, arch
:rtype: dict
"""
return {"name": tm.name,
"epoch": int(tm.epoch),
"version": tm.version,
"release": tm.release,
"arch": tm.arch}
[docs]def proj_to_module(proj):
"""Extract the name from a YumAvailablePackageSqlite object
:param proj: Project details
:type proj: dict
:returns: A dict with name, and group_type
:rtype: dict
group_type is hard-coded to "rpm"
"""
return {"name": proj["name"],
"group_type": "rpm"}
[docs]def dep_evra(dep):
"""Return the epoch:version-release.arch for the dep
:param dep: dependency dict
:type dep: dict
:returns: epoch:version-release.arch
:rtype: str
"""
if dep["epoch"] == 0:
return dep["version"]+"-"+dep["release"]+"."+dep["arch"]
else:
return str(dep["epoch"])+":"+dep["version"]+"-"+dep["release"]+"."+dep["arch"]
[docs]def dep_nevra(dep):
"""Return the name-epoch:version-release.arch"""
return dep["name"]+"-"+dep_evra(dep)
[docs]def projects_list(yb):
"""Return a list of projects
:param yb: yum base object
:type yb: YumBase
:returns: List of project info dicts with name, summary, description, homepage, upstream_vcs
:rtype: list of dicts
"""
try:
ybl = yb.doPackageLists(pkgnarrow="available", showdups=False)
except YumBaseError as e:
raise ProjectsError("There was a problem listing projects: %s" % str(e))
finally:
yb.closeRpmDB()
projs = _unique_dicts(map(yaps_to_project, ybl.available), key=lambda p: p["name"].lower())
return sorted(projs, key=lambda p: p["name"].lower())
[docs]def projects_info(yb, project_names):
"""Return details about specific projects
:param yb: yum base object
:type yb: YumBase
:param project_names: List of names of projects to get info about
:type project_names: str
:returns: List of project info dicts with yaps_to_project as well as epoch, version, release, etc.
:rtype: list of dicts
"""
try:
ybl = yb.doPackageLists(pkgnarrow="available", patterns=project_names, showdups=False)
except YumBaseError as e:
raise ProjectsError("There was a problem with info for %s: %s" % (project_names, str(e)))
finally:
yb.closeRpmDB()
return _unique_projs(ybl.available)
def _unique_projs(projs):
"""Return a sorted list of projects with builds combined into one project entry
:param yaps: Yum object with package details
:type yaps: YumAvailablePackageSqlite
:returns: List of project info dicts with yaps_to_project as well as epoch, version, release, etc.
:rtype: list of dicts
"""
# iterate over ybl.available
# - if ybl.name isn't in the results yet, add yaps_to_project_info in sorted position
# - if ybl.name is already in results, get its builds. If the build for the project is different
# in any way (version, arch, etc.) add it to the entry's builds list. If it is the same,
# skip it.
results = []
results_names = {}
for p in projs:
if p.name.lower() not in results_names:
idx = insort_left(results, yaps_to_project_info(p), key=lambda p: p["name"].lower())
results_names[p.name.lower()] = idx
else:
build = yaps_to_build(p)
if build not in results[results_names[p.name.lower()]]["builds"]:
results[results_names[p.name.lower()]]["builds"].append(build)
return results
[docs]def filterVersionGlob(pkgs, version):
"""Filter a list of yum package objects with a version glob
:param pkgs: list of yum package objects
:type pkgs: list
:param version: version matching glob
:type version: str
pkgs should be a list of all the versions of the *same* package.
Return the latest package that matches the 'version' glob.
"""
# Pick the version(s) matching the version glob
matches = [po for po in pkgs if fnmatch.fnmatchcase(po.version, version)]
if not matches:
raise RuntimeError("No package version matching %s" % version)
# yum implements __cmd__ using verCMP so this will return the highest matching version
return max(matches)
def _findPackageGlob(yb, pkg_name):
"""Find the package(s) that match a name glob
:param yb: yum base object
:type yb: YumBase
:param pkg_name: Name or fileglob of the name to find
:type pkg_name: str
:returns: list of yum package objects or empty list
"""
(exact, globbed, _unmatched) = yb.pkgSack.matchPackageNames([pkg_name])
pkgs = exact + globbed
if pkgs:
return pkgs
# Nothing matched, check rpmdb
pkgs = yb.rpmdb.returnPackages(patterns=[pkg_name], ignore_case=False)
if pkgs:
return pkgs
# Nothing matched, find a matching dep
return yb.returnPackagesByDep(pkg_name)
def _depsolve(yb, projects, groups):
"""Find the dependencies for a list of projects and groups
:param yb: yum base object
:type yb: YumBase
:param projects: The projects and version globs to find the dependencies for
:type projects: List of tuples
:param groups: The groups to include in dependency solving
:type groups: List of str
:returns: A list of errors that were encountered while depsolving the packages
:rtype: list of strings
:raises: ProjectsError if there was a problem installing something
"""
# This resets the transaction
yb.closeRpmDB()
install_errors = []
for name in groups:
yb.selectGroup(name, ["mandatory", "default"])
for name, version in projects:
if not version:
version = "*"
pattern = "%s %s" % (name, version)
# yum.install's pattern matches the whole nevra, which can result in -* matching
# unexpected packages. So we need to implement our own version globbing.
# First get a list of packages, then filter that by the version
pkgs = _findPackageGlob(yb, name)
if not pkgs:
install_errors.append((name, "No package name matching %s" % name))
continue
try:
po = filterVersionGlob(pkgs, version)
log.debug("Chose %s as best match for %s", po.nevra, pattern)
yb.install(po=po)
except (YumBaseError, RuntimeError) as e:
install_errors.append((pattern, str(e)))
return install_errors
[docs]def projects_depsolve(yb, projects, groups):
"""Return the dependencies for a list of projects
:param yb: yum base object
:type yb: YumBase
:param projects: The projects and version globs to find the dependencies for
:type projects: List of tuples
:param groups: The groups to include in dependency solving
:type groups: List of str
:returns: NEVRA's of the project and its dependencies
:rtype: list of dicts
:raises: ProjectsError if there was a problem installing something
"""
try:
install_errors = _depsolve(yb, projects, groups)
# Were there problems installing these packages?
if install_errors:
raise ProjectsError("The following package(s) had problems: %s" % ",".join(["%s (%s)" % (pattern, err) for pattern, err in install_errors]))
(rc, msg) = yb.buildTransaction()
if rc not in [0, 1, 2]:
raise ProjectsError("There was a problem depsolving %s: %s" % (projects, msg))
yb.tsInfo.makelists()
deps = sorted(map(tm_to_dep, yb.tsInfo.installed + yb.tsInfo.depinstalled), key=lambda p: p["name"].lower())
except YumBaseError as e:
raise ProjectsError("There was a problem depsolving %s: %s" % (projects, str(e)))
finally:
yb.closeRpmDB()
return deps
[docs]def estimate_size(packages, block_size=4096):
"""Estimate the installed size of a package list
:param packages: The packages to be installed
:type packages: list of TransactionMember objects
:param block_size: The block size to use for rounding up file sizes.
:type block_size: int
:returns: Tuple of the the estimated size needed, and the size anaconda will calculate
:rtype: tuple(int, int)
Estimating actual requirements is difficult without the actual file sizes, which
yum doesn't provide access to. So use the file count and block size to estimate
a minimum size for each package.
Anaconda only takes into account the installedsize of each package. It then fudges
this by 35% to make sure there is enough space.
"""
installed_size = 0
anaconda_size = 0
for p in packages:
installed_size += len(p.po.filelist) * block_size
installed_size += p.po.installedsize
# anaconda only takes into account installedsize
anaconda_size += p.po.installedsize
# also count the RPM package size (yum cache)
installed_size += ((p.po.size / block_size) + 1) * block_size
return (installed_size, anaconda_size)
[docs]def projects_depsolve_with_size(yb, projects, groups, with_core=True):
"""Return the dependencies and installed size for a list of projects
:param yb: yum base object
:type yb: YumBase
:param projects: The projects and version globs to find the dependencies for
:type projects: List of tuples
:param groups: The groups to include in dependency solving
:type groups: List of str
:returns: installed size, size estimated by anaconda, and a list of NEVRA's of the project and its dependencies
:rtype: tuple of (int, int, list of dicts)
:raises: ProjectsError if there was a problem installing something
The anaconda_size only includes the installed package size, not file block or cache estimation like
installed_size includes.
"""
try:
install_errors = _depsolve(yb, projects, groups)
# Were there problems installing these packages?
if install_errors:
raise ProjectsError("The following package(s) had problems: %s" % ",".join(["%s (%s)" % (pattern, err) for pattern, err in install_errors]))
if with_core:
yb.selectGroup("core", group_package_types=['mandatory', 'default', 'optional'])
(rc, msg) = yb.buildTransaction()
if rc not in [0, 1, 2]:
raise ProjectsError("There was a problem depsolving %s: %s" % (projects, msg))
yb.tsInfo.makelists()
(installed_size, anaconda_size) = estimate_size(yb.tsInfo.installed + yb.tsInfo.depinstalled)
deps = sorted(map(tm_to_dep, yb.tsInfo.installed + yb.tsInfo.depinstalled), key=lambda p: p["name"].lower())
except YumBaseError as e:
raise ProjectsError("There was a problem depsolving %s: %s" % (projects, str(e)))
finally:
yb.closeRpmDB()
return (installed_size, anaconda_size, deps)
[docs]def modules_list(yb, module_names):
"""Return a list of modules
:param yb: yum base object
:type yb: YumBase
:param offset: Number of modules to skip
:type limit: int
:param limit: Maximum number of modules to return
:type limit: int
:returns: List of module information and total count
:rtype: tuple of a list of dicts and an Int
Modules don't exist in RHEL7 so this only returns projects
and sets the type to "rpm"
"""
projs = _unique_dicts(projects_info(yb, module_names), key=lambda p: p["name"].lower())
return list(map(proj_to_module, projs))
def _unique_dicts(lst, key):
"""Return a new list of dicts, only including one match of key(d)
:param lst: list of dicts
:type lst: list
:param key: key function to match lst entries
:type key: function
:returns: list of the unique lst entries
:rtype: list
Uses key(d) to test for duplicates in the returned list, creating a
list of unique return values.
"""
result = []
result_keys = []
for d in lst:
if key(d) not in result_keys:
result.append(d)
result_keys.append(key(d))
return result
[docs]def modules_info(yb, module_names):
"""Return details about a module, including dependencies
:param yb: yum base object
:type yb: YumBase
:param module_names: Names of the modules to get info about
:type module_names: str
:returns: List of dicts with module details and dependencies.
:rtype: list of dicts
"""
try:
# Get the info about each module
ybl = yb.doPackageLists(pkgnarrow="available", patterns=module_names, showdups=False)
except YumBaseError as e:
raise ProjectsError("There was a problem with info for %s: %s" % (module_names, str(e)))
finally:
yb.closeRpmDB()
modules = sorted(map(yaps_to_project, ybl.available), key=lambda p: p["name"].lower())
# Add the dependency info to each one
for module in modules:
module["dependencies"] = projects_depsolve(yb, [(module["name"], "*")], [])
return modules
[docs]def yum_repo_to_file_repo(repo):
"""Return a string representation of a repo dict suitable for writing to a .repo file
:param repo: Yum Repository represented as a dict
:type repo: dict
:returns: A string
:rtype: str
The YumRepo.dump() function does not produce a string that can be used as a
yum .repo file. So do this manually with only the attributes we care about.
"""
repo_str = "[%s]\n" % repo["id"]
if repo["metalink"]:
repo_str += "metalink = %s\n" % repo["metalink"]
elif repo["mirrorlist"]:
repo_str += "mirrorlist = %s\n" % repo["mirrorlist"]
elif repo["baseurl"]:
repo_str += "baseurl = %s\n" % repo["baseurl"][0]
else:
raise RuntimeError("Repo has no baseurl, metalink, or mirrorlist")
# proxy is optional
if "proxy" in repo:
repo_str += "proxy = %s\n" % repo["proxy"]
repo_str += "sslverify = %s\n" % repo["sslverify"]
repo_str += "gpgcheck = %s\n" % repo["gpgcheck"]
if "gpgkey" in repo:
repo_str += "gpgkey = %s\n" % ",".join(repo["gpgkey"])
return repo_str
[docs]def repo_to_source(repo, system_source):
"""Return a Weldr Source dict created from the YumRepository
:param repo: Yum Repository
:type repo: yum.yumRepo.YumRepository
:param system_source: True if this source is an immutable system source
:type system_source: bool
:returns: A dict with Weldr Source fields filled in
:rtype: dict
Example::
{
"check_gpg": true,
"check_ssl": true,
"gpgkey_url": [
"file:///etc/pki/rpm-gpg/RPM-GPG-KEY-fedora-28-x86_64"
],
"name": "fedora",
"proxy": "http://proxy.brianlane.com:8123",
"system": true
"type": "yum-metalink",
"url": "https://mirrors.fedoraproject.org/metalink?repo=fedora-28&arch=x86_64"
}
"""
source = {"name": repo.id, "system": system_source}
if repo.baseurl:
source["url"] = repo.baseurl[0]
source["type"] = "yum-baseurl"
elif repo.metalink:
source["url"] = repo.metalink
source["type"] = "yum-metalink"
elif repo.mirrorlist:
source["url"] = repo.mirrorlist
source["type"] = "yum-mirrorlist"
else:
raise RuntimeError("Repo has no baseurl, metalink, or mirrorlist")
# proxy is optional
if repo.proxy:
source["proxy"] = repo.proxy
if not repo.sslverify:
source["check_ssl"] = False
else:
source["check_ssl"] = True
if not repo.gpgcheck:
source["check_gpg"] = False
else:
source["check_gpg"] = True
if repo.gpgkey:
source["gpgkey_urls"] = repo.gpgkey
return source
[docs]def source_to_repo(source):
"""Return an add_enable_repo kwargs dict created from a source dict
:param source: A Weldr source dict
:type source: dict
:returns: A yum YumRepository object
:rtype: yum.yumRepo.YumRepository
The dict it suitable for passing to yum's add_enable_repo function
after popping off baseurl and mirrorlist.
Example::
{
"gpgcheck": True,
"sslverify": True,
"gpgkey": ["file:///etc/pki/rpm-gpg/RPM-GPG-KEY-fedora-28-x86_64"],
"id": "fedora",
"proxy": "http://proxy.brianlane.com:8123",
"baseurl": "https://mirrors.fedoraproject.org/metalink?repo=fedora-28&arch=x86_64",
"metalink": None,
"mirrorlist": None
}
"""
repo = {"id": source["name"]}
# This will allow errors to be raised so we can catch them
# without this they are logged, but the repo is silently disabled
repo["skip_if_unavailable"] = False
if source["type"] == "yum-baseurl":
repo["baseurl"] = [source["url"]]
repo["metalink"] = None
repo["mirrorlist"] = None
elif source["type"] == "yum-metalink":
repo["metalink"] = source["url"]
repo["baseurl"] = []
repo["mirrorlist"] = None
elif source["type"] == "yum-mirrorlist":
repo["mirrorlist"] = source["url"]
repo["baseurl"] = []
repo["metalink"] = None
if "proxy" in source:
repo["proxy"] = source["proxy"]
if source["check_ssl"]:
repo["sslverify"] = True
else:
repo["sslverify"] = False
if source["check_gpg"]:
repo["gpgcheck"] = True
else:
repo["gpgcheck"] = False
if "gpgkey_urls" in source:
repo["gpgkey"] = source["gpgkey_urls"]
return repo
[docs]def get_source_ids(source_path):
"""Return a list of the source ids in a file
:param source_path: Full path and filename of the source (yum repo) file
:type source_path: str
:returns: A list of source id strings
:rtype: list of str
"""
if not os.path.exists(source_path):
return []
cfg = ConfigParser()
cfg.read(source_path)
return cfg.sections()
[docs]def get_repo_sources(source_glob):
"""Return a list of sources from a directory of yum repositories
:param source_glob: A glob to use to match the source files, including full path
:type source_glob: str
:returns: A list of the source ids in all of the matching files
:rtype: list of str
"""
sources = []
for f in glob(source_glob):
sources.extend(get_source_ids(f))
return sources
[docs]def delete_repo_source(source_glob, source_name):
"""Delete a source from a repo file
:param source_glob: A glob of the repo sources to search
:type source_glob: str
:returns: None
:raises: ProjectsError if there was a problem
A repo file may have multiple sources in it, delete only the selected source.
If it is the last one in the file, delete the file.
WARNING: This will delete ANY source, the caller needs to ensure that a system
source_name isn't passed to it.
"""
found = False
for f in glob(source_glob):
try:
cfg = ConfigParser()
cfg.read(f)
if source_name in cfg.sections():
found = True
cfg.remove_section(source_name)
# If there are other sections, rewrite the file without the deleted one
if len(cfg.sections()) > 0:
with open(f, "w") as cfg_file:
cfg.write(cfg_file)
else:
# No sections left, just delete the file
os.unlink(f)
except Exception as e:
raise ProjectsError("Problem deleting repo source %s: %s" % (source_name, str(e)))
if not found:
raise ProjectsError("source %s not found" % source_name)