Source code for Bcfg2.Server.Plugins.Packages.Collection

""" ``Collection`` objects represent the set of
:class:`Bcfg2.Server.Plugins.Packages.Source.Source` objects that
apply to a given client, and can be used to query all software
repositories for a client in aggregate.  In some cases this can give
faster or more accurate results.

In most cases, ``Collection`` methods have been designed to defer the
call to the Sources in the ``Collection`` and aggregate the results as
appropriate.  The simplest ``Collection`` implemention is thus often a
simple subclass that adds no additional functionality.

Overriding Methods
------------------

As noted above, the ``Collection`` object is written expressly so that
you can subclass it and override no methods or attributes, and it will
work by deferring all calls to the Source objects it contains.  There
are thus three approaches to writing a ``Collection`` subclass:

#. Keep the superclass almost entirely intact and defer to the
   ``Source`` objects inside it. For an example of this kind of
   ``Collection`` object, see
   :mod:`Bcfg2.Server.Plugins.Packages.Apt`.

#. Keep :func:`Collection.complete` intact, and override the methods
   it calls: :func:`Collection.is_package`,
   :func:`Collection.is_virtual_package`, :func:`Collection.get_deps`,
   :func:`Collection.get_provides`, :func:`Collection.get_vpkgs`, and
   :func:`Collection.setup_data`.  There are no examples of this kind
   of ``Collection`` subclass yet.

#. Provide your own implementation of :func:`Collection.complete`, in
   which case you do not have to override the above methods.  You may
   want to override :func:`Collection.packages_from_entry`,
   :func:`Collection.packages_to_entry`, and
   :func:`Collection.get_new_packages`.  For an example of this kind
   of ``Collection`` object, see
   :mod:`Bcfg2.Server.Plugins.Packages.yum`.

In either case, you may want to override
:func:`Collection.get_groups`, :func:`Collection.get_group`,
:func:`Collection.get_essential`, :func:`Collection.get_config`,
:func:`Collection.filter_unknown`, and
:func:`Collection.build_extra_structures`.

.. _pkg-objects:

Conversion Between Package Objects and XML Entries
--------------------------------------------------

Collection objects have to translate Bcfg2 entries,
:class:`lxml.etree._Element` objects, into objects suitable for use by
the backend for resolving dependencies.  This is handled by two
functions:

* :func:`Collection.packages_from_entry` is called to translate an XML
  entry into a list of packages;

* :func:`Collection.packages_to_entry` is called to translate a list
  of packages back into an XML entry.

Because of this translation layer, the return type of any functions
below that return packages (e.g., :func:`Collection.get_group`) is
actually indeterminate; they must return an object suitable for
passing to :func:`Collection.packages_to_entry`.  Similarly, functions
that take a package as an argument (e.g.,
:func:`Collection.is_package`) take the appropriate package object.
In the documentation below, the actual parameter return type (usually
.``string``) used in this base implementation is noted, as well as
this fact.

The Collection Module
---------------------
"""

import copy
import lxml.etree
import Bcfg2.Options
import Bcfg2.Server.Plugin
from Bcfg2.Logger import Debuggable
from Bcfg2.Compat import any, md5  # pylint: disable=W0622
from Bcfg2.Server.FileMonitor import get_fam
from Bcfg2.Server.Statistics import track_statistics


[docs]class Collection(list, Debuggable): """ ``Collection`` objects represent the set of :class:`Bcfg2.Server.Plugins.Packages.Source` objects that apply to a given client, and can be used to query all software repositories for a client in aggregate. In some cases this can give faster or more accurate results. """ #: Whether or not this Packages backend supports package groups __package_groups__ = False def __init__(self, metadata, sources, cachepath, basepath, debug=False): """ :param metadata: The client metadata for this collection :type metadata: Bcfg2.Server.Plugins.Metadata.ClientMetadata :param sources: A list of all sources known to the server that will be used to generate the list of sources that apply to this client :type sources: list of :class:`Bcfg2.Server.Plugins.Packages.Source.Source` objects :param cachepath: The filesystem path where cache and other temporary data will be stored :type cachepath: string :param basepath: The filesystem path to the Packages plugin directory, where more permanent data can be stored :type basepath: string :param debug: Enable debugging output :type debug: bool .. ----- .. autoattribute:: __package_groups__ """ Debuggable.__init__(self) list.__init__(self, sources) self.debug_flag = self.debug_flag or debug self.metadata = metadata self.basepath = basepath self.cachepath = cachepath self.virt_pkgs = dict() self.fam = get_fam() try: self.ptype = sources[0].ptype except IndexError: self.ptype = "unknown" @property def cachekey(self): """ A unique identifier for the set of sources contained in this ``Collection`` object. This is unique to a set of sources, **not** necessarily to the client, which lets clients with identical sources share cache data.""" return md5(self.sourcelist().encode('UTF-8')).hexdigest()
[docs] def get_config(self): """ Get the configuration for the package tool used by this source type. This should be a config appropriate for use on either the server (to resolve dependencies) or the client. Subclasses must override this method in order to be able to generate configs. By default it logs an error and returns the empty string. :returns: string """ self.logger.error("Packages: Cannot generate config for host %s with " "no sources or multiple source types" % self.metadata.hostname) return ""
[docs] def sourcelist(self): """ Get a human-readable list of sources in this collection, including some information about each source. :returns: string """ srcs = [] for source in self: for url_map in source.url_map: if url_map['arch'] not in self.metadata.groups: continue reponame = source.get_repo_name(url_map) srcs.append("Name: %s" % reponame) srcs.append(" Type: %s" % source.ptype) if url_map['url']: srcs.append(" URL: %s" % url_map['url']) elif url_map['rawurl']: srcs.append(" RAWURL: %s" % url_map['rawurl']) if source.gpgkeys: srcs.append(" GPG Key(s): %s" % ", ".join(source.gpgkeys)) else: srcs.append(" GPG Key(s): None") if len(source.blacklist): srcs.append(" Blacklist: %s" % ", ".join(source.blacklist)) if len(source.whitelist): srcs.append(" Whitelist: %s" % ", ".join(source.whitelist)) srcs.append("") return "\n".join(srcs)
[docs] def get_relevant_groups(self): """ Get all groups that might be relevant to determining which sources apply to this collection's client. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_relevant_groups` :return: list of strings - group names """ groups = [] for source in self: groups.extend(source.get_relevant_groups(self.metadata)) return sorted(list(set(groups)))
@property def cachefiles(self): """ A list of the full path to all cachefiles used by this collection. The base implementation simply aggregates :attr:`Bcfg2.Server.Plugins.Packages.Source.Source.cachefile` attributes.""" cachefiles = set() for source in self: cachefiles.add(source.cachefile) return list(cachefiles)
[docs] @track_statistics() def get_groups(self, grouplist): """ Given a list of package group names, return a dict of ``<group name>: <list of packages>``. This method is provided since some backends may be able to query multiple groups at once faster than serially. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_group`. :param grouplist: The list of groups to query :type grouplist: list of strings - group names :returns: dict of ``<group name>: <list of packages>`` In this implementation the packages will be strings, but see :ref:`pkg-objects`.""" rv = dict() for group, ptype in grouplist: rv[group] = self.get_group(group, ptype) return rv
[docs] @track_statistics() def get_group(self, group, ptype=None): """ Get the list of packages of the given type in a package group. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_group`. :param group: The name of the group to query :type group: string :param ptype: The type of packages to get, for backends that support multiple package types in package groups (e.g., "recommended," "optional," etc.) :type ptype: string :returns: list of strings - package names, but see :ref:`pkg-objects` """ if not self.__package_groups__: self.logger.error("Packages: Package groups are not supported by " "%s" % self.__class__.__name__) return [] for source in self: pkgs = source.get_group(self.metadata, group, ptype=ptype) if pkgs: return pkgs self.logger.warning("Packages: '%s' is not a valid group" % group) return []
[docs] def is_package(self, package): """ Return True if a package is a package, False otherwise. The base implementation returns True if any Source object's :func:`Bcfg2.Server.Plugins.Packages.Source.Source.is_package` returns True. :param package: The name of the package, but see :ref:`pkg-objects` :type package: string :returns: bool """ return any(source.is_package(self.metadata, package) for source in self)
[docs] def is_virtual_package(self, package): """ Return True if a name is a virtual package (i.e., is a symbol provided by a real package), False otherwise. The base implementation returns True if any Source object's :func:`Bcfg2.Server.Plugins.Packages.Source.Source.is_virtual_package` returns True. :param package: The name of the symbol, but see :ref:`pkg-objects` :type package: string :returns: bool """ return any(source.is_virtual_package(self.metadata, package) for source in self)
[docs] def get_deps(self, package, recs=None): """ Get a list of the dependencies of the given package. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_deps`. :param package: The name of the symbol, but see :ref:`pkg-objects` :type package: string :returns: list of strings, but see :ref:`pkg-objects` """ recommended = None if recs and package in recs: recommended = recs[package] for source in self: if source.is_package(self.metadata, package): return source.get_deps(self.metadata, package, recommended) return []
[docs] def get_essential(self): """ Get a list of packages that are essential to the repository. The base implementation simply aggregates :attr:`Bcfg2.Server.Plugins.Packages.Source.Source.essentialpkgs` attributes :returns: list of strings, but see :ref:`pkg-objects` """ essential = set() for source in self: essential |= source.essentialpkgs return essential
[docs] def get_provides(self, package): """ Get a list of all symbols provided by the given package. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_provides`. :param package: The name of the package, but see :ref:`pkg-objects` :type package: string :returns: list of strings, but see :ref:`pkg-objects` """ for source in self: providers = source.get_provides(self.metadata, package) if providers: return providers return []
[docs] def get_vpkgs(self): """ Get a list of all virtual packages provided by all sources. The base implementation simply aggregates the results of :func:`Bcfg2.Server.Plugins.Packages.Source.Source.get_vpkgs`. :returns: list of strings, but see :ref:`pkg-objects` """ vpkgs = dict() for source in self: s_vpkgs = source.get_vpkgs(self.metadata) for name, prov_set in list(s_vpkgs.items()): if name not in vpkgs: vpkgs[name] = set(prov_set) else: vpkgs[name].update(prov_set) return vpkgs
[docs] def filter_unknown(self, unknown): """ After :func:`complete`, filter out packages that appear in the list of unknown packages but should not be presented to the user. E.g., packages that you expect to be unknown. The base implementation filters out packages that are expected to be unknown by any source in this collection. :param unknown: A set of unknown packages. The set should be modified in place. :type unknown: set of strings, but see :ref:`pkg-objects` """ for source in self: source.filter_unknown(unknown)
[docs] def build_extra_structures(self, independent): """ Add additional entries to the ``<Independent/>`` section of the final configuration. This can be used to handle, e.g., GPG keys and other entries besides packages that need to be handled for a complete client configuration. :param independent: The XML tag to add extra entries to. This is modified in place. :type independent: lxml.etree._Element """ pass
[docs] def get_additional_data(self): """ Get additional :class:`Bcfg2.Server.Plugin.interfaces.Connector` data to be supplied to :func:`Bcfg2.Server.Plugins.Packages.Packages.get_additional_data` (and thence to client metadata objects). The base implementation simply aggregates :attr:`Bcfg2.Server.Plugins.Packages.Source.Source.url_map` attributes. :returns: list of additional Connector data """ sdata = [] for source in self: sdata.extend(copy.deepcopy(source.url_map)) return sdata
[docs] def setup_data(self, force_update=False): """ Do any collection-level data setup tasks. This is called when sources are loaded or reloaded by :class:`Bcfg2.Server.Plugins.Packages.Packages`. The base implementation is a no-op; the child :class:`Bcfg2.Server.Plugins.Packages.Source.Source` objects will handle all data setup. :param force_update: Ignore all local cache and setup data from its original upstream sources (i.e., the package repositories) :type force_update: bool """ pass
[docs] def packages_from_entry(self, entry): """ Given a Package or BoundPackage entry, get a list of the package(s) described by it in a format appropriate for passing to :func:`complete`. By default, that's just the name; only the :mod:`Bcfg2.Server.Plugins.Packages.Yum` backend supports versions or other extended data. See :ref:`pkg-objects` for more details. :param entry: The XML entry describing the package or packages. :type entry: lxml.etree._Element :returns: list of strings, but see :ref:`pkg-objects` """ return [entry.get("name")]
[docs] def packages_to_entry(self, pkglist, entry): """ Given a list of package objects as returned by :func:`packages_from_entry` or :func:`complete`, return an XML tree describing the BoundPackage entries that should be included in the client configuration. See :ref:`pkg-objects` for more details. :param pkglist: A list of packages as returned by :func:`complete` :type pkglist: list of strings, but see :ref:`pkg-objects` :param entry: The base XML entry to add all of the Package entries to. This should be modified in place. :type entry: lxml.etree._Element """ for pkg in pkglist: lxml.etree.SubElement(entry, 'BoundPackage', name=pkg, version=Bcfg2.Options.setup.packages_version, type=self.ptype, origin='Packages')
[docs] def get_new_packages(self, initial, complete): """ Compute the difference between the complete package list (as returned by :func:`complete`) and the initial package list computed from the specification. This is necessary because the format may be different between the two lists due to :func:`packages_to_entry` and :func:`packages_from_entry`. See :ref:`pkg-objects` for more details. :param initial: The initial package list :type initial: set of strings, but see :ref:`pkg-objects` :param complete: The final package list :type complete: set of strings, but see :ref:`pkg-objects` :return: set of strings, but see :ref:`pkg-objects` - the set of packages that are in ``complete`` but not in ``initial`` """ return list(complete.difference(initial))
[docs] @track_statistics() def complete(self, packagelist, # pylint: disable=R0912,R0914 recommended=None): """ Build a complete list of all packages and their dependencies. :param packagelist: Set of initial packages computed from the specification. :type packagelist: set of strings, but see :ref:`pkg-objects` :returns: tuple of sets - The first element contains a set of strings (but see :ref:`pkg-objects`) describing the complete package list, and the second element is a set of symbols whose dependencies could not be resolved. """ # setup vpkg cache pgrps = tuple(self.get_relevant_groups()) if pgrps not in self.virt_pkgs: self.virt_pkgs[pgrps] = self.get_vpkgs() vpkg_cache = self.virt_pkgs[pgrps] # unclassified is set of unsatisfied requirements (may be pkg # for vpkg) unclassified = set(packagelist) vpkgs = set() both = set() pkgs = set(packagelist) packages = set() examined = set() unknown = set() final_pass = False really_done = False # do while unclassified or vpkgs or both or pkgs while unclassified or pkgs or both or final_pass: if really_done: break if len(unclassified) + len(pkgs) + len(both) == 0: # one more pass then exit really_done = True while unclassified: current = unclassified.pop() examined.add(current) is_pkg = False if self.is_package(current): is_pkg = True is_vpkg = current in vpkg_cache if is_pkg and is_vpkg: both.add(current) elif is_pkg and not is_vpkg: pkgs.add(current) elif is_vpkg and not is_pkg: vpkgs.add(current) elif not is_vpkg and not is_pkg: unknown.add(current) while pkgs: # direct packages; current can be added, and all deps # should be resolved current = pkgs.pop() self.debug_log("Packages: handling package requirement %s" % (current,)) packages.add(current) deps = self.get_deps(current, recommended) newdeps = set(deps).difference(examined) if newdeps: self.debug_log("Packages: Package %s added requirements %s" % (current, newdeps)) unclassified.update(newdeps) satisfied_vpkgs = set() for current in vpkgs: # virtual dependencies, satisfied if one of N in the # config, or can be forced if only one provider if len(vpkg_cache[current]) == 1: self.debug_log("Packages: requirement %s satisfied by %s" % (current, vpkg_cache[current])) unclassified.update( vpkg_cache[current].difference(examined)) satisfied_vpkgs.add(current) else: satisfiers = [item for item in vpkg_cache[current] if item in packages] self.debug_log("Packages: requirement %s satisfied by %s" % (current, satisfiers)) satisfied_vpkgs.add(current) vpkgs.difference_update(satisfied_vpkgs) satisfied_both = set() for current in both: # packages that are both have virtual providers as # well as a package with that name. allow use of virt # through explicit specification, then fall back to # forcing current on last pass satisfiers = [item for item in vpkg_cache[current] if item in packages] if satisfiers: self.debug_log("Packages: requirement %s satisfied by %s" % (current, satisfiers)) satisfied_both.add(current) elif current in packagelist or final_pass: pkgs.add(current) satisfied_both.add(current) both.difference_update(satisfied_both) if len(unclassified) + len(pkgs) == 0: final_pass = True else: final_pass = False self.filter_unknown(unknown) return packages, unknown
def __repr__(self): return "%s(%s)" % (self.__class__.__name__, list.__repr__(self))
[docs]def get_collection_class(source_type): """ Given a source type, determine the class of Collection object that should be used to contain these sources. Note that ``source_type`` is *not* a :class:`Bcfg2.Server.Plugins.Packages.Source.Source` subclass; it's the name of a source type as given in ``sources.xml``. :param source_type: The type of source, e.g., "yum" or "apt" :type source_type: string :returns: type - the Collection subclass that should be used to instantiate an object to contain sources of the given type. """ for mod in Bcfg2.Options.setup.packages_backends: if mod.__name__.endswith(".%s" % source_type.title()): return getattr(mod, "%sCollection" % source_type.title()) raise Bcfg2.Server.Plugin.PluginExecutionError( "Packages: No collection class found for %s sources" % source_type)