Source code for spack.detection.path

# Copyright 2013-2024 Lawrence Livermore National Security, LLC and other
# Spack Project Developers. See the top-level COPYRIGHT file for details.
#
# SPDX-License-Identifier: (Apache-2.0 OR MIT)
"""Detection of software installed in the system, based on paths inspections
and running executables.
"""
import collections
import concurrent.futures
import os
import os.path
import re
import sys
import warnings
from typing import Dict, List, Optional, Set, Tuple

import llnl.util.filesystem
import llnl.util.lang
import llnl.util.tty

import spack.util.elf as elf_utils
import spack.util.environment
import spack.util.environment as environment
import spack.util.ld_so_conf

from .common import (
    DetectedPackage,
    WindowsCompilerExternalPaths,
    WindowsKitExternalPaths,
    _convert_to_iterable,
    compute_windows_program_path_for_package,
    compute_windows_user_path_for_package,
    executable_prefix,
    find_win32_additional_install_paths,
    library_prefix,
    path_to_dict,
)

#: Timeout used for package detection (seconds)
DETECTION_TIMEOUT = 60
if sys.platform == "win32":
    DETECTION_TIMEOUT = 120


[docs] def common_windows_package_paths(pkg_cls=None) -> List[str]: """Get the paths for common package installation location on Windows that are outside the PATH Returns [] on unix """ if sys.platform != "win32": return [] paths = WindowsCompilerExternalPaths.find_windows_compiler_bundled_packages() paths.extend(find_win32_additional_install_paths()) paths.extend(WindowsKitExternalPaths.find_windows_kit_bin_paths()) paths.extend(WindowsKitExternalPaths.find_windows_kit_reg_installed_roots_paths()) paths.extend(WindowsKitExternalPaths.find_windows_kit_reg_sdk_paths()) if pkg_cls: paths.extend(compute_windows_user_path_for_package(pkg_cls)) paths.extend(compute_windows_program_path_for_package(pkg_cls)) return paths
[docs] def file_identifier(path): s = os.stat(path) return (s.st_dev, s.st_ino)
[docs] def executables_in_path(path_hints: List[str]) -> Dict[str, str]: """Get the paths of all executables available from the current PATH. For convenience, this is constructed as a dictionary where the keys are the executable paths and the values are the names of the executables (i.e. the basename of the executable path). There may be multiple paths with the same basename. In this case it is assumed there are two different instances of the executable. Args: path_hints: list of paths to be searched. If None the list will be constructed based on the PATH environment variable. """ search_paths = llnl.util.filesystem.search_paths_for_executables(*path_hints) return path_to_dict(search_paths)
[docs] def get_elf_compat(path): """For ELF files, get a triplet (EI_CLASS, EI_DATA, e_machine) and see if it is host-compatible.""" # On ELF platforms supporting, we try to be a bit smarter when it comes to shared # libraries, by dropping those that are not host compatible. with open(path, "rb") as f: elf = elf_utils.parse_elf(f, only_header=True) return (elf.is_64_bit, elf.is_little_endian, elf.elf_hdr.e_machine)
[docs] def accept_elf(path, host_compat): """Accept an ELF file if the header matches the given compat triplet, obtained with :py:func:`get_elf_compat`. In case it's not an ELF (e.g. static library, or some arbitrary file, fall back to is_readable_file).""" # Fast path: assume libraries at least have .so in their basename. # Note: don't replace with splitext, because of libsmth.so.1.2.3 file names. if ".so" not in os.path.basename(path): return llnl.util.filesystem.is_readable_file(path) try: return host_compat == get_elf_compat(path) except (OSError, elf_utils.ElfParsingError): return llnl.util.filesystem.is_readable_file(path)
[docs] def libraries_in_ld_and_system_library_path( path_hints: Optional[List[str]] = None, ) -> Dict[str, str]: """Get the paths of all libraries available from ``path_hints`` or the following defaults: - Environment variables (Linux: ``LD_LIBRARY_PATH``, Darwin: ``DYLD_LIBRARY_PATH``, and ``DYLD_FALLBACK_LIBRARY_PATH``) - Dynamic linker default paths (glibc: ld.so.conf, musl: ld-musl-<arch>.path) - Default system library paths. For convenience, this is constructed as a dictionary where the keys are the library paths and the values are the names of the libraries (i.e. the basename of the library path). There may be multiple paths with the same basename. In this case it is assumed there are two different instances of the library. Args: path_hints: list of paths to be searched. If None the list will be constructed based on the set of LD_LIBRARY_PATH, LIBRARY_PATH, DYLD_LIBRARY_PATH, and DYLD_FALLBACK_LIBRARY_PATH environment variables as well as the standard system library paths. path_hints (list): list of paths to be searched. If ``None``, the default system paths are used. """ if path_hints: search_paths = llnl.util.filesystem.search_paths_for_libraries(*path_hints) else: search_paths = [] # Environment variables if sys.platform == "darwin": search_paths.extend(environment.get_path("DYLD_LIBRARY_PATH")) search_paths.extend(environment.get_path("DYLD_FALLBACK_LIBRARY_PATH")) elif sys.platform.startswith("linux"): search_paths.extend(environment.get_path("LD_LIBRARY_PATH")) # Dynamic linker paths search_paths.extend(spack.util.ld_so_conf.host_dynamic_linker_search_paths()) # Drop redundant paths search_paths = list(filter(os.path.isdir, search_paths)) # Make use we don't doubly list /usr/lib and /lib etc search_paths = list(llnl.util.lang.dedupe(search_paths, key=file_identifier)) try: host_compat = get_elf_compat(sys.executable) accept = lambda path: accept_elf(path, host_compat) except (OSError, elf_utils.ElfParsingError): accept = llnl.util.filesystem.is_readable_file path_to_lib = {} # Reverse order of search directories so that a lib in the first # search path entry overrides later entries for search_path in reversed(search_paths): for lib in os.listdir(search_path): lib_path = os.path.join(search_path, lib) if accept(lib_path): path_to_lib[lib_path] = lib return path_to_lib
[docs] def libraries_in_windows_paths(path_hints: Optional[List[str]] = None) -> Dict[str, str]: """Get the paths of all libraries available from the system PATH paths. For more details, see `libraries_in_ld_and_system_library_path` regarding return type and contents. Args: path_hints: list of paths to be searched. If None the list will be constructed based on the set of PATH environment variables as well as the standard system library paths. """ search_hints = ( path_hints if path_hints is not None else spack.util.environment.get_path("PATH") ) search_paths = llnl.util.filesystem.search_paths_for_libraries(*search_hints) # on Windows, some libraries (.dlls) are found in the bin directory or sometimes # at the search root. Add both of those options to the search scheme search_paths.extend(llnl.util.filesystem.search_paths_for_executables(*search_hints)) if path_hints is None: # if no user provided path was given, add defaults to the search search_paths.extend(WindowsKitExternalPaths.find_windows_kit_lib_paths()) # SDK and WGL should be handled by above, however on occasion the WDK is in an atypical # location, so we handle that case specifically. search_paths.extend(WindowsKitExternalPaths.find_windows_driver_development_kit_paths()) return path_to_dict(search_paths)
def _group_by_prefix(paths: Set[str]) -> Dict[str, Set[str]]: groups = collections.defaultdict(set) for p in paths: groups[os.path.dirname(p)].add(p) return groups
[docs] class Finder: """Inspects the file-system looking for packages. Guesses places where to look using PATH."""
[docs] def default_path_hints(self) -> List[str]: return []
[docs] def search_patterns(self, *, pkg: "spack.package_base.PackageBase") -> List[str]: """Returns the list of patterns used to match candidate files. Args: pkg: package being detected """ raise NotImplementedError("must be implemented by derived classes")
[docs] def candidate_files(self, *, patterns: List[str], paths: List[str]) -> List[str]: """Returns a list of candidate files found on the system. Args: patterns: search patterns to be used for matching files paths: paths where to search for files """ raise NotImplementedError("must be implemented by derived classes")
[docs] def prefix_from_path(self, *, path: str) -> str: """Given a path where a file was found, returns the corresponding prefix. Args: path: path of a detected file """ raise NotImplementedError("must be implemented by derived classes")
[docs] def detect_specs( self, *, pkg: "spack.package_base.PackageBase", paths: List[str] ) -> List[DetectedPackage]: """Given a list of files matching the search patterns, returns a list of detected specs. Args: pkg: package being detected paths: files matching the package search patterns """ if not hasattr(pkg, "determine_spec_details"): warnings.warn( f"{pkg.name} must define 'determine_spec_details' in order" f" for Spack to detect externally-provided instances" f" of the package." ) return [] result = [] for candidate_path, items_in_prefix in sorted(_group_by_prefix(set(paths)).items()): # TODO: multiple instances of a package can live in the same # prefix, and a package implementation can return multiple specs # for one prefix, but without additional details (e.g. about the # naming scheme which differentiates them), the spec won't be # usable. try: specs = _convert_to_iterable( pkg.determine_spec_details(candidate_path, items_in_prefix) ) except Exception as e: specs = [] warnings.warn( f'error detecting "{pkg.name}" from prefix {candidate_path} [{str(e)}]' ) if not specs: files = ", ".join(_convert_to_iterable(items_in_prefix)) llnl.util.tty.debug( f"The following files in {candidate_path} were decidedly not " f"part of the package {pkg.name}: {files}" ) resolved_specs: Dict[spack.spec.Spec, str] = {} # spec -> exe found for the spec for spec in specs: prefix = self.prefix_from_path(path=candidate_path) if not prefix: continue if spec in resolved_specs: prior_prefix = ", ".join(_convert_to_iterable(resolved_specs[spec])) llnl.util.tty.debug( f"Files in {candidate_path} and {prior_prefix} are both associated" f" with the same spec {str(spec)}" ) continue resolved_specs[spec] = candidate_path try: spec.validate_detection() except Exception as e: msg = ( f'"{spec}" has been detected on the system but will ' f"not be added to packages.yaml [reason={str(e)}]" ) warnings.warn(msg) continue if spec.external_path: prefix = spec.external_path result.append(DetectedPackage(spec=spec, prefix=prefix)) return result
[docs] def find( self, *, pkg_name: str, initial_guess: Optional[List[str]] = None ) -> List[DetectedPackage]: """For a given package, returns a list of detected specs. Args: pkg_name: package being detected initial_guess: initial list of paths to search from the caller if None, default paths are searched. If this is an empty list, nothing will be searched. """ import spack.repo pkg_cls = spack.repo.PATH.get_pkg_class(pkg_name) patterns = self.search_patterns(pkg=pkg_cls) if not patterns: return [] if initial_guess is None: initial_guess = self.default_path_hints() initial_guess.extend(common_windows_package_paths(pkg_cls)) candidates = self.candidate_files(patterns=patterns, paths=initial_guess) result = self.detect_specs(pkg=pkg_cls, paths=candidates) return result
[docs] class ExecutablesFinder(Finder):
[docs] def default_path_hints(self) -> List[str]: return spack.util.environment.get_path("PATH")
[docs] def search_patterns(self, *, pkg: "spack.package_base.PackageBase") -> List[str]: result = [] if hasattr(pkg, "executables") and hasattr(pkg, "platform_executables"): result = pkg.platform_executables() return result
[docs] def candidate_files(self, *, patterns: List[str], paths: List[str]) -> List[str]: executables_by_path = executables_in_path(path_hints=paths) patterns = [re.compile(x) for x in patterns] result = [] for compiled_re in patterns: for path, exe in executables_by_path.items(): if compiled_re.search(exe): result.append(path) return list(sorted(set(result)))
[docs] def prefix_from_path(self, *, path: str) -> str: result = executable_prefix(path) if not result: msg = f"no bin/ dir found in {path}. Cannot add it as a Spack package" llnl.util.tty.debug(msg) return result
[docs] class LibrariesFinder(Finder): """Finds libraries on the system, searching by LD_LIBRARY_PATH, LIBRARY_PATH, DYLD_LIBRARY_PATH, DYLD_FALLBACK_LIBRARY_PATH, and standard system library paths """
[docs] def search_patterns(self, *, pkg: "spack.package_base.PackageBase") -> List[str]: result = [] if hasattr(pkg, "libraries"): result = pkg.libraries return result
[docs] def candidate_files(self, *, patterns: List[str], paths: List[str]) -> List[str]: libraries_by_path = ( libraries_in_ld_and_system_library_path(path_hints=paths) if sys.platform != "win32" else libraries_in_windows_paths(path_hints=paths) ) patterns = [re.compile(x) for x in patterns] result = [] for compiled_re in patterns: for path, exe in libraries_by_path.items(): if compiled_re.search(exe): result.append(path) return result
[docs] def prefix_from_path(self, *, path: str) -> str: result = library_prefix(path) if not result: msg = f"no lib/ or lib64/ dir found in {path}. Cannot add it as a Spack package" llnl.util.tty.debug(msg) return result
[docs] def by_path( packages_to_search: List[str], *, path_hints: Optional[List[str]] = None, max_workers: Optional[int] = None, ) -> Dict[str, List[DetectedPackage]]: """Return the list of packages that have been detected on the system, keyed by unqualified package name. Args: packages_to_search: list of packages to be detected. Each package can be either unqualified of fully qualified path_hints: initial list of paths to be searched max_workers: maximum number of workers to search for packages in parallel """ # TODO: Packages should be able to define both .libraries and .executables in the future # TODO: determine_spec_details should get all relevant libraries and executables in one call executables_finder, libraries_finder = ExecutablesFinder(), LibrariesFinder() detected_specs_by_package: Dict[str, Tuple[concurrent.futures.Future, ...]] = {} result = collections.defaultdict(list) with concurrent.futures.ProcessPoolExecutor(max_workers=max_workers) as executor: for pkg in packages_to_search: executable_future = executor.submit( executables_finder.find, pkg_name=pkg, initial_guess=path_hints ) library_future = executor.submit( libraries_finder.find, pkg_name=pkg, initial_guess=path_hints ) detected_specs_by_package[pkg] = executable_future, library_future for pkg_name, futures in detected_specs_by_package.items(): for future in futures: try: detected = future.result(timeout=DETECTION_TIMEOUT) if detected: _, unqualified_name = spack.repo.partition_package_name(pkg_name) result[unqualified_name].extend(detected) except concurrent.futures.TimeoutError: llnl.util.tty.debug( f"[EXTERNAL DETECTION] Skipping {pkg_name}: timeout reached" ) except Exception as e: llnl.util.tty.debug( f"[EXTERNAL DETECTION] Skipping {pkg_name}: exception occured {e}" ) return result