Source code for mirgecom.array_context

"""Provide some utilities for handling ArrayContexts.

.. autofunction:: get_reasonable_array_context_class
.. autofunction:: actx_class_is_lazy
.. autofunction:: actx_class_is_eager
.. autofunction:: actx_class_is_profiling
.. autofunction:: actx_class_is_numpy
.. autofunction:: actx_class_is_distributed
.. autofunction:: initialize_actx
"""

__copyright__ = """
Copyright (C) 2023 University of Illinois Board of Trustees
"""

__license__ = """
Permission is hereby granted, free of charge, to any person obtaining a copy
of this software and associated documentation files (the "Software"), to deal
in the Software without restriction, including without limitation the rights
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
copies of the Software, and to permit persons to whom the Software is
furnished to do so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in
all copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
THE SOFTWARE.
"""

from typing import Type, Dict, Any, Tuple
import os
import logging

import pyopencl as cl
from arraycontext import (ArrayContext, PyOpenCLArrayContext,
                          PytatoPyOpenCLArrayContext)

logger = logging.getLogger(__name__)



[docs]
def get_reasonable_array_context_class(*, lazy: bool, distributed: bool,
                        profiling: bool, numpy: bool = False) -> Type[ArrayContext]:
    """Return a :class:`~arraycontext.ArrayContext` with the given constraints."""
    if lazy and profiling:
        raise ValueError("Can't specify both lazy and profiling")

    if numpy:
        if profiling:
            raise ValueError("Can't specify both numpy and profiling")
        if lazy:
            raise ValueError("Can't specify both numpy and lazy")

        if distributed:
            from grudge.array_context import MPINumpyArrayContext
            return MPINumpyArrayContext
        else:
            from grudge.array_context import NumpyArrayContext
            return NumpyArrayContext

    if profiling:
        from mirgecom.profiling import PyOpenCLProfilingArrayContext
        return PyOpenCLProfilingArrayContext

    from grudge.array_context import \
        get_reasonable_array_context_class as grudge_get_reasonable_actx_class

    return grudge_get_reasonable_actx_class(lazy=lazy, distributed=distributed)




[docs]
def actx_class_is_lazy(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* is lazy."""
    return issubclass(actx_class, PytatoPyOpenCLArrayContext)




[docs]
def actx_class_is_eager(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* is eager."""
    return issubclass(actx_class, PyOpenCLArrayContext)




[docs]
def actx_class_is_profiling(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* has profiling enabled."""
    from mirgecom.profiling import PyOpenCLProfilingArrayContext
    return issubclass(actx_class, PyOpenCLProfilingArrayContext)



def actx_class_is_pyopencl(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* is PyOpenCL-based."""
    return actx_class_is_lazy(actx_class) or actx_class_is_eager(actx_class)



[docs]
def actx_class_is_numpy(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* is numpy-based."""
    from grudge.array_context import NumpyArrayContext
    return issubclass(actx_class, NumpyArrayContext)




[docs]
def actx_class_is_distributed(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* is distributed."""
    from grudge.array_context import MPIBasedArrayContext
    return issubclass(actx_class, MPIBasedArrayContext)



def actx_class_has_fallback_args(actx_class: Type[ArrayContext]) -> bool:
    """Return True if *actx_class* has fallback arguments."""
    import inspect
    spec = inspect.getfullargspec(actx_class.__init__)
    return "use_axis_tag_inference_fallback" in spec.args


def _check_cache_dirs_node(actx: ArrayContext) -> None:
    """Check whether multiple ranks share cache directories on the same node."""
    if not actx_class_is_distributed(type(actx)):
        return

    from mpi4py import MPI

    size = MPI.COMM_WORLD.Get_size()

    if size <= 1:
        return

    from mirgecom.mpi import shared_split_comm_world

    with shared_split_comm_world() as node_comm:
        node_rank = node_comm.Get_rank()

        def _check_var(var: str) -> None:
            from warnings import warn

            try:
                my_path = os.environ[var]
            except KeyError:
                warn(f"Please set the '{var}' variable in your job script to "
                    "avoid file system overheads when running on large numbers of "
                    "ranks. See https://mirgecom.readthedocs.io/en/latest/running/large-systems.html "  # noqa: E501
                    "for more information.")
                # Create a fake path so there will not be a second warning below.
                my_path = f"no/such/path/rank{node_rank}"

            all_paths = node_comm.gather(my_path, root=0)

            if node_rank == 0:
                assert all_paths
                if len(all_paths) != len(set(all_paths)):
                    hostname = MPI.Get_processor_name()
                    dup = [path for path in set(all_paths)
                                if all_paths.count(path) > 1]

                    from warnings import warn
                    warn(f"Multiple ranks are sharing '{var}' on node '{hostname}'. "
                        f"Duplicate '{var}'s: {dup}.")

        _check_var("XDG_CACHE_HOME")

        if os.environ.get("XDG_CACHE_HOME") is None:
            # When XDG_CACHE_HOME is set but POCL_CACHE_DIR is not, pocl
            # will use XDG_CACHE_HOME as the cache directory.
            _check_var("POCL_CACHE_DIR")

        # We haven't observed an issue yet that 'CUDA_CACHE_PATH' fixes,
        # so disable this check for now.
        # _check_var("CUDA_CACHE_PATH")


def _check_gpu_oversubscription(actx: ArrayContext) -> None:
    """
    Check whether multiple ranks are running on the same GPU on each node.

    Only works with CUDA or AMD devices currently.
    """
    if not actx_class_is_distributed(type(actx)):
        return

    from mpi4py import MPI
    import pyopencl as cl

    assert isinstance(actx, (PyOpenCLArrayContext, PytatoPyOpenCLArrayContext))

    size = MPI.COMM_WORLD.Get_size()

    if size <= 1:
        return

    dev = actx.queue.device

    # Only check GPU devices
    if not (dev.type & cl.device_type.GPU):
        return

    from pyopencl.characterize import nv_compute_capability
    if nv_compute_capability(dev) is not None:
        try:
            domain_id = hex(dev.pci_domain_id_nv)
        except (cl._cl.LogicError, AttributeError):
            from warnings import warn
            warn("Cannot detect whether multiple ranks are running on the"
                 " same GPU because it requires Nvidia GPUs running with"
                 " pyopencl>2021.1.1 and (Nvidia CL or pocl>1.6).")
            raise

        bus_id = hex(dev.pci_bus_id_nv)
        slot_id = hex(dev.pci_slot_id_nv)
        dev_id: Tuple[Any, ...] = (domain_id, bus_id, slot_id)

    elif dev.platform.vendor.startswith("Advanced Micro") \
            and "MI300A" not in dev.board_name_amd:
        # FIXME: Can't detect GPU ID on MI300A (and perhaps other AMD GPUs), since
        # the values for dev.topology_amd are identical on the APUs, and pyopencl
        # does not support the cl_amd_copy_buffer_p2p extension, which is
        # the only way to distinguish APUs from each other.
        dev_id = (dev.topology_amd.bus,)
    else:
        from warnings import warn
        warn("Cannot detect whether multiple ranks are running on the"
             " same GPU.")
        return

    from mirgecom.mpi import shared_split_comm_world

    with shared_split_comm_world() as node_comm:
        node_rank = node_comm.Get_rank()

        dev_ids = node_comm.gather(dev_id, root=0)

        if node_rank == 0:
            assert dev_ids
            if len(dev_ids) != len(set(dev_ids)):
                hostname = MPI.Get_processor_name()
                dup = [item for item in dev_ids if dev_ids.count(item) > 1]

                from warnings import warn
                warn(f"Multiple ranks are sharing GPUs on node '{hostname}'. "
                     f"Duplicate PCIe IDs: {dup}.")


def _check_pocl_svm_issue(actx: ArrayContext) -> None:
    """Check for pocl version >= 6 and warn about SVM performance issue."""
    assert isinstance(actx, (PyOpenCLArrayContext, PytatoPyOpenCLArrayContext))

    dev = actx.queue.device

    # Only check if running on an NVIDIA device, where SVM is required. Otherwise,
    # just disable SVM in simutil.get_reasonable_memory_pool
    from pyopencl.characterize import nv_compute_capability
    if nv_compute_capability(dev) is None:
        return

    # TODO: Check if this is still an issue in pocl7
    from pyopencl.characterize import get_pocl_version
    pocl_version = get_pocl_version(dev.platform)
    if pocl_version is not None and pocl_version[0] >= 6:
        from warnings import warn
        warn(
            "Performance may be degraded on this device due to an issue with "
            "shared virtual memory (SVM) in pocl version >= 6. If running "
            "performance-critical simulations, consider "
            "downgrading to version 5. See "
            "https://github.com/illinois-ceesd/mirgecom/pull/1055 for more details.")


def log_disk_cache_config(actx: ArrayContext) -> None:
    """Log the disk cache configuration."""
    assert isinstance(actx, (PyOpenCLArrayContext, PytatoPyOpenCLArrayContext))

    if actx_class_is_distributed(type(actx)):
        from grudge.array_context import MPIBasedArrayContext
        assert isinstance(actx, MPIBasedArrayContext)
        rank = actx.mpi_communicator.Get_rank()
    else:
        rank = 0

    res = f"Rank {rank} disk cache config: "

    from pyopencl.characterize import nv_compute_capability, get_pocl_version
    dev = actx.queue.device

    # Variables set to a 'True' value => cache is disabled
    from pytools import strtobool
    loopy_cache_enabled = not strtobool(os.getenv("LOOPY_NO_CACHE", "False"))
    pyopencl_cache_enabled = not strtobool(os.getenv("PYOPENCL_NO_CACHE", "False"))

    loopy_cache_dir = ("(" + os.getenv("XDG_CACHE_HOME", "default dir") + ")"
                       if loopy_cache_enabled else "")
    pyopencl_cache_dir = ("(" + os.getenv("XDG_CACHE_HOME", "default dir") + ")"
                          if pyopencl_cache_enabled else "")

    res += f"loopy: {loopy_cache_enabled} {loopy_cache_dir}; "
    res += f"pyopencl: {pyopencl_cache_enabled} {pyopencl_cache_dir}; "

    if get_pocl_version(dev.platform) is not None:
        # Variable set to '0' => cache is disabled
        pocl_cache_enabled = os.getenv("POCL_KERNEL_CACHE", "1") != "0"

        # If POCL_CACHE_DIR is set, pocl uses it. Otherwise, it uses XDG_CACHE_HOME.
        pocl_cache_dir = ("("
                          + os.getenv("POCL_CACHE_DIR",
                                    os.getenv("XDG_CACHE_HOME", "default dir")) + ")"
                        if pocl_cache_enabled else "")

        res += f"pocl: {pocl_cache_enabled} {pocl_cache_dir}; "

    if nv_compute_capability(dev) is not None:
        # Variable set to '1' => cache is disabled
        cuda_cache_enabled = os.getenv("CUDA_CACHE_DISABLE", "0") != "1"
        cuda_cache_dir = ("(" + os.getenv("CUDA_CACHE_PATH", "default dir") + ")"
                          if cuda_cache_enabled else "")
        res += f"cuda: {cuda_cache_enabled} {cuda_cache_dir};"

    res += "\n"
    logger.info(res)



[docs]
def initialize_actx(
        actx_class: Type[ArrayContext],
        comm=None, *,
        use_axis_tag_inference_fallback: bool = False,
        use_einsum_inference_fallback: bool = False) -> ArrayContext:
    """Initialize a new :class:`~arraycontext.ArrayContext` based on *actx_class*."""
    from grudge.array_context import (MPIPyOpenCLArrayContext,
                                      MPIPytatoArrayContext
                                      )

    actx_kwargs: Dict[str, Any] = {}

    if comm:
        actx_kwargs["mpi_communicator"] = comm

    if actx_class_is_numpy(actx_class):
        from grudge.array_context import MPINumpyArrayContext
        if comm:
            assert issubclass(actx_class, MPINumpyArrayContext)
        else:
            assert not issubclass(actx_class, MPINumpyArrayContext)
    else:
        cl_ctx = cl.create_some_context()
        if actx_class_is_profiling(actx_class):
            queue = cl.CommandQueue(cl_ctx,
                properties=cl.command_queue_properties.PROFILING_ENABLE)
        else:
            queue = cl.CommandQueue(cl_ctx)
        actx_kwargs["queue"] = queue

        from mirgecom.simutil import get_reasonable_memory_pool
        alloc = get_reasonable_memory_pool(cl_ctx, queue)
        actx_kwargs["allocator"] = alloc

        if actx_class_is_lazy(actx_class):
            assert issubclass(actx_class, PytatoPyOpenCLArrayContext)

            if actx_class_has_fallback_args(actx_class):
                actx_kwargs["use_axis_tag_inference_fallback"] = \
                    use_axis_tag_inference_fallback
                actx_kwargs["use_einsum_inference_fallback"] = \
                    use_einsum_inference_fallback
            if comm:
                assert issubclass(actx_class, MPIPytatoArrayContext)
                actx_kwargs["mpi_base_tag"] = 12000
            else:
                assert not issubclass(actx_class, MPIPytatoArrayContext)
        else:
            assert issubclass(actx_class, PyOpenCLArrayContext)
            actx_kwargs["force_device_scalars"] = True
            if comm:
                assert issubclass(actx_class, MPIPyOpenCLArrayContext)
            else:
                assert not issubclass(actx_class, MPIPyOpenCLArrayContext)

    actx = actx_class(**actx_kwargs)

    # Check cache directories and log disk cache configuration for
    # PyOpenCL-based actx (Non-PyOpenCL actx classes don't use loopy, pyopencl,
    # or pocl, and therefore we don't need to examine their caching).
    if actx_class_is_pyopencl(actx_class):
        _check_gpu_oversubscription(actx)
        _check_cache_dirs_node(actx)
        _check_pocl_svm_issue(actx)
        log_disk_cache_config(actx)

    return actx