Source code for pygmt.src.grdhisteq

"""
grdhisteq - Perform histogram equalization for a grid.
"""

import pandas as pd
from pygmt.clib import Session
from pygmt.exceptions import GMTInvalidInput
from pygmt.helpers import (
    GMTTempFile,
    args_in_kwargs,
    build_arg_string,
    fmt_docstring,
    kwargs_to_strings,
    use_alias,
)
from pygmt.io import load_dataarray


[docs]@fmt_docstring
@use_alias(
    C="divisions",
    D="outfile",
    G="outgrid",
    R="region",
    N="gaussian",
    Q="quadratic",
    V="verbose",
)
@kwargs_to_strings(R="sequence")
def grdhisteq(grid, **kwargs):
    r"""
    Perform histogram equalization for a grid.

    Two common use cases of :meth:`pygmt.grdhisteq` are to find data values
    that divide a grid into patches of equal area or to write a grid with
    statistics based on some kind of cumulative distribution function.

    Histogram equalization provides a way to highlight data that has most
    values clustered in a small portion of the dynamic range, such as a grid
    of flat topography with a mountain in the middle. Ordinary gray shading of
    this grid (using :meth:`pygmt.Figure.grdimage` or
    :meth:`pygmt.Figure.grdview`) with a linear mapping from topography to
    graytone will result in most of the image being very dark gray, with the
    mountain being almost white. :meth:`pygmt.grdhisteq` can provide a list of
    data values that divide the data range into divisions which have an equal
    area in the image [Default is 16 if ``divisions`` is not set]. The
    :class:`pandas.DataFrame` or ASCII file output can be used to make a
    colormap with :meth:`pygmt.makecpt` and an image with
    :meth:`pygmt.Figure.grdimage` that has all levels of gray occuring equally.

    :meth:`pygmt.grdhisteq` also provides a way to write a grid with statistics
    based on a cumulative distribution function. In this application, the
    ``outgrid`` has relative highs and lows in the same (x,y) locations as the
    ``grid``, but the values are changed to reflect their place in the
    cumulative distribution.

    Must provide ``outfile`` or ``outgrid``.

    Full option list at :gmt-docs:`grdhisteq.html`

    {aliases}

    Parameters
    ----------
    grid : str or xarray.DataArray
        The file name of the input grid or the grid loaded as a DataArray.
    outgrid : str or bool or None
        The name of the output netCDF file with extension .nc to store the grid
        in.
    outfile : str or bool or None
        The name of the output ASCII file to store the results of the
        histogram equalization in. Not allowed if ``outgrid`` is used.
    divisions : int
        Set the number of divisions of the data range.

    {R}
    {V}

    Returns
    -------
    ret: pandas.DataFrame or xarray.DataArray or None
        Return type depends on whether the ``outgrid`` parameter is set:

        - pandas.DataFrame if ``outfile`` is True
        - xarray.DataArray if ``outgrid`` is True
        - None if ``outgrid`` is a str (grid output is stored in ``outgrid``)
        - None if ``outfile`` is a str (file output is stored in ``outfile``)

    See Also
    -------
    :meth:`pygmt.grd2cpt`
    """
    if "D" in kwargs and "G" in kwargs:
        raise GMTInvalidInput("Cannot use both ``outfile`` and ``outgrid``.")
    if not args_in_kwargs(["D", "G"], kwargs):
        raise GMTInvalidInput("Must set ``outgrid`` or ``outfile``.")
    with GMTTempFile(suffix=".nc") as tmpfile:
        with Session() as lib:
            file_context = lib.virtualfile_from_data(check_kind="raster", data=grid)
            with file_context as infile:
                # Return table data if outgrid is not set
                if "G" not in kwargs or kwargs["G"] is None:
                    # Return pd.Dataframe if filename not provided
                    if "D" not in kwargs or kwargs["D"] is True:
                        outfile = tmpfile.name
                    else:  # Return set output to file Name
                        outfile = kwargs["D"]
                    # Temporary workaround to GMT bug, see GitHub issue 5785
                    kwargs.update({"D": True})
                    kwargs.update({">": outfile})
                else:  # NetCDF or xarray.DataArray output if outgrid is set
                    if kwargs["G"] is True:
                        kwargs.update({"G": tmpfile.name})
                    outgrid = kwargs["G"]
                arg_str = " ".join([infile, build_arg_string(kwargs)])
                lib.call_module("grdhisteq", arg_str)

        try:  # Try returning a xr.DataArray
            result = load_dataarray(outgrid) if outgrid == tmpfile.name else None
        except UnboundLocalError:  # if outgrid unset, return pd.DataFrame or text file
            result = (
                pd.read_csv(outfile, sep="\t", header=None)
                if outfile == tmpfile.name
                else None
            )
    return result