Source code for gridkit._statistical_functions

import numpy

from gridkit.bounded_grid import BoundedGrid
from gridkit.errors import AlignmentError
from gridkit.index import GridIndex
from gridkit.tile import Tile, average_data_tiles, count_tiles, sum_data_tiles


def _total_bounds(left_bounds, right_bounds):
    return (
        min(left_bounds[0], right_bounds[0]),
        min(left_bounds[1], right_bounds[1]),
        max(left_bounds[2], right_bounds[2]),
        max(left_bounds[3], right_bounds[3]),
    )



[docs]
def total_bounds(grids):
    if len(grids) == 1:
        return grids[0].bounds

    combined_bounds = grids[0].bounds
    for grid in grids[1:]:
        combined_bounds = _total_bounds(combined_bounds, grid.bounds)
    return combined_bounds



def _empty_combined_grid(grids, value=numpy.nan):
    reference = grids[0]
    if not all([grid.is_aligned_with(reference)[0] for grid in grids[1:]]):
        raise AlignmentError(
            "Not all grids are aligned. Please `resample` all grids on the same grid."
        )

    combined_bounds = total_bounds(grids)
    _, shape = grids[0].cells_in_bounds(
        combined_bounds, return_cell_count=True
    )  # TODO: split ids and shape outputs into different methods
    combined_data = numpy.full(  # data shape is y,x
        shape,
        value,
        dtype=float,  # Fixme: don't hardcode dtype. This if workaround for working with NaNs
    )

    return reference.update(combined_data, bounds=combined_bounds, crs=reference.crs)



[docs]
def count_bounded_grids(grids):
    empty_grid = _empty_combined_grid(grids, value=0)
    combined_grid = empty_grid.copy()
    for grid in grids:
        if grid.nodata_value is None:
            value_ids = combined_grid.cells_in_bounds(grid.bounds)
        else:
            value_ids = grid != grid.nodata_value
        numpy_ids = combined_grid.grid_id_to_numpy_id(value_ids.ravel())
        combined_grid._data[numpy_ids] += 1
    return combined_grid




[docs]
def count(grids_or_tiles):
    """See :func:`gridkit.tile.count_tiles`"""
    if all([isinstance(obj, BoundedGrid) for obj in grids_or_tiles]):
        return count_bounded_grids(grids_or_tiles)
    if all([isinstance(obj, Tile) for obj in grids_or_tiles]):
        return count_tiles(grids_or_tiles)
    raise TypeError(
        "Either not all types are the same or the tiles are not of type gridkit.BoundedGrid or gridkit.Tile"
    )




[docs]
def sum_bounded_grids(grids):
    empty_grid = _empty_combined_grid(grids, value=numpy.nan)
    combined_grid = empty_grid.copy()
    for (
        grid
    ) in grids:  # add zero instead of NaN where there is coverage to allow adding
        combined_grid.assign(0, bounds=grid.bounds, in_place=True)
    empty_grid = _empty_combined_grid(grids, value=0)  # TODO: add `replace` function
    for grid in grids:  # add the values
        combined_grid += empty_grid.assign(
            grid.data, bounds=grid.bounds, in_place=False
        )
    return combined_grid




[docs]
def sum(grids_or_tiles):
    """See :func:`gridkit.tile.sum_data_tiles`"""
    if all([isinstance(obj, BoundedGrid) for obj in grids_or_tiles]):
        return sum_bounded_grids(grids_or_tiles)
    if all([isinstance(obj, Tile) for obj in grids_or_tiles]):
        return sum_data_tiles(grids_or_tiles)
    raise TypeError(
        "Either not all types are the same or the tiles are not of type gridkit.BoundedGrid or gridkit.Tile"
    )




[docs]
def mean_bounded_grids(grids):
    return sum(grids) / count(grids)




[docs]
def mean(grids_or_tiles):
    """See :func:`gridkit.tile.average_data_tiles`"""
    if all([isinstance(obj, BoundedGrid) for obj in grids_or_tiles]):
        return mean_bounded_grids(grids_or_tiles)
    if all([isinstance(obj, Tile) for obj in grids_or_tiles]):
        return average_data_tiles(grids_or_tiles)
    raise TypeError(
        "Either not all types are the same or the tiles are not of type gridkit.BoundedGrid or gridkit.Tile"
    )