Source code for skyborn.interp.rcm2rgrid

from __future__ import annotations

import typing

import numpy as np
import xarray as xr

from .errors import ChunkError, CoordinateError
from .fortran.rcm2rgrid import drcm2rgrid, drgrid2rcm
from .missing_values import fort2py_msg, py2fort_msg

supported_types = typing.Union[xr.DataArray, np.ndarray]

# Fortran Wrappers _<funcname>()
# These wrappers are executed within dask processes (if any), and could/should
# do anything that can benefit from parallel execution.


def _rcm2rgrid(lat2d, lon2d, fi, lat1d, lon1d, msg_py):

    fi = np.transpose(fi, axes=(2, 1, 0))
    lat2d = np.transpose(lat2d, axes=(1, 0))
    lon2d = np.transpose(lon2d, axes=(1, 0))

    fi, msg_py, msg_fort = py2fort_msg(fi, msg_py=msg_py)

    fo = drcm2rgrid(lat2d, lon2d, fi, lat1d, lon1d, xmsg=msg_fort)
    fo = np.asarray(fo)
    fo = np.transpose(fo, axes=(2, 1, 0))

    fort2py_msg(fo, msg_fort=msg_fort, msg_py=msg_py)

    return fo


def _rgrid2rcm(lat1d, lon1d, fi, lat2d, lon2d, msg_py):

    fi = np.transpose(fi, axes=(2, 1, 0))
    lat2d = np.transpose(lat2d, axes=(1, 0))
    lon2d = np.transpose(lon2d, axes=(1, 0))

    fi, msg_py, msg_fort = py2fort_msg(fi, msg_py=msg_py)

    fo = drgrid2rcm(lat1d, lon1d, fi, lat2d, lon2d, xmsg=msg_fort)
    fo = np.asarray(fo)
    fo = np.transpose(fo, axes=(2, 1, 0))

    fort2py_msg(fo, msg_fort=msg_fort, msg_py=msg_py)

    return fo


def _regridded_rectilinear_coords(
    fi: xr.DataArray, lat1d: xr.DataArray, lon1d: xr.DataArray
) -> dict[str, xr.DataArray | np.ndarray]:
    """Preserve only coordinates that remain shape-compatible after regridding."""

    lat_dim = fi.dims[-2]
    lon_dim = fi.dims[-1]
    remapped_dims = {lat_dim, lon_dim}
    coords: dict[str, xr.DataArray | np.ndarray] = {}

    for name, coord in fi.coords.items():
        if name in remapped_dims:
            continue
        if any(dim in remapped_dims for dim in coord.dims):
            continue
        coords[name] = coord

    coords[lat_dim] = lat1d.data
    coords[lon_dim] = lon1d.data
    return coords


# Outer Wrappers <funcname>()
# These wrappers are executed in the __main__ python process, and should be
# used for any tasks which would not benefit from parallel execution.


# TODO: Even though this function is advertised to work on multi-dimensional arrays,
# it is currently only applicable to 3D-arrays due to the implementation of `_rcm2rgrid`
[docs] def rcm2rgrid( lat2d: supported_types, lon2d: supported_types, fi: supported_types, lat1d: supported_types, lon1d: supported_types, msg: np.number = None, meta: bool = False, ) -> supported_types: """Interpolates data on a curvilinear grid (i.e. RCM, WRF, NARR) to a rectilinear grid. Interpolates RCM (Regional Climate Model), WRF (Weather Research and Forecasting) and NARR (North American Regional Reanalysis) grids to a rectilinear grid. Actually, this function will interpolate most grids that use curvilinear latitude/longitude grids. No extrapolation is performed beyond the range of the input coordinates. Missing values are allowed but ignored. The weighting method used is simple inverse distance squared. Missing values are allowed but ignored. The code searches the input curvilinear grid latitudes and longitudes for the four grid points that surround a specified output grid coordinate. Because one or more of these input points could contain missing values, fewer than four points could be used in the interpolation. Curvilinear grids which have two-dimensional latitude and longitude coordinate axes present some issues because the coordinates are not necessarily monotonically increasing. The simple search algorithm used by ``rcm2rgrid`` is not capable of handling all cases. The result is that, sometimes, there are small gaps in the interpolated grids. Any interior points not interpolated in the initial interpolation pass will be filled using linear interpolation. In some cases, edge points may not be filled. Parameters ---------- lat2d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A two-dimensional array that specifies the latitudes locations of the input (``fi``). Because this array is two-dimensional, it is not an associated coordinate variable of ``fi``; therefore, it always needs to be explicitly provided. The latitude order must be south-to-north. lon2d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A two-dimensional array that specifies the longitudes locations of the input (``fi``). Because this array is two-dimensional, it is not an associated coordinate variable of ``fi``; therefore, it always needs to be explicitly provided. The latitude order must be west-to-east. fi : :class:`xarray.DataArray`, :class:`numpy.ndarray` A multi-dimensional array to be interpolated. The rightmost two dimensions (latitude, longitude) are the dimensions to be interpolated. lat1d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A one-dimensional array that specifies the latitude coordinates of the regular grid. Must be monotonically increasing. lon1d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A one-dimensional array that specifies the longitude coordinates of the regular grid. Must be monotonically increasing. msg : :obj:`numpy.number` A numpy scalar value that represent a missing value in ``fi``. This argument allows a user to use a missing value scheme other than NaN or masked arrays, similar to what NCL allows. meta : :obj:`bool` If set to True and the input array is an Xarray, the metadata from the input array will be copied to the output array; default is False. Warning: This option is not currently supported. Returns ------- fo : :class:`xarray.DataArray`, :class:`numpy.ndarray` The interpolated grid. A multi-dimensional array of the same size as ``fi`` except that the rightmost dimension sizes have been replaced by the sizes of ``lat1d`` and ``lon1d``, respectively. Examples -------- Example 1: Using rcm2rgrid with :class:`xarray.DataArray` input .. code-block:: python import numpy as np import xarray as xr from skyborn.interp import rcm2rgrid # Open a netCDF data file using xarray default engine and load the data stream ds = xr.open_dataset("./ruc.nc") # [INPUT] Grid & data info on the source curvilinear ht_curv=ds.DIST_236_CBL[:] lat2D_curv=ds.gridlat_236[:] lon2D_curv=ds.gridlon_236[:] # [OUTPUT] Grid on destination rectilinear grid (or read the 1D lat and lon from # an other .nc file. newlat1D_rect=np.linspace(lat2D_curv.min(), lat2D_curv.max(), 100) newlon1D_rect=np.linspace(lon2D_curv.min(), lon2D_curv.max(), 100) ht_rect = rcm2rgrid(lat2D_curv, lon2D_curv, ht_curv, newlat1D_rect, newlon1D_rect) """ if (lon2d is None) | (lat2d is None): raise CoordinateError("rcm2rgrid: lon2d and lat2d should always be provided!") # ''' Start of boilerplate is_input_xr = True # If the input is numpy.ndarray, convert it to xarray.DataArray if not isinstance(fi, xr.DataArray): is_input_xr = False fi = xr.DataArray(fi) # Convert 2d arrays to Xarray for inner wrapper call below if they are numpy lon2d = xr.DataArray(lon2d) lat2d = xr.DataArray(lat2d) lon1d = xr.DataArray(lon1d) lat1d = xr.DataArray(lat1d) # Ensure last two dimensions of `fi` are not chunked if fi.chunks is not None: if list(fi.chunks)[-2:] != [(lat2d.shape[0],), (lat2d.shape[1],)]: raise ChunkError( "rcm2rgrid: `fi` must be unchunked along the rightmost two dimensions!" ) # ''' end of boilerplate # Inner Fortran wrapper call fo = _rcm2rgrid(lat2d.data, lon2d.data, fi.data, lat1d.data, lon1d.data, msg) # If input was xarray.DataArray, convert output to xarray.DataArray as well if is_input_xr: fo = xr.DataArray( fo, attrs=fi.attrs, dims=fi.dims, coords=_regridded_rectilinear_coords(fi, lat1d, lon1d), ) return fo
# TODO: Even though this function is advertised to work on multi-dimensional arrays, # it is currently only applicable to 3D-arrays due to the implementation of `_rcm2rgrid` # TODO: This function requires the input to have the coordinates in the rightmost two dimensions, # but xarray.DataArrray inputs with coordinates anywhere could/should actually be fine
[docs] def rgrid2rcm( lat1d: supported_types, lon1d: supported_types, fi: supported_types, lat2d: supported_types, lon2d: supported_types, msg: np.number = None, meta: bool = False, ) -> supported_types: """Interpolates data on a rectilinear lat/lon grid to a curvilinear grid like those used by the RCM, WRF and NARR models/datasets. Interpolates data on a rectilinear lat/lon grid to a curvilinear grid, such as those used by the RCM (Regional Climate Model), WRF (Weather Research and Forecasting) and NARR (North American Regional Reanalysis) models/datasets. No extrapolation is performed beyond the range of the input coordinates. The method used is simple inverse distance weighting. Missing values are allowed but ignored. Parameters ---------- lat1d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A one-dimensional array that specifies the latitude coordinates of the regular grid. Must be monotonically increasing. Note: It should only be explicitly provided when the input (``fi``) is ``numpy.ndarray``; otherwise, it should come from ``fi.coords``. lon1d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A one-dimensional array that specifies the longitude coordinates of the regular grid. Must be monotonically increasing. Note: It should only be explicitly provided when the input (``fi``) is ``numpy.ndarray``; otherwise, it should come from ``fi.coords``. fi : :class:`xarray.DataArray`, :class:`numpy.ndarray` A multi-dimensional array to be interpolated. The rightmost two dimensions (latitude, longitude) are the dimensions to be interpolated. lat2d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A two-dimensional array that specifies the latitude locations of the input (``fi``). Because this array is two-dimensional it is not an associated coordinate variable of ``fi``. lon2d : :class:`xarray.DataArray`, :class:`numpy.ndarray` A two-dimensional array that specifies the longitude locations of the input (``fi``). Because this array is two-dimensional it is not an associated coordinate variable of ``fi``. msg : :obj:`numpy.number` A numpy scalar value that represents a missing value in ``fi``. This argument allows a user to use a missing value scheme other than NaN or masked arrays, similar to what NCL allows. meta : :obj:`bool` If set to True and the input array is an Xarray, the metadata from the input array will be copied to the output array; default is False. Warning: this option is not currently supported. Returns ------- fo : :class:`xarray.DataArray`, :class:`numpy.ndarray` The interpolated grid. A multi-dimensional array of the same size as ``fi`` except that the rightmost dimension sizes have been replaced by the sizes of ``lat2d`` (or ``lon2d``). Examples -------- Example 1: Using rgrid2rcm with :class:`xarray.DataArray` input .. code-block:: python import numpy as np import xarray as xr from skyborn.interp import rgrid2rcm # Open a netCDF data file using xarray default engine and load the data stream # input grid and data ds_rect = xr.open_dataset("./DATAFILE_RECT.nc") # [INPUT] Grid & data info on the source rectilinear ht_rect =ds_rect.SOME_FIELD[:] lat1D_rect=ds_rect.gridlat_[:] lon1D_rect=ds_rect.gridlon_[:] # Open a netCDF data file using xarray default engine and load the data stream # for output grid ds_curv = xr.open_dataset("./DATAFILE_CURV.nc") # [OUTPUT] Grid on destination curvilinear grid (or read the 2D lat and lon from # an other .nc file newlat2D_rect=ds_curv.gridlat2D_[:] newlon2D_rect=ds_curv.gridlat2D_[:] ht_curv = rgrid2rcm(lat1D_rect, lon1D_rect, ht_rect, newlat2D_curv, newlon2D_curv) """ # ''' Start of boilerplate is_input_xr = True # If the input is numpy.ndarray, convert it to xarray.DataArray if not isinstance(fi, xr.DataArray): if (lon1d is None) | (lat1d is None): raise CoordinateError( "rgrid2rcm: Arguments `lon1d` and `lat1d` must be provided " "explicitly unless `fi` is an xarray.DataArray." ) is_input_xr = False fi = xr.DataArray(fi) fi = fi.assign_coords({fi.dims[-1]: lon1d, fi.dims[-2]: lat1d}) # lon1d and lat1d should be coming from xarray input coords or assigned # as coords while xarray being initiated from numpy input above lon1d = fi.coords[fi.dims[-1]] lat1d = fi.coords[fi.dims[-2]] # Convert 2d arrays to Xarray for inner wrapper call below if they are numpy lat2d = xr.DataArray(lat2d) lon2d = xr.DataArray(lon2d) # If input data is already chunked if fi.chunks is not None: # Ensure last two dimensions of `fi` are not chunked if list(fi.chunks)[-2:] != [lat1d.shape, lon1d.shape]: raise Exception( "rgrid2rcm: `fi` must be unchunked along the last two dimensions" ) # ''' end of boilerplate # Inner Fortran wrapper call fo = _rgrid2rcm(lat1d.data, lon1d.data, fi.data, lat2d.data, lon2d.data, msg) # If input was xarray.DataArray, convert output to xarray.DataArray as well if is_input_xr: fo = xr.DataArray(fo, attrs=fi.attrs, dims=fi.dims) return fo