Source code for fluxfootprints.ffp_xr

import logging
from typing import Optional, Tuple, Union
import numpy as np
import pandas as pd
from scipy.ndimage import gaussian_filter
import xarray as xr

from .base_footprint_model import BaseFootprintModel


[docs]
class ffp_climatology_new(BaseFootprintModel):
    r"""
    Create a footprint‑climatology from a series of individual flux‑footprint
    estimates using the simple 2‑D parameterisation of Kljun et al. (2015).

    The routine

    1. computes a footprint for every time step,
    2. rotates each footprint into its observed wind direction,
    3. aggregates all footprints onto a common grid, and
    4. derives user‑requested source‑area contours (``rs``).

    The implementation is based on:

        Kljun, N., Calanca, P., Rotach, M. W., & Schmid, H. P. (2015).
        *A simple two‑dimensional parameterisation for flux‑footprint
        predictions (FFP)*. **Geoscientific Model Development, 8**, 3695‑3713.
        https://doi.org/10.5194/gmd‑8‑3695‑2015

    Parameters
    ----------
    zm : float or 1‑D array_like
        Measurement height above displacement height (i.e.\ ``z – d``) [m].
    z0 : float or 1‑D array_like or None
        Surface roughness length [m].  Either `z0` **or** `umean` must be
        provided; if both are given, `z0` takes precedence.
    umean : float or 1‑D array_like or None
        Mean wind speed at `zm` [m s⁻¹].
    h : 1‑D array_like
        Boundary‑layer height [m].
    ol : 1‑D array_like
        Obukhov length [m].
    sigmav : 1‑D array_like
        Standard deviation of lateral velocity fluctuations [m s⁻¹].
    ustar : 1‑D array_like
        Friction velocity [m s⁻¹].
    wind_dir : 1‑D array_like
        Wind direction in degrees (0–360°, meteorological convention).

    Other Parameters
    ----------------
    domain : array_like of float, optional
        Domain limits ``[xmin, xmax, ymin, ymax]`` [m].
        Default is the smaller of

        * the minimal rectangle that contains the *r* % footprint, or
        * ``[-1000, 1000, -1000, 1000]``.
    dx, dy : float, optional
        Grid‑cell size in x and y [m].  Defaults to 2 m.  If only `dx`
        is given, `dy = dx`.
    nx, ny : int, optional
        Number of grid cells in x and y.  Defaults to 1000×1000.  Ignored
        when `dx`/`dy` **and** `domain` are supplied (cell size wins).
    rs : float or sequence of float, optional
        Source‑area percentages for which contour lines are returned,
        e.g.\ ``80`` or ``[10, 30, 80]``.  Values may be expressed as
        percentages (``80``) or fractions (``0.8``).  Must be 10–90 %.
        Default is ``np.arange(10, 90, 10)``.  Use ``None`` to skip
        contour calculations.
    rslayer : {0, 1}, optional
        If 1, allow calculations when `zm` lies in the roughness sub‑layer
        (RS).  **Warning:** the model is formally **invalid** within the RS,
        so results are only indicative.  Requires `z0`.  Default is 0.
    smooth_data : {0, 1}, optional
        Apply a convolution filter to smooth the footprint climatology.
        Default is 1 (smooth).
    crop : {0, 1}, optional
        Crop the output grid to the extent of the largest requested
        contour (`rs`) or, if `rs` is *None*, the 80 % contour.  Default 0.
    pulse : int, optional
        Print progress every *pulse* footprints.  Default is no output.
    verbosity : {0, 1, 2}, optional
        Verbosity level: 0 = silent, 1 = only fatal messages, 2 = chatty.
        Default 2.
    fig : {0, 1}, optional
        Plot an example footprint on screen when set to 1.  Default 0.

    Returns
    -------
    FFP : dict
        Dictionary with keys (see below) carrying the climatology results.
    x_2d, y_2d : ndarray
        2‑D grids (mesh‑grids) of x and y coordinates [m].
    fclim_2d : ndarray
        Normalised footprint‑climatology values [m⁻²].
    rs : ndarray or None
        Echo of input `rs` in percent, or *None* when `rs` was *None*.
    fr : ndarray or None
        Footprint value at each `rs` contour.
    xr, yr : list[ndarray] or None
        x‑ and y‑coordinates of every `rs` contour line.
    n : int
        Number of individual footprints used in the aggregation.
    flag_err : {0, 1, 2, 3}
        Error/status flag:
        *0* no error, *1* fatal error, *2* some contours outside domain,
        *3* invalid input rows removed.

    Notes
    -----
    *Implemented by* N. Kljun & G. Fratini, originally in MATLAB,
    ported to Python 3.x (v 1.4, 11 Dec 2019).

    Examples
    --------
    >>> from fluxfootprints import ffp_climatology_new
    >>> clim = ffp_climatology_new(
    ...     zm=2.5,
    ...     z0=0.1,
    ...     h=h_series,
    ...     ol=ol_series,
    ...     sigmav=sigmav_series,
    ...     ustar=ustar_series,
    ...     wind_dir=wd_series,
    ... )
    >>> clim["fclim_2d"].shape
    (1000, 1000)
    """

    def __init__(
        self,
        df: pd.DataFrame,
        domain: np.ndarray = [-1000.0, 1000.0, -1000.0, 1000.0],
        dx: int = 10.0,
        dy: int = 10.0,
        nx: int = 1000,
        ny: int = 1000,
        rs: Union[list, np.ndarray] = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8],
        crop_height: float = 0.2,
        atm_bound_height: float = 2000.0,
        inst_height: float = 2.0,
        rslayer: bool = False,
        smooth_data: bool = True,
        crop: bool = False,
        verbosity: int = 2,
        fig: bool = False,
        logger=None,
        time=None,
        crs: int = None,
        station_x: float = None,
        station_y: float = None,
        **kwargs,
    ):
        super().__init__(
            df=df,
            domain=domain,
            dx=dx,
            dy=dy,
            rs=rs,
            crop_height=crop_height,
            atm_bound_height=atm_bound_height,
            inst_height=inst_height,
            smooth_data=smooth_data,
            verbosity=verbosity,
            logger=logger,
        )


        self.fclim_2d = None
        self.df = df

        # Model parameters
        self.xmin, self.xmax, self.ymin, self.ymax = domain

        if dx is None and nx is not None:
            self.x = np.linspace(self.xmin, self.xmax, nx + 1)
            self.y = np.linspace(self.ymin, self.ymax, ny + 1)
        else:
            self.x = np.arange(self.xmin, self.xmax + dx, dx)
            self.y = np.arange(self.ymin, self.ymax + dy, dy)

        self.rotated_theta = None

        self.a = 1.4524
        self.b = -1.9914
        self.c = 1.4622
        self.d = 0.1359
        self.ac = 2.17
        self.bc = 1.66
        self.cc = 20.0
        self.oln = 5000.0  # limit to L for neutral scaling
        self.k = 0.4  # von Karman
        # ===========================================================================
        # Get kwargs
        self.show_heatmap = kwargs.get("show_heatmap", True)

        # ===========================================================================
        # Input check
        self.flag_err = 0

        self.dx = dx
        self.dy = dy

        self.rs = rs
        self.rslayer = rslayer
        self.smooth_data = smooth_data
        self.crop = crop
        self.verbosity = verbosity
        self.fig = fig

        self.time = None  # defined later after dropping na values
        self.ts_len = None  # defined by len of dropped df

        self.f_2d = None

        self.logger = self._ensure_logger(logger)

        if self.verbosity < 2:
            self.logger.setLevel(logging.INFO)
        elif self.verbosity < 3:
            self.logger.setLevel(logging.WARNING)
        else:
            self.logger.setLevel(logging.DEBUG)

        if "crop_height" in df.columns:
            h_c = df["crop_height"]
        else:
            h_c = crop_height

        if "atm_bound_height" in df.columns:
            h_s = df["atm_bound_height"]
        else:
            h_s = atm_bound_height

        if "inst_height" in df.columns:
            zm_s = df["inst_height"]
        else:
            zm_s = inst_height

        self.prep_df_fields(
            h_c=h_c,
            d_h=None,
            zm_s=zm_s,
            h_s=h_s,
        )
        self.define_domain()
        self.create_xr_dataset()

    def _ensure_logger(self, logger: Optional[logging.Logger]) -> logging.Logger:
        if isinstance(logger, logging.Logger):
            return logger
        lg = logging.getLogger("footprint_daily_summary")
        if not lg.handlers:
            lg.addHandler(logging.StreamHandler())
        lg.setLevel(logging.WARNING)
        return lg

    def _validate_input_df(self,df, config=None, required_vars=None):
        """
        Validate input DataFrame for FFP climatology calculations.
        
        Parameters
        ----------
        df : pd.DataFrame
            Input DataFrame containing flux tower measurements
        config : dict, optional
            Configuration dictionary mapping standard variable names to column names
            Expected keys: 'zm', 'u_mean', 'ustar', 'L', 'sigma_v', 'h', 'z0', 'wind_dir'
        required_vars : list, optional
            List of required variables. If None, uses default set.
            
        Returns
        -------
        pd.DataFrame
            Validated DataFrame with standardized column names
            
        Raises
        ------
        ValueError
            If required columns are missing or data is invalid
        """
        import pandas as pd
        import numpy as np
        
        # Default configuration mapping
        default_config = {
            'zm': 'zm',              # Measurement height [m]
            'u_mean': 'WS',          # Mean wind speed [m/s]
            'ustar': 'USTAR',        # Friction velocity [m/s]
            'L': 'MO_LENGTH',        # Obukhov length [m]
            'sigma_v': 'V_SIGMA',    # Std dev of lateral velocity [m/s]
            'h': 'PBLH_F',           # Boundary layer height [m]
            'z0': 'z0',              # Roughness length [m]
            'wind_dir': 'WD'         # Wind direction [degrees]
        }
        
        # Check if DataFrame is empty
        if df.empty:
            raise ValueError("Input DataFrame is empty")
        
        return df


[docs]
    def prep_df_fields(
        self,
        h_c=0.2,
        d_h=None,
        zm_s=2.0,
        h_s=2000.0,
    ):
        # h_c Height of canopy [m]
        # Estimated displacement height [m]
        # zm_s Measurement height [m] from AMF metadata
        # h_s Height of atmos. boundary layer [m] - assumed

        if d_h is None:
            d_h = 10 ** (0.979 * np.log10(h_c) - 0.154)

        self.df["zm"] = zm_s - d_h
        self.df["h_c"] = h_c
        self.df["z0"] = h_c * 0.123
        self.df["h"] = h_s

        self.df = self.df.rename(
            columns={
                "V_SIGMA": "sigmav",
                "USTAR": "ustar",
                "wd": "wind_dir",
                "MO_LENGTH": "ol",
                "ws": "umean",
            }
        )

        # Check if all required fields are in the DataFrame
        all_present = np.all(
            np.isin(["ol", "sigmav", "ustar", "wind_dir"], self.df.columns)
        )
        if all_present:
            self.logger.debug("All required fields are present")
        else:
            self.raise_ffp_exception(1)

        self.df["zm"] = np.where(self.df["zm"] <= 0.0, np.nan, self.df["zm"])
        self.df["h"] = np.where(self.df["h"] <= 10.0, np.nan, self.df["h"])
        self.df["zm"] = np.where(self.df["zm"] > self.df["h"], np.nan, self.df["zm"])
        self.df["sigmav"] = np.where(self.df["sigmav"] < 0.0, np.nan, self.df["sigmav"])
        self.df["ustar"] = np.where(self.df["ustar"] <= 0.05, np.nan, self.df["ustar"])

        self.df["wind_dir"] = np.where(
            self.df["wind_dir"] > 360.0, np.nan, self.df["wind_dir"]
        )
        self.df["wind_dir"] = np.where(
            self.df["wind_dir"] < 0.0, np.nan, self.df["wind_dir"]
        )

        self.df = self.df.dropna(
            subset=["sigmav", "wind_dir", "h", "ol", "ustar"], how="any"
        )
        self.ts_len = len(self.df)
        self.logger.debug(f"input len is {self.ts_len}")



[docs]
    def raise_ffp_exception(self, code):
        exceptions = {
            1: "At least one required parameter is missing. Check the inputs.",
            2: "zm (measurement height) must be larger than zero.",
            3: "z0 (roughness length) must be larger than zero.",
            4: "h (boundary layer height) must be larger than 10 m.",
            5: "zm (measurement height) must be smaller than h (boundary layer height).",
            6: "zm (measurement height) should be above the roughness sub-layer.",
            7: "zm/ol (measurement height to Obukhov length ratio) must be >= -15.5.",
            8: "sigmav (standard deviation of crosswind) must be larger than zero.",
            9: "ustar (friction velocity) must be >= 0.1.",
            10: "wind_dir (wind direction) must be in the range [0, 360].",
        }

        message = exceptions.get(code, "Unknown error code.")

        if self.verbosity > 0:
            print(f"Error {code}: {message}")
            self.logger.info(f"Error {code}: {message}")

        if code in [1, 4, 5, 7, 9, 10]:  # Fatal errors
            self.logger.error(f"Error {code}: {message}")
            raise ValueError(f"FFP Exception {code}: {message}")



[docs]
    def define_domain(self):
        # ===========================================================================
        # Create 2D grid
        self.xv, self.yv = np.meshgrid(self.x, self.y, indexing="ij")

        # Define physical domain in cartesian and polar coordinates
        self.logger.debug(f"x: {self.x}, y: {self.y}")
        # Polar coordinates
        # Set theta such that North is pointing upwards and angles increase clockwise
        # Polar coordinates
        self.rho = xr.DataArray(
            np.sqrt(self.xv**2 + self.yv**2),
            dims=("x", "y"),
            coords={"x": self.x, "y": self.y},
        )
        self.theta = xr.DataArray(
            np.arctan2(self.xv, self.yv),
            dims=("x", "y"),
            coords={"x": self.x, "y": self.y},
        )
        self.logger.debug(f"rho: {self.rho}, theta: {self.theta}")
        # Initialize raster for footprint climatology
        self.fclim_2d = xr.zeros_like(self.rho)


        # ===========================================================================


[docs]
    def create_xr_dataset(self):
        # Time series inputs as an xarray.Dataset
        self.df.index.name = "time"
        self.ds = xr.Dataset.from_dataframe(self.df)



[docs]
    def calc_xr_footprint(self):
        # Rotate coordinates into wind direction
        self.rotated_theta = self.theta - (self.ds["wind_dir"] * np.pi / 180.0)

        psi_cond = np.logical_and(self.oln > self.ds["ol"], self.ds["ol"] > 0)

        # Compute xstar_ci_dummy for all timestamps
        xx = (1.0 - 19.0 * self.ds["zm"] / self.ds["ol"]) ** 0.25

        psi_f = xr.where(
            psi_cond,
            -5.3 * self.ds["zm"] / self.ds["ol"],
            np.log((1.0 + xx**2) / 2.0)
            + 2.0 * np.log((1.0 + xx) / 2.0)
            - 2.0 * np.arctan(xx)
            + np.pi / 2.0,
        )

        xstar_bottom = xr.where(
            self.ds["z0"].isnull(),
            (self.ds["umean"] / self.ds["ustar"] * self.k),
            (np.log(self.ds["zm"] / self.ds["z0"]) - psi_f),
        )

        xstar_ci_dummy = xr.where(
            (np.log(self.ds["zm"] / self.ds["z0"]) - psi_f) > 0,
            self.rho
            * np.cos(self.rotated_theta)
            / self.ds["zm"]
            * (1.0 - (self.ds["zm"] / self.ds["h"]))
            / xstar_bottom,
            0.0,
        )

        xstar_ci_dummy = xstar_ci_dummy.astype(float)

        # Mask invalid values
        px = xstar_ci_dummy > self.d

        # Compute fstar_ci_dummy and f_ci_dummy
        fstar_ci_dummy = xr.where(
            px,
            self.a
            * (xstar_ci_dummy - self.d) ** self.b
            * np.exp(-self.c / (xstar_ci_dummy - self.d)),
            0.0,
        )

        f_ci_dummy = xr.where(
            px,
            fstar_ci_dummy
            / self.ds["zm"]
            * (1.0 - (self.ds["zm"] / self.ds["h"]))
            / xstar_bottom,
            0.0,
        )

        # Calculate sigystar_dummy for valid points
        sigystar_dummy = xr.where(
            px,
            self.ac
            * np.sqrt(
                self.bc
                * np.abs(xstar_ci_dummy) ** 2
                / (1.0 + self.cc * np.abs(xstar_ci_dummy))
            ),
            0.0,  # Default value for invalid points
        )

        self.ds["ol"] = xr.where(np.abs(self.ds["ol"]) > self.oln, -1e6, self.ds["ol"])

        # Calculate scale_const in a vectorized way
        scale_const = xr.where(
            self.ds["ol"] <= 0,
            1e-5 * np.abs(self.ds["zm"] / self.ds["ol"]) ** (-1) + 0.80,
            1e-5 * np.abs(self.ds["zm"] / self.ds["ol"]) ** (-1) + 0.55,
        )

        scale_const = xr.where(scale_const > 1.0, 1.0, scale_const)

        # Calculate sigy_dummy
        sigy_dummy = xr.where(
            px,
            sigystar_dummy
            / scale_const
            * self.ds["zm"]
            * self.ds["sigmav"]
            / self.ds["ustar"],
            0.0,  # Default value for invalid points
        )

        # less than or equal to zero covers the px filter as well
        sigy_dummy = xr.where(sigy_dummy <= 0.0, np.nan, sigy_dummy)
        # sigy_dummy = xr.where(px, sigy_dummy, 0.0)

        # sig_cond = np.logical_or(sigy_dummy.isnull(), px, sigy_dummy == 0.0)
        #

        # Calculate the footprint in real scale
        self.f_2d = xr.where(
            sigy_dummy.isnull(),
            0.0,
            f_ci_dummy
            / (np.sqrt(2 * np.pi) * sigy_dummy)
            * np.exp(
                -((self.rho * np.sin(self.rotated_theta)) ** 2) / (2.0 * sigy_dummy**2)
            ),
        )

        self.f_2d = self.f_2d / self.f_2d.sum(dim=("x", "y"))
        # self.f_2d = xr.where(px, self.f_2d, 0.0)

        # Accumulate into footprint climatology raster
        self.fclim_2d = self.f_2d.sum(dim="time") / self.ts_len

        # Apply smoothing if requested
        if self.smooth_data:
            self.f_2d = xr.apply_ufunc(
                gaussian_filter,
                self.f_2d,
                kwargs={"sigma": 1.0},
                input_core_dims=[["x", "y"]],
                output_core_dims=[["x", "y"]],
            )
            self.fclim_2d = xr.apply_ufunc(
                gaussian_filter,
                self.fclim_2d,
                kwargs={"sigma": 1.0},
                input_core_dims=[["x", "y"]],
                output_core_dims=[["x", "y"]],
            )



[docs]
    def smooth_and_contour(self, rs=[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8]):
        """
        Compute footprint climatology using xarray structures for efficient, vectorized operations.

        Parameters:
            rs (list): Contour levels to compute.
            smooth_data (bool): Whether to smooth data using Gaussian filtering.

        Returns:
            xr.Dataset: Aggregated footprint climatology.
        """

        # Ensure the footprint data is normalized
        self.ds["footprint"] = self.fclim_2d
        self.ds["footprint"] = self.ds["footprint"] / self.ds["footprint"].sum(
            dim=("x", "y")
        )

        # Apply smoothing if requested
        if self.smooth_data:
            self.ds["footprint"] = xr.apply_ufunc(
                gaussian_filter,
                self.ds["footprint"],
                kwargs={"sigma": 1.0},
                input_core_dims=[["x", "y"]],
                output_core_dims=[["x", "y"]],
            )

        # Calculate cumulative footprint and extract contours
        cumulative = self.ds["footprint"].cumsum(dim="x").cumsum(dim="y")

        contours = {r: cumulative.where(cumulative >= r).fillna(0) for r in self.rs}

        # Combine results into a dataset
        climatology = xr.Dataset(
            {f"contour_{int(r * 100)}": data for r, data in contours.items()}
        )

        return climatology



[docs]
    def run(self, return_result: bool = True):

        self.calc_xr_footprint()

        if return_result:
            results = xr.Dataset(
                        {
                            "footprint_climatology": self.fclim_2d,  # Use DataArray directly
                            "domain_x": ("x", self.x),
                            "domain_y": ("y", self.y),
                        }
                    )
            return results


        # self.smooth_and_contour()