Source code for pyco2stats.stats

from scipy.optimize import minimize
from scipy.optimize import  brentq # brentq for uniroot
from scipy.integrate import quad 
from scipy.optimize import minimize_scalar, root_scalar

import numpy as np
import scipy.special as sp
import scipy.stats as stats
import statsmodels.api as sm
import warnings
import math

from scipy.interpolate import RegularGridInterpolator

from scipy.stats.mstats import trim as scipy_trim
from scipy.stats import trimboth as scipy_trimboth
from scipy.stats.mstats import trimtail as scipy_trimtail
from scipy.stats import tmean as scipy_tmean
from scipy.stats.mstats import trimmed_std as scipy_trimmed_std 
from scipy.stats.mstats import winsorize as scipy_winsorize
from scipy.special import hyp0f1
import scipy.interpolate
from scipy.stats import norm, t, chi2, nct

from astropy.stats import biweight_location as astropy_biweight_location
from astropy.stats import biweight_scale as astropy_biweight_scale
from astropy.stats import median_absolute_deviation as astropy_median_absolute_deviation
from astropy.stats import mad_std as astropy_mad_std
from astropy.stats import sigma_clip as astropy_sigma_clip
from astropy.stats import sigma_clipped_stats as astropy_sigma_clipped_stats

from typing import List, Union, Dict, Any, Optional, Sequence
from scipy.stats import t as t_distribution # da mettere a posto t è richiamata due volte in modo diverso
from scipy.stats import norm as norm_distribution # da mettere a posto norm è richiamata due volte in modo diverso

import functools


"""
The Stats class includes a variety of statistical methodologies to analyze CO2 flux data and geochemical samplings in environmental and volcanic systems.
Stats comprises robust statistics (i.e. biweight estimators, sigma-clipping, data-trimming, winsorizing procedures) and specific tools to estimate the
central tendency and confidence intervals of log-normally distributed data.
"""

def deprecated(reason):
    def decorator(func):
        @functools.wraps(func)
        def wrapper(*args, **kwargs):
            warnings.warn(
                f"{func.__name__}() is deprecated: {reason}",
                category=DeprecationWarning,
                stacklevel=2
            )
            return func(*args, **kwargs)
        return wrapper
    return decorator



[docs]
class Stats:

[docs]
    @staticmethod
    def lognormal_median_ci(data, confidence_level=0.95):
        """
        Estimates the median and its confidence interval for data assumed
        to be log-normally distributed.

        Args:
            data (array-like): A list, numpy array, or pandas Series of
                               positive numerical data points.
            confidence_level (float): The desired confidence level (e.g., 0.95 for 95%).
                                     Must be between 0 and 1.

        Returns:
            dict: A dictionary containing:
                  'median_estimate': The point estimate of the median.
                  'confidence_interval': A tuple (lower_bound, upper_bound)
                                         for the median.
                  Returns None if input data is invalid (e.g., non-positive values,
                  not enough data points).
        """
        # --- Input Validation ---
        try:
            # Convert to numpy array for easier handling
            data = np.asarray(data)

            # Check for non-positive values (logarithm is undefined)
            if np.any(data <= 0):
                print("Error: Data contains non-positive values. Log-normal "
                      "distribution is only defined for positive values.")
                return None

            # Check for sufficient data
            n = len(data)
            if n < 2:
                print("Error: Need at least two data points to estimate variance.")
                return None

            # Check confidence level validity
            if not (0 < confidence_level < 1):
                print("Error: Confidence level must be between 0 and 1.")
                return None

        except Exception as e:
            print(f"Error processing input data: {e}")
            return None

        # --- Calculations ---
        # 1. Log-transform the data
        log_data = np.log(data)

        # 2. Calculate mean and standard deviation of log-transformed data
        mu_hat = np.mean(log_data)
        sigma_hat = np.std(log_data, ddof=1)  # Use ddof=1 for sample standard deviation

        # 3. Point estimate of the median
        median_estimate = np.exp(mu_hat)

        # 4. Calculate confidence interval for the median
        alpha = 1 - confidence_level
        # Degrees of freedom
        dof = n - 1
        # Critical t-value for two-tailed test
        t_critical = stats.t.ppf(1 - alpha / 2, dof)
        # Standard error of the mean of log-transformed data
        se_mu_hat = sigma_hat / np.sqrt(n)

        # Confidence interval for mu (mean of log-data)
        lower_bound_mu = mu_hat - t_critical * se_mu_hat
        upper_bound_mu = mu_hat + t_critical * se_mu_hat

        # Confidence interval for the median (exponentiate the bounds for mu)
        lower_ci_median = np.exp(lower_bound_mu)
        upper_ci_median = np.exp(upper_bound_mu)

        return  median_estimate, lower_ci_median, upper_ci_median



[docs]
    @staticmethod
    def bootstrap_mean_ci(data, n_bootstraps=1000, confidence_level=0.95):
        """
        Estimates the mean and confidence interval for a log-normal distribution
        using the bootstrapping method.

        Args:
            data (array-like): A 1D array or list containing the log-normally
                               distributed data.
            n_bootstraps (int): The number of bootstrap samples to generate.
                               Defaults to 1000.
            confidence_level (float): The desired confidence level for the interval.
                                     Must be between 0 and 1. Defaults to 0.95.

        Returns:
            tuple: A tuple containing:
                   - estimated_mean (float): The estimated mean of the log-normal
                                             distribution (mean of bootstrap means).
                   - ci_lower (float): The lower bound of the confidence interval.
                   - ci_upper (float): The upper bound of the confidence interval.
        """
        if not 0 < confidence_level < 1:
            raise ValueError("confidence_level must be between 0 and 1")

        n_samples = len(data)
        if n_samples == 0:
            return np.nan, np.nan, np.nan

        bootstrap_means = []
        for _ in range(n_bootstraps):
            # Resample with replacement
            bootstrap_sample = np.random.choice(data, size=n_samples, replace=True)
            # Calculate the mean of the resample
            bootstrap_means.append(np.mean(bootstrap_sample))

        # Calculate the estimated mean as the mean of the bootstrap means
        estimated_mean = np.mean(bootstrap_means)

        # Calculate the confidence interval using the percentile method
        alpha = 1.0 - confidence_level
        lower_percentile = alpha / 2.0 * 100
        upper_percentile = (1.0 - alpha / 2.0) * 100
        ci_lower, ci_upper = np.percentile(bootstrap_means, [lower_percentile, upper_percentile])

        return estimated_mean, ci_lower, ci_upper





[docs]
    @staticmethod
    def median(a, axis=None, out=None, overwrite_input=False, keepdims=False):
        """
        Compute the median along the specified axis. Mutuated from numpy.

        Returns the median of the array elements.

        Parameters
        ----------
        a : array_like
            Input array or object that can be converted to an array.
        axis : {int, sequence of int, None}, optional
            Axis or axes along which the medians are computed. The default,
            axis=None, will compute the median along a flattened version of
            the array.
        out : ndarray, optional
            Alternative output array in which to place the result. It must
            have the same shape and buffer length as the expected output,
            but the type (of the output) will be cast if necessary.
        overwrite_input : bool, optional
           If True, then allow use of memory of input array `a` for
           calculations. The input array will be modified by the call to
           `median`. This will save memory when you do not need to preserve
           the contents of the input array. Treat the input as undefined,
           but it will probably be fully or partially sorted. Default is
           False. If `overwrite_input` is ``True`` and `a` is not already an
           `ndarray`, an error will be raised.
        keepdims : bool, optional
            If this is set to True, the axes which are reduced are left
            in the result as dimensions with size one. With this option,
            the result will broadcast correctly against the original `arr`.

        Returns
        -------
        median : ndarray
            A new array holding the result. If the input contains integers
            or floats smaller than ``float64``, then the output data-type is
            ``np.float64``.  Otherwise, the data-type of the output is the
            same as that of the input. If `out` is specified, that array is
            returned instead.
        """
        return np.median(a, axis, out, overwrite_input, keepdims)



[docs]
    @staticmethod
    def mad(data, axis=None, func=None, ignore_nan=False):
        """
        Calculate the median absolute deviation (MAD) mutuated from astropy.

        The MAD is defined as :math: median(abs(a - median(a))).

        Parameters
        ----------
        data : array-like
            Input array or object that can be converted to an array.
        axis : None, int, or tuple of int, optional
            The axis or axes along which the MADs are computed.  The default
            (`None`) is to compute the MAD of the flattened array.
        func : callable, optional
            The function used to compute the median. Defaults to `numpy.ma.median`
            for masked arrays, otherwise to `numpy.median`.
        ignore_nan : bool
            Ignore NaN values (treat them as if they are not in the array) when
            computing the median.  This will use `numpy.ma.median` if ``axis`` is
            specified, or `numpy.nanmedian` if ``axis==None`` and numpy's version
            is >1.10 because nanmedian is slightly faster in this case.

        Returns
        -------
        mad : float or `~numpy.ndarray`
            The median absolute deviation of the input array.  If ``axis``
            is `None` then a scalar will be returned, otherwise a
            `~numpy.ndarray` will be returned.
        """
        return astropy_median_absolute_deviation(data, axis, func, ignore_nan)



[docs]
    @staticmethod
    def mad_std(data, axis=None, func=None, ignore_nan=False):
        r"""
        Calculate a robust standard deviation using the median absolute
        deviation (MAD), mutuated from astropy.

        The standard deviation estimator is given by:

        .. math::

            \sigma \approx \frac{\textrm{MAD}}{\Phi^{-1}(3/4)} \approx 1.4826 \cdot \textrm{MAD}

        where :math: \Phi^{-1}(P) is the normal inverse cumulative
        distribution function evaluated at probability :math: P = 3/4.

        Parameters
        ----------
        data : array-like
            Data array or object that can be converted to an array.
        axis : None, int, or tuple of int, optional
            The axis or axes along which the robust standard deviations are
            computed.  The default (`None`) is to compute the robust
            standard deviation of the flattened array.
        func : callable, optional
            The function used to compute the median. Defaults to `numpy.ma.median`
            for masked arrays, otherwise to `numpy.median`.
        ignore_nan : bool
            Ignore NaN values (treat them as if they are not in the array) when
            computing the median.  This will use `numpy.ma.median` if ``axis`` is
            specified, or `numpy.nanmedian` if ``axis=None`` and numpy's version is
            >1.10 because nanmedian is slightly faster in this case.

        Returns
        -------
        mad_std : float or `~numpy.ndarray`
            The robust standard deviation of the input data.  If ``axis`` is
            `None` then a scalar will be returned, otherwise a
            `~numpy.ndarray` will be returned.
        """
        return astropy_mad_std(data, axis, func, ignore_nan)



[docs]
    @staticmethod
    def sigma_clip(data,sigma=3,sigma_lower=None,sigma_upper=None,maxiters=5, cenfunc="median", stdfunc="std", axis=None, masked=True, return_bounds=False, copy=True, grow=False):
        """
        Perform sigma-clipping on the provided data. Mutuated from astropy.

        The data will be iterated over, each time rejecting values that are
        less or more than a specified number of standard deviations from a
        center value.

        Clipped (rejected) pixels are those where:
        
        .. math::

            data < center - (\sigma_{lower} * std)
            data > center + (\sigma_{upper} * std)

        where:

            center = cenfunc(data [, axis=])
            std = stdfunc(data [, axis=])

        Invalid data values (i.e., NaN or inf) are automatically clipped.

        For an object-oriented interface to sigma clipping, see
        :class:`SigmaClip`.

        Parameters
        ----------
        data : array-like or `~numpy.ma.MaskedArray`
            The data to be sigma clipped.

        sigma : float, optional
            The number of standard deviations to use for both the lower
            and upper clipping limit. These limits are overridden by
            ``sigma_lower`` and ``sigma_upper``, if input. The default is 3.

        sigma_lower : float or None, optional
            The number of standard deviations to use as the lower bound for
            the clipping limit. If `None` then the value of ``sigma`` is
            used. The default is `None`.

        sigma_upper : float or None, optional
            The number of standard deviations to use as the upper bound for
            the clipping limit. If `None` then the value of ``sigma`` is
            used. The default is `None`.

        maxiters : int or None, optional
            The maximum number of sigma-clipping iterations to perform or
            `None` to clip until convergence is achieved (i.e., iterate
            until the last iteration clips nothing). If convergence is
            achieved prior to ``maxiters`` iterations, the clipping
            iterations will stop. The default is 5.

        cenfunc : {'median', 'mean'} or callable, optional
            The statistic or callable function/object used to compute
            the center value for the clipping. If using a callable
            function/object and the ``axis`` keyword is used, then it must
            be able to ignore NaNs (e.g., `numpy.nanmean`) and it must have
            an ``axis`` keyword to return an array with axis dimension(s)
            removed. The default is ``'median'``.

        stdfunc : {'std', 'mad_std'} or callable, optional
            The statistic or callable function/object used to compute the
            standard deviation about the center value. If using a callable
            function/object and the ``axis`` keyword is used, then it must
            be able to ignore NaNs (e.g., `numpy.nanstd`) and it must have
            an ``axis`` keyword to return an array with axis dimension(s)
            removed. The default is ``'std'``.

        axis : None or int or tuple of int, optional
            The axis or axes along which to sigma clip the data. If `None`,
            then the flattened data will be used. ``axis`` is passed to the
            ``cenfunc`` and ``stdfunc``. The default is `None`.

        masked : bool, optional
            If `True`, then a `~numpy.ma.MaskedArray` is returned, where
            the mask is `True` for clipped values. If `False`, then a
            `~numpy.ndarray` is returned. The default is `True`.

        return_bounds : bool, optional
            If `True`, then the minimum and maximum clipping bounds are also
            returned.

        copy : bool, optional
            If `True`, then the ``data`` array will be copied. If `False`
            and ``masked=True``, then the returned masked array data will
            contain the same array as the input ``data`` (if ``data`` is a
            `~numpy.ndarray` or `~numpy.ma.MaskedArray`). If `False` and
            ``masked=False``, the input data is modified in-place. The
            default is `True`.

        grow : float or `False`, optional
            Radius within which to mask the neighbouring pixels of those
            that fall outwith the clipping limits (only applied along
            ``axis``, if specified). As an example, for a 2D image a value
            of 1 will mask the nearest pixels in a cross pattern around each
            deviant pixel, while 1.5 will also reject the nearest diagonal
            neighbours and so on.

        Returns
        -------
        result : array-like
            If ``masked=True``, then a `~numpy.ma.MaskedArray` is returned,
            where the mask is `True` for clipped values and where the input
            mask was `True`.

            If ``masked=False``, then a `~numpy.ndarray` is returned.

            If ``return_bounds=True``, then in addition to the masked array
            or array above, the minimum and maximum clipping bounds are
            returned.

            If ``masked=False`` and ``axis=None``, then the output array
            is a flattened 1D `~numpy.ndarray` where the clipped values
            have been removed. If ``return_bounds=True`` then the returned
            minimum and maximum thresholds are scalars.

            If ``masked=False`` and ``axis`` is specified, then the output
            `~numpy.ndarray` will have the same shape as the input ``data``
            and contain ``np.nan`` where values were clipped. If the input
            ``data`` was a masked array, then the output `~numpy.ndarray`
            will also contain ``np.nan`` where the input mask was `True`.
            If ``return_bounds=True`` then the returned minimum and maximum
            clipping thresholds will be `~numpy.ndarray`\\s.
        """
        return astropy_sigma_clip(data, sigma, sigma_lower, sigma_upper, maxiters, cenfunc, stdfunc, axis, masked, return_bounds, copy, grow)



[docs]
    @staticmethod
    def sigma_clipped_stats(
            data,
            mask=None,
            mask_value=None,
            sigma=3.0,
            sigma_lower=None,
            sigma_upper=None,
            maxiters=5,
            cenfunc="median",
            stdfunc="std",
            std_ddof=0,
            axis=None,
            grow=False,
        ):
        """
        Calculate sigma-clipped statistics on the provided data, mutuated from astropy.

        Parameters
        ----------
        data : array-like or `~numpy.ma.MaskedArray`
            Data array or object that can be converted to an array.

        mask : `numpy.ndarray` (bool), optional
            A boolean mask with the same shape as ``data``, where a `True`
            value indicates the corresponding element of ``data`` is masked.
            Masked pixels are excluded when computing the statistics.

        mask_value : float, optional
            A data value (e.g., ``0.0``) that is ignored when computing the
            statistics. ``mask_value`` will be masked in addition to any
            input ``mask``.

        sigma : float, optional
            The number of standard deviations to use for both the lower
            and upper clipping limit. These limits are overridden by
            ``sigma_lower`` and ``sigma_upper``, if input. The default is 3.

        sigma_lower : float or None, optional
            The number of standard deviations to use as the lower bound for
            the clipping limit. If `None` then the value of ``sigma`` is
            used. The default is `None`.

        sigma_upper : float or None, optional
            The number of standard deviations to use as the upper bound for
            the clipping limit. If `None` then the value of ``sigma`` is
            used. The default is `None`.

        maxiters : int or None, optional
            The maximum number of sigma-clipping iterations to perform or
            `None` to clip until convergence is achieved (i.e., iterate
            until the last iteration clips nothing). If convergence is
            achieved prior to ``maxiters`` iterations, the clipping
            iterations will stop. The default is 5.

        cenfunc : {'median', 'mean'} or callable, optional
            The statistic or callable function/object used to compute
            the center value for the clipping. If using a callable
            function/object and the ``axis`` keyword is used, then it must
            be able to ignore NaNs (e.g., `numpy.nanmean`) and it must have
            an ``axis`` keyword to return an array with axis dimension(s)
            removed. The default is ``'median'``.

        stdfunc : {'std', 'mad_std'} or callable, optional
            The statistic or callable function/object used to compute the
            standard deviation about the center value. If using a callable
            function/object and the ``axis`` keyword is used, then it must
            be able to ignore NaNs (e.g., `numpy.nanstd`) and it must have
            an ``axis`` keyword to return an array with axis dimension(s)
            removed. The default is ``'std'``.

        std_ddof : int, optional
            The delta degrees of freedom for the standard deviation
            calculation. The divisor used in the calculation is ``N -
            std_ddof``, where ``N`` represents the number of elements. The
            default is 0.

        axis : None or int or tuple of int, optional
            The axis or axes along which to sigma clip the data. If `None`,
            then the flattened data will be used. ``axis`` is passed to the
            ``cenfunc`` and ``stdfunc``. The default is `None`.

        grow : float or `False`, optional
            Radius within which to mask the neighbouring pixels of those
            that fall outwith the clipping limits (only applied along
            ``axis``, if specified). As an example, for a 2D image a value
            of 1 will mask the nearest pixels in a cross pattern around each
            deviant pixel, while 1.5 will also reject the nearest diagonal
            neighbours and so on.

        Notes
        -----
        The best performance will typically be obtained by setting
        ``cenfunc`` and ``stdfunc`` to one of the built-in functions
        specified as as string. If one of the options is set to a string
        while the other has a custom callable, you may in some cases see
        better performance if you have the `bottleneck`_ package installed.

        .. _bottleneck:  https://github.com/pydata/bottleneck

        Returns
        -------
        mean, median, stddev : float
            The mean, median, and standard deviation of the sigma-clipped
            data.
        """
        return astropy_sigma_clipped_stats(data, mask, mask_value, sigma, sigma_lower, sigma_upper, maxiters, cenfunc, stdfunc, std_ddof, axis, grow)

   

[docs]
    @staticmethod
    def biweight_location(data, c=6.0, M=None, axis=None, ignore_nan=False):
        r"""
        Compute the biweight location.

        The biweight location is a robust statistic for determining the
        central location of a distribution.  It is given by:

        .. math::

            \zeta_{biloc}= M + \frac{\sum_{|u_i|<1}(x_i - M) (1 - u_i^2)^2}{\sum_{|u_i|<1}(1 - u_i^2)^2}

        where :math:`x` is the input data, :math:`M` is the sample median
        (or the input initial location guess) and :math:`u_i` is given by:

        .. math::

            u_{i} = \frac{(x_i - M)}{c \cdot MAD}

        where :math:`c` is the tuning constant and :math:`MAD` is the
        `median absolute deviation
        <https://en.wikipedia.org/wiki/Median_absolute_deviation>`_.  The
        biweight location tuning constant ``c`` is typically 6.0 (the
        default).

        If :math:`MAD` is zero, then the median will be returned.

        Parameters
        ----------
        data : array-like
            Input array or object that can be converted to an array.
            ``data`` can be a `~numpy.ma.MaskedArray`.
        c : float, optional
            Tuning constant for the biweight estimator (default = 6.0).
        M : float or array-like, optional
            Initial guess for the location.  If ``M`` is a scalar value,
            then its value will be used for the entire array (or along each
            ``axis``, if specified).  If ``M`` is an array, then its must be
            an array containing the initial location estimate along each
            ``axis`` of the input array.  If `None` (default), then the
            median of the input array will be used (or along each ``axis``,
            if specified).
        axis : None, int, or tuple of int, optional
            The axis or axes along which the biweight locations are
            computed.  If `None` (default), then the biweight location of
            the flattened input array will be computed.
        ignore_nan : bool, optional
            Whether to ignore NaN values in the input ``data``.

        Returns
        -------
        biweight_location : float or `~numpy.ndarray`
            The biweight location of the input data.  If ``axis`` is `None`
            then a scalar will be returned, otherwise a `~numpy.ndarray`
            will be returned.
        """
        if ignore_nan:
            data = np.ma.masked_invalid(data)
        return astropy_biweight_location(data, c=c, M=M, axis=axis)

    

[docs]
    @staticmethod
    def biweight_scale(data, c=9.0, M=None, axis=None, modify_sample_size=False, ignore_nan=False):
        r"""
        Compute the biweight scale.

        The biweight scale is a robust statistic for determining the
        standard deviation of a distribution.  It is the square root of the
        `biweight midvariance.

        It is given by:

        .. math::

            \zeta_{biscl} = \sqrt{n}\frac{\sqrt{\sum_{|u_i| < 1}(x_i - M)^2 (1 - u_i^2)^4}} {|(\sum_{|u_i| < 1}(1 - u_i^2) (1 - 5u_i^2))|}

        where :math:`x` is the input data, :math:`M` is the sample median
        (or the input location) and :math:`u_i` is given by:

        .. math::

            u_{i} = \frac{x_i - M}{c * MAD}

        where :math:`c` is the tuning constant and :math:`MAD` is the
        `median absolute deviation
        <https://en.wikipedia.org/wiki/Median_absolute_deviation>`_.  The
        biweight midvariance tuning constant ``c`` is typically 9.0 (the
        default).

        If :math:`MAD` is zero, then zero will be returned.

        For the standard definition of biweight scale, :math:`n` is the
        total number of points in the array (or along the input ``axis``, if
        specified).  That definition is used if ``modify_sample_size`` is
        `False`, which is the default.

        However, if ``modify_sample_size = True``, then :math:`n` is the
        number of points for which :math:`|u_i| < 1` (i.e. the total number
        of non-rejected values), i.e.

        .. math::

            n = \sum_{|u_i| < 1} 1

        which results in a value closer to the true standard deviation for
        small sample sizes or for a large number of rejected values.

        Parameters
        ----------
        data : array-like
            Input array or object that can be converted to an array.
            ``data`` can be a `~numpy.ma.MaskedArray`.
        c : float, optional
            Tuning constant for the biweight estimator (default = 9.0).
        M : float or array-like, optional
            The location estimate.  If ``M`` is a scalar value, then its
            value will be used for the entire array (or along each ``axis``,
            if specified).  If ``M`` is an array, then its must be an array
            containing the location estimate along each ``axis`` of the
            input array.  If `None` (default), then the median of the input
            array will be used (or along each ``axis``, if specified).
        axis : None, int, or tuple of int, optional
            The axis or axes along which the biweight scales are computed.
            If `None` (default), then the biweight scale of the flattened
            input array will be computed.
        modify_sample_size : bool, optional
            If `False` (default), then the sample size used is the total
            number of elements in the array (or along the input ``axis``, if
            specified), which follows the standard definition of biweight
            scale.  If `True`, then the sample size is reduced to correct
            for any rejected values (i.e. the sample size used includes only
            the non-rejected values), which results in a value closer to the
            true standard deviation for small sample sizes or for a large
            number of rejected values.
        ignore_nan : bool, optional
            Whether to ignore NaN values in the input ``data``.

        Returns
        -------
        biweight_scale : float or `~numpy.ndarray`
            The biweight scale of the input data.  If ``axis`` is `None`
            then a scalar will be returned, otherwise a `~numpy.ndarray`
            will be returned.
        """
        if ignore_nan:
            data = np.ma.masked_invalid(data)
        return astropy_biweight_scale(data, c=c, M=M, axis=axis, modify_sample_size=modify_sample_size)



[docs]
    @staticmethod
    def trim(a, limits=None, inclusive=(True, True), axis=None):
        """
        Trims an array by masking the data outside some given limits. Mutuated for scipy.

        Returns a masked version of the input array.

        Parameters
        ----------
        a : array_like
            Input array.
        limits : {None, tuple of float}, optional
            Tuple of the percentages to cut on each side of the array, with respect
            to the number of unmasked data, as floats between 0. and 1.
            Noting n the number of unmasked data before trimming, the
            (n*limits[0])th smallest data and the (n*limits[1])th largest data are
            masked, and the total number of unmasked data after trimming
            is n*(1.-sum(limits)). The value of one limit can be set to None to
            indicate an open interval.
        inclusive : {(True, True) tuple}, optional
            Tuple indicating whether the number of data being masked on each side
            should be truncated (True) or rounded (False).
        axis : {None, int}, optional
            Axis along which to trim. If None, the whole array is trimmed, but its
            shape is maintained.
        """
        return scipy_trim(a, limits, inclusive, axis)



[docs]
    @staticmethod
    def trimmed_mean(a, limits=None, inclusive=(True, True), axis=None):
        """
        Compute the trimmed, mean given a lower and an upper limit. Mutuated from Scipy stats.

        This function finds the arithmetic mean of given values, ignoring values
        outside the given `limits`.

        Parameters
        ----------
        a : array_like
            Array of values.
        limits : None or (lower limit, upper limit), optional
            Values in the input array less than the lower limit or greater than the
            upper limit will be ignored.  When limits is None (default), then all
            values are used.  Either of the limit values in the tuple can also be
            None representing a half-open interval.
        inclusive : (bool, bool), optional
            A tuple consisting of the (lower flag, upper flag).  These flags
            determine whether values exactly equal to the lower or upper limits
            are included.  The default value is (True, True).
        axis : int or None, optional
            Axis along which to compute test. Default is None.

        Returns
        -------
        tmean : ndarray
            Trimmed mean.
        """
        return scipy_tmean(a, limits, inclusive, axis)

    

[docs]
    @staticmethod
    def trimmed_std(a, limits=(0.1,0.1), inclusive=(1,1), relative=True, axis=None, ddof=0):
        """
        Returns the trimmed standard deviation of the data along the given axis. Mutuated from Scipy stats.

        Parameters
        ----------
        a : array_like
            Input array.
        limits : tuple of float, optional
            The lower and upper fraction of elements to trim. These fractions
            should be between 0 and 1.
        inclusive : tuple of {0, 1}, optional
            Tuple indicating whether the number of data being masked on each side
            should be truncated (1) or rounded (0).
        relative : bool, optional
            Whether to treat the `limits` as relative or absolute positions.
        axis : int, optional
            Axis along which to perform the trimming.
        ddof : int, optional
            Means Delta Degrees of Freedom. The denominator used in the calculations
            is ``n - ddof``, where ``n`` represents the number of elements.
        """
        return scipy_trimmed_std(a, limits, inclusive, relative, axis, ddof)



[docs]
    @staticmethod
    def trimboth(a, proportiontocut=0.2, axis=0):
        """
        Slice off the passed proportion of items from both ends of the passed
        array (i.e., with `proportiontocut` = 0.1, slices leftmost 10% **and**
        rightmost 10% of scores). The trimmed values are the lowest and
        highest ones.
        Slice off less if proportion results in a non-integer slice index (i.e.
        conservatively slices off `proportiontocut`).

        Parameters
        ----------
        a : array_like
            Data to trim.
        proportiontocut : float
            Proportion (in range 0-1) of total data set to trim of each end.
        axis : int or None, optional
            Axis along which to trim data. Default is 0. If None, compute over
            the whole array `a`.

        Returns
        -------
        out : ndarray
            Trimmed version of array `a`. The order of the trimmed content
            is undefined.

        See Also
        --------
        trim_mean

        Examples
        --------
        Create an array of 10 values and trim 10% of those values from each end:

        >>> import numpy as np
        >>> from scipy import stats
        >>> a = [0, 1, 2, 3, 4, 5, 6, 7, 8, 9]
        >>> stats.trimboth(a, 0.1)
        array([1, 3, 2, 4, 5, 6, 7, 8])

        Note that the elements of the input array are trimmed by value, but the
        output array is not necessarily sorted.

        The proportion to trim is rounded down to the nearest integer. For
        instance, trimming 25% of the values from each end of an array of 10
        values will return an array of 6 values:

        >>> b = np.arange(10)
        >>> stats.trimboth(b, 1/4).shape
        (6,)

        Multidimensional arrays can be trimmed along any axis or across the entire
        array:

        >>> c = [2, 4, 6, 8, 0, 1, 3, 5, 7, 9]
        >>> d = np.array([a, b, c])
        >>> stats.trimboth(d, 0.4, axis=0).shape
        (1, 10)
        >>> stats.trimboth(d, 0.4, axis=1).shape
        (3, 2)
        >>> stats.trimboth(d, 0.4, axis=None).shape
        (6,)

        """
        return scipy_trimboth(a, proportiontocut, axis)



[docs]
    @staticmethod
    def trimtail(data, proportiontocut=0.2, tail='left', inclusive=(True, True), axis=None):
        """
        Trims the data by masking values from one tail.

        Parameters
        ----------
        data : array_like
            Data to trim.
        proportiontocut : float, optional
            Percentage of trimming. If n is the number of unmasked values
            before trimming, the number of values after trimming is
            ``(1 - proportiontocut) * n``.  Default is 0.2.
        tail : {'left', 'right'}, optional
            If 'left' the `proportiontocut` lowest values will be masked.
            If 'right' the `proportiontocut` highest values will be masked.
            Default is 'left'.
        inclusive : {(bool, bool) tuple}, optional
            Tuple indicating whether the number of data being masked on each side
            should be rounded (True) or truncated (False).  Default is
            (True, True).
        axis : int, optional
            Axis along which to perform the trimming.
            If None, the input array is first flattened.  Default is None.

        Returns
        -------
        trimtail : ndarray
            Returned array of same shape as `data` with masked tail values.
        """
        return scipy_trimtail(data, proportiontocut, tail, inclusive, axis)



[docs]
    @staticmethod
    def winsorize(a, limits=None, inclusive=(True, True), inplace=False, axis=None, nan_policy='propagate'):
        """
        Returns a Winsorized version of the input array. Mutuated from Scipy

        The (limits[0])th lowest values are set to the (limits[0])th percentile,
        and the (limits[1])th highest values are set to the (1 - limits[1])th
        percentile.
        Masked values are skipped.

        Parameters
        ----------
        a : sequence
            Input array.
        limits : {None, tuple of float}, optional
            Tuple of the percentages to cut on each side of the array, with respect
            to the number of unmasked data, as floats between 0. and 1.
            Noting n the number of unmasked data before trimming, the
            (n*limits[0])th smallest data and the (n*limits[1])th largest data are
            masked, and the total number of unmasked data after trimming
            is n*(1.-sum(limits)) The value of one limit can be set to None to
            indicate an open interval.
        inclusive : {(True, True) tuple}, optional
            Tuple indicating whether the number of data being masked on each side
            should be truncated (True) or rounded (False).
        inplace : {False, True}, optional
            Whether to winsorize in place (True) or to use a copy (False)
        axis : {None, int}, optional
            Axis along which to trim. If None, the whole array is trimmed, but its
            shape is maintained.
        nan_policy : {'propagate', 'raise', 'omit'}, optional
            Defines how to handle when input contains nan.
            The following options are available (default is 'propagate'):

              * 'propagate': allows nan values and may overwrite or propagate them
              * 'raise': throws an error
              * 'omit': performs the calculations ignoring nan values

        Notes
        -----
        This function is applied to reduce the effect of possibly spurious outliers
        by limiting the extreme values.

        Returns
        -------
        winsorized : ndarray
            Winsorized array.
        """
        return scipy_winsorize(a, limits, inclusive, inplace, axis, nan_policy)



[docs]
    @staticmethod
    def winsorized_mean(a, limits=None, inclusive=(True, True), inplace=False, axis=None, nan_policy='propagate'):
        """
        Returns a Winsorized mean of the input array.

        The (limits[0])th lowest values are set to the (limits[0])th percentile,
        and the (limits[1])th highest values are set to the (1 - limits[1])th
        percentile.
        Masked values are skipped.

        Parameters
        ----------
        a : sequence
            Input array.
        limits : {None, tuple of float}, optional
            Tuple of the percentages to cut on each side of the array, with respect
            to the number of unmasked data, as floats between 0. and 1.
            Noting n the number of unmasked data before trimming, the
            (n*limits[0])th smallest data and the (n*limits[1])th largest data are
            masked, and the total number of unmasked data after trimming
            is n*(1.-sum(limits)) The value of one limit can be set to None to
            indicate an open interval.
        inclusive : {(True, True) tuple}, optional
            Tuple indicating whether the number of data being masked on each side
            should be truncated (True) or rounded (False).
        inplace : {False, True}, optional
            Whether to winsorize in place (True) or to use a copy (False)
        axis : {None, int}, optional
            Axis along which to trim. If None, the whole array is trimmed, but its
            shape is maintained.
        nan_policy : {'propagate', 'raise', 'omit'}, optional
            Defines how to handle when input contains nan.
            The following options are available (default is 'propagate'):

              * 'propagate': allows nan values and may overwrite or propagate them
              * 'raise': throws an error
              * 'omit': performs the calculations ignoring nan values

        Notes
        -----
        This function is applied to reduce the effect of possibly spurious outliers
        by limiting the extreme values.

        Returns
        -------
        winsorized_mean : float
            Winsorized mean of the array.
        """
        return np.mean(scipy_winsorize(a, limits, inclusive, inplace, axis, nan_policy))



[docs]
    @staticmethod
    def winsorized_std(a, ddof=1, limits=None, inclusive=(True, True), inplace=False, axis=None, nan_policy='propagate'):
        """
        Returns a Winsorized Standard Deviation of the input array.

        The (limits[0])th lowest values are set to the (limits[0])th percentile,
        and the (limits[1])th highest values are set to the (1 - limits[1])th
        percentile.
        Masked values are skipped.

        Parameters
        ----------
        a : sequence
            Input array.
        ddof : int, optional
            Delta Degrees of Freedom. The denominator used in calculations is `N - ddof`, 
            where `N` represents the number of elements. By default ddof is one.
        limits : {None, tuple of float}, optional
            Tuple of the percentages to cut on each side of the array, with respect
            to the number of unmasked data, as floats between 0. and 1.
            Noting n the number of unmasked data before trimming, the
            (n*limits[0])th smallest data and the (n*limits[1])th largest data are
            masked, and the total number of unmasked data after trimming
            is n*(1.-sum(limits)) The value of one limit can be set to None to
            indicate an open interval.
        inclusive : {(True, True) tuple}, optional
            Tuple indicating whether the number of data being masked on each side
            should be truncated (True) or rounded (False).
        inplace : {False, True}, optional
            Whether to winsorize in place (True) or to use a copy (False).
        axis : {None, int}, optional
            Axis along which to trim. If None, the whole array is trimmed, but its
            shape is maintained.
        nan_policy : {'propagate', 'raise', 'omit'}, optional
            Defines how to handle when input contains nan.
            The following options are available (default is 'propagate'):

              * 'propagate': allows nan values and may overwrite or propagate them
              * 'raise': throws an error
              * 'omit': performs the calculations ignoring nan values

        Returns
        -------
        winsorized_std : float
            Winsorized standard deviation of the array.
        """
        return np.std(scipy_winsorize(a, limits, inclusive, inplace, axis, nan_policy), ddof=ddof)



[docs]
    @staticmethod
    def Huber(data, c=1.5, tol=1e-08, maxiter=30, norm=None):
        """
        Huber's proposal 2 for estimating location and scale jointly. 
        Return joint estimates of Huber's scale and location. 
        Mutuated from statsmodels.robust.

        Parameters
        ----------
        c : float, optional
            Threshold used in threshold for :math: \chi=\psi^2.  Default value is 1.5.
        tol : float, optional
            Tolerance for convergence.  Default value is 1e-08.
        maxiter : int, optional
            Maximum number of iterations.  Default value is 30.
        norm : statsmodels.robust.norms.RobustNorm, optional
            A robust norm used in M estimator of location. If None,
            the location estimator defaults to a one-step
            fixed point version of the M-estimator using Huber's T.

        Returns
        -------
        huber : tuple
            Returns a tuple (location, scale) of the joint estimates.
        """
        huber_proposal_2 = sm.robust.Huber(c, tol, maxiter, norm)
        return huber_proposal_2(data)



    # lognormal_estimator start here


[docs]
    @staticmethod
    def lognormal_estimator(
        X_lognorm_data,
        method="umvue",
        ci=False,
        ci_method="zou",
        ci_type="two-sided",
        conf_level=0.95,
        parkin_list=None
    ):
        """
        Estimate the mean and its uncertainty for log-normally distributed data.

        Several estimators of the arithmetic mean of a log-normal population
        are available. Optionally, a confidence interval can also be computed
        using one of the supported methods.

        Parameters
        ----------
        X_lognorm_data : array-like
            One-dimensional array containing at least two strictly positive
            observations assumed to follow a log-normal distribution.
        method : {'umvue', 'umvue_sichel', 'qmle', 'mle', 'mme', 'mmue'}, optional
            Method used to estimate the population mean:

            * ``'umvue'`` uses Finney's uniformly minimum-variance unbiased
              estimator.
            * ``'umvue_sichel'`` uses Sichel's estimator.
            * ``'qmle'`` uses the quasi-maximum-likelihood estimator.
            * ``'mle'`` uses the maximum-likelihood estimator.
            * ``'mme'`` uses the method-of-moments estimator.
            * ``'mmue'`` uses the unbiased method-of-moments estimator.

            The default is ``'umvue'``.
        ci : bool, optional
            If `True`, compute a confidence interval for the estimated mean.
            The default is `False`.
        ci_method : {'land', 'normal_approx', 'zou', 'cox', 'sichel'}, optional
            Method used to calculate the confidence interval. The default is
            ``'zou'``.
        ci_type : {'two-sided', 'lower', 'upper'}, optional
            Type of confidence interval. The default is ``'two-sided'``.
        conf_level : float, optional
            Confidence level, expressed as a value between 0 and 1. The
            default is 0.95.
        parkin_list : optional
            Reserved parameter retained for compatibility. It is currently
            not used by the calculation.

        Returns
        -------
        result : dict
            Dictionary containing:

            * ``'sample_size'``: number of observations.
            * ``'method'``: point-estimation method.
            * ``'mean_estimate'``: estimated arithmetic mean.
            * ``'sd_estimate'``: estimated standard deviation of the estimator.

            If ``ci=True``, the dictionary is extended with the confidence
            interval information returned by the selected ``ci_method``,
            including ``'LCL'`` and ``'UCL'``.

        Raises
        ------
        ValueError
            If fewer than two observations are provided, if any observation
            is non-positive, or if an unsupported estimation or confidence
            interval method is selected.

        Warns
        -----
        UserWarning
            If the variance or standard-deviation estimate is not available
            for the selected method.
        """
        X_lognorm_data = np.asarray(X_lognorm_data, dtype=float)
        if X_lognorm_data.size < 2 or np.any(X_lognorm_data <= 0):
            raise ValueError("`data` must contain at least two positive values.")

        n = X_lognorm_data.size
        Y_norm_data = np.log(X_lognorm_data)
        Y_mu_hat = float(np.mean(Y_norm_data))
        Y_sigma2_hat = float(np.var(Y_norm_data, ddof=1))
        Y_sigma2_mle = Y_sigma2_hat * (n - 1) / n
        df = n - 1
        # Point estimation
        if method == "umvue":
            X_theta_hat, X_var_hat = Stats.umvue_finney_lognormal_estimator(X_lognorm_data)
            sd_muhat_ci_normal = np.sqrt(np.exp(2 * Y_mu_hat) * ((Stats.finneys_g(n - 1, Y_sigma2_hat/2)**2) - Stats.finneys_g(n - 1, (Y_sigma2_hat * (n - 2))/(n - 1))))
        elif method == "umvue_sichel":
            X_theta_hat, X_var_hat = Stats.umvue_sichel_lognormal_estimator(X_lognorm_data)
        elif method == "qmle":
            X_theta_hat = math.exp(Y_mu_hat + 0.5 * Y_sigma2_hat)
            se2 = (np.exp(Y_sigma2_hat) - 1) * np.exp(2 * Y_mu_hat + Y_sigma2_hat)
            sd_muhat_ci_normal = np.sqrt(np.exp(2 * Y_mu_hat + Y_sigma2_hat/n) * (np.exp(Y_sigma2_hat/n) * ((1 - (2 * Y_sigma2_hat)/df)**(-df/2)) - ((1 - Y_sigma2_hat/df)**(-df))))
            X_var_hat = se2 / n
        elif method == "mle":
            X_theta_hat = np.exp(Y_mu_hat + 0.5 * Y_sigma2_mle)
            se2 = (np.exp(Y_sigma2_mle) - 1) * np.exp(2 * Y_mu_hat + Y_sigma2_mle)
            X_var_hat = se2 / n
            sd_muhat_ci_normal = np.sqrt(np.exp(2 * Y_mu_hat + Y_sigma2_hat/n) * (np.exp(Y_sigma2_hat/n) * ((1 - (2 * Y_sigma2_hat)/n)**(-df/2)) - ((1 - Y_sigma2_hat/n)**(-df))))
        elif method == "mme":
            X_theta_hat = float(np.mean(X_lognorm_data))
            X_var_hat = float(np.var(X_lognorm_data, ddof=0) / n)
            sd_muhat_ci_normal = np.sqrt(X_var_hat)/np.sqrt(n)
        elif method == "mmue":
            X_theta_hat = float(np.mean(X_lognorm_data))
            X_var_hat = float(np.var(X_lognorm_data, ddof=1) / n)
            sd_muhat_ci_normal = np.sqrt(X_var_hat)/np.sqrt(n)
        else:
            raise ValueError(f"Unknown method '{method}'")

        # Always compute SE
        if np.isnan(X_var_hat) or X_var_hat < 0:
            X_sd_hat = float("nan")
            warnings.warn(f"Standard deviation estimate not available for method='{method}'.", UserWarning)
        else:
            X_sd_hat = math.sqrt(X_var_hat)

        result = {
            "sample_size": n,
            "method": method,
            "mean_estimate": X_theta_hat,
            "sd_estimate": X_sd_hat
        }

        # Confidence intervals
        if ci:
            if ci_method == 'land':
                ci_limits = Stats.ci_lnorm_land(
                        mu_hat=Y_mu_hat, 
                        sigma2_hat=Y_sigma2_hat, 
                        n= n, 
                        ci_type=ci_type, 
                        conf_level=conf_level)
            elif ci_method == "normal_approx":
                    ci_limits = Stats.ci_standard_approx(
                        mu_hat=X_theta_hat,
                        sigma2_hat=sd_muhat_ci_normal**2,
                        n=n,
                        test_statistic="z",
                        ci_type=ci_type,
                        conf_level=conf_level
                    )
            elif ci_method == "zou":
                ci_limits = Stats.ci_lnorm_zou(
                    mu_hat=Y_mu_hat,  
                    sigma2_hat=Y_sigma2_hat,
                    n=n,
                    ci_type=ci_type,
                    conf_level=conf_level
                )
            elif ci_method == "cox":
                ci_limits = Stats.ci_cox(
                    mu_hat=Y_mu_hat,
                    sigma2_hat=Y_sigma2_hat,
                    n=n,
                    ci_type=ci_type,
                    conf_level=conf_level
                )
            elif ci_method == "sichel":
                ci_limits = Stats.ci_sichel(
                    mu_hat=Y_mu_hat,
                    sigma2_hat=Y_sigma2_hat,
                    n=n,
                    ci_type=ci_type,
                    conf_level=conf_level
                )
            else:
                raise ValueError(f"Unknown ci_method '{ci_method}'")

            result.update(ci_limits)

        return result




[docs]
    @staticmethod
    def umvue_finney_lognormal_estimator(data):
        """
        UMVUE of the log‑normal mean & variance (Finney’s formula).
        Returns (mean_estimate, variance_estimate).  If data has fewer
        than two points, variance_estimate is NaN.  If data contains
        non‐positive values, returns (NaN, NaN) with a warning.
        """
        data = np.asarray(data)
        n = data.size

        if n == 0:
            return np.nan, np.nan
        if np.any(data <= 0):
            warnings.warn(
                "Data contains non‐positive values; lognormal requires positive data.",
                UserWarning
            )
            return np.nan, np.nan
        if n == 1:
            return float(data[0]), np.nan

        # Log-space moments
        log_data = np.log(data)
        y_bar = log_data.mean()
        s_sq  = log_data.var(ddof=1)

        # Finney’s UMVUE for the mean
        alpha = (n - 1.0) / 2.0
        z     = (n - 1.0)**2 / (4.0 * n) * s_sq
        
        phi = Stats.finneys_g(n - 1, s_sq/2)
        umvu_mean = np.exp(y_bar) * phi
    
        # Finney’s UMVUE for the variance (only defined for n>2)
        if n > 2:
            umvu_variance = np.exp(2 * y_bar) * (Stats.finneys_g(n - 1, 2 * s_sq) - Stats.finneys_g(n - 1, (s_sq * (n - 2))/(n - 1)))
        else:
            umvu_variance = np.nan

        return umvu_mean, umvu_variance





[docs]
    @staticmethod
    def umvue_sichel_lognormal_estimator(X_lognorm_data):
        """
        Estimate the mean and variance of a log-normal population using
        Sichel's estimator.

        The method operates on log-transformed observations and uses the
        confluent hypergeometric limit function to compute the correction
        factor for the mean estimate.

        Parameters
        ----------
        X_lognorm_data : array-like
            Strictly positive observations assumed to follow a log-normal
            distribution.

        Returns
        -------
        mean_est : float
            Estimated arithmetic mean of the log-normal population.
        variance_est : float
            Estimated variance of the log-normal population.

        Raises
        ------
        ValueError
            If one or more observations are non-positive.

        Warns
        -----
        RuntimeWarning
            If evaluation of the hypergeometric function fails. In that
            case, ``(np.nan, np.nan)`` is returned.
        """
        X_lognorm_data = np.asarray(X_lognorm_data, dtype=float)
        if np.any(X_lognorm_data <= 0):
            raise ValueError("All observations must be positive.")

        log_data = np.log(X_lognorm_data)
        n = len(log_data)
        hat_mu = np.mean(log_data)
        hat_sigma2 = np.var(log_data, ddof=1)

        z1 = (n - 1) / 2
        z2 = hat_sigma2 * (n - 1) / 4
        try:
            gamma_n = hyp0f1(z1, z2)
        except Exception as e:
            warnings.warn(f"Sichel estimator hyp0f1 failed: {e}", RuntimeWarning)
            return np.nan, np.nan

        mean_est = math.exp(hat_mu) * gamma_n
        variance_est = (math.exp(hat_sigma2) - 1) * math.exp(2 * hat_mu + hat_sigma2)

        return mean_est, variance_est




[docs]
    @staticmethod
    def finneys_g(m, z, n_terms_inc=10, max_iter=100, tol=None):
        """
        Evaluate Finney's correction function for log-normal estimation.

        The function evaluates the correction series used in Finney's
        uniformly minimum-variance unbiased estimator of the arithmetic
        mean of a log-normal population. The series is expanded in blocks
        until the last term is smaller than the specified tolerance.

        Parameters
        ----------
        m : int or array-like of int
            Degrees-of-freedom parameter of Finney's correction function.
        z : float or array-like of float
            Argument of Finney's correction function. If negative values are
            supplied, alternating signs are applied to the series terms.
        n_terms_inc : int, optional
            Number of additional series terms evaluated at each iteration.
            The default is 10.
        max_iter : int, optional
            Maximum number of series-expansion iterations. The default is
            100.
        tol : float or None, optional
            Convergence tolerance applied to the final series term. If
            `None`, machine precision for floating-point values is used.

        Returns
        -------
        result : float or numpy.ndarray
            Value of Finney's correction function. A scalar is returned for
            scalar input; otherwise, an array is returned. Values for which
            the calculation fails or does not converge are returned as
            ``np.nan``.

        Warns
        -----
        RuntimeWarning
            If non-finite terms are generated, the series evaluation fails,
            or convergence is not reached within ``max_iter`` iterations.
        """
        tol = tol if tol is not None else np.finfo(float).eps
        m_arr = np.atleast_1d(m).astype(int)
        z_arr = np.atleast_1d(z).astype(float)
        result = np.full_like(z_arr, np.nan, dtype=float)

        def _terms(m_i, z_i, n_terms):
            p = np.arange(2, n_terms)
            num = np.concatenate(([0], [math.log(m_i) + math.log(abs(z_i))],
                                   2*p*math.log(m_i) + np.log(m_i + 2*p) + p*math.log(abs(z_i))))
            cumsum_m2p = np.cumsum(np.log(m_i + 2*p))
            cumsum_p = np.cumsum(np.log(p))
            denom = np.concatenate(([0], [math.log(m_i + 1)],
                                     math.log(m_i) + math.log(m_i + 2) + cumsum_m2p
                                     + p*math.log(m_i + 1) + cumsum_p))
            terms = np.exp(num - denom)
            if z_i < 0:
                terms *= (-1)**np.arange(len(terms))
            return terms

        for idx, (m_i, z_i) in enumerate(zip(m_arr, z_arr)):
            converged = False
            for block in range(1, max_iter+1):
                n_terms = n_terms_inc * block
                try:
                    terms = _terms(m_i, z_i, n_terms)
                    if not np.isfinite(terms).all():
                        raise ValueError("Non-finite terms in series.")
                    if abs(terms[-1]) <= tol:
                        result[idx] = terms.sum()
                        converged = True
                        break
                except Exception as e:
                    msg = f"finneys_g failed at index {idx}: m={m_i}, z={z_i}, reason: {e}"
                    warnings.warn(msg, RuntimeWarning)
                    break
            if not converged:
                msg = f"finneys_g did not converge at index {idx}: m={m_i}, z={z_i}"
                warnings.warn(msg, RuntimeWarning)

        return float(result) if result.size == 1 else result


    # Example Psi-factor table; extend as needed
    psi_table = [
        (3, 0.20, 0.58, 1.87),
        (3, 0.40, 0.49, 2.29),
        (5, 0.20, 0.67, 1.73),
        (5, 0.40, 0.55, 2.08),
        (10,0.20, 0.75, 1.59),
        (10,0.40, 0.64, 1.82),
    ]


[docs]
    @staticmethod
    def lookup_psi(p, V, n, psi_table=psi_table):
        """
        Retrieve a lower or upper Psi factor from a lookup table.

        The lookup is first restricted to entries matching the requested
        sample size. If an exact match for ``V`` is unavailable, the entry
        with the nearest tabulated value is used.

        Parameters
        ----------
        p : float
            Probability used to select the lower or upper Psi factor.
            Values below 0.5 select the lower factor; values greater than or
            equal to 0.5 select the upper factor.
        V : float
            Variance-related value used to select the corresponding table
            entry.
        n : int
            Sample size for which the Psi factors are required.
        psi_table : sequence of tuple, optional
            Lookup table whose entries have the form
            ``(sample_size, V, lower_psi, upper_psi)``.

        Returns
        -------
        psi : float
            Selected lower or upper Psi factor.

        Raises
        ------
        ValueError
            If the lookup table contains no entries for the requested
            sample size.
        """
        entries = [e for e in psi_table if e[0] == n]
        if not entries:
            raise ValueError(f"No Psi-factors for n={n}")
        for _, v_val, psi_l, psi_u in entries:
            if math.isclose(v_val, V):
                return psi_l if p < 0.5 else psi_u
        _, _, psi_l, psi_u = min(entries, key=lambda e: abs(e[1] - V))
        return psi_l if p < 0.5 else psi_u




[docs]
    @staticmethod
    def ci_standard_approx(
        mu_hat, sigma2_hat, n,
        df=None, ci_type="two-sided", conf_level=0.95,
        lb=-math.inf, ub=math.inf, test_statistic="z"):
        """
        Compute a normal- or Student's t-based approximate confidence interval.

        The interval is constructed around ``mu_hat`` using the square root
        of ``sigma2_hat`` as its standard-error estimate. Optional lower and
        upper bounds can be used to truncate the resulting interval.

        Parameters
        ----------
        mu_hat : float
            Point estimate around which the confidence interval is
            constructed.
        sigma2_hat : float
            Estimated variance of ``mu_hat``.
        n : int
            Sample size. When a t interval is requested and ``df`` is not
            provided, the degrees of freedom are set to ``n - 1``.
        df : int or None, optional
            Degrees of freedom for the Student's t distribution. The default
            is `None`.
        ci_type : {'two-sided', 'lower', 'upper'}, optional
            Type of confidence interval. The default is ``'two-sided'``.
        conf_level : float, optional
            Confidence level, expressed as a value between 0 and 1. The
            default is 0.95.
        lb : float, optional
            Minimum permitted value for the lower confidence limit. The
            default is negative infinity.
        ub : float, optional
            Maximum permitted value for the upper confidence limit. The
            default is positive infinity.
        test_statistic : {'z', 't'}, optional
            Distribution used to obtain the critical quantiles. The default
            is ``'z'``.

        Returns
        -------
        limits : dict
            Dictionary containing ``'LCL'`` and ``'UCL'``, representing the
            lower and upper confidence limits.

        Raises
        ------
        ValueError
            If a t-based interval is requested but the degrees of freedom
            cannot be determined.
        """
        sd_hat = np.sqrt(sigma2_hat)
        alpha = 1 - conf_level
        test_statistic = test_statistic.lower()
        df = df if df is not None else (n-1 if test_statistic=="t" else None)
        if test_statistic == "t" and df is None:
            raise ValueError("df required for t-interval")
        q_lower, q_upper = {
            "two-sided": (alpha/2, 1-alpha/2),
            "lower": (alpha, 1.0),
            "upper": (0.0, 1-alpha)
        }.get(ci_type, (None,None))
        quant = (lambda p: t.ppf(p, df)) if test_statistic=="t" else (lambda p: norm.ppf(p))
        lcl = mu_hat - quant(1-q_lower)*sd_hat if q_lower>0 else -math.inf
        ucl = mu_hat + quant(q_upper)*sd_hat if q_upper<1 else math.inf
        return {"LCL": max(lb, lcl), "UCL": min(ub, ucl)}



[docs]
    @staticmethod
    def ci_lnorm_zou(mu_hat, sigma2_hat, n, ci_type, conf_level):
        """
        Exact port of R's ci.lnorm.zou() for confidence intervals on the lognormal mean.
        """
        alpha = 1 - conf_level
        sdlog = np.sqrt(sigma2_hat)
        theta2_hat = sigma2_hat / 2
        pivot = mu_hat + theta2_hat

        # Mean CI component (z-distribution)
        z = norm.ppf(1 - alpha / 2) if ci_type == "two-sided" else norm.ppf(1 - alpha)
        se_meanlog = sdlog / np.sqrt(n)
        mean_LCL = mu_hat - z * se_meanlog
        mean_UCL = mu_hat + z * se_meanlog

        # Variance CI component (chi-squared)
        df = n - 1
        chi2_L = chi2.ppf(alpha / 2, df) if ci_type == "two-sided" else chi2.ppf(alpha, df)
        chi2_U = chi2.ppf(1 - alpha / 2, df) if ci_type == "two-sided" else chi2.ppf(1 - alpha, df)

        var_LCL = (sdlog**2 * df / chi2_U) / 2
        var_UCL = (sdlog**2 * df / chi2_L) / 2

        if ci_type == "two-sided":
            dL = (mu_hat - mean_LCL)**2 + (theta2_hat - var_LCL)**2
            dU = (mean_UCL - mu_hat)**2 + (var_UCL - theta2_hat)**2
            LCL = math.exp(pivot - math.sqrt(dL))
            UCL = math.exp(pivot + math.sqrt(dU))
        elif ci_type == "lower":
            dL = (mu_hat - mean_LCL)**2 + (theta2_hat - var_LCL)**2
            LCL = math.exp(pivot - math.sqrt(dL))
            UCL = math.inf
        else:  # upper
            dU = (mean_UCL - mu_hat)**2 + (var_UCL - theta2_hat)**2
            LCL = -math.inf
            UCL = math.exp(pivot + math.sqrt(dU))

        return {"LCL": LCL, "UCL": UCL}




[docs]
    @staticmethod
    def ci_cox(mu_hat, sigma2_hat, n, ci_type="two-sided", conf_level=0.95):
        """
        Cox method for confidence intervals on the lognormal mean.
        This version assumes R's EnvStats might use a t-distribution if df is passed
        to its internal ci.normal.approx.
        mu_hat: Mean of the log-transformed data.
        sigma2_hat: Variance of the log-transformed data.
        """
        alpha = 1.0 - conf_level
        df_cox = n - 1

        # Basic parameter validation
        if not (0 < conf_level < 1):
            raise ValueError("conf_level must be between 0 and 1.")
        if n < 2: # Cox SE formula needs n and n+1. If n=1, df_cox=0.
            warnings.warn(f"Sample size n={n} is too small for Cox method. Returning NaN CI.", RuntimeWarning)
            return {"LCL": np.nan, "UCL": np.nan}
        if sigma2_hat < 0:
            warnings.warn("sigma2_hat is negative in ci_cox. Returning NaN CI.", RuntimeWarning)
            return {"LCL": np.nan, "UCL": np.nan}


        ci_type = ci_type.lower()
        beta_hat = mu_hat + (sigma2_hat / 2.0)
        
        # Cox standard error formula
        # Ensure n is float for division if it's an int, though it usually is from X_lognorm_data.size
        n_float = float(n)
        se_beta_hat_term1 = sigma2_hat / n_float
        se_beta_hat_term2 = (sigma2_hat ** 2) / (2.0 * (n_float + 1.0))
        
        variance_beta_hat = se_beta_hat_term1 + se_beta_hat_term2
        if variance_beta_hat < 0: 
            warnings.warn(f"Calculated negative variance for se_beta_hat ({variance_beta_hat}) in Cox method. Returning NaN CI.", RuntimeWarning)
            return {"LCL": np.nan, "UCL": np.nan}
        se_beta_hat = math.sqrt(variance_beta_hat)

        lcl_log, ucl_log = np.nan, np.nan

        if se_beta_hat == 0 : # If variance is zero, CI is just the point estimate
            if ci_type == "lower":
                 lcl_log = beta_hat
                 ucl_log = float("inf")
            elif ci_type == "upper":
                 lcl_log = float("-inf")
                 ucl_log = beta_hat
            else: # two-sided
                 lcl_log = beta_hat
                 ucl_log = beta_hat
        elif df_cox == 0 : # n=1, t-distribution ppf will fail for df=0
             warnings.warn(f"Degrees of freedom is 0 (n=1) in ci_cox, returning NaN CI.", RuntimeWarning)
             return {"LCL": np.nan, "UCL": np.nan}
        else:
            # Using t-distribution as hypothesized for EnvStats::ci.normal.approx behavior
            if ci_type == "two-sided":
                if alpha == 1.0: # conf_level is 0, alpha/2 is 0.5
                    t_val = 0.0 # t.ppf(0.5, df) is 0
                elif alpha == 0.0: # conf_level is 1, alpha/2 is 0
                     t_val = float("inf") # t.ppf(1.0, df) is inf
                else:
                    t_val = t.ppf(1.0 - alpha / 2.0, df_cox)
                
                lcl_log = beta_hat - t_val * se_beta_hat
                ucl_log = beta_hat + t_val * se_beta_hat
            elif ci_type == "lower":
                if alpha == 1.0: # conf_level is 0
                    t_val = 0.0 # t.ppf(0.5, df) is 0, lcl = beta_hat
                elif alpha == 0.0: # conf_level is 1
                     t_val = float("inf") # t.ppf(1.0, df) is inf, lcl = -inf
                else:
                    t_val = t.ppf(1.0 - alpha, df_cox) 
                lcl_log = beta_hat - t_val * se_beta_hat
                ucl_log = float("inf")
            elif ci_type == "upper":
                if alpha == 1.0: # conf_level is 0
                    t_val = 0.0 # ucl = beta_hat
                elif alpha == 0.0: # conf_level is 1
                     t_val = float("inf") # ucl = inf
                else:
                    t_val = t.ppf(1.0 - alpha, df_cox) 
                lcl_log = float("-inf")
                ucl_log = beta_hat + t_val * se_beta_hat
            else:
                raise ValueError(f"Invalid ci_type: {ci_type}. Must be 'two-sided', 'lower', or 'upper'.")

        # Exponentiate, handling -inf, inf, and nan
        LCL = np.nan
        if lcl_log == float("-inf"):
            LCL = float("-inf")
        elif not np.isnan(lcl_log): # np.isnan handles np.nan
            try:
                LCL = math.exp(lcl_log)
            except OverflowError: # If lcl_log is huge
                LCL = float("inf") 
        
        UCL = np.nan
        if ucl_log == float("inf"):
            UCL = float("inf")
        elif not np.isnan(ucl_log):
            try:
                UCL = math.exp(ucl_log)
            except OverflowError: # If ucl_log is huge
                UCL = float("inf")
        
        return {"LCL": LCL, "UCL": UCL}


    # Land method starts here

[docs]
    def lands_cond_t_prop_density_polar(theta, nu, zeta):
        """
        Evaluate Land's conditional t proportional density in polar coordinates.

        Parameters
        ----------
        theta : float or array-like
            Angular coordinate at which the proportional density is
            evaluated.
        nu : int
            Degrees of freedom of the conditional t distribution.
        zeta : float
            Non-centrality or shape parameter of the conditional
            distribution.

        Returns
        -------
        density : float or numpy.ndarray
            Unnormalized proportional density evaluated at ``theta``.
        """
        return np.exp((nu - 1) * np.log(np.cos(theta)) - (nu / 2) * np.log(nu) + (1 + nu) * zeta * np.sin(theta))



[docs]
    def lands_cond_t_prop_density(tau, nu, zeta):
        """
        Evaluate Land's conditional t proportional density.

        Parameters
        ----------
        tau : float or array-like
            Value at which the proportional conditional t density is
            evaluated.
        nu : int
            Degrees of freedom of the conditional t distribution.
        zeta : float
            Non-centrality or shape parameter of the conditional
            distribution.

        Returns
        -------
        density : float or numpy.ndarray
            Unnormalized proportional density evaluated at ``tau``.
        """
        return ((nu + tau**2) ** (-(nu + 1) / 2)) * np.exp(((nu + 1) * zeta * tau) / np.sqrt(nu + tau**2))




[docs]
    def qlands_t(p, nu, zeta, tol=np.finfo(float).eps**0.9):
        """
        Compute a quantile of Land's conditional t distribution.

        The proportional density is normalized numerically in polar
        coordinates. The requested quantile is then obtained by numerical
        integration and root finding.

        Parameters
        ----------
        p : float
            Cumulative probability at which the quantile is evaluated. Must
            be between 0 and 1.
        nu : int
            Degrees of freedom. Must be greater than or equal to 2.
        zeta : float
            Non-centrality or shape parameter of Land's conditional t
            distribution.
        tol : float, optional
            Numerical tolerance used by the root-finding procedures. The
            default is approximately machine precision raised to 0.9.

        Returns
        -------
        quantile : float
            Quantile corresponding to cumulative probability ``p``.
            Negative and positive infinity are returned for ``p=0`` and
            ``p=1``, respectively.

        Raises
        ------
        ValueError
            If ``p`` is outside the interval [0, 1] or if ``nu`` is smaller
            than 2.
        """
        if not (0 <= p <= 1):
            raise ValueError("'p' must be between 0 and 1")
        if nu < 2:
            raise ValueError("'nu' must be >= 2")

        if p == 0:
            return -np.inf
        if p == 1:
            return np.inf

        # Find theta_max for normalization
        def fcn(theta):
            return -(nu - 1) * np.tan(theta) + (1 + nu) * zeta * np.cos(theta)

        sol = root_scalar(fcn, bracket=[-np.pi/2 + 1e-8, np.pi/2 - 1e-8], method='brentq', xtol=tol, maxiter=10000)
        theta_max = sol.root
        #print(f"[DEBUG] theta_max = {theta_max}")

        # Adjust for p > 0.5
        if p > 0.5:
            new_zeta = -zeta
            new_p = 1 - p
            invert = True
        else:
            new_zeta = zeta
            new_p = p
            invert = False

        #print(f"[DEBUG] p: {p}, new_p: {new_p}, zeta: {zeta}, new_zeta: {new_zeta}, invert: {invert}")

        # Build density function with new_zeta
        try:
            test_val = lands_cond_t_prop_density_polar(theta_max, nu, new_zeta)
            if np.isfinite(test_val):
                scaling_factor, _ = quad(lands_cond_t_prop_density_polar, -np.pi/2, np.pi/2, args=(nu, new_zeta))
                def density(theta):
                    return lands_cond_t_prop_density_polar(theta, nu, new_zeta) / scaling_factor
                #print(f"[DEBUG] Scaling factor (new_zeta={new_zeta}) = {scaling_factor}")
            else:
                raise Exception
        except:
            def quasi_density(theta, ln_c):
                return np.exp(ln_c + (nu - 1) * np.log(np.cos(theta)) - (nu / 2) * np.log(nu) + (1 + nu) * new_zeta * np.sin(theta))

            def fcn_to_minimize(ln_c):
                integral, _ = quad(lambda theta: quasi_density(theta, ln_c), -np.pi/2, np.pi/2)
                return (integral - 1)**2

            start = -((nu - 1) * np.log(np.cos(theta_max)) - (nu / 2) * np.log(nu) + (1 + nu) * new_zeta * np.sin(theta_max))
            res = minimize(fcn_to_minimize, x0=start, method='Nelder-Mead')
            ln_c = res.x[0]

            def density(theta):
                return quasi_density(theta, ln_c)

            #print(f"[DEBUG] Used fallback normalization constant ln_c (new_zeta={new_zeta}) = {ln_c}")

        # Root of cumulative density - p
        def integral_root(theta_val):
            val, _ = quad(density, -np.pi/2, theta_val)
            return val - new_p

        root = root_scalar(integral_root, bracket=[-np.pi/2 + 1e-8, np.pi/2 - 1e-8], xtol=tol, maxiter=10000, method='brentq')
        theta_quantile = root.root
        quant = np.sqrt(nu) * np.tan(theta_quantile)

        #print(f"[DEBUG] Root (theta_quantile): {theta_quantile}")
        #print(f"[DEBUG] Raw quantile (before sign correction): {quant}")

        return -quant if invert else quant



[docs]
    @staticmethod
    def lands_C_old(S, nu, conf_level):
        """
        Compute Land's C constant using the legacy minimization procedure.

        This method is retained as the previous implementation of the
        numerical procedure used to determine Land's C constant. New code
        should generally use :meth:`lands_C`.

        Parameters
        ----------
        S : float
            Positive scale parameter used in Land's method.
        nu : int
            Degrees of freedom. Must be greater than or equal to 2.
        conf_level : float
            Probability level used to calculate the constant. Must be
            between 0 and 1.

        Returns
        -------
        C : float
            Land's C constant.

        Raises
        ------
        ValueError
            If ``S`` is not positive, ``nu`` is smaller than 2, or
            ``conf_level`` is outside the interval [0, 1].

        See Also
        --------
        lands_C
            Updated implementation of the same numerical calculation.
        """
        if S < np.finfo(float).eps:
            raise ValueError("'S' must be positive")
        if nu < 2:
            raise ValueError("'nu' must be greater than or equal to 2")
        if conf_level < 0 or conf_level > 1:
            raise ValueError("'conf_level' must be between 0 and 1")

        alpha = 1 - conf_level

        def fcn_to_minimize(m):
            T_m = (np.sqrt(nu + 1) * ((-S**2) / 2 - m)) / S
            zeta_m = (-S * np.sqrt(nu + T_m**2)) / (2 * np.sqrt(nu + 1))
            return (T_m - Stats.qlands_t(alpha, nu, zeta_m))**2

        start_T_m = (-np.sqrt(nu + 1) * S) / 2
        start_zeta_m = (-S * np.sqrt(nu + start_T_m**2)) / (2 * np.sqrt(nu + 1))
        start_T_m = Stats.qlands_t(1 - conf_level, nu, start_zeta_m)
        start_m = ((-S**2) / 2) - (S * start_T_m) / np.sqrt(nu + 1)

        result = minimize(fcn_to_minimize, start_m)

        m = result.x[0]
        return (m * np.sqrt(nu)) / S



[docs]
    @staticmethod
    def lands_C(S: float, nu: int, conf_level: float, tol: float = 1e-8, maxiter: int = 100) -> float:
        """
        Compute the constant C for Land's method, 
        matching R's lands.C(S, nu, conf.level).

        Parameters
        ----------
        S : float
            Must be > 0.
        nu : int
            Degrees of freedom, >= 2.
        conf_level : float
            Confidence level between 0 and 1.
        tol : float
            Tolerance for minimization.
        maxiter : int
            Maximum iterations for the optimizer.

        Returns
        -------
        C : float
        """
        if S <= np.finfo(float).eps:
            raise ValueError("'S' must be positive")
        if nu < 2 or int(nu) != nu:
            raise ValueError("'nu' must be an integer >= 2")
        if not (0 < conf_level < 1):
            raise ValueError("'conf_level' must be between 0 and 1")

        alpha = 1.0 - conf_level

        # objective(m) = [T(m) - qlands_t(alpha; nu, zeta(m))]^2
        def objective(m):
            Tm = (np.sqrt(nu + 1) * ((-S**2) / 2 - m)) / S
            zeta_m = (-S * np.sqrt(nu + Tm**2)) / (2 * np.sqrt(nu + 1))
            q = Stats.qlands_t(alpha, nu, zeta_m)
            return (Tm - q) ** 2

        # initial guess for m via R's logic
        # Tm0  = qlands_t(1-alpha, nu, zeta0)
        Tm0 = Stats.qlands_t(1 - conf_level, nu,
                       (-S * np.sqrt(nu + ((-np.sqrt(nu + 1)*S/2)**2))) /
                       (2 * np.sqrt(nu + 1)))
        m0 = (-S**2) / 2 - (S * Tm0) / np.sqrt(nu + 1)

        # bracket ±S^2 around that start
        bracket = (m0 - S**2, m0 + S**2)

        # Brent's method on a bounded interval is often more robust:
        res = minimize_scalar(
            objective,
            method='bounded',
            bounds=bracket,
            options={'xatol': tol, 'maxiter': maxiter}
        )

        if not res.success:
            # fallback to Brent unrestricted
            res = minimize_scalar(objective, bracket=bracket, method='Brent', tol=tol)
            if not res.success:
                raise RuntimeError("lands_C minimization failed to converge")

        m_star = res.x
        return (m_star * np.sqrt(nu)) / S



[docs]
    @staticmethod
    def ci_land(lambda_, mu_hat, sig_sq_hat, n, nu, gamma_sq, ci_type="two-sided", conf_level=0.95):
        r"""
        Compute a confidence interval using Land's exact method.

        The interval is calculated for a parameter of the form

        .. math::

            \\mu + \\lambda \\sigma^2

        using Land's conditional t distribution and the numerically
        determined C constants.

        Parameters
        ----------
        lambda_ : float
            Coefficient multiplying the variance term. It must be non-zero.
        mu_hat : float
            Estimate of the location parameter.
        sig_sq_hat : float
            Positive estimate of the variance parameter.
        n : int
            Sample size reported in the returned result.
        nu : int
            Degrees of freedom. Must be an integer greater than or equal to
            2.
        gamma_sq : float
            Positive scaling parameter used in the Land transformation.
        ci_type : {'two-sided', 'lower', 'upper'}, optional
            Type of confidence interval. The default is ``'two-sided'``.
        conf_level : float, optional
            Confidence level. It must be at least 0.5 and smaller than 1.
            The default is 0.95.

        Returns
        -------
        result : dict
            Dictionary containing:

            * ``'LCL'``: lower confidence limit.
            * ``'UCL'``: upper confidence limit.
            * ``'parameter'``: description of the estimated parameter.
            * ``'type'``: confidence-interval type.
            * ``'method'``: confidence-interval method.
            * ``'conf_level'``: requested confidence level.
            * ``'sample_size'``: sample size.
            * ``'dof'``: degrees of freedom.

        Raises
        ------
        ValueError
            If the input parameters are outside their permitted ranges or
            if ``ci_type`` is not one of the supported values.
        """
        if np.abs(lambda_) < np.finfo(float).eps:
            raise ValueError("'lambda' cannot be 0")
        if sig_sq_hat < np.finfo(float).eps:
            raise ValueError("'sig_sq_hat' must be larger than 0")
        if nu < 2 or nu != int(nu):
            raise ValueError("'nu' must be an integer greater than or equal to 2")
        if gamma_sq < np.finfo(float).eps:
            raise ValueError("'gamma_sq' must be larger than 0")
        if conf_level < 0.5 or conf_level >= 1:
            raise ValueError("'conf_level' must be at least 50% and less than 100%")

        k = (nu + 1) / (2 * lambda_ * gamma_sq)
        S = np.sqrt((2 * lambda_ * sig_sq_hat) / k)

        if ci_type == "two-sided":
            alpha = (1 - conf_level) / 2
            lcl = mu_hat + lambda_ * sig_sq_hat + ((k * S) / np.sqrt(nu)) * Stats.lands_C(S, nu, alpha)
            ucl = mu_hat + lambda_ * sig_sq_hat + ((k * S) / np.sqrt(nu)) * Stats.lands_C(S, nu, 1 - alpha)
        elif ci_type == "lower":
            lcl = mu_hat + lambda_ * sig_sq_hat + ((k * S) / np.sqrt(nu)) * Stats.lands_C(S, nu, 1 - conf_level)
            ucl = np.inf
        elif ci_type == "upper":
            lcl = -np.inf
            ucl = mu_hat + lambda_ * sig_sq_hat + ((k * S) / np.sqrt(nu)) * Stats.lands_C(S, nu, conf_level)
        else:
            raise ValueError("Invalid ci_type. Choose from 'two-sided', 'lower', or 'upper'.")

        return {
            "LCL": lcl,
            "UCL": ucl,
            "parameter": f"mu + {lambda_}*(sigma^2)",
            "type": ci_type,
            "method": "Land",
            "conf_level": conf_level,
            "sample_size": n,
            "dof": nu
        }


    

[docs]
    @staticmethod
    def ci_lnorm_land(mu_hat, sigma2_hat, n, ci_type='two-sided', conf_level=0.95):
        r"""
        Compute a Land confidence interval for the arithmetic mean of a
        log-normal population.

        This method applies :meth:`ci_land` to the log-scale parameter

        .. math::

            \\mu + \\frac{1}{2}\\sigma^2

        and exponentiates the resulting confidence limits to obtain an
        interval for the arithmetic mean on the original data scale.

        Parameters
        ----------
        mu_hat : float
            Estimated mean of the log-transformed observations.
        sigma2_hat : float
            Estimated variance of the log-transformed observations.
        n : int
            Sample size. The degrees of freedom are set to ``n - 1``.
        ci_type : {'two-sided', 'lower', 'upper'}, optional
            Type of confidence interval. The default is ``'two-sided'``.
        conf_level : float, optional
            Confidence level. The default is 0.95.

        Returns
        -------
        result : dict
            Dictionary returned by :meth:`ci_land`, with ``'LCL'`` and
            ``'UCL'`` exponentiated to the original data scale and
            ``'parameter'`` set to ``'mean'``.

        Raises
        ------
        ValueError
            If one of the parameters passed to :meth:`ci_land` is invalid.
        """
        result = Stats.ci_land(
            lambda_=0.5,
            mu_hat=mu_hat,
            sig_sq_hat=sigma2_hat,
            n=n,
            nu=n - 1,
            gamma_sq=n,
            ci_type=ci_type,
            conf_level=conf_level
        )
        
        result['LCL'] = np.exp(result['LCL'])
        result['UCL'] = np.exp(result['UCL'])
        result['parameter'] = "mean"

        return result