Source code for copul.family.elliptical.gaussian

import numpy as np
import sympy as sp
from scipy.stats import norm

from copul.copula_sampler import CopulaSampler
from copul.family.elliptical.multivar_gaussian import MultivariateGaussian
from copul.family.elliptical.elliptical_copula import EllipticalCopula
from copul.family.frechet.biv_independence_copula import BivIndependenceCopula
from copul.family.frechet.lower_frechet import LowerFrechet
from copul.family.frechet.upper_frechet import UpperFrechet
from copul.wrapper.sympy_wrapper import SymPyFuncWrapper



[docs]
class Gaussian(MultivariateGaussian, EllipticalCopula):
    r"""
    Bivariate Gaussian copula.

    Extends :class:`~copul.family.elliptical.multivar_gaussian.MultivariateGaussian`
    for the 2-dimensional case. Characterized by a correlation parameter
    :math:`\rho \in [-1,1]`.

    **Special cases**

    - :math:`\rho=-1`: Lower Fréchet bound (countermonotone)
    - :math:`\rho=0`: Independence
    - :math:`\rho=1`: Upper Fréchet bound (comonotone)
    """

    # Define generator as a symbolic expression with 't' as the variable
    t = sp.symbols("t", positive=True)
    generator = sp.exp(-t / 2)

    def __new__(cls, *args, **kwargs):
        r"""
        Factory method that handles special cases during initialization.

        Parameters
        ----------
        *args, **kwargs
            Arguments passed to the constructor.

        Returns
        -------
        Copula
            An instance of the appropriate copula class (e.g., Lower/Upper Fréchet
            or Independence) when :math:`\rho \in \{-1,0,1\}`, otherwise a
            :class:`Gaussian`.
        """
        # Handle special cases during initialization with positional args
        if len(args) == 1:
            if args[0] == -1:
                return LowerFrechet()
            elif args[0] == 0:
                return BivIndependenceCopula()
            elif args[0] == 1:
                return UpperFrechet()

        # Default case - proceed with normal initialization
        return super().__new__(cls)

    def __init__(self, *args, **kwargs):
        r"""
        Initialize a bivariate Gaussian copula.

        Parameters
        ----------
        *args : tuple
            Positional arguments corresponding to copula parameters.
        **kwargs : dict
            Keyword arguments to override default symbolic parameters.
        """
        # Handle special cases from __new__
        if len(args) == 1 and isinstance(args[0], (int, float)):
            kwargs["rho"] = args[0]
            args = ()

        # Call parent initializer
        super().__init__(*args, **kwargs)

    def __call__(self, *args, **kwargs):
        r"""
        Create a new instance with updated parameters.

        Special handling for boundary :math:`\rho` values
        (:math:`-1, 0, 1`) returning the corresponding special copulas.

        Parameters
        ----------
        *args, **kwargs
            Updated parameter values.

        Returns
        -------
        Copula
            A new instance with the updated parameters.
        """
        if args is not None and len(args) == 1:
            kwargs["rho"] = args[0]

        if "rho" in kwargs:
            if kwargs["rho"] == -1:
                del kwargs["rho"]
                return LowerFrechet()(**kwargs)
            elif kwargs["rho"] == 0:
                del kwargs["rho"]
                return BivIndependenceCopula()(**kwargs)
            elif kwargs["rho"] == 1:
                del kwargs["rho"]
                return UpperFrechet()(**kwargs)

        return super().__call__(**kwargs)


[docs]
    def rvs(self, n=1, approximate=False, random_state=None, **kwargs):
        r"""
        Generate random samples from the Gaussian copula.

        For the bivariate case, a fast implementation from ``statsmodels`` is used.

        Parameters
        ----------
        n : int, default 1
            Number of samples to generate.
        approximate : bool, default False
            If ``True``, use the project’s generic approximating sampler.
        random_state : int or numpy.random.Generator, optional
            Seed or generator for reproducibility.
        **kwargs
            Passed to the multivariate sampler when ``dim > 2``.

        Returns
        -------
        numpy.ndarray
            Array of shape :math:`(n,2)` with samples on :math:`[0,1]^2`.
        """
        if approximate:
            sampler = CopulaSampler(self, random_state=random_state)
            return sampler.rvs(n, approximate)
        from statsmodels.distributions.copula.elliptical import (
            GaussianCopula as StatsGaussianCopula,
        )

        # For bivariate case, we can use the statsmodels implementation
        if self.dim == 2:
            return StatsGaussianCopula(float(self.rho)).rvs(n)
        else:
            # Otherwise use the multivariate implementation
            return super().rvs(n, **kwargs)


    @property
    def cdf(self):
        """
        Compute the cumulative distribution function of the Gaussian copula.

        For the bivariate case, this can use the statsmodels implementation
        for efficiency.

        Returns
        -------
        callable
            Function that computes the CDF at given points
        """
        from statsmodels.distributions.copula.elliptical import (
            GaussianCopula as StatsGaussianCopula,
        )

        # For bivariate case, we can use the statsmodels implementation
        if self.dim == 2:
            cop = StatsGaussianCopula(float(self.rho))

            def gauss_cdf(u, v):
                if u == 0 or v == 0:
                    return sp.S.Zero
                else:
                    return float(cop.cdf([u, v]))

            return lambda u, v: SymPyFuncWrapper(gauss_cdf(u, v))
        else:
            # Otherwise use the multivariate implementation
            return super().cdf


[docs]
    def cdf_vectorized(self, u, v):
        r"""
        Vectorized CDF for the bivariate Gaussian copula.

        Evaluates :math:`C(u,v)` at many points simultaneously.

        Parameters
        ----------
        u : array_like
            First uniform marginal, values in :math:`[0,1]`.
        v : array_like
            Second uniform marginal, values in :math:`[0,1]`.

        Returns
        -------
        numpy.ndarray
            CDF values at the specified points.

        Notes
        -----
        This implementation leverages the compiled backend in ``statsmodels``. The
        defining relation is

        .. math::

           C(u,v) \;=\; \Phi_{\rho}\!\bigl(\Phi^{-1}(u),\,\Phi^{-1}(v)\bigr),

        where :math:`\Phi` is the standard normal CDF and :math:`\Phi_{\rho}` is the
        bivariate normal CDF with correlation :math:`\rho`.
        """
        # Ensure inputs are numpy arrays for vectorized operations
        u = np.asarray(u)
        v = np.asarray(v)

        # Validate that inputs are within the valid [0, 1] range
        if np.any((u < 0) | (u > 1)) or np.any((v < 0) | (v > 1)):
            raise ValueError("Marginals must be in [0, 1]")

        # Use numpy's broadcasting to handle scalar and array inputs seamlessly
        if u.ndim == 0 and v.ndim > 0:
            u = np.broadcast_to(u, v.shape)
        elif v.ndim == 0 and u.ndim > 0:
            v = np.broadcast_to(v, u.shape)

        # Get the correlation parameter as a standard float
        rho_val = float(self.rho)

        # Handle special cases for correlation extremes with fast, vectorized numpy functions
        if rho_val == -1:
            return np.maximum(u + v - 1, 0)  # Lower Fréchet bound
        if rho_val == 0:
            return u * v  # Independence copula
        if rho_val == 1:
            return np.minimum(u, v)  # Upper Fréchet bound

        # Initialize the result array. The default of 0 correctly handles C(0,v) and C(u,0).
        result = np.zeros_like(u, dtype=float)

        # Identify points that are not on the boundaries of the unit square [0,1]^2
        # These are the only points that require the complex bivariate normal CDF calculation.
        interior_mask = (u > 0) & (u < 1) & (v > 0) & (v < 1)

        # Process interior points if any exist
        if np.any(interior_mask):
            from statsmodels.distributions.copula.elliptical import (
                GaussianCopula as StatsGaussianCopula,
            )

            # Instantiate the statsmodels Gaussian Copula
            # Note: statsmodels expects the correlation matrix parameter named 'corr'
            cop = StatsGaussianCopula(corr=rho_val)

            # Create pairs of (u, v) for the interior points
            uv_pairs = np.column_stack((u[interior_mask], v[interior_mask]))

            # Calculate the CDF for all interior points in a single, fast, vectorized call
            result[interior_mask] = cop.cdf(uv_pairs)

        # Handle the u=1 and v=1 boundary cases.
        # np.where is used for vectorized conditional assignment.
        result[u == 1] = v[u == 1]
        result[v == 1] = u[v == 1]

        return result


    def _conditional_distribution(self, u=None, v=None):
        r"""
        Conditional distribution of the bivariate Gaussian copula.

        Returns a function computing :math:`\mathbb{P}(V \le v \mid U=u)` (or the
        symmetric version) using the Gaussian conditional formula.

        Parameters
        ----------
        u : float, optional
            Conditioning value for :math:`U`.
        v : float, optional
            Conditioning value for :math:`V`.

        Returns
        -------
        callable or float
            A function :math:`v \mapsto C(v\mid u)` / :math:`u \mapsto C(u\mid v)`,
            or its value if both arguments are provided.
        """
        scale = float(np.sqrt(1 - float(self.rho) ** 2))

        def conditional_func(u_, v_):
            return norm.cdf(
                norm.ppf(v_), loc=float(self.rho) * norm.ppf(u_), scale=scale
            )

        if u is None and v is None:
            return conditional_func
        elif u is not None and v is not None:
            return conditional_func(u, v)
        elif u is not None:
            return lambda v_: conditional_func(u, v_)
        else:
            return lambda u_: conditional_func(u_, v)


[docs]
    def cond_distr_1(self, u=None, v=None):
        r"""
        First conditional distribution :math:`C(v\mid u)`.

        Parameters
        ----------
        u : float, optional
            Conditioning value.
        v : float, optional
            Evaluation point.

        Returns
        -------
        SymPyFuncWrapper
            Wrapped conditional distribution function or value.
        """
        if v in [0, 1]:
            return SymPyFuncWrapper(sp.Number(v))
        return SymPyFuncWrapper(sp.Number(self._conditional_distribution(u, v)))



[docs]
    def cond_distr_2(self, u=None, v=None):
        r"""
        Second conditional distribution :math:`C(u\mid v)`.

        Parameters
        ----------
        u : float, optional
            Evaluation point.
        v : float, optional
            Conditioning value.

        Returns
        -------
        SymPyFuncWrapper
            Wrapped conditional distribution function or value.
        """
        if u in [0, 1]:
            return SymPyFuncWrapper(sp.Number(u))
        return SymPyFuncWrapper(sp.Number(self._conditional_distribution(v, u)))


    @property
    def pdf(self):
        r"""
        Probability density function of the Gaussian copula.

        In the bivariate case, this uses the optimized ``statsmodels`` implementation.

        Returns
        -------
        callable
            Function that computes :math:`c(u,v)` at given points :math:`(u,v)\in(0,1)^2`.
        """
        from statsmodels.distributions.copula.elliptical import (
            GaussianCopula as StatsGaussianCopula,
        )

        # For bivariate case, we can use the statsmodels implementation
        if self.dim == 2:
            return lambda u, v: SymPyFuncWrapper(
                sp.Number(StatsGaussianCopula(float(self.rho)).pdf([u, v]))
            )
        else:
            # Otherwise use the multivariate implementation
            return super().pdf


[docs]
    def chatterjees_xi(self, *args, **kwargs):
        r"""
        Chatterjee's :math:`\xi` dependence measure for the Gaussian copula.

        Returns
        -------
        float
            Value of :math:`\xi`.
        """
        self._set_params(args, kwargs)
        return 3 / np.pi * np.arcsin(1 / 2 + float(self.rho) ** 2 / 2) - 0.5



[docs]
    def blests_nu(self):
        return self.spearmans_rho()



[docs]
    def spearmans_rho(self, *args, **kwargs):
        r"""
        Spearman's rank correlation :math:`\rho_{\!S}` for the Gaussian copula.

        Returns
        -------
        float
            Value of :math:`\rho_{\!S}`.
        """
        self._set_params(args, kwargs)
        return 6 / np.pi * np.arcsin(float(self.rho) / 2)



[docs]
    def kendalls_tau(self, *args, **kwargs):
        r"""
        Kendall's :math:`\tau` for the Gaussian copula.

        Returns
        -------
        float
            Value of :math:`\tau`.
        """
        self._set_params(args, kwargs)
        return 2 / np.pi * np.arcsin(float(self.rho))



[docs]
    def spearman_footrule(self, *args, **kwargs) -> float:
        r"""
        Spearman's footrule :math:`\psi` for the Gaussian copula.

        Closed form, via a trivariate normal orthant probability:

        .. math::
           \psi(\rho) \;=\; \frac{3}{\pi}\,\arcsin\!\Bigl(\frac{1+\rho}{2}\Bigr) \;-\; \tfrac{1}{2}.

        Returns
        -------
        float
            Footrule value in :math:`[-\tfrac12, 1]`.
        """
        self._set_params(args, kwargs)
        rho = float(self.rho)

        # numeric safety: clamp to [-1, 1]
        rho = max(-1.0, min(1.0, rho))

        footrule = (3.0 / np.pi) * np.arcsin((1.0 + rho) / 2.0) - 0.5
        return footrule



[docs]
    def spearmans_footrule(self, *args, **kwargs) -> float:
        r"""Alias for :meth:`spearman_footrule`."""
        return self.spearman_footrule(*args, **kwargs)


    # ------------------------------------------------------------------
    # Dependence measures with known closed forms
    # ------------------------------------------------------------------


[docs]
    def schweizer_wolff_sigma(self, *args, **kwargs):
        r"""
        Schweizer–Wolff :math:`\sigma` for the Gaussian copula.

        The bivariate Gaussian copula is PQD when :math:`\rho \ge 0` and
        NQD when :math:`\rho < 0`, so the absolute value in the definition
        of :math:`\sigma` is redundant:

        .. math::

           \sigma(\rho)
             = \lvert\rho_S\rvert
             = \frac{6}{\pi}\,\bigl|\!\arcsin(\rho/2)\bigr|

        Returns
        -------
        float
        """
        self._set_params(args, kwargs)
        rho = float(self.rho)
        rho = max(-1.0, min(1.0, rho))
        return (6.0 / np.pi) * abs(np.arcsin(rho / 2.0))



[docs]
    def hoeffdings_d(self, *args, **kwargs):
        r"""
        Hoeffding's :math:`D` for the Gaussian copula (numerical).

        No simple closed form is known.  Falls back to base-class
        numerical quadrature.

        Returns
        -------
        float
        """
        self._set_params(args, kwargs)
        return self._hoeffdings_d_numerical()



[docs]
    def gini_gamma(self, *args, **kwargs):
        r"""
        Gini's :math:`\gamma` for the Gaussian copula.

        .. math::

           \gamma(\rho)
             = \frac{2}{\pi}\Bigl(\arcsin\Bigl(\frac{1+\rho}{2}\Bigr)
               - \arcsin\Bigl(\frac{1-\rho}{2}\Bigr)\Bigr)

        obtained by expressing the diagonal and anti-diagonal integrals of
        the copula as trivariate normal orthant probabilities.

        Returns
        -------
        float
        """
        self._set_params(args, kwargs)
        rho = float(self.rho)
        rho = max(-1.0, min(1.0, rho))
        return (2.0 / np.pi) * (
            np.arcsin((1.0 + rho) / 2.0) - np.arcsin((1.0 - rho) / 2.0)
        )



[docs]
    def blomqvists_beta(self, *args, **kwargs):
        r"""
        Blomqvist's :math:`\beta` for the Gaussian copula.

        .. math::

           \beta(\rho) = \frac{2}{\pi}\,\arcsin(\rho)

        Returns
        -------
        float
        """
        if args or kwargs:
            self._set_params(args, kwargs)
        rho = float(self.rho)
        rho = max(-1.0, min(1.0, rho))
        return (2.0 / np.pi) * np.arcsin(rho)



[docs]
    def lambda_L(self):
        r"""Lower tail dependence for the Gaussian copula.

        The Gaussian copula has **no tail dependence** for
        :math:`\rho < 1`:

        .. math::

           \lambda_L = 0 \quad\text{for } \rho \in [-1, 1).

        Returns
        -------
        float
            Always 0 (unless :math:`\rho = 1`, comonotonic limit).
        """
        rho_val = float(self.rho)
        if rho_val >= 1.0:
            return 1.0
        return 0.0



[docs]
    def lambda_U(self):
        r"""Upper tail dependence for the Gaussian copula.

        Same as :meth:`lambda_L` — zero for :math:`\rho < 1`.

        Returns
        -------
        float
        """
        return self.lambda_L()



[docs]
    def tail_order(self):
        r"""Tail order for the Gaussian copula.

        .. math::

           \kappa_L = \kappa_U = \frac{2}{1 + \rho}

        for :math:`-1 < \rho \le 1`, see Hua & Joe (2011), *Tail order and
        intermediate tail dependence of multivariate copulas*, JMVA 102,
        Example 2.

        Returns
        -------
        dict
        """
        rho_val = float(self.rho)
        if rho_val >= 1.0:
            kappa = 1.0
        elif rho_val <= -1.0:
            kappa = float("inf")
        else:
            kappa = 2.0 / (1.0 + rho_val)
        return {"lower": kappa, "upper": kappa}