sktime · ShreeshaM07 · Jul 17, 2024 · Jul 18, 2024 · Jul 24, 2024 · Jul 25, 2024
diff --git a/skpro/distributions/cmp_pois_gam.py b/skpro/distributions/cmp_pois_gam.py
@@ -0,0 +1,184 @@
+# copyright: skpro developers, BSD-3-Clause License (see LICENSE file)
+"""Compound poisson gamma probability distribution."""
+
+__author__ = ["ShreeshaM07"]
+
+import math
+
+import numpy as np
+
+from skpro.distributions.base import BaseDistribution
+
+
+class CmpPoissonGamma(BaseDistribution):
+    """Compound Poisson Gamma Distribution.
+
+    Parameters
+    ----------
+    lambda_ : float or array of float (1D or 2D)
+        The rate parameter of the Poisson distribution.
+    alpha : float or array of float (1D or 2D)
+        The shape parameter of the Gamma distribution.
+    beta : float or array of float (1D or 2D)
+        The rate parameter (inverse scale) of the Gamma distribution.
+    index : pd.Index, optional, default = RangeIndex
+    columns : pd.Index, optional, default = RangeIndex
+    """
+
+    _tags = {
+        "capabilities:approx": ["pdfnorm"],
+        "capabilities:exact": [
+            "mean",
+            "var",
+            "energy",
+            "pdf",
+            "log_pdf",
+            "cdf",
+            "ppf",
+            "pmf",
+            "log_pmf",
+        ],
+        "distr:measuretype": "mixed",
+        "distr:paramtype": "parametric",
+        "broadcast_init": "on",
+    }
+
+    def __init__(self, lambda_, alpha, beta, index=None, columns=None):
+        self.lambda_ = lambda_
+        self.alpha = alpha
+        self.beta = beta
+        super().__init__(index=index, columns=columns)
+
+    def _pdf(self, x):
+        """Probability density function.
+
+        Parameters
+        ----------
+        x : 2D np.ndarray, same shape as ``self``
+            values to evaluate the pdf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            pdf values at the given points
+        """
+        from scipy.special import gamma as gam_fun
+
+        lam = self.lambda_
+        alpha = self.alpha
+        beta = self.beta
+        pdf_value = np.zeros_like(x)
+        tol = 1e-10
+
+        for idx, val in np.ndenumerate(x):
+            if val <= 0:
+                continue  # PDF is zero for non-positive values
+
+            const_term = np.exp(-beta * val) / ((np.exp(lam) - 1) * val)
+            i = 1
+            while True:
+                t1 = lam * (pow(beta * val, alpha))
+                numer = pow(t1, i)
+                i_fact = math.factorial(i)
+                gamma_fun = gam_fun(i * alpha)
+                denom = i_fact * gamma_fun
+
+                term = numer / denom
+                pdf_value[idx] += term
+
+                if term < tol:
+                    break
+                i += 1
+                if i > 1000:  # safeguard to prevent infinite loop
+                    break
+            pdf_value[idx] = pdf_value[idx] * const_term
+
+        return pdf_value
+
+    def _pmf(self, k):
+        """Probability mass function.
+
+        Parameters
+        ----------
+        k : 2D np.ndarray, same shape as ``self``
+            values to evaluate the pmf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            pmf values at the given points
+        """
+        from scipy.stats import poisson
+
+        lambda_ = self.lambda_
+        return poisson.pmf(k, lambda_)
+
+    def _compute_crj(self, r, j, rho):
+        from itertools import combinations_with_replacement, permutations
+
+        from scipy.special import comb
+
+        partitions = np.array(
+            [
+                p
+                for p in combinations_with_replacement(range(1, r + 1), j)
+                if sum(p) == r
+            ]
+        )
+
+        partitions = np.vstack(
+            [np.array(list(set(permutations(sub_list)))) for sub_list in partitions]
+        )
+
+        if partitions.size == 0:
+            return 0
+
+        term = np.prod([comb(rho + 1 + s_i, s_i + 2) for s_i in partitions.T], axis=0)
+        c_rj = np.sum(term)
+        c_rj *= (rho**2 + rho) ** (-r / 2 - j)
+        return c_rj
+
+    def _compute_hr(self, x, r, rho):
+        from scipy.special import eval_hermitenorm, factorial
+
+        hr = np.zeros_like(x, dtype=float)
+        for j in range(1, r + 1):
+            H = eval_hermitenorm(r + 2 * j - 1, x)
+            crj = self._compute_crj(r, j, rho)
+            # print("1. r = ",r," and j =",j)
+            hr += H * crj / factorial(j)
+        #     print("2. He(",r+2*j,",",x,") = \n",H)
+        #     print("3. crj for r=",r,"j=",j," = ",crj)
+        #     print("4. j!",factorial(j))
+        #     print("5. h_",r,"upto from j=1 to j=",j," = ",hr)
+        #     print("-------------------------------")
+        # print("6. h_",r," = ",hr)
+        # print()
+        return hr
+
+    def _cdf(self, x):
+        """Cumulative distribution function.
+
+        Parameters
+        ----------
+        x : 2D np.ndarray, same shape as ``self``
+            values to evaluate the cdf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            cdf values at the given points
+        """
+        from scipy.stats import norm
+
+        lambda_ = self.lambda_
+        rho = self.alpha
+        max_r = 10
+        phi_x = np.exp(-(x**2) / 2)
+        Phi_x = norm.cdf(x)
+        series_sum = np.zeros_like(x, dtype=float)
+        for r in range(1, max_r + 1):
+            hr_x = self._compute_hr(x, r, rho)
+            series_sum += pow(lambda_, -r / 2) * hr_x
+        cdf = Phi_x - phi_x * series_sum
+        return cdf
diff --git a/skpro/distributions/tweedie.py b/skpro/distributions/tweedie.py
@@ -0,0 +1,192 @@
+# copyright: skpro developers, BSD-3-Clause License (see LICENSE file)
+"""Tweedie probability distribution."""
+
+__author__ = ["ShreeshaM07"]
+
+import numpy as np
+
+from skpro.distributions.base import BaseDistribution
+
+# import pandas as pd
+
+
+class Tweedie(BaseDistribution):
+    """Tweedie Distribution.
+
+    Parameters
+    ----------
+    pow : float or array of float (1D or 2D)
+        Power parameter
+    mu : float or array of float (1D or 2D)
+        mean of the normal distribution
+    scale : float or array of float (1D or 2D)
+        scale parameter
+    index : pd.Index, optional, default = RangeIndex
+    columns : pd.Index, optional, default = RangeIndex
+    """
+
+    _tags = {
+        "capabilities:approx": ["pdfnorm"],
+        "capabilities:exact": [
+            "mean",
+            "var",
+            "energy",
+            "pdf",
+            "log_pdf",
+            "cdf",
+            "ppf",
+            "pmf",
+            "log_pmf",
+        ],
+        "distr:measuretype": "mixed",
+        "distr:paramtype": "parametric",
+        "broadcast_init": "on",
+    }
+
+    def __init__(self, pow, mu, scale, index=None, columns=None):
+        from skpro.distributions.cmp_pois_gam import CmpPoissonGamma
+        from skpro.distributions.gamma import Gamma
+        from skpro.distributions.normal import Normal
+        from skpro.distributions.poisson import Poisson
+
+        self.pow = pow
+        self.mu = mu
+        self.scale = scale
+        mu = np.array(mu)
+        scale = np.array(scale)
+        if pow == 0:
+            self._norm = Normal(mu=mu, sigma=scale, index=index, columns=columns)
+        elif pow == 1:
+            self._pois = Poisson(mu=mu, index=index, columns=columns)
+        elif pow > 1 and pow < 2:
+            self._cmp_pg = CmpPoissonGamma(
+                pow=pow, mu=mu, scale=scale, index=index, columns=columns
+            )
+        elif pow == 2:
+            alpha = (mu / scale) ** 2
+            beta = mu / scale**2
+            self._gam = Gamma(alpha=alpha, beta=beta, index=index, columns=columns)
+
+        super().__init__(index=index, columns=columns)
+
+    def _pdf(self, x):
+        """Probability density function.
+
+        Parameters
+        ----------
+        x : 2D np.ndarray, same shape as ``self``
+            values to evaluate the pdf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            pdf values at the given points
+        """
+        pow = self.pow
+
+        if pow == 0:
+            return self._norm.pdf(x)
+        elif pow == 1:
+            return self._pois.pdf(x)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.pdf(x)
+        elif pow == 2:
+            return self._gam.pdf(x)
+
+    def _pmf(self, x):
+        """Probability mass function.
+
+        Private method, to be implemented by subclasses.
+        """
+        pow = self.pow
+
+        if pow == 0:
+            return self._norm.pmf(x)
+        elif pow == 1:
+            return self._pois.pmf(x)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.pmf(x)
+        elif pow == 2:
+            return self._gam.pmf(x)
+
+    def _log_pdf(self, x):
+        """Logarithmic probability density function.
+
+        Parameters
+        ----------
+        x : 2D np.ndarray, same shape as ``self``
+            values to evaluate the pdf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            log pdf values at the given points
+        """
+        pow = self.pow
+        if pow == 0:
+            return self._norm.log_pdf(x)
+        elif pow == 1:
+            return self._pois.log_pdf(x)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.log_pdf(x)
+
+    def _log_pmf(self, x):
+        """Logarithmic probability mass function.
+
+        Private method, to be implemented by subclasses.
+        """
+        pow = self.pow
+        if pow == 0:
+            return self._norm.log_pmf(x)
+        elif pow == 1:
+            return self._pois.log_pmf(x)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.log_pmf(x)
+
+    def _cdf(self, x):
+        """Cumulative distribution function.
+
+        Parameters
+        ----------
+        x : 2D np.ndarray, same shape as ``self``
+            values to evaluate the cdf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            cdf values at the given points
+        """
+        pow = self.pow
+
+        if pow == 0:
+            return self._norm.cdf(x)
+        elif pow == 1:
+            return self._pois.cdf(x)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.cdf(x)
+        elif pow == 2:
+            return self._gam.cdf(x)
+
+    def _ppf(self, p):
+        """Quantile function = percent point function = inverse cdf.
+
+        Parameters
+        ----------
+        p : 2D np.ndarray, same shape as ``self``
+            values to evaluate the ppf at
+
+        Returns
+        -------
+        2D np.ndarray, same shape as ``self``
+            ppf values at the given points
+        """
+        pow = self.pow
+
+        if pow == 0:
+            return self._norm.ppf(p)
+        elif pow == 1:
+            return self._pois.ppf(p)
+        elif pow > 1 and pow < 2:
+            return self._cmp_pg.ppf(p)
+        elif pow == 2:
+            return self._gam.ppf(p)