§
    M/PhqS  ã                   óœ  — d Z ddlmZ ddlZddlmZ ddlmZ ddl	m
Z d„ Zd?d„Zd„ ZeZd„ Zd„ Zd„ Zd„ Zd„ Zi Zeeeeeeedœed<   d„ Zd„ d„ d„ dœed<   deied<    G d„ d¦  «        Zd@d „ZdAd!„ZdBd#„ZdCd$„Z G d%„ d&¦  «        Zed'k    r<dd(lmZ ej          !                    d)d"¬*¦  «        Z! e"d+¦  «          e" ee!d,¦  «        ¦  «          ee!d,¦  «        Z# e"e# $                    ¦   «         ¦  «         g d-¢Z%e%D ]"Z& e"e&e# $                    e&d¦  «        ¦  «         Œ# e"d.¦  «         dd/l'm(Z(  e(e)¦  «        Z*d"Z+ e,d¦  «        D ]hZ-ej.         /                    e+¦  «        Z! ee!d,¦  «        Z#e%D ]=Z&e*e&          0                    e# $                    e&d¦  «        d         d0         ¦  «         Œ>Œi ej1        d1„ e%D ¦   «         ¦  «        Z2 e"d2d3 3                    e%¦  «        ¦  «          e"d4e2d5k      4                    d0¦  «        ¦  «          e"d6e2d7k      4                    d0¦  «        ¦  «          e"d8e2d9k      4                    d0¦  «        ¦  «          ed:„ d,d"¬;¦  «         d"Z+dZ5 e e¦   «         d<e+e5d¬=¦  «        Z6 ej7        e5 ej1        g d>¢¦  «        z  ¦  «         8                    e9¦  «        Z: e"e6e:         ¦  «         dS dS )Dat  More Goodness of fit tests

contains

GOF : 1 sample gof tests based on Stephens 1970, plus AD A^2
bootstrap : vectorized bootstrap p-values for gof test with fitted parameters


Created : 2011-05-21
Author : Josef Perktold

parts based on ks_2samp and kstest from scipy.stats
(license: Scipy BSD, but were completely rewritten by Josef Perktold)


References
----------

é    )ÚlmapN)Údistributions)Úcache_readonly)Ú
kolmogorovc                 óš  — t          t          j        | |f¦  «        \  } }| j        d         }|j        d         }t	          | ¦  «        }t	          |¦  «        }t          j        | ¦  «        } t          j        |¦  «        }t          j        | |g¦  «        }t          j        | |d¬¦  «        d|z  z  }t          j        ||d¬¦  «        d|z  z  }t          j        t          j	        ||z
  ¦  «        ¦  «        }t          j
        ||z  t          ||z   ¦  «        z  ¦  «        }	 t          |dz   d|z  z   |z  ¦  «        }	n	#  d}	Y nxY w||	fS )aA  
    Computes the Kolmogorov-Smirnof statistic on 2 samples.

    This is a two-sided test for the null hypothesis that 2 independent samples
    are drawn from the same continuous distribution.

    Parameters
    ----------
    a, b : sequence of 1-D ndarrays
        two arrays of sample observations assumed to be drawn from a continuous
        distribution, sample sizes can be different


    Returns
    -------
    D : float
        KS statistic
    p-value : float
        two-tailed p-value


    Notes
    -----

    This tests whether 2 samples are drawn from the same distribution. Note
    that, like in the case of the one-sample K-S test, the distribution is
    assumed to be continuous.

    This is the two-sided test, one-sided tests are not implemented.
    The test uses the two-sided asymptotic Kolmogorov-Smirnov distribution.

    If the K-S statistic is small or the p-value is high, then we cannot
    reject the hypothesis that the distributions of the two samples
    are the same.

    Examples
    --------

    >>> from scipy import stats
    >>> import numpy as np
    >>> from scipy.stats import ks_2samp

    >>> #fix random seed to get the same result
    >>> np.random.seed(12345678)

    >>> n1 = 200  # size of first sample
    >>> n2 = 300  # size of second sample

    different distribution
    we can reject the null hypothesis since the pvalue is below 1%

    >>> rvs1 = stats.norm.rvs(size=n1,loc=0.,scale=1)
    >>> rvs2 = stats.norm.rvs(size=n2,loc=0.5,scale=1.5)
    >>> ks_2samp(rvs1,rvs2)
    (0.20833333333333337, 4.6674975515806989e-005)

    slightly different distribution
    we cannot reject the null hypothesis at a 10% or lower alpha since
    the pvalue at 0.144 is higher than 10%

    >>> rvs3 = stats.norm.rvs(size=n2,loc=0.01,scale=1.0)
    >>> ks_2samp(rvs1,rvs3)
    (0.10333333333333333, 0.14498781825751686)

    identical distribution
    we cannot reject the null hypothesis since the pvalue is high, 41%

    >>> rvs4 = stats.norm.rvs(size=n2,loc=0.0,scale=1.0)
    >>> ks_2samp(rvs1,rvs4)
    (0.07999999999999996, 0.41126949729859719)
    r   Úright)Úsideç      ð?ç¸…ëQ¸¾?ç)\Âõ(¼?)r   ÚnpÚasarrayÚshapeÚlenÚsortÚconcatenateÚsearchsortedÚmaxÚabsoluteÚsqrtÚfloatÚksprob)
Údata1Údata2Ún1Ún2Údata_allÚcdf1Úcdf2ÚdÚenÚprobs
             úi/var/www/html/test/jupyter/venv/lib/python3.11/site-packages/statsmodels/sandbox/distributions/gof_new.pyÚks_2sampr$      s4  € õP œ
 U¨E NÑ3Ô3L€Eˆ5Ø	ŒQŒ€BØ	ŒQŒ€BÝ	ˆU‰Œ€BÝ	ˆU‰Œ€BÝŒGE‰NŒN€EÝŒGE‰NŒN€EÝŒ~˜u U˜mÑ,Ô,€HåŒ?˜5 ¨wÐ7Ñ7Ô7¸¸R¹Ñ@€DÝŒO˜E (°Ð8Ñ8Ô8¸3¸r¹6ÑB€DÝ
ŒrŒ{˜4 ™9Ñ%Ô%Ñ&Ô&€Aå	ŒB‘•u˜R ™U‘|”|Ñ#Ñ	$Ô	$€BðÝr˜$‘w˜t B™w‘¨Ñ)Ñ*Ô*ˆˆøðØˆˆˆøøøØˆdˆ7€Ns   Ä$E  Å E© é   Ú	two_sidedÚapproxc                 óL  — t          | t          ¦  «        rL|r|| k    r5t          t          | ¦  «        j        }t          t          | ¦  «        j        } nt          d¦  «        ‚t          |t          ¦  «        rt          t          |¦  «        j        }t          | ¦  «        rd|i}t          j	         | |i |¤Ž¦  «        }n#t          j	        | ¦  «        }t          |¦  «        } ||g|¢R Ž }|dv rXt          j        d|dz   ¦  «        |z  |z
                       ¦   «         }	|dk    r"|	t          j                             |	|¦  «        fS |dv rU|t          j        d|¦  «        |z  z
                       ¦   «         }
|d	k    r"|
t          j                             |
|¦  «        fS |d
k    rüt          j        |	|
g¦  «        }|dk    r6|t          j                             |t          j        |¦  «        z  ¦  «        fS |dk    r¦t          j                             |t          j        |¦  «        z  ¦  «        }|dk    s|d|dz  dz  z
  k    r6|t          j                             |t          j        |¦  «        z  ¦  «        fS |t          j                             ||¦  «        dz  fS dS dS )aÉ  
    Perform the Kolmogorov-Smirnov test for goodness of fit

    This performs a test of the distribution G(x) of an observed
    random variable against a given distribution F(x). Under the null
    hypothesis the two distributions are identical, G(x)=F(x). The
    alternative hypothesis can be either 'two_sided' (default), 'less'
    or 'greater'. The KS test is only valid for continuous distributions.

    Parameters
    ----------
    rvs : str or array or callable
        string: name of a distribution in scipy.stats

        array: 1-D observations of random variables

        callable: function to generate random variables, requires keyword
        argument `size`

    cdf : str or callable
        string: name of a distribution in scipy.stats, if rvs is a string then
        cdf can evaluate to `False` or be the same as rvs
        callable: function to evaluate cdf

    args : tuple, sequence
        distribution parameters, used if rvs or cdf are strings
    N : int
        sample size if rvs is string or callable
    alternative : 'two_sided' (default), 'less' or 'greater'
        defines the alternative hypothesis (see explanation)

    mode : 'approx' (default) or 'asymp'
        defines the distribution used for calculating p-value

        'approx' : use approximation to exact distribution of test statistic

        'asymp' : use asymptotic distribution of test statistic


    Returns
    -------
    D : float
        KS test statistic, either D, D+ or D-
    p-value :  float
        one-tailed or two-tailed p-value

    Notes
    -----

    In the one-sided test, the alternative is that the empirical
    cumulative distribution function of the random variable is "less"
    or "greater" than the cumulative distribution function F(x) of the
    hypothesis, G(x)<=F(x), resp. G(x)>=F(x).

    Examples
    --------

    >>> from scipy import stats
    >>> import numpy as np
    >>> from scipy.stats import kstest

    >>> x = np.linspace(-15,15,9)
    >>> kstest(x,'norm')
    (0.44435602715924361, 0.038850142705171065)

    >>> np.random.seed(987654321) # set random seed to get the same result
    >>> kstest('norm','',N=100)
    (0.058352892479417884, 0.88531190944151261)

    is equivalent to this

    >>> np.random.seed(987654321)
    >>> kstest(stats.norm.rvs(size=100),'norm')
    (0.058352892479417884, 0.88531190944151261)

    Test against one-sided alternative hypothesis:

    >>> np.random.seed(987654321)

    Shift distribution to larger values, so that cdf_dgp(x)< norm.cdf(x):

    >>> x = stats.norm.rvs(loc=0.2, size=100)
    >>> kstest(x,'norm', alternative = 'less')
    (0.12464329735846891, 0.040989164077641749)

    Reject equal distribution against alternative hypothesis: less

    >>> kstest(x,'norm', alternative = 'greater')
    (0.0072115233216311081, 0.98531158590396395)

    Do not reject equal distribution against alternative hypothesis: greater

    >>> kstest(x,'norm', mode='asymp')
    (0.12464329735846891, 0.08944488871182088)


    Testing t distributed random variables against normal distribution:

    With 100 degrees of freedom the t distribution looks close to the normal
    distribution, and the kstest does not reject the hypothesis that the sample
    came from the normal distribution

    >>> np.random.seed(987654321)
    >>> stats.kstest(stats.t.rvs(100,size=100),'norm')
    (0.072018929165471257, 0.67630062862479168)

    With 3 degrees of freedom the t distribution looks sufficiently different
    from the normal distribution, that we can reject the hypothesis that the
    sample came from the normal distribution at a alpha=10% level

    >>> np.random.seed(987654321)
    >>> stats.kstest(stats.t.rvs(3,size=100),'norm')
    (0.131016895759829, 0.058826222555312224)
    ú5if rvs is string, cdf has to be the same distributionÚsize)r'   Úgreaterr
   é   r,   )r'   Úlessç        r.   r'   Úasympr(   éj
  çš™™™™™é?ç333333Ó?ç     @@é   N)Ú
isinstanceÚstrÚgetattrr   ÚcdfÚrvsÚAttributeErrorÚcallabler   r   r   Úaranger   ÚksoneÚsfÚ	kstwobignr   )r:   r9   ÚargsÚNÚalternativeÚmodeÚkwdsÚvalsÚcdfvalsÚDplusÚDminÚDÚpval_twos                r#   ÚkstestrL   }   s  € õf #•sÑÔð Zàð 	Z˜ š˜Ý-¨Ñ-Ô-Ô1ˆCÝ-¨Ñ-Ô-Ô1ˆCˆCå Ð!XÑYÔYÐYõ #•sÑÔð .Ý•m SÑ)Ô)Ô-ˆÝ}„}ð ØqˆzˆÝŒwss˜DÐ( 4Ð(Ð(Ñ)Ô)ˆˆåŒws‰|Œ|ˆÝ‰IŒIˆØˆc$Ð˜ÐÐÐ€GàÐ.Ð.Ð.Ý”˜3  !¡Ñ$Ô$ QÑ&¨Ñ0×5Ò5Ñ7Ô7ˆØ˜)Ò#Ð#Ø-Ô-×0Ò0°°qÑ9Ô9Ð9Ð9àÐ+Ð+Ð+Ø"œ) C¨Ñ+Ô+¨AÑ-Ñ-×2Ò2Ñ4Ô4ˆØ˜&Ò Ð ØÔ,×/Ò/°°QÑ7Ô7Ð7Ð7àkÒ!Ð!ÝŒFE˜$<Ñ Ô ˆØ7Š?ˆ?Ø•mÔ-×0Ò0°µ2´7¸1±:´:±Ñ>Ô>Ð>Ð>Ø8ÒÐÝ$Ô.×1Ò1°!µB´G¸A±J´J±,Ñ?Ô?ˆHØ4Šxˆx˜8 d¨Q¨s©U°6©\Ñ&9Ò9Ð9Ø-Ô1×4Ò4°Qµr´w¸q±z´z±\ÑBÔBÐBÐBà-Ô-×0Ò0°°1Ñ5Ô5°aÑ7Ð7Ð7ð "Ð!ð Ðó    c                 ó   — t          j        |¦  «        dz   dt          j        |¦  «        z  z   }| |z  }t          j        d|dz  z  ¦  «        }t          j        | t          j        g d¢¦  «        k    ¦  «        }|||fS )Nr   r   éþÿÿÿr5   )ç=
×£p=ê?rP   r
   ©r   r   ÚexpÚsumÚarray©ÚstatÚnobsÚ
mod_factorÚstat_modifiedÚpvalÚdigitss         r#   Údplus_st70_uppr\     s{   € Ý”˜‘” Ñ%¨­r¬w°t©}¬}Ñ(<Ñ<€JØ˜:Ñ%€MÝŒ6"} aÑ'Ñ'Ñ(Ô(€DÝŒVD2œ8Ð$6Ð$6Ð$6Ñ7Ô7Ò7Ñ8Ô8€Fà˜$ Ð&Ð&rM   c                 ó  — t          j        |¦  «        dz   dt          j        |¦  «        z  z   }| |z  }dt          j        d|dz  z  ¦  «        z  }t          j        | t          j        g d¢¦  «        k    ¦  «        }|||fS )Nr   r   r5   rO   )ç…ëQ¸í?r^   gHáz®Gñ?rQ   rU   s         r#   Ú
d_st70_uppr_   &  s€   € Ý”˜‘” Ñ%¨­r¬w°t©}¬}Ñ(<Ñ<€JØ˜:Ñ%€MØrŒvb˜=¨!Ñ+Ñ+Ñ,Ô,Ñ,€DÝŒVD2œ8Ð$6Ð$6Ð$6Ñ7Ô7Ò7Ñ8Ô8€Fà˜$ Ð&Ð&rM   c                 ó  — t          j        |¦  «        dz   dt          j        |¦  «        z  z   }| |z  }|dz  }d|z  dz
  t          j        d|z  ¦  «        z  }t          j        | t          j        g d¢¦  «        k    ¦  «        }|||fS )Ng×£p=
×Ã?g¸…ëQ¸Î?r5   é   rO   )çö(\Âõð?rb   g)\Âõ(ô?rQ   )rV   rW   rX   rY   ÚzsqurZ   r[   s          r#   Ú
v_st70_upprd   .  sŒ   € Ý”˜‘” Ñ&¨µ´¸±´Ñ)=Ñ=€Jà˜:Ñ%€MØ˜!Ñ€DØ‰Hq‰LBœF 2¨¡9Ñ-Ô-Ñ-€DÝŒVD2œ8Ð$6Ð$6Ð$6Ñ7Ô7Ò7Ñ8Ô8€FØ˜$ Ð&Ð&rM   c                 ó–   — d|z  }| d|z  z
  d|dz  z  z   d|z   z  }dt          j        dd|z  z
  ¦  «        z  }t           j        }|||fS )	Nr
   gš™™™™™Ù?g333333ã?r5   r-   çš™™™™™©?gR¸…ëQ@é   )r   rR   Únan©rV   rW   ÚnobsinvrY   rZ   r[   s         r#   Úwsqu_st70_upprk   7  sb   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<ÀÀWÁÑM€MØ•"”&˜  MÑ 1Ñ1Ñ2Ô2Ñ2€DÝŒV€Fà˜$ Ð&Ð&rM   c                 óú   — d|z  }| d|z  z
  d|dz  z  z   }|dd|z  z   z  }dt          j        d|z  t           j        dz  z  ¦  «        z  }t          j        | t          j        g d¢¦  «        k    ¦  «        }|||fS )Nr
   çš™™™™™¹?r5   r-   r2   rO   )çÂõ(\Ò?rn   gÃõ(\ÂÕ?©r   rR   ÚpirS   rT   ri   s         r#   Úusqu_st70_upprq   ?  s   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<€MØa˜# ™-Ñ'Ñ(€MØrŒvc˜MÑ)­B¬E°1©HÑ4Ñ5Ô5Ñ5€DÝŒVD2œ8Ð$6Ð$6Ð$6Ñ7Ô7Ò7Ñ8Ô8€Fà˜$ Ð&Ð&rM   c                 ó   — d|z  }| d|z  z
  d|dz  z  z   }|dd|z  z   z  }dt          j        d|z  d	z  t           j        dz  z  ¦  «        z  }t          j        | t          j        g d
¢¦  «        k    ¦  «        }|||fS )Nr
   gffffffæ?çÍÌÌÌÌÌì?r5   r-   g®Gáz®ó?g‘í|?5^ô?rO   ç       @)r   r   g!°rh‘íÜ?ro   ri   s         r#   Ú
a_st70_uppru   H  s•   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<€MØa˜$ ™.Ñ(Ñ)€MØ•2”6˜# Ñ-°Ñ2µR´U¸A±XÑ=Ñ>Ô>Ñ>€DÝŒVD2œ8Ð$7Ð$7Ð$7Ñ8Ô8Ò8Ñ9Ô9€Fà˜$ Ð&Ð&rM   )Úd_plusÚd_minusr    ÚvÚwsquÚusquÚaÚstephens70uppc                 óv  — t           j                             | t          j        |¦  «        z  ¦  «        }|dk    s|d|dz  dz  z
  k    rA| t           j                             | t          j        |¦  «        z  ¦  «        t          j        fS | t           j                             | |¦  «        dz  t          j        fS )Nr1   r2   r3   r4   r5   )r   r@   r?   r   r   rh   r>   )rJ   rB   rK   s      r#   Úpval_kstest_approxr~   ^  s—   € ÝÔ&×)Ò)¨!­B¬G°A©J¬J©,Ñ7Ô7€HØˆ4‚x€x8˜d Q s¡U¨6¡\Ñ1Ò1Ð1Ø•-Ô)×,Ò,¨Q­r¬w°q©z¬z©\Ñ:Ô:½B¼FÐBÐBà•-Ô%×(Ò(¨¨1Ñ-Ô-¨aÑ/µ´Ð7Ð7rM   c                 ó\   — | t           j                             | |¦  «        t          j        fS ©N©r   r>   r?   r   rh   )rH   rB   s     r#   ú<lambda>r‚   f  s"   €  ­Ô(;×(>Ò(>¸uÀaÑ(HÔ(HÍ"Ì&Ð Q€ rM   c                 ó\   — | t           j                             | |¦  «        t          j        fS r€   r   )rI   rB   s     r#   r‚   r‚   g  s"   €  ¥}Ô':×'=Ò'=¸dÀ1Ñ'EÔ'EÅrÄvÐ N€ rM   c                 ó„   — | t           j                             | t          j        |¦  «        z  ¦  «        t          j        fS r€   )r   r@   r?   r   r   rh   )rJ   rB   s     r#   r‚   r‚   h  s,   € ˜=Ô2×5Ò5°a½¼À¹
¼
±lÑCÔCÅRÄVÐL€ rM   )rv   rw   r    Úscipyr    Úscipy_approxc                   óÒ   — e Zd ZdZdd„Zed„ ¦   «         Zed„ ¦   «         Zed„ ¦   «         Zed„ ¦   «         Z	ed	„ ¦   «         Z
ed
„ ¦   «         Zed„ ¦   «         Zed„ ¦   «         Zdd„ZdS )ÚGOFaP  One Sample Goodness of Fit tests

    includes Kolmogorov-Smirnov D, D+, D-, Kuiper V, Cramer-von Mises W^2, U^2 and
    Anderson-Darling A, A^2. The p-values for all tests except for A^2 are based on
    the approximatiom given in Stephens 1970. A^2 has currently no p-values. For
    the Kolmogorov-Smirnov test the tests as given in scipy.stats are also available
    as options.


    design: I might want to retest with different distributions, to calculate
    data summary statistics only once, or add separate class that holds
    summary statistics and data (sounds good).


    r%   r&   c                 ó  — t          |t          ¦  «        rL|r||k    r5t          t          |¦  «        j        }t          t          |¦  «        j        }nt          d¦  «        ‚t          |t          ¦  «        rt          t          |¦  «        j        }t          |¦  «        rd|i}t          j	         ||i |¤Ž¦  «        }n#t          j	        |¦  «        }t          |¦  «        } ||g|¢R Ž }|| _        || _        || _        d S )Nr*   r+   )r6   r7   r8   r   r9   r:   r;   r<   r   r   r   rW   Úvals_sortedrG   )Úselfr:   r9   rA   rB   rE   rF   rG   s           r#   Ú__init__zGOF.__init__†  s  € Ýc3ÑÔð 	^àð ^˜S CšZ˜ZÝm¨SÑ1Ô1Ô5Ým¨SÑ1Ô1Ô5å$Ð%\Ñ]Ô]Ð]õ c3ÑÔð 	2Ý-¨Ñ-Ô-Ô1ˆCÝC‰=Œ=ð 	Ø˜1:ˆDÝ”7˜3˜3 Ð, tÐ,Ð,Ñ-Ô-ˆDˆDå”7˜3‘<”<ˆDÝD‘	”	ˆAØ#dÐ"˜TÐ"Ð"Ð"ˆàˆŒ	ØˆÔØˆŒˆˆrM   c                 ó~   — | j         }| j        }t          j        d|dz   ¦  «        |z  |z
                       ¦   «         S )Nr
   r-   ©rW   rG   r   r=   r   ©r‹   rW   rG   s      r#   rv   z
GOF.d_plus   s<   € àŒyˆØ”,ˆÝ”	˜#˜t A™vÑ&Ô& tÑ+¨gÑ5×:Ò:Ñ<Ô<Ð<rM   c                 óx   — | j         }| j        }|t          j        d|¦  «        |z  z
                       ¦   «         S )Nr/   rŽ   r   s      r#   rw   zGOF.d_minus¦  s8   € àŒyˆØ”,ˆØ"œ) C¨Ñ.Ô.¨tÑ3Ñ3×8Ò8Ñ:Ô:Ð:rM   c                 óB   — t          j        | j        | j        g¦  «        S r€   )r   r   rv   rw   ©r‹   s    r#   r    zGOF.d¬  s   € åŒvt”{ D¤LÐ1Ñ2Ô2Ð2rM   c                 ó    — | j         | j        z   S )ÚKuiper)rv   rw   r’   s    r#   rx   zGOF.v°  s   € ð Œ{˜Tœ\Ñ)Ð)rM   c                 ó¬   — | j         }| j        }|dt          j        d|dz   ¦  «        z  dz
  |z  dz  z
  dz                       ¦   «         d|z  dz  z   }|S )zCramer von Misesrt   r
   r-   r5   g      (@)rW   rG   r   r=   rS   )r‹   rW   rG   ry   s       r#   ry   zGOF.wsquµ  sf   € ð ŒyˆØ”,ˆà˜B¥¤¨2¨t°A©vÑ!6Ô!6Ñ6¸Ñ:¸DÑ@ÀÑCÑCÀaÑG×LÒLÑNÔNØD‘˜‘ñˆàˆrM   c                 ól   — | j         }| j        }| j        ||                     ¦   «         dz
  dz  z  z
  }|S )Nç      à?r5   )rW   rG   ry   Úmean)r‹   rW   rG   rz   s       r#   rz   zGOF.usqu¿  s8   € àŒyˆØ”,ˆàŒy˜4 7§<¢<¡>¤>°CÑ#7¸!Ñ";Ñ;Ñ;ˆØˆrM   c                 óä   — | j         }| j        }d}t          d|¦  «        D ]@}||         |d |…         z
  }|dk    }d||         z
  ||<   ||                     ¦   «         z  }ŒA|dz  d|z  |z  z
  }|S )Nr   r-   r—   g      @rt   )rW   rG   ÚrangerS   )r‹   rW   rG   ÚmsumÚjÚmjÚmaskr{   s           r#   r{   zGOF.aÇ  sŽ   € àŒyˆØ”,ˆð ˆÝq˜‘”ð 	ð 	ˆAØ˜”˜g b q bœkÑ)ˆBØ˜’HˆDØ˜2˜dœ8‘|ˆBˆt‰HØB—F’F‘H”HÑˆDˆDà2‰I˜˜T™	 DÑ(Ñ(ˆØˆrM   c           	      óü   — | j         }| j        }dt          j        d|dz   ¦  «        z  dz
  t          j        |¦  «        t          j        d|ddd…         z
  ¦  «        z   z                       ¦   «          |z  |z
  }|S )z4Stephens 1974, does not have p-value formula for A^2rt   r
   r-   Néÿÿÿÿ)rW   rG   r   r=   ÚlogrS   )r‹   rW   rG   Úasqus       r#   r¢   zGOF.asqu×  s†   € ð ŒyˆØ”,ˆà•r”y  T¨!¡VÑ,Ô,Ñ,¨qÑ0Ý”˜‘”¥2¤6¨!¨G°D°D°b°D¬M©/Ñ#:Ô#:Ñ:ñ=ß>Aºc¹e¼eðDØDHñIØKOñPˆð ˆrM   r    r|   c                 ó¶   — t          | |¦  «        }|dk    r#t          |         |         || j        ¦  «        |fS t          |         |         || j        ¦  «        S )z


        r|   )r8   Ú	gof_pvalsrW   )r‹   ÚtestidÚpvalsrV   s       r#   Úget_testzGOF.get_testã  s[   € õ
 t˜VÑ$Ô$ˆØOÒ#Ð#Ý˜UÔ# FÔ+¨D°$´)Ñ<Ô<¸dÐBÐBå˜UÔ# FÔ+¨D°$´)Ñ<Ô<Ð<rM   N)r%   r&   )r    r|   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__rŒ   r   rv   rw   r    rx   ry   rz   r{   r¢   r§   r%   rM   r#   rˆ   rˆ   n  s  € € € € € ðð ð.ð ð ð ð4 ð=ð =ñ „^ð=ð
 ð;ð ;ñ „^ð;ð
 ð3ð 3ñ „^ð3ð ð*ð *ñ „^ð*ð ðð ñ „^ðð ðð ñ „^ðð ðð ñ „^ðð ðð ñ „^ðð	=ð 	=ð 	=ð 	=ð 	=ð 	=rM   rˆ   éd   c                 óœ  ‡	— ddl m}  |t          ¦  «        Š	t          d¦  «        D ]b} | |¦  «        }t	          ||¦  «        }t
          D ]=}‰	|                              |                     |d¦  «        d         d         ¦  «         Œ>Œct          j	        ˆ	fd„t
          D ¦   «         ¦  «        }t          dd                     t
          ¦  «        ¦  «         t          d	|d
k                          d¦  «        ¦  «         t          d|dk                          d¦  «        ¦  «         t          d|dk                          d¦  «        ¦  «         d S )Nr   ©Údefaultdictiè  r|   r-   c                 ó    •— g | ]
}‰|         ‘ŒS r%   r%   )Ú.0ÚtiÚresultss     €r#   ú
<listcomp>zgof_mc.<locals>.<listcomp>   s   ø€ Ð6Ð6Ð6 rw˜r”{Ð6Ð6Ð6rM   ú	         ú      úat 0.01:ç{®Gáz„?úat 0.05:rf   úat 0.10:rm   )Úcollectionsr¯   Úlistrš   rˆ   Úall_gofsÚappendr§   r   rT   ÚprintÚjoinr˜   )
ÚrandfnÚdistrrW   r¯   Úir:   Úgoftr²   Úresarrr³   s
            @r#   Úgof_mcrÆ   õ  sM  ø€ à'Ð'Ð'Ð'Ð'Ð'àˆk$ÑÔ€GÝ4‰[Œ[ð Ið IˆØˆfT‰lŒlˆÝ3˜‰ŒˆÝð 	Ið 	IˆBØBŒK×Ò˜tŸ}š}¨R°ÑAÔAÀ!ÔDÀQÔGÑHÔHÐHÐHð	Iõ ŒXÐ6Ð6Ð6Ð6­XÐ6Ñ6Ô6Ñ7Ô7€FÝ	ˆ+x—}’}¥XÑ.Ô.Ñ/Ô/Ð/Ý	ˆ*v ’}×*Ò*¨1Ñ-Ô-Ñ.Ô.Ð.Ý	ˆ*v ’}×*Ò*¨1Ñ-Ô-Ñ.Ô.Ð.Ý	ˆ*v ’|×)Ò)¨!Ñ,Ô,Ñ-Ô-Ð-Ð-Ð-rM   c           	      óÜ  — t          | j        ¦  «        }| j        |         }t          d¦  «        g|z  }dg|z  }t          d¦  «        ||<   t          ddd¦  «        ||<   dt          j        d|dz   ¦  «        t          |¦  «                 z  dz
  t          j        | ¦  «        t          j        d| t          |¦  «                 z
  ¦  «        z   z  |z                       |¦  «         |z
  }|S )z.vectorized Anderson Darling A^2, Stephens 1974Nr    rt   r
   r-   )r   r   Úslicer   r=   Útupler¡   rS   )rG   ÚaxisÚndimrW   Úslice_reverseÚislicer¢   s          r#   ÚasquarerÎ     så   € åˆwŒ}ÑÔ€DØŒ=˜Ô€DÝ˜4‘[”[M DÑ(€MØˆVd‰]€FÝ˜‘;”;€Fˆ4LÝ  d¨BÑ/Ô/€M$ÑØ•2”9˜R  a¡Ñ(Ô(­¨v©¬Ô7Ñ7¸!Ñ;ÝŒVG‰_Œ_rœv a¨µ°mÑ0DÔ0DÔ(EÑ&EÑFÔFÑFñHØHLñMßNQÊcÐRVÉiÌiðXàñ€Dð €KrM   éÈ   c                 óF  — |û|€t          d¦  «        ‚t          t          j        |t	          |¦  «        z  ¦  «        ¦  «        }d}t          |¦  «        D ]’} | j        |fi d||fi¤Ž}	|                      |	d¬¦  «        }
t          d„ |
¦  «        }
t          j	        |  
                    |	|
¦  «        d¬¦  «        }t          |d¬¦  «        }|||k                         ¦   «         z  }Œ“|t	          ||z  ¦  «        z  S  | j        |fi d||fi¤Ž}	|                      |	d¬¦  «        }
t          d„ |
¦  «        }
t          j	        |  
                    |	|
¦  «        d¬¦  «        }t          |d¬¦  «        }|€t          j	        |¦  «        }|S ||k                         ¦   «         S )	a  Monte Carlo (or parametric bootstrap) p-values for gof

    currently hardcoded for A^2 only

    assumes vectorized fit_vec method,
    builds and analyses (nobs, nrep) sample in one step

    rename function to less generic

    this works also with nrep=1

    Nzusing batching requires a valuer   r+   r-   ©rÊ   c                 ó,   — t          j        | d¦  «        S ©Nr-   ©r   Úexpand_dims©Úxs    r#   r‚   zbootstrap.<locals>.<lambda>;  s   € ¥B¤N°1°aÑ$8Ô$8€ rM   c                 ó,   — t          j        | d¦  «        S rÓ   rÔ   rÖ   s    r#   r‚   zbootstrap.<locals>.<lambda>D  s   € ¥¤¨q°!Ñ 4Ô 4€ rM   )Ú
ValueErrorÚintr   Úceilr   rš   r:   Úfit_vecr   r   r9   rÎ   rS   r˜   )rÂ   rA   rW   ÚnrepÚvalueÚ
batch_sizeÚn_batchÚcountÚirepr:   ÚparamsrG   rV   Ústat_sorteds                 r#   Ú	bootstraprå     s½  € ð, ÐØˆ=ÝÐ>Ñ?Ô?Ð?Ý•b”g˜d¥5¨Ñ#4Ô#4Ñ4Ñ5Ô5Ñ6Ô6ˆØˆÝ˜'‘N”Nð 	+ð 	+ˆDØ%”)˜DÐ@Ð@ V¨Z¸Ð,>Ð$?Ð@Ð@ˆCØ—]’] 3¨Q]Ñ/Ô/ˆFÝÐ8Ð8¸&ÑAÔAˆFÝ”g˜eŸiši¨¨VÑ4Ô4¸1Ð=Ñ=Ô=ˆGÝ˜7¨Ð+Ñ+Ô+ˆDØd˜e’m×(Ò(Ñ*Ô*Ñ*ˆEˆEØ•u˜W zÑ1Ñ2Ô2Ñ2Ð2ð ˆeŒi˜Ð6Ð6 ¨¨t¨Ð 5Ð6Ð6ˆØ—’˜s¨Ñ+Ô+ˆÝÐ4Ð4°fÑ=Ô=ˆÝ”'˜%Ÿ)š) C¨Ñ0Ô0°qÐ9Ñ9Ô9ˆÝw QÐ'Ñ'Ô'ˆØˆ=Ýœ' $™-œ-ˆKØÐà˜E’M×'Ò'Ñ)Ô)Ð)rM   c                 ó  — d}t          |¦  «        D ]i} |j        |fi d|i¤Ž}|                     |¦  «        }t          j        |                     ||¦  «        ¦  «        }	t          |	d¬¦  «        }
||
| k    z  }Œj|dz  |z  S )zþMonte Carlo (or parametric bootstrap) p-values for gof

    currently hardcoded for A^2 only

    non vectorized, loops over all parametric bootstrap replications and calculates
    and returns specific p-value,

    rename function to less generic

    r   r+   rÑ   r
   )rš   r:   rÜ   r   r   r9   rÎ   )rÞ   rÂ   rA   rW   rÝ   rá   râ   r:   rã   rG   rV   s              r#   Ú
bootstrap2rç   O  sš   € ð$ €EÝd‘”ð !ð !ˆàˆeŒi˜Ð.Ð. ¨ Ð.Ð.ˆØ—’˜sÑ#Ô#ˆÝ”'˜%Ÿ)š) C¨Ñ0Ô0Ñ1Ô1ˆÝw QÐ'Ñ'Ô'ˆØ$˜%’-Ñ ˆˆØ2‰:˜ÑÐrM   c                   ó&   — e Zd ZdZdd„Zd„ Zd„ ZdS )ÚNewNormz-just a holder for modified distributions
    r   c                 óV   — |                      |¦  «        |                     |¦  «        fS r€   )r˜   Ústd)r‹   r×   rÊ   s      r#   rÜ   zNewNorm.fit_vecp  s!   € ØvŠvd‰|Œ|˜QŸUšU 4™[œ[Ð(Ð(rM   c                 ó^   — t           j                             ||d         |d         ¬¦  «        S )Nr   r-   )ÚlocÚscale)r   Únormr9   )r‹   r×   rA   s      r#   r9   zNewNorm.cdfs  s(   € ÝÔ!×%Ò% a¨T°!¬W¸DÀ¼GÐ%ÑDÔDÐDrM   c                 ón   — |d         }|d         }||t           j                             |¬¦  «        z  z   S )Nr   r-   ©r+   )r   rï   r:   )r‹   rA   r+   rí   rî   s        r#   r:   zNewNorm.rvsv  s8   € ØŒGˆØ1ŒgˆØU]Ô/×3Ò3¸Ð3Ñ>Ô>Ñ>Ñ>Ð>rM   N©r   )r¨   r©   rª   r«   rÜ   r9   r:   r%   rM   r#   ré   ré   l  sS   € € € € € ðð ð)ð )ð )ð )ðEð Eð Eð?ð ?ð ?ð ?ð ?rM   ré   Ú__main__)Ústatsé   rñ   zscipy kstestrï   )r    rv   rw   rx   ry   rz   r{   z
Is it correctly sized?r®   r-   c                 ó(   — g | ]}t           |         ‘ŒS r%   )r³   )r±   r²   s     r#   r´   r´   —  s   € Ð6Ð6Ð6 r•w˜r”{Ð6Ð6Ð6rM   rµ   r¶   r·   r¸   r¹   rf   rº   rm   c                 óD   — t           j                             d| ¬¦  «        S )Nrõ   rñ   )rô   Útr:   ©rW   s    r#   r‚   r‚     s   € œŸš A¨D˜Ñ1Ô1€ rM   rù   )r   r-   )rA   rW   rÝ   rÞ   )g®Gáz®ï?gffffffî?rs   )r%   r&   r'   r(   )r¬   rò   )r%   rÏ   r¬   NN)r%   rÏ   r¬   );r«   Ústatsmodels.compat.pythonr   Únumpyr   Úscipy.statsr   Ústatsmodels.tools.decoratorsr   Úscipy.specialr   r   r$   rL   r\   Údminus_st70_uppr_   rd   rk   rq   ru   r¤   r~   rˆ   rÆ   rÎ   rå   rç   ré   r¨   r…   rô   rø   r:   r¿   rÄ   r§   r½   r²   r»   r¯   r¼   r³   rW   rš   rÃ   ÚrandomÚrandnr¾   rT   rÅ   rÀ   r˜   rÝ   ÚbtÚfloorÚastyperÚ   Ú
quantindexr%   rM   r#   ú<module>r     sé  ððð ð& +Ð *Ð *Ð *Ð *Ð *Ø Ð Ð Ð à %Ð %Ð %Ð %Ð %Ð %à 7Ð 7Ð 7Ð 7Ð 7Ð 7à .Ð .Ð .Ð .Ð .Ð .ðZð Zð Zð~Y8ð Y8ð Y8ð Y8ð|'ð 'ð 'ð !€ð'ð 'ð 'ð'ð 'ð 'ð'ð 'ð 'ð'ð 'ð 'ð'ð 'ð 'ð €	ð ØØ
Ø
ØØØ
ðð €	ˆ/Ñ ð8ð 8ð 8ð RÐQØNÐNØ
LÐ
Lðð €	ˆ'Ñ ð Ð
ð€	ˆ.Ñ ð~=ð ~=ð ~=ð ~=ð ~=ñ ~=ô ~=ð ~=ðN.ð .ð .ð .ð"ð ð ð ð..*ð .*ð .*ð .*ðdð ð ð ð:?ð ?ð ?ð ?ð ?ñ ?ô ?ð ?ð& ˆzÒÑØÐÐÐÐÐà
Œ'+Š+a˜cˆ+Ñ
"Ô
"€CØ	€Eˆ.ÑÔÐØ	€Eˆ&ˆ&fÑ
Ô
ÑÔÐØˆ3ˆsFÑÔ€DØ	€Eˆ$-Š-‰/Œ/ÑÔÐàCÐCÐC€HØð 6ð 6ˆØˆˆb$—-’-  OÑ4Ô4Ñ5Ô5Ð5Ð5à	€EÐ
$Ñ%Ô%Ð%Ø'Ð'Ð'Ð'Ð'Ð'àˆk˜$ÑÔ€GØ€DØˆU3‰ZŒZð Ið IˆØŒioŠo˜dÑ#Ô#ˆØˆs3˜ÑÔˆØð 	Ið 	IˆBØBŒK×Ò˜tŸ}š}¨R°ÑAÔAÀ!ÔDÀQÔGÑHÔHÐHÐHð	Ið ˆRŒXÐ6Ð6¨XÐ6Ñ6Ô6Ñ7Ô7€FØ	€Eˆ+x—}’} XÑ.Ô.Ñ/Ô/Ð/Ø	€Eˆ*v ’}×*Ò*¨1Ñ-Ô-Ñ.Ô.Ð.Ø	€Eˆ*v ’}×*Ò*¨1Ñ-Ô-Ñ.Ô.Ð.Ø	€Eˆ*v ’|×)Ò)¨!Ñ,Ô,Ñ-Ô-Ð-à
€FÐ1Ð1°6ÀÐDÑDÔDÐDà€DØ€DØ	ˆ77‘9”9 5¨t¸$ÀdÐ	KÑ	KÔ	K€BØ”˜$  ¤Ð*;Ð*;Ð*;Ñ!<Ô!<Ñ<Ñ=Ô=×DÒDÀSÑIÔI€JØ	€Eˆ"ˆZŒ.ÑÔÐðð ðQ ÐrM   