Ë
    !£¯gqS  ã                   óì  — d Z ddlmZ ddlZddlmZ ddlmZ ddl	m
Z d„ Zd:d„Zd	„ ZeZd
„ Zd„ Zd„ Zd„ Zd„ Zi Zeeeeeeedœed<   d„ Zd„ d„ d„ dœed<   deied<    G d„ d«      Zd;d„Zd<d„Zd=d„Zd>d „Z G d!„ d"«      Zed#k(  rçdd$lmZ ej@                  jC                  d%d¬&«      Z! e"d'«        e" ee!d(«      «        ee!d(«      Z# e"e#jI                  «       «       g d)¢Z%e%D ]  Z& e"e&e#jI                  e&d«      «       Œ  e"d*«       dd+l'm(Z(  e(e)«      Z*dZ+ e,d«      D ]W  Z-ej\                  j_                  e+«      Z! ee!d(«      Z#e%D ],  Z&e*e&   ja                  e#jI                  e&d«      d   d,   «       Œ. ŒY  ejb                  e%D  cg c]  } e*|    ‘Œ	 c} «      Z2 e"d-d.jg                  e%«      «        e"d/e2d0k  ji                  d,«      «        e"d1e2d2k  ji                  d,«      «        e"d3e2d4k  ji                  d,«      «        ed5„ d(d¬6«       dZ+dZ5 e e«       d7e+e5d¬8«      Z6 ejn                  e5 ejb                  g d9¢«      z  «      jq                  e9«      Z: e"e6e:   «       yyc c} w )?at  More Goodness of fit tests

contains

GOF : 1 sample gof tests based on Stephens 1970, plus AD A^2
bootstrap : vectorized bootstrap p-values for gof test with fitted parameters


Created : 2011-05-21
Author : Josef Perktold

parts based on ks_2samp and kstest from scipy.stats
(license: Scipy BSD, but were completely rewritten by Josef Perktold)


References
----------

é    )ÚlmapN)Údistributions)Úcache_readonly)Ú
kolmogorovc                 ó–  — t        t        j                  | |f«      \  } }| j                  d   }|j                  d   }t	        | «      }t	        |«      }t        j
                  | «      } t        j
                  |«      }t        j                  | |g«      }t        j                  | |d¬«      d|z  z  }t        j                  ||d¬«      d|z  z  }t        j                  t        j                  ||z
  «      «      }t        j                  ||z  t        ||z   «      z  «      }	 t        |dz   d|z  z   |z  «      }	||	fS #  d}	Y ||	fS xY w)aA  
    Computes the Kolmogorov-Smirnof statistic on 2 samples.

    This is a two-sided test for the null hypothesis that 2 independent samples
    are drawn from the same continuous distribution.

    Parameters
    ----------
    a, b : sequence of 1-D ndarrays
        two arrays of sample observations assumed to be drawn from a continuous
        distribution, sample sizes can be different


    Returns
    -------
    D : float
        KS statistic
    p-value : float
        two-tailed p-value


    Notes
    -----

    This tests whether 2 samples are drawn from the same distribution. Note
    that, like in the case of the one-sample K-S test, the distribution is
    assumed to be continuous.

    This is the two-sided test, one-sided tests are not implemented.
    The test uses the two-sided asymptotic Kolmogorov-Smirnov distribution.

    If the K-S statistic is small or the p-value is high, then we cannot
    reject the hypothesis that the distributions of the two samples
    are the same.

    Examples
    --------

    >>> from scipy import stats
    >>> import numpy as np
    >>> from scipy.stats import ks_2samp

    >>> #fix random seed to get the same result
    >>> np.random.seed(12345678)

    >>> n1 = 200  # size of first sample
    >>> n2 = 300  # size of second sample

    different distribution
    we can reject the null hypothesis since the pvalue is below 1%

    >>> rvs1 = stats.norm.rvs(size=n1,loc=0.,scale=1)
    >>> rvs2 = stats.norm.rvs(size=n2,loc=0.5,scale=1.5)
    >>> ks_2samp(rvs1,rvs2)
    (0.20833333333333337, 4.6674975515806989e-005)

    slightly different distribution
    we cannot reject the null hypothesis at a 10% or lower alpha since
    the pvalue at 0.144 is higher than 10%

    >>> rvs3 = stats.norm.rvs(size=n2,loc=0.01,scale=1.0)
    >>> ks_2samp(rvs1,rvs3)
    (0.10333333333333333, 0.14498781825751686)

    identical distribution
    we cannot reject the null hypothesis since the pvalue is high, 41%

    >>> rvs4 = stats.norm.rvs(size=n2,loc=0.0,scale=1.0)
    >>> ks_2samp(rvs1,rvs4)
    (0.07999999999999996, 0.41126949729859719)
    r   Úright)Úsideç      ð?ç¸…ëQ¸¾?ç)\Âõ(¼?)r   ÚnpÚasarrayÚshapeÚlenÚsortÚconcatenateÚsearchsortedÚmaxÚabsoluteÚsqrtÚfloatÚksprob)
Údata1Údata2Ún1Ún2Údata_allÚcdf1Úcdf2ÚdÚenÚprobs
             úf/var/www/dash_apps/app1/venv/lib/python3.12/site-packages/statsmodels/sandbox/distributions/gof_new.pyÚks_2sampr$      s%  € ôP œŸ
™
 U¨E NÓ3L€Eˆ5Ø	‰Q‰€BØ	‰Q‰€BÜ	ˆU‹€BÜ	ˆU‹€BÜG‰GE‹N€EÜG‰GE‹N€EÜ~‰~˜u U˜mÓ,€Hä?‰?˜5 ¨wÔ7¸¸R¹Ñ@€DÜO‰O˜E (°Ô8¸3¸r¹6ÑB€DÜ
‰Œr{‰{˜4 ™9Ó%Ó&€Aä	‰B‘”u˜R ™U“|Ñ#Ó	$€BðÜr˜$‘w˜t B™w‘¨Ñ)Ó*ˆð ˆdˆ7€NøðØ‰Øˆdˆ7€Nús   Ä$D? Ä?Ec                 ó  — t        | t        «      rG|r|| k(  r5t        t        | «      j                  }t        t        | «      j
                  } nt        d«      ‚t        |t        «      rt        t        |«      j                  }t        | «      r d|i}t        j                   | |i |¤Ž«      }n t        j                  | «      }t        |«      } ||g|¢­Ž }|dv rTt        j                  d|dz   «      |z  |z
  j                  «       }	|dk(  r"|	t        j                  j                  |	|«      fS |dv rQ|t        j                  d|«      |z  z
  j                  «       }
|d	k(  r"|
t        j                  j                  |
|«      fS |d
k(  rýt        j                  	
g«      }|dk(  r7|t        j                  j                  |t        j                   |«      z  «      fS |dk(  r¤t        j                  j                  |t        j                   |«      z  «      }|dkD  s|d|dz  dz  z
  kD  r7|t        j                  j                  |t        j                   |«      z  «      fS |t        j                  j                  ||«      dz  fS yy)aÉ  
    Perform the Kolmogorov-Smirnov test for goodness of fit

    This performs a test of the distribution G(x) of an observed
    random variable against a given distribution F(x). Under the null
    hypothesis the two distributions are identical, G(x)=F(x). The
    alternative hypothesis can be either 'two_sided' (default), 'less'
    or 'greater'. The KS test is only valid for continuous distributions.

    Parameters
    ----------
    rvs : str or array or callable
        string: name of a distribution in scipy.stats

        array: 1-D observations of random variables

        callable: function to generate random variables, requires keyword
        argument `size`

    cdf : str or callable
        string: name of a distribution in scipy.stats, if rvs is a string then
        cdf can evaluate to `False` or be the same as rvs
        callable: function to evaluate cdf

    args : tuple, sequence
        distribution parameters, used if rvs or cdf are strings
    N : int
        sample size if rvs is string or callable
    alternative : 'two_sided' (default), 'less' or 'greater'
        defines the alternative hypothesis (see explanation)

    mode : 'approx' (default) or 'asymp'
        defines the distribution used for calculating p-value

        'approx' : use approximation to exact distribution of test statistic

        'asymp' : use asymptotic distribution of test statistic


    Returns
    -------
    D : float
        KS test statistic, either D, D+ or D-
    p-value :  float
        one-tailed or two-tailed p-value

    Notes
    -----

    In the one-sided test, the alternative is that the empirical
    cumulative distribution function of the random variable is "less"
    or "greater" than the cumulative distribution function F(x) of the
    hypothesis, G(x)<=F(x), resp. G(x)>=F(x).

    Examples
    --------

    >>> from scipy import stats
    >>> import numpy as np
    >>> from scipy.stats import kstest

    >>> x = np.linspace(-15,15,9)
    >>> kstest(x,'norm')
    (0.44435602715924361, 0.038850142705171065)

    >>> np.random.seed(987654321) # set random seed to get the same result
    >>> kstest('norm','',N=100)
    (0.058352892479417884, 0.88531190944151261)

    is equivalent to this

    >>> np.random.seed(987654321)
    >>> kstest(stats.norm.rvs(size=100),'norm')
    (0.058352892479417884, 0.88531190944151261)

    Test against one-sided alternative hypothesis:

    >>> np.random.seed(987654321)

    Shift distribution to larger values, so that cdf_dgp(x)< norm.cdf(x):

    >>> x = stats.norm.rvs(loc=0.2, size=100)
    >>> kstest(x,'norm', alternative = 'less')
    (0.12464329735846891, 0.040989164077641749)

    Reject equal distribution against alternative hypothesis: less

    >>> kstest(x,'norm', alternative = 'greater')
    (0.0072115233216311081, 0.98531158590396395)

    Do not reject equal distribution against alternative hypothesis: greater

    >>> kstest(x,'norm', mode='asymp')
    (0.12464329735846891, 0.08944488871182088)


    Testing t distributed random variables against normal distribution:

    With 100 degrees of freedom the t distribution looks close to the normal
    distribution, and the kstest does not reject the hypothesis that the sample
    came from the normal distribution

    >>> np.random.seed(987654321)
    >>> stats.kstest(stats.t.rvs(100,size=100),'norm')
    (0.072018929165471257, 0.67630062862479168)

    With 3 degrees of freedom the t distribution looks sufficiently different
    from the normal distribution, that we can reject the hypothesis that the
    sample came from the normal distribution at a alpha=10% level

    >>> np.random.seed(987654321)
    >>> stats.kstest(stats.t.rvs(3,size=100),'norm')
    (0.131016895759829, 0.058826222555312224)
    ú5if rvs is string, cdf has to be the same distributionÚsize)Ú	two_sidedÚgreaterr
   é   r)   )r(   Úlessç        r+   r(   ÚasympÚapproxéj
  çš™™™™™é?ç333333Ó?ç     @@é   N)Ú
isinstanceÚstrÚgetattrr   ÚcdfÚrvsÚAttributeErrorÚcallabler   r   r   Úaranger   ÚksoneÚsfÚ	kstwobignr   )r8   r7   ÚargsÚNÚalternativeÚmodeÚkwdsÚvalsÚcdfvalsÚDplusÚDminÚDÚpval_twos                r#   ÚkstestrJ   }   s>  € ôf #”sÔá˜ šÜœ-¨Ó-×1Ñ1ˆCÜœ-¨Ó-×1Ñ1‰Cä Ð!XÓYÐYô #”sÔÜ”m SÓ)×-Ñ-ˆÜ„}ØqˆzˆÜw‰w‘s˜DÐ( 4Ñ(Ó)‰äw‰ws‹|ˆÜ‹IˆÙ$Ð˜Ò€GàÐ.Ñ.Ü—‘˜3  !¡Ó$ QÑ&¨Ñ0×5Ñ5Ó7ˆØ˜)Ò#Øœ-×-Ñ-×0Ñ0°°qÓ9Ð9Ð9àÐ+Ñ+Øœ"Ÿ)™) C¨Ó+¨AÑ-Ñ-×2Ñ2Ó4ˆØ˜&Ò Øœ×,Ñ,×/Ñ/°°QÓ7Ð7Ð7àkÒ!ÜF‰FE˜$<Ó ˆØ7Š?Ø”m×-Ñ-×0Ñ0°´2·7±7¸1³:±Ó>Ð>Ð>Ø8ÒÜ$×.Ñ.×1Ñ1°!´B·G±G¸A³J±,Ó?ˆHØ4Šx˜8 d¨Q¨s©U°6©\Ñ&9Ò9Øœ-×1Ñ1×4Ñ4°Q´r·w±w¸q³z±\ÓBÐBÐBàœ-×-Ñ-×0Ñ0°°1Ó5°aÑ7Ð7Ð7ð ð	 "ó    c                 ó  — t        j                  |«      dz   dt        j                  |«      z  z   }| |z  }t        j                  d|dz  z  «      }t        j                  | t        j                  g d¢«      kD  «      }|||fS )Nr   r   éþÿÿÿr3   )ç=
×£p=ê?rN   r
   ©r   r   ÚexpÚsumÚarray©ÚstatÚnobsÚ
mod_factorÚstat_modifiedÚpvalÚdigitss         r#   Údplus_st70_upprZ     sr   € Ü—‘˜“ Ñ%¨¬r¯w©w°t«}Ñ(<Ñ<€JØ˜:Ñ%€MÜ6‰6"} aÑ'Ñ'Ó(€DÜV‰VDœ2Ÿ8™8Ò$6Ó7Ñ7Ó8€Fà˜$ Ð&Ð&rK   c                 ó  — t        j                  |«      dz   dt        j                  |«      z  z   }| |z  }dt        j                  d|dz  z  «      z  }t        j                  | t        j                  g d¢«      kD  «      }|||fS )Nr   r   r3   rM   )ç…ëQ¸í?r\   gHáz®Gñ?rO   rS   s         r#   Ú
d_st70_uppr]   &  sw   € Ü—‘˜“ Ñ%¨¬r¯w©w°t«}Ñ(<Ñ<€JØ˜:Ñ%€MØŒrv‰vb˜=¨!Ñ+Ñ+Ó,Ñ,€DÜV‰VDœ2Ÿ8™8Ò$6Ó7Ñ7Ó8€Fà˜$ Ð&Ð&rK   c                 ó  — t        j                  |«      dz   dt        j                  |«      z  z   }| |z  }|dz  }d|z  dz
  t        j                  d|z  «      z  }t        j                  | t        j                  g d¢«      kD  «      }|||fS )Ng×£p=
×Ã?g¸…ëQ¸Î?r3   é   rM   )çö(\Âõð?r`   g)\Âõ(ô?rO   )rT   rU   rV   rW   ÚzsqurX   rY   s          r#   Ú
v_st70_upprb   .  sƒ   € Ü—‘˜“ Ñ&¨´·±¸³Ñ)=Ñ=€Jà˜:Ñ%€MØ˜!Ñ€DØ‰Hq‰LœBŸF™F 2¨¡9Ó-Ñ-€DÜV‰VDœ2Ÿ8™8Ò$6Ó7Ñ7Ó8€FØ˜$ Ð&Ð&rK   c                 ó    — d|z  }| d|z  z
  d|dz  z  z   d|z   z  }dt        j                  dd|z  z
  «      z  }t         j                  }|||fS )	Nr
   gš™™™™™Ù?g333333ã?r3   r*   çš™™™™™©?gR¸…ëQ@é   )r   rP   Únan©rT   rU   ÚnobsinvrW   rX   rY   s         r#   Úwsqu_st70_uppri   7  sc   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<ÀÀWÁÑM€MØ”"—&‘&˜  MÑ 1Ñ1Ó2Ñ2€DÜV‰V€Fà˜$ Ð&Ð&rK   c                 ó  — d|z  }| d|z  z
  d|dz  z  z   }|dd|z  z   z  }dt        j                  d|z  t         j                  dz  z  «      z  }t        j                  | t        j                  g d¢«      kD  «      }|||fS )Nr
   çš™™™™™¹?r3   r*   r0   rM   )çÂõ(\Ò?rl   gÃõ(\ÂÕ?©r   rP   ÚpirQ   rR   rg   s         r#   Úusqu_st70_uppro   ?  s‰   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<€MØa˜# ™-Ñ'Ñ(€MØŒrv‰vc˜MÑ)¬B¯E©E°1©HÑ4Ó5Ñ5€DÜV‰VDœ2Ÿ8™8Ò$6Ó7Ñ7Ó8€Fà˜$ Ð&Ð&rK   c                 ó  — d|z  }| d|z  z
  d|dz  z  z   }|dd|z  z   z  }dt        j                  d|z  d	z  t         j                  dz  z  «      z  }t        j                  | t        j                  g d
¢«      kD  «      }|||fS )Nr
   gffffffæ?çÍÌÌÌÌÌì?r3   r*   g®Gáz®ó?g‘í|?5^ô?rM   ç       @)r   r   g!°rh‘íÜ?rm   rg   s         r#   Ú
a_st70_upprs   H  sŽ   € Ø4‰i€GØ˜C '™MÑ)¨C°'¸1±*Ñ,<Ñ<€MØa˜$ ™.Ñ(Ñ)€MØ”2—6‘6˜# Ñ-°Ñ2´R·U±U¸A±XÑ=Ó>Ñ>€DÜV‰VDœ2Ÿ8™8Ò$7Ó8Ñ8Ó9€Fà˜$ Ð&Ð&rK   )Úd_plusÚd_minusr    ÚvÚwsquÚusquÚaÚstephens70uppc                 ó†  — t         j                  j                  | t        j                  |«      z  «      }|dkD  s|d|dz  dz  z
  kD  rF| t         j                  j                  | t        j                  |«      z  «      t        j
                  fS | t         j                  j                  | |«      dz  t        j
                  fS )Nr/   r0   r1   r2   r3   )r   r>   r=   r   r   rf   r<   )rH   r@   rI   s      r#   Úpval_kstest_approxr|   ^  s–   € Ü×&Ñ&×)Ñ)¨!¬B¯G©G°A«J©,Ó7€HØˆ4‚x8˜d Q s¡U¨6¡\Ñ1Ò1Ø”-×)Ñ)×,Ñ,¨Q¬r¯w©w°q«z©\Ó:¼B¿F¹FÐBÐBà”-×%Ñ%×(Ñ(¨¨1Ó-¨aÑ/´·±Ð7Ð7rK   c                 ód   — | t         j                  j                  | |«      t        j                  fS ©N©r   r<   r=   r   rf   )rF   r@   s     r#   ú<lambda>r€   f  s$   €  ¬×(;Ñ(;×(>Ñ(>¸uÀaÓ(HÌ"Ï&É&Ð Q€ rK   c                 ód   — | t         j                  j                  | |«      t        j                  fS r~   r   )rG   r@   s     r#   r€   r€   g  s$   €  ¤}×':Ñ':×'=Ñ'=¸dÀ1Ó'EÄrÇvÁvÐ N€ rK   c                 óŽ   — | t         j                  j                  | t        j                  |«      z  «      t        j
                  fS r~   )r   r>   r=   r   r   rf   )rH   r@   s     r#   r€   r€   h  s.   € ˜œ=×2Ñ2×5Ñ5°a¼¿¹À»
±lÓCÄRÇVÁVÐL€ rK   )rt   ru   r    Úscipyr    Úscipy_approxc                   ó    — e Zd ZdZdd„Zed„ «       Zed„ «       Zed„ «       Zed„ «       Z	ed„ «       Z
ed„ «       Zed	„ «       Zed
„ «       Zdd„Zy)ÚGOFaP  One Sample Goodness of Fit tests

    includes Kolmogorov-Smirnov D, D+, D-, Kuiper V, Cramer-von Mises W^2, U^2 and
    Anderson-Darling A, A^2. The p-values for all tests except for A^2 are based on
    the approximatiom given in Stephens 1970. A^2 has currently no p-values. For
    the Kolmogorov-Smirnov test the tests as given in scipy.stats are also available
    as options.


    design: I might want to retest with different distributions, to calculate
    data summary statistics only once, or add separate class that holds
    summary statistics and data (sounds good).


    c                 óØ  — t        |t        «      rG|r||k(  r5t        t        |«      j                  }t        t        |«      j
                  }nt        d«      ‚t        |t        «      rt        t        |«      j                  }t        |«      r d|i}t        j                   ||i |¤Ž«      }n t        j                  |«      }t        |«      } ||g|¢­Ž }|| _        || _        || _        y )Nr&   r'   )r4   r5   r6   r   r7   r8   r9   r:   r   r   r   rU   Úvals_sortedrE   )Úselfr8   r7   r?   r@   rC   rD   rE   s           r#   Ú__init__zGOF.__init__†  sÆ   € Ücœ3Ôá˜S CšZÜœm¨SÓ1×5Ñ5Üœm¨SÓ1×5Ñ5‘ä$Ð%\Ó]Ð]ô cœ3ÔÜœ-¨Ó-×1Ñ1ˆCÜCŒ=Ø˜1:ˆDÜ—7‘7™3 Ð, tÑ,Ó-‰Dä—7‘7˜3“<ˆDÜD“	ˆAÙdÐ"˜TÒ"ˆàˆŒ	ØˆÔØˆrK   c                 óŒ   — | j                   }| j                  }t        j                  d|dz   «      |z  |z
  j	                  «       S )Nr
   r*   ©rU   rE   r   r;   r   ©r‰   rU   rE   s      r#   rt   z
GOF.d_plus   s<   € ày‰yˆØ—,‘,ˆÜ—	‘	˜#˜t A™vÓ& tÑ+¨gÑ5×:Ñ:Ó<Ð<rK   c                 ó†   — | j                   }| j                  }|t        j                  d|«      |z  z
  j	                  «       S )Nr,   rŒ   r   s      r#   ru   zGOF.d_minus¦  s8   € ày‰yˆØ—,‘,ˆØœ"Ÿ)™) C¨Ó.¨tÑ3Ñ3×8Ñ8Ó:Ð:rK   c                 óX   — t        j                  | j                  | j                  g«      S r~   )r   r   rt   ru   ©r‰   s    r#   r    zGOF.d¬  s   € äv‰vt—{‘{ D§L¡LÐ1Ó2Ð2rK   c                 ó4   — | j                   | j                  z   S )ÚKuiper)rt   ru   r   s    r#   rv   zGOF.v°  s   € ð {‰{˜TŸ\™\Ñ)Ð)rK   c                 óº   — | j                   }| j                  }|dt        j                  d|dz   «      z  dz
  |z  dz  z
  dz  j	                  «       d|z  dz  z   }|S )zCramer von Misesrr   r
   r*   r3   g      (@)rU   rE   r   r;   rQ   )r‰   rU   rE   rw   s       r#   rw   zGOF.wsquµ  sf   € ð y‰yˆØ—,‘,ˆà˜B¤§¡¨2¨t°A©vÓ!6Ñ6¸Ñ:¸DÑ@ÀÑCÑCÀaÑG×LÑLÓNØD‘˜‘ñˆàˆrK   c                 ó‚   — | j                   }| j                  }| j                  ||j                  «       dz
  dz  z  z
  }|S )Nç      à?r3   )rU   rE   rw   Úmean)r‰   rU   rE   rx   s       r#   rx   zGOF.usqu¿  s<   € ày‰yˆØ—,‘,ˆày‰y˜4 7§<¡<£>°CÑ#7¸!Ñ";Ñ;Ñ;ˆØˆrK   c                 óÔ   — | j                   }| j                  }d}t        d|«      D ]0  }||   |d | z
  }|dkD  }d||   z
  ||<   ||j                  «       z  }Œ2 |dz  d|z  |z  z
  }|S )Nr   r*   r•   g      @rr   )rU   rE   ÚrangerQ   )r‰   rU   rE   ÚmsumÚjÚmjÚmaskry   s           r#   ry   zGOF.aÇ  sŒ   € ày‰yˆØ—,‘,ˆð ˆÜq˜“ò 	ˆAØ˜‘˜g b q˜kÑ)ˆBØ˜‘HˆDØ˜2˜d™8‘|ˆBˆt‰HØB—F‘F“HÑ‰Dð		ð 2‰I˜˜T™	 DÑ(Ñ(ˆØˆrK   c           	      ó  — | j                   }| j                  }dt        j                  d|dz   «      z  dz
  t        j                  |«      t        j                  d|ddd…   z
  «      z   z  j                  «        |z  |z
  }|S )z4Stephens 1974, does not have p-value formula for A^2rr   r
   r*   Néÿÿÿÿ)rU   rE   r   r;   ÚlogrQ   )r‰   rU   rE   Úasqus       r#   r    zGOF.asqu×  s„   € ð y‰yˆØ—,‘,ˆà”r—y‘y  T¨!¡VÓ,Ñ,¨qÑ0Ü—‘˜“¤2§6¡6¨!¨G±D°b°D©M©/Ó#:Ñ:ñ=ß>A¹c»eðDØDHñIØKOñPˆð ˆrK   c                 ó˜   — t        | |«      }|dk(  rt        |   |   || j                  «      |fS t        |   |   || j                  «      S )z


        rz   )r6   Ú	gof_pvalsrU   )r‰   ÚtestidÚpvalsrT   s       r#   Úget_testzGOF.get_testã  sS   € ô
 t˜VÓ$ˆØOÒ#Ü˜UÑ# FÑ+¨D°$·)±)Ó<¸dÐBÐBä˜UÑ# FÑ+¨D°$·)±)Ó<Ð<rK   N)© é   )r    rz   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__rŠ   r   rt   ru   r    rv   rw   rx   ry   r    r¥   r¦   rK   r#   r†   r†   n  s±   „ ñó.ð4 ñ=ó ð=ð
 ñ;ó ð;ð
 ñ3ó ð3ð ñ*ó ð*ð ñó ðð ñó ðð ñó ðð ñó ðô	=rK   r†   éd   c                 ó*  — ddl m}  |t        «      }t        d«      D ]K  } | |«      }t	        ||«      }t
        D ],  }||   j                  |j                  |d«      d   d   «       Œ. ŒM t        j                  t
        D cg c]  }||   ‘Œ	 c}«      }	t        ddj                  t
        «      «       t        d|	d	k  j                  d«      «       t        d
|	dk  j                  d«      «       t        d|	dk  j                  d«      «       y c c}w )Nr   ©Údefaultdictiè  rz   r*   ú	         ú      úat 0.01:ç{®Gáz„?úat 0.05:rd   úat 0.10:rk   )Úcollectionsr¯   Úlistr˜   r†   Úall_gofsÚappendr¥   r   rR   ÚprintÚjoinr–   )
ÚrandfnÚdistrrU   r¯   ÚresultsÚir8   ÚgoftÚtiÚresarrs
             r#   Úgof_mcrÃ   õ  sò   € å'áœ$Ó€GÜ4‹[ò IˆÙT‹lˆÜ3˜‹ˆÜò 	IˆBØB‰K×Ñ˜tŸ}™}¨R°ÓAÀ!ÑDÀQÑGÕHñ	IðIô X‰X¬XÖ6 rw˜r“{Ò6Ó7€FÜ	ˆ+x—}‘}¤XÓ.Ô/Ü	ˆ*v ‘}×*Ñ*¨1Ó-Ô.Ü	ˆ*v ‘}×*Ñ*¨1Ó-Ô.Ü	ˆ*v ‘|×)Ñ)¨!Ó,Õ-ùò	 7s   ÂDc           	      ó¬  — t        | j                  «      }| j                  |   }t        d«      g|z  }dg|z  }t        d«      ||<   t        ddd«      ||<   dt        j                  d|dz   «      t        |«         z  dz
  t        j                  | «      t        j                  d| t        |«         z
  «      z   z  |z  j                  |«       |z
  }|S )z.vectorized Anderson Darling A^2, Stephens 1974Nrž   rr   r
   r*   )r   r   Úslicer   r;   ÚtuplerŸ   rQ   )rE   ÚaxisÚndimrU   Úslice_reverseÚislicer    s          r#   ÚasquarerË     sÖ   € äˆw}‰}Ó€DØ=‰=˜Ñ€DÜ˜4“[M DÑ(€MØˆVd‰]€FÜ˜“;€Fˆ4LÜ  d¨BÓ/€M$ÑØ”2—9‘9˜R  a¡Ó(¬¨v«Ñ7Ñ7¸!Ñ;ÜV‰VG‹_œrŸv™v a¨´°mÓ0DÑ(EÑ&EÓFÑFñHØHLñMßNQÉcÐRVËiðXàñ€Dð €KrK   éÈ   c                 óê  — |Û|€t        d«      ‚t        t        j                  |t	        |«      z  «      «      }d}t        |«      D ]ƒ  } | j                  |fi d||fi¤Ž}	| j                  |	d¬«      }
t        d„ |
«      }
t        j                  | j                  |	|
«      d¬«      }t        |d¬«      }|||k\  j                  «       z  }Œ… |t	        ||z  «      z  S  | j                  |fi d||fi¤Ž}	| j                  |	d¬«      }
t        d„ |
«      }
t        j                  | j                  |	|
«      d¬«      }t        |d¬«      }|€t        j                  |«      }|S ||k\  j                  «       S )a  Monte Carlo (or parametric bootstrap) p-values for gof

    currently hardcoded for A^2 only

    assumes vectorized fit_vec method,
    builds and analyses (nobs, nrep) sample in one step

    rename function to less generic

    this works also with nrep=1

    zusing batching requires a valuer   r'   r*   ©rÇ   c                 ó.   — t        j                  | d«      S ©Nr*   ©r   Úexpand_dims©Úxs    r#   r€   zbootstrap.<locals>.<lambda>;  s   € ¤B§N¡N°1°aÓ$8€ rK   c                 ó.   — t        j                  | d«      S rÐ   rÑ   rÓ   s    r#   r€   zbootstrap.<locals>.<lambda>D  s   € ¤§¡¨q°!Ó 4€ rK   )Ú
ValueErrorÚintr   Úceilr   r˜   r8   Úfit_vecr   r   r7   rË   rQ   r–   )r½   r?   rU   ÚnrepÚvalueÚ
batch_sizeÚn_batchÚcountÚirepr8   ÚparamsrE   rT   Ústat_sorteds                 r#   Ú	bootstraprâ     st  € ð, ÐØˆ=ÜÐ>Ó?Ð?Ü”b—g‘g˜d¤5¨Ó#4Ñ4Ó5Ó6ˆØˆÜ˜'“Nò 	+ˆDØ%—)‘)˜DÑ@ V¨Z¸Ð,>Ð$?Ñ@ˆCØ—]‘] 3¨Q]Ó/ˆFÜÑ8¸&ÓAˆFÜ—g‘g˜eŸi™i¨¨VÓ4¸1Ô=ˆGÜ˜7¨Ô+ˆDØd˜e‘m×(Ñ(Ó*Ñ*‰Eð	+ð ”u˜W zÑ1Ó2Ñ2Ð2ð ˆei‰i˜Ñ6 ¨¨t¨Ð 5Ñ6ˆØ—‘˜s¨Ó+ˆÜÑ4°fÓ=ˆÜ—'‘'˜%Ÿ)™) C¨Ó0°qÔ9ˆÜw QÔ'ˆØˆ=ÜŸ'™' $›-ˆKØÐà˜E‘M×'Ñ'Ó)Ð)rK   c                 óö   — d}t        |«      D ]b  } |j                  |fi d|i¤Ž}|j                  |«      }t        j                  |j                  ||«      «      }	t        |	d¬«      }
||
| k\  z  }Œd |dz  |z  S )zþMonte Carlo (or parametric bootstrap) p-values for gof

    currently hardcoded for A^2 only

    non vectorized, loops over all parametric bootstrap replications and calculates
    and returns specific p-value,

    rename function to less generic

    r   r'   rÎ   r
   )r˜   r8   rÙ   r   r   r7   rË   )rÛ   r½   r?   rU   rÚ   rÞ   rß   r8   rà   rE   rT   s              r#   Ú
bootstrap2rä   O  s‡   € ð$ €EÜd“ò !ˆàˆei‰i˜Ñ. ¨ Ñ.ˆØ—‘˜sÓ#ˆÜ—'‘'˜%Ÿ)™) C¨Ó0Ó1ˆÜw QÔ'ˆØ$˜%‘-Ñ ‰ð!ð 2‰:˜ÑÐrK   c                   ó$   — e Zd ZdZdd„Zd„ Zd„ Zy)ÚNewNormz-just a holder for modified distributions
    c                 óF   — |j                  |«      |j                  |«      fS r~   )r–   Ústd)r‰   rÔ   rÇ   s      r#   rÙ   zNewNorm.fit_vecp  s   € Øv‰vd‹|˜QŸU™U 4›[Ð(Ð(rK   c                 óR   — t         j                  j                  ||d   |d   ¬«      S )Nr   r*   )ÚlocÚscale)r   Únormr7   )r‰   rÔ   r?   s      r#   r7   zNewNorm.cdfs  s(   € Ü×!Ñ!×%Ñ% a¨T°!©W¸DÀ¹GÐ%ÓDÐDrK   c                 ób   — |d   }|d   }||t         j                  j                  |¬«      z  z   S )Nr   r*   ©r'   )r   rì   r8   )r‰   r?   r'   rê   rë   s        r#   r8   zNewNorm.rvsv  s8   € Ø‰GˆØ1‰gˆØUœ]×/Ñ/×3Ñ3¸Ð3Ó>Ñ>Ñ>Ð>rK   N©r   )r¨   r©   rª   r«   rÙ   r7   r8   r¦   rK   r#   ræ   ræ   l  s   „ ñó)òEó?rK   ræ   Ú__main__)Ústatsé   rî   zscipy kstestrì   )r    rt   ru   rv   rw   rx   ry   z
Is it correctly sized?r®   r*   r°   r±   r²   r³   r´   rd   rµ   rk   c                 óD   — t         j                  j                  d| ¬«      S )Nrò   rî   )rñ   Útr8   ©rU   s    r#   r€   r€     s   € œŸ™Ÿ™ A¨D˜Ó1€ rK   rõ   )r   r*   )r?   rU   rÚ   rÛ   )g®Gáz®ï?gffffffî?rq   )r¦   r§   r(   r.   )r¬   rï   )r¦   rÌ   r¬   NN)r¦   rÌ   r¬   );r«   Ústatsmodels.compat.pythonr   Únumpyr   Úscipy.statsr   Ústatsmodels.tools.decoratorsr   Úscipy.specialr   r   r$   rJ   rZ   Údminus_st70_uppr]   rb   ri   ro   rs   r¢   r|   r†   rÃ   rË   râ   rä   ræ   r¨   rƒ   rñ   rô   r8   rº   rÀ   r¥   r¸   rÁ   r¶   r¯   r·   r¾   rU   r˜   r¿   ÚrandomÚrandnr¹   rR   rÂ   r»   r–   rÚ   ÚbtÚfloorÚastyper×   Ú
quantindex)rÁ   s   0r#   ú<module>r     sÌ  ðñõ& +Û å %å 7å .òZó~Y8ò|'ð !€ò'ò'ò'ò'ò'ð €	ð ØØ
Ø
ØØØ
ñ€	ˆ/Ñ ò8ñ RÙNÙ
Lñ€	ˆ'Ñ ð Ð
ð€	ˆ.Ñ ÷~=ñ ~=óN.ó"ó..*ód÷:?ñ ?ð& ˆzÓÝà
'‰'+‰+a˜cˆ+Ó
"€CÙ	ˆ.ÔÙ	‰&fÓ
ÔÙˆsFÓ€DÙ	ˆ$-‰-‹/ÔâC€HØò 6ˆÙˆb$—-‘-  OÓ4Õ5ð6ñ 
Ð
$Ô%Ý'á˜$Ó€GØ€DÙ3‹Zò IˆØi‰io‰o˜dÓ#ˆÙ3˜ÓˆØò 	IˆBØB‰K×Ñ˜tŸ}™}¨R°ÓAÀ!ÑDÀQÑGÕHñ	IðIð ˆRX‰X¨XÖ6 rw˜r“{Ò6Ó7€FÙ	ˆ+x—}‘} XÓ.Ô/Ù	ˆ*v ‘}×*Ñ*¨1Ó-Ô.Ù	ˆ*v ‘}×*Ñ*¨1Ó-Ô.Ù	ˆ*v ‘|×)Ñ)¨!Ó,Ô-á
Ñ1°6ÀÕDà€DØ€DÙ	‘7“9 5¨t¸$ÀdÔ	K€BØ—‘˜$  §¡Ò*;Ó!<Ñ<Ó=×DÑDÀSÓI€JÙ	ˆ"ˆZ‰.ÔððQ ùò0 7s   ÆI1