some new features

2025-07-30 17:09:11 +03:00
parent db5d46760a
commit 8019bd3b7c
20616 changed files with 4375466 additions and 8 deletions
--- a/.venv/lib/python3.12/site-packages/statsmodels/stats/base.py
+++ b/.venv/lib/python3.12/site-packages/statsmodels/stats/base.py
@ -0,0 +1,128 @@
+"""Base classes for statistical test results
+
+Created on Mon Apr 22 14:03:21 2013
+
+Author: Josef Perktold
+"""
+from statsmodels.compat.python import lzip
+import numpy as np
+from statsmodels.tools.testing import Holder
+
+
+class HolderTuple(Holder):
+    """Holder class with indexing
+
+    """
+
+    def __init__(self, tuple_=None, **kwds):
+        super().__init__(**kwds)
+        if tuple_ is not None:
+            self.tuple = tuple(getattr(self, att) for att in tuple_)
+        else:
+            self.tuple = (self.statistic, self.pvalue)
+
+    def __iter__(self):
+        yield from self.tuple
+
+    def __getitem__(self, idx):
+        return self.tuple[idx]
+
+    def __len__(self):
+        return len(self.tuple)
+
+    def __array__(self, dtype=None, copy=True):
+        return np.array(list(self.tuple), dtype=dtype, copy=copy)
+
+
+class AllPairsResults:
+    '''Results class for pairwise comparisons, based on p-values
+
+    Parameters
+    ----------
+    pvals_raw : array_like, 1-D
+        p-values from a pairwise comparison test
+    all_pairs : list of tuples
+        list of indices, one pair for each comparison
+    multitest_method : str
+        method that is used by default for p-value correction. This is used
+        as default by the methods like if the multiple-testing method is not
+        specified as argument.
+    levels : {list[str], None}
+        optional names of the levels or groups
+    n_levels : None or int
+        If None, then the number of levels or groups is inferred from the
+        other arguments. It can be explicitly specified, if the inferred
+        number is incorrect.
+
+    Notes
+    -----
+    This class can also be used for other pairwise comparisons, for example
+    comparing several treatments to a control (as in Dunnet's test).
+
+    '''
+
+    def __init__(self, pvals_raw, all_pairs, multitest_method='hs',
+                 levels=None, n_levels=None):
+        self.pvals_raw = pvals_raw
+        self.all_pairs = all_pairs
+        if n_levels is None:
+            # for all_pairs nobs*(nobs-1)/2
+            self.n_levels = np.max(all_pairs) + 1
+        else:
+            self.n_levels = n_levels
+
+        self.multitest_method = multitest_method
+        self.levels = levels
+        if levels is None:
+            self.all_pairs_names = [
+                f'{pairs!r}' for pairs in all_pairs
+            ]
+        else:
+            self.all_pairs_names = [
+                '{}-{}'.format(
+                    levels[pairs[0]], levels[pairs[1]]
+                ) for pairs in all_pairs
+            ]
+
+    def pval_corrected(self, method=None):
+        '''p-values corrected for multiple testing problem
+
+        This uses the default p-value correction of the instance stored in
+        ``self.multitest_method`` if method is None.
+
+        '''
+        import statsmodels.stats.multitest as smt
+        if method is None:
+            method = self.multitest_method
+        # TODO: breaks with method=None
+        return smt.multipletests(self.pvals_raw, method=method)[1]
+
+    def __str__(self):
+        return self.summary()
+
+    def pval_table(self):
+        '''create a (n_levels, n_levels) array with corrected p_values
+
+        this needs to improve, similar to R pairwise output
+        '''
+        k = self.n_levels
+        pvals_mat = np.zeros((k, k))
+        # if we do not assume we have all pairs
+        pvals_mat[lzip(*self.all_pairs)] = self.pval_corrected()
+        return pvals_mat
+
+    def summary(self):
+        '''returns text summarizing the results
+
+        uses the default pvalue correction of the instance stored in
+        ``self.multitest_method``
+        '''
+        import statsmodels.stats.multitest as smt
+        maxlevel = max(len(ss) for ss in self.all_pairs_names)
+
+        text = ('Corrected p-values using %s p-value correction\n\n'
+                % smt.multitest_methods_names[self.multitest_method])
+        text += 'Pairs' + (' ' * (maxlevel - 5 + 1)) + 'p-values\n'
+        text += '\n'.join(f'{pairs}  {pv:6.4g}' for (pairs, pv) in
+                          zip(self.all_pairs_names, self.pval_corrected()))
+        return text