Merge pull request #11 from lizgehret/mann-whitney-tests

TEST: stats unit tests for mann-whitney-u and wilcoxon-srt
qiime2 · May 3, 2022 · 96d5be8 · 96d5be8
2 parents 85c4cad + 2f2e53b
commit 96d5be8
Show file tree

Hide file tree

Showing 3 changed files with 110 additions and 16 deletions.
diff --git a/q2_fmt/_engraftment.py b/q2_fmt/_engraftment.py
@@ -11,12 +11,6 @@
 
 import qiime2
 
-#TODO: add in control comparison hypothesis
-# Questions from Greg's study
-# Increase in alpha div from baseline
-# Difference in alpha at a single timepoint (week vs. control)
-# Beta: is distance to donor significantly *lower* (not just different) than it was at baseline (week 0, pre-FMT)
-# Beta[donor, subject]_w < Beta[donor, subject]_0
 
 def engraftment(
     ctx, diversity_measure, metadata, hypothesis, time_column,

diff --git a/q2_fmt/_stats.py b/q2_fmt/_stats.py
@@ -26,11 +26,15 @@ def mann_whitney_u(distribution: pd.DataFrame, hypothesis: str,
                                       against_each=against_each)
     elif hypothesis == 'all-pairwise':
         if reference_group is not None:
-            raise ValueError("you are confused, pls try again")
+            raise ValueError("`all-pairwise` was selected as the hypothesis,"
+                             " but a `reference_group` was added. Please either"
+                             " select `reference` as the hypothesis, or remove"
+                             " the `reference_group` parameter from your command.")
         comparisons = _comp_all_pairwise(distribution,
                                          against_each=against_each)
     else:
-        raise ValueError()
+        raise ValueError("Invalid hypothesis. Please either choose `reference` or"
+                         " `all-pairwise` as your hypothesis.")
 
     table = []
     for (idx_a, comp_a), (idx_b, comp_b) in comparisons:
@@ -127,10 +131,14 @@ def wilcoxon_srt(distribution: pd.DataFrame, hypothesis: str,
         comparisons = _comp_baseline(distribution, baseline_group)
     elif hypothesis == 'consecutive':
         if baseline_group is not None:
-            raise ValueError()
+            raise ValueError("`consecutive` was selected as the hypothesis,"
+                             " but a `baseline_group` was added. Please either"
+                             " select `baseline` as the hypothesis, or remove"
+                             " the `baseline_group` parameter from your command.")
         comparisons = _comp_consecutive(distribution)
     else:
-        raise ValueError()
+        raise ValueError("Invalid hypothesis. Please either choose `baseline` or"
+                         " `consecutive` as your hypothesis.")
 
     table = []
     for comp_a, comp_b in comparisons:

diff --git a/q2_fmt/tests/test_engraftment.py b/q2_fmt/tests/test_engraftment.py
@@ -14,7 +14,8 @@
 
 from q2_fmt._engraftment import group_timepoints
 from q2_fmt._stats import wilcoxon_srt, mann_whitney_u
-from q2_fmt._examples import faithpd_timedist_factory
+from q2_fmt._examples import faithpd_timedist_factory, faithpd_refdist_factory
+
 
 class TestBase(TestPluginBase):
     package='q2_fmt.tests'
@@ -29,6 +30,8 @@ def setUp(self):
         self.alpha = pd.read_csv(self.get_data_path('alpha_div.tsv'), sep='\t', index_col=0, squeeze=True)
 
         self.faithpd_timedist = faithpd_timedist_factory().view(pd.DataFrame)
+        self.faithpd_refdist = faithpd_refdist_factory().view(pd.DataFrame)
+
 
 class ErrorMixins:
     def test_with_time_column_input_not_in_metadata(self):
@@ -441,6 +444,10 @@ def test_examples(self):
 
 class TestStats(TestBase):
     # Wilcoxon SRT test cases
+
+    # Data in the exp_stats_data dataframes were pulled from Greg Caporaso's
+    # Autism study repo on github, which can be found here:
+    # https://github.com/caporaso-lab/autism-fmt1/blob/18-month-followup/16S/engraftment.ipynb
     def test_wilcoxon_with_faith_pd_baseline0_asymptotic(self):
         exp_stats_data = pd.DataFrame({
             'A:group': [0.0, 0.0, 0.0, 0.0],
@@ -476,13 +483,98 @@ def test_wilcoxon_with_faith_pd_consecutive_asymptotic(self):
 
         stats_data = wilcoxon_srt(distribution=self.faithpd_timedist,
                                   hypothesis='consecutive', p_val_approx='asymptotic')
-        print(stats_data['B:measure'])
+
         pd.testing.assert_frame_equal(stats_data, exp_stats_data)
 
+    def test_wilcoxon_consecutive_hypothesis_with_baseline_group(self):
+        with self.assertRaisesRegex(ValueError, "`consecutive` was selected as the hypothesis,"
+                                    " but a `baseline_group` was added."):
+            wilcoxon_srt(distribution=self.faithpd_timedist,
+                         hypothesis='consecutive', baseline_group='reference')
+
+    def test_wilcoxon_invalid_hypothesis(self):
+        with self.assertRaisesRegex(ValueError, "Invalid hypothesis. Please either choose"
+                                    " `baseline` or `consecutive` as your hypothesis."):
+            wilcoxon_srt(distribution=self.faithpd_timedist, hypothesis='foo')
+
+    def test_wilcoxon_invalid_baseline_group(self):
+        with self.assertRaisesRegex(ValueError, "'foo' was not found as a group"
+                                    " within the distribution."):
+            wilcoxon_srt(distribution=self.faithpd_timedist,
+                         hypothesis='baseline', baseline_group='foo')
+
     # Mann-Whitney U test cases
-    # search for any online refs for datasets with given results to compare
+
+    # Data in the exp_stats_data dataframes were calculated 'by hand' in a jupyter notebook
+    # using the same data, manually organized into groups and subsequently compared using
+    # scipy.stats.mannwhitneyu to calculate the test-statistic and p-values
+    # Notebook can be found here, for reference:
+    # https://gist.github.com/lizgehret/c9add7b451e5e91b1017a2a963276bff
+    def test_mann_whitney_pairwise_against_each(self):
+        exp_stats_data = pd.DataFrame({
+            'A:group': ['control', 'control', 'control', 'control', 'control',
+                        'reference', 'reference', 'reference', 'reference', 'reference'],
+            'A:n': [23, 23, 23, 23, 23, 5, 5, 5, 5, 5],
+            'A:measure': [11.64962736, 11.64962736, 11.64962736, 11.64962736, 11.64962736,
+                          10.24883918, 10.24883918, 10.24883918, 10.24883918, 10.24883918],
+            'B:group': [0, 3, 10, 18, 100, 0, 3, 10, 18, 100],
+            'B:n': [18, 17, 18, 18, 16, 18, 17, 18, 18, 16],
+            'B:measure': [9.54973486, 9.592979726, 10.9817719, 11.39392352, 12.97286672,
+                          9.54973486, 9.592979726, 10.9817719, 11.39392352, 12.97286672],
+            'n': [41, 40, 41, 41, 39, 23, 22, 23, 23, 21],
+            'test-statistic': [282.0, 260.0, 194.0, 190.0, 104.0,
+                               49.0, 43.0, 20.0, 14.0, 6.0],
+            'p-value': [0.050330911733538534, 0.07994303215567311, 0.7426248650660427,
+                        0.6646800940267454, 0.02321456407322841, 0.7941892150565809,
+                        1.0, 0.06783185968744732, 0.023005953105134484,
+                        0.0056718704407604376],
+            'q-value': [0.12582728, 0.13323839, 0.92828108, 0.94954299, 0.07738188,
+                        0.88243246, 1.0, 0.13566372, 0.11502977, 0.0567187],
+        })
+
+        stats_data = mann_whitney_u(distribution=self.faithpd_refdist,
+                                    against_each=self.faithpd_timedist,
+                                    hypothesis='all-pairwise',
+                                    p_val_approx='asymptotic')
+
+        pd.testing.assert_frame_equal(stats_data, exp_stats_data)
+
     def test_mann_whitney_reference(self):
-        pass
+        exp_stats_data = pd.DataFrame({
+            'A:group': ['reference'],
+            'A:n': [5],
+            'A:measure': [10.2488392],
+            'B:group': ['control'],
+            'B:n': [23],
+            'B:measure': [11.6496274],
+            'n': [28],
+            'test-statistic': [37.0],
+            'p-value': [0.23025583],
+            'q-value': [0.23025583],
+        })
+
+        stats_data = mann_whitney_u(distribution=self.faithpd_refdist,
+                                    hypothesis='reference',
+                                    reference_group='reference',
+                                    p_val_approx='asymptotic')
+
+        pd.testing.assert_frame_equal(stats_data, exp_stats_data)
 
-    def test_mann_whitney_pairwise(self):
-        pass
+    def test_mann_whitney_all_pairwise_hypothesis_with_reference_group(self):
+        with self.assertRaisesRegex(ValueError, "`all-pairwise` was selected as the"
+                                    " hypothesis, but a `reference_group` was added."):
+            mann_whitney_u(distribution=self.faithpd_refdist,
+                           hypothesis='all-pairwise',
+                           reference_group='reference')
+
+    def test_mann_whitney_invalid_hypothesis(self):
+        with self.assertRaisesRegex(ValueError, "Invalid hypothesis. Please either"
+                         " choose `reference` or `all-pairwise` as your hypothesis."):
+            mann_whitney_u(distribution=self.faithpd_refdist,
+                           hypothesis='foo')
+
+    def test_mann_whitney_invalid_reference_group(self):
+        with self.assertRaisesRegex(ValueError, "'foo' was not found as a group"
+                                    " within the distribution."):
+            mann_whitney_u(distribution=self.faithpd_refdist,
+                           hypothesis='reference', reference_group='foo')