Quantco · YYYasin19 · Jun 30, 2022 · Jun 23, 2022 · Jun 23, 2022 · Jun 24, 2022
diff --git a/src/datajudge/constraints/stats.py b/src/datajudge/constraints/stats.py
@@ -1,12 +1,12 @@
 import math
 import warnings
-from typing import Any, Optional, Tuple
+from typing import Any, Optional
 
 import sqlalchemy as sa
 
 from .. import db_access
 from ..db_access import DataReference
-from .base import Constraint, OptionalSelections, TestResult
+from .base import Constraint, TestResult
 
 
 class KolmogorovSmirnov2Sample(Constraint):
@@ -16,13 +16,6 @@ def __init__(
         self.significance_level = significance_level
         super().__init__(ref, ref2=ref2)
 
-    def retrieve(
-        self, engine: sa.engine.Engine, ref: DataReference
-    ) -> Tuple[Any, OptionalSelections]:
-        sel = ref.get_selection(engine)  # table selection incl. WHERE condition
-        col = ref.get_column(engine)  # column name
-        return sel, col
-
     @staticmethod
     def approximate_p_value(
         d: float, n_samples: int, m_samples: int
@@ -56,12 +49,12 @@ def approximate_p_value(
     @staticmethod
     def check_acceptance(
         d_statistic: float, n_samples: int, m_samples: int, accepted_level: float
-    ):
+    ) -> bool:
         """
         For a given test statistic, d, and the respective sample sizes `n` and `m`, this function
         checks whether the null hypothesis can be rejected for an accepted significance level.
 
-        For more information, check out the `Wikipedia entry <https://w.wiki/5May>`.
+        For more information, check out the `Wikipedia entry <https://w.wiki/5May>`_.
         """
 
         def c(alpha: float):
@@ -72,24 +65,26 @@ def c(alpha: float):
         )
 
     @staticmethod
-    def calculate_statistic(engine, table1, table2) -> Any:
+    def calculate_statistic(engine, table1_def: tuple, table2_def: tuple) -> Any:
 
         # retrieve test statistic d, as well as sample sizes m and n
-        d_statistic, m, n = db_access.get_ks_2sample(
-            engine, table1=table1, table2=table2
+        d_statistic, n_samples, m_samples = db_access.get_ks_2sample(
+            engine, table1=table1_def, table2=table2_def
         )
 
         # calculate approximate p-value
-        p_value = KolmogorovSmirnov2Sample.approximate_p_value(d_statistic, m, n)
+        p_value = KolmogorovSmirnov2Sample.approximate_p_value(
+            d_statistic, n_samples, m_samples
+        )
 
-        return d_statistic, p_value, n, m
+        return d_statistic, p_value, n_samples, m_samples
 
     def test(self, engine: sa.engine.Engine) -> TestResult:
 
         # get query selections and column names for target columns
-        selection1 = str(self.ref.data_source.get_clause(engine))
+        selection1 = self.ref.data_source.get_clause(engine)
         column1 = self.ref.get_column(engine)
-        selection2 = str(self.ref2.data_source.get_clause(engine))
+        selection2 = self.ref2.data_source.get_clause(engine)
         column2 = self.ref2.get_column(engine)
 
         d_statistic, p_value, n_samples, m_samples = self.calculate_statistic(
@@ -105,11 +100,11 @@ def test(self, engine: sa.engine.Engine) -> TestResult:
             f"Null hypothesis (H0) for the 2-sample Kolmogorov-Smirnov test was rejected, i.e., "
             f"the two samples ({self.ref.get_string()} and {self.target_prefix})"
             f" do not originate from the same distribution."
+            f"The test results are d={d_statistic}"
         )
-        if p_value:
-            assertion_text += f"\n p-value: {p_value}"
+        if p_value is not None:
+            assertion_text += f"and {p_value=}"
 
-        # store values s.t. they can be checked later
         if not result:
             return TestResult.failure(assertion_text)
 

diff --git a/src/datajudge/db_access.py b/src/datajudge/db_access.py
@@ -908,16 +908,14 @@ def get_ks_2sample(engine: sa.engine.Engine, table1: tuple, table2: tuple):
     """
     Runs the query for the two-sample Kolmogorov-Smirnov test and returns the test statistic d.
     """
-    table1_selection, col1 = table1
-    table2_selection, col2 = table2
-
-    if is_mssql(engine):
-        table1_selection = str(table1_selection).replace(
-            '"', ""
-        )  # tempdb.dbo.int_table
-        table2_selection = str(table2_selection).replace(
-            '"', ""
-        )  # "tempdb.dbo".int_table
+
+    # make sure we have a string representation here
+    table1_selection, col1 = str(table1[0]), str(table1[1])
+    table2_selection, col2 = str(table2[0]), str(table2[1])
+
+    if is_mssql(engine):  # "tempdb.dbo".table_name -> tempdb.dbo.table_name
+        table1_selection = table1_selection.replace('"', "")
+        table2_selection = table2_selection.replace('"', "")
 
     # for RawQueryDataSource this could be a whole subquery and will therefore need to be wrapped
     if "SELECT" in table1_selection:

diff --git a/tests/integration/test_integration.py b/tests/integration/test_integration.py
@@ -3,7 +3,6 @@
 import pytest
 
 import datajudge.requirements as requirements
-from datajudge import db_access
 from datajudge.constraints.stats import KolmogorovSmirnov2Sample
 from datajudge.db_access import (
     Condition,
@@ -1856,9 +1855,9 @@ def test_ks_2sample_implementation(engine, random_normal_table, configuration):
     ref2 = DataReference(tds, columns=[col_2])
 
     # retrieve table selections from data references
-    selection1 = str(ref.data_source.get_clause(engine))
+    selection1 = ref.data_source.get_clause(engine)
     column1 = ref.get_column(engine)
-    selection2 = str(ref2.data_source.get_clause(engine))
+    selection2 = ref2.data_source.get_clause(engine)
     column2 = ref2.get_column(engine)
 
     (
@@ -1870,10 +1869,6 @@ def test_ks_2sample_implementation(engine, random_normal_table, configuration):
         engine, (selection1, column1), (selection2, column2)
     )
 
-    # compare with scipy implementation
-    data1, _ = db_access.get_column(engine, ref)
-    data2, _ = db_access.get_column(engine, ref2)
-
     assert (
         abs(d_statistic - expected_d) <= 1e-10
     ), f"The test statistic does not match: {expected_d} vs {d_statistic}"