Giskard-AI
diff --git a/‎python-client/giskard/core/model_validation.py‎
Lines changed: 1 addition & 1 deletion b/‎python-client/giskard/core/model_validation.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎python-client/giskard/scanner/__init__.py‎
Lines changed: 1 addition & 0 deletions b/‎python-client/giskard/scanner/__init__.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python-client/giskard/scanner/calibration/underconfidence_detector.py‎
Lines changed: 2 additions & 0 deletions b/‎python-client/giskard/scanner/calibration/underconfidence_detector.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎python-client/giskard/scanner/common/examples.py‎
Lines changed: 7 additions & 2 deletions b/‎python-client/giskard/scanner/common/examples.py‎
Lines changed: 7 additions & 2 deletions
diff --git a/‎python-client/giskard/scanner/common/loss_based_detector.py‎
Lines changed: 16 additions & 28 deletions b/‎python-client/giskard/scanner/common/loss_based_detector.py‎
Lines changed: 16 additions & 28 deletions
diff --git a/‎python-client/giskard/scanner/correlation/spurious_correlation_detector.py‎
Lines changed: 151 additions & 0 deletions b/‎python-client/giskard/scanner/correlation/spurious_correlation_detector.py‎
Lines changed: 151 additions & 0 deletions
diff --git a/‎python-client/giskard/scanner/result.py‎
Lines changed: 5 additions & 2 deletions b/‎python-client/giskard/scanner/result.py‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎python-client/giskard/scanner/templates/_issues/spurious_correlation.html‎
Lines changed: 37 additions & 0 deletions b/‎python-client/giskard/scanner/templates/_issues/spurious_correlation.html‎
Lines changed: 37 additions & 0 deletions
diff --git a/‎python-client/giskard/scanner/templates/_issues_table.html‎
Lines changed: 2 additions & 0 deletions b/‎python-client/giskard/scanner/templates/_issues_table.html‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎python-client/giskard/scanner/templates/_main_content.html‎
Lines changed: 10 additions & 0 deletions b/‎python-client/giskard/scanner/templates/_main_content.html‎
Lines changed: 10 additions & 0 deletions
@@ -72,7 +72,7 @@ def _do_validate_model(model: BaseModel, validate_ds: Optional[Dataset] = None):
         else:  # Classification with target = None
             validate_model_execution(model, validate_ds)
 
-        if model.meta.model_type == SupportedModelTypes.CLASSIFICATION:
+        if model.meta.model_type == SupportedModelTypes.CLASSIFICATION and validate_ds.target is not None:
             validate_order_classifcation_labels(model, validate_ds)
 
 
 
@@ -12,6 +12,7 @@
     ".stochasticity.stochasticity_detector",
     ".calibration.overconfidence_detector",
     ".calibration.underconfidence_detector",
+    ".correlation.spurious_correlation_detector",
     ".llm.toxicity_detector",
 ]
 
 
@@ -14,6 +14,8 @@
 
 @detector(name="underconfidence", tags=["underconfidence", "classification"])
 class UnderconfidenceDetector(LossBasedDetector):
+    _needs_target = False
+
     def __init__(self, threshold=0.1, p_threshold=0.95, method="tree"):
         self.threshold = threshold
         self.p_threshold = p_threshold
 
@@ -22,7 +22,9 @@ def get_examples_dataframe(self, n=3, with_prediction: Union[int, bool] = 1):
         examples = dataset.df.copy()
 
         # Keep only interesting columns
-        cols_to_show = issue.features + [issue.dataset.target]
+        cols_to_show = issue.features
+        if issue.dataset.target is not None:
+            cols_to_show += [issue.dataset.target]
         examples = examples.loc[:, cols_to_show]
 
         # If metadata slice, add the metadata column
@@ -54,7 +56,10 @@ def get_examples_dataframe(self, n=3, with_prediction: Union[int, bool] = 1):
             else:
                 pred_examples = model_pred.prediction
 
-            examples[f"Predicted `{issue.dataset.target}`"] = pred_examples
+            predicted_label = "Predicted"
+            if issue.dataset.target is not None:
+                predicted_label += f" `{issue.dataset.target}`"
+            examples[predicted_label] = pred_examples
 
         n = min(len(examples), n)
         if n > 0:
 
@@ -4,13 +4,12 @@
 from typing import Sequence
 from abc import abstractmethod
 
+from ...slicing.slice_finder import SliceFinder
+
 from ..registry import Detector
 
 from ...models.base import BaseModel
 from ...datasets.base import Dataset
-from ...slicing.utils import get_slicer
-from ...slicing.text_slicer import TextSlicer
-from ...slicing.category_slicer import CategorySlicer
 from ...ml_worker.testing.registry.slicing_function import SlicingFunction
 from ..logger import logger
 from ..issues import Issue
@@ -21,7 +20,13 @@ class LossBasedDetector(Detector):
     MAX_DATASET_SIZE = 10_000_000
     LOSS_COLUMN_NAME = "__gsk__loss"
 
+    _needs_target = True
+
     def run(self, model: BaseModel, dataset: Dataset):
+        if self._needs_target and dataset.target is None:
+            logger.info(f"{self.__class__.__name__}: Skipping detection because the dataset has no target column.")
+            return []
+
         logger.info(f"{self.__class__.__name__}: Running")
 
         # Check if we have enough data to run the scan
@@ -48,8 +53,7 @@ def run(self, model: BaseModel, dataset: Dataset):
         # Find slices
         logger.info(f"{self.__class__.__name__}: Finding data slices")
         start = perf_counter()
-        dataset_to_slice = dataset.select_columns(model.meta.feature_names) if model.meta.feature_names else dataset
-        slices = self._find_slices(dataset_to_slice, meta)
+        slices = self._find_slices(model, dataset, meta)
         elapsed = perf_counter() - start
         logger.info(
             f"{self.__class__.__name__}: {len(slices)} slices found (took {datetime.timedelta(seconds=elapsed)})"
@@ -70,7 +74,9 @@ def run(self, model: BaseModel, dataset: Dataset):
     def _numerical_slicer_method(self):
         return "tree"
 
-    def _find_slices(self, dataset: Dataset, meta: pd.DataFrame):
+    def _find_slices(self, model: BaseModel, dataset: Dataset, meta: pd.DataFrame):
+        features = model.meta.feature_names or dataset.columns.drop(dataset.target, errors="ignore")
+
         df_with_meta = dataset.df.join(meta, how="right")
 
         column_types = dataset.column_types.copy()
@@ -85,28 +91,10 @@ def _find_slices(self, dataset: Dataset, meta: pd.DataFrame):
         # For performance
         dataset_with_meta.load_metadata_from_instance(dataset.column_meta)
 
-        # Columns by type
-        cols_by_type = {
-            type_val: [col for col, col_type in dataset.column_types.items() if col_type == type_val]
-            for type_val in ["numeric", "category", "text"]
-        }
-
-        # Numerical features
-        slicer = get_slicer(self._numerical_slicer_method, dataset_with_meta, self.LOSS_COLUMN_NAME)
-
-        slices = []
-        for col in cols_by_type["numeric"]:
-            slices.extend(slicer.find_slices([col]))
-
-        # Categorical features
-        slicer = CategorySlicer(dataset_with_meta, target=self.LOSS_COLUMN_NAME)
-        for col in cols_by_type["category"]:
-            slices.extend(slicer.find_slices([col]))
-
-        # Text features
-        slicer = TextSlicer(dataset_with_meta, target=self.LOSS_COLUMN_NAME, slicer=self._numerical_slicer_method)
-        for col in cols_by_type["text"]:
-            slices.extend(slicer.find_slices([col]))
+        # Find slices
+        sf = SliceFinder(numerical_slicer=self._numerical_slicer_method)
+        sliced = sf.run(dataset_with_meta, features, target=self.LOSS_COLUMN_NAME)
+        slices = sum(sliced.values(), start=[])
 
         # Keep only slices of size at least 5% of the dataset or 20 samples (whatever is larger)
         slices = [s for s in slices if max(0.05 * len(dataset), 20) <= len(dataset_with_meta.slice(s))]
 
@@ -0,0 +1,151 @@
+from dataclasses import dataclass
+import pandas as pd
+from sklearn.metrics import adjusted_mutual_info_score, mutual_info_score
+from scipy import stats
+
+from ..common.examples import ExampleExtractor
+from ...ml_worker.testing.registry.slicing_function import SlicingFunction
+from ..issues import Issue
+from ...slicing.slice_finder import SliceFinder
+from ..logger import logger
+from ...datasets.base import Dataset
+from ...models.base import BaseModel
+from ..registry import Detector
+from ..decorators import detector
+
+
+@detector(name="spurious_correlation", tags=["spurious_correlation", "classification"])
+class SpuriousCorrelationDetector(Detector):
+    def __init__(self, method="theil", threshold=0.5) -> None:
+        self.threshold = threshold
+        self.method = method
+
+    def run(self, model: BaseModel, dataset: Dataset):
+        logger.info(f"{self.__class__.__name__}: Running")
+
+        # Dataset prediction
+        ds_predictions = pd.Series(model.predict(dataset).prediction, dataset.df.index)
+
+        # Keep only interesting features
+        features = model.meta.feature_names or dataset.columns.drop(dataset.target, errors="ignore")
+
+        # Warm up text metadata
+        for f in features:
+            if dataset.column_types[f] == "text":
+                dataset.column_meta[f, "text"]
+
+        # Prepare dataset for slicing
+        df = dataset.df.copy()
+        if dataset.target is not None:
+            df.drop(columns=dataset.target, inplace=True)
+        df["__gsk__target"] = pd.Categorical(ds_predictions)
+        wdata = Dataset(df, target="__gsk__target", column_types=dataset.column_types)
+        wdata.load_metadata_from_instance(dataset.column_meta)
+
+        # Find slices
+        sliced_cols = SliceFinder("tree").run(wdata, features, target=wdata.target)
+
+        measure_fn, measure_name = self._get_measure_fn()
+        issues = []
+        for col, slices in sliced_cols.items():
+            if not slices:
+                continue
+
+            for slice_fn in slices:
+                data_slice = dataset.slice(slice_fn)
+
+                # Skip small slices
+                if len(data_slice) < 20 or len(data_slice) < 0.05 * len(dataset):
+                    continue
+
+                dx = pd.DataFrame(
+                    {
+                        "feature": dataset.df.index.isin(data_slice.df.index).astype(int),
+                        "prediction": ds_predictions,
+                    },
+                    index=dataset.df.index,
+                )
+                dx.dropna(inplace=True)
+
+                metric_value = measure_fn(dx.feature, dx.prediction)
+                logger.info(f"{self.__class__.__name__}: {slice_fn}\tAssociation = {metric_value:.3f}")
+
+                if metric_value > self.threshold:
+                    predictions = dx[dx.feature > 0].prediction.value_counts(normalize=True)
+                    info = SpuriousCorrelationInfo(col, slice_fn, metric_value, measure_name, predictions)
+                    issues.append(SpuriousCorrelationIssue(model, dataset, "info", info))
+
+        return issues
+
+    def _get_measure_fn(self):
+        if self.method == "theil":
+            return _theil_u, "Theil's U"
+        if self.method == "mutual_information" or self.method == "mi":
+            return _mutual_information, "Mutual information"
+        if self.method == "cramer":
+            return _cramer_v, "Cramer's V"
+        raise ValueError(f"Unknown method `{self.method}`")
+
+
+def _cramer_v(x, y):
+    ct = pd.crosstab(x, y)
+    return stats.contingency.association(ct, method="cramer")
+
+
+def _mutual_information(x, y):
+    return adjusted_mutual_info_score(x, y)
+
+
+def _theil_u(x, y):
+    return mutual_info_score(x, y) / stats.entropy(pd.Series(y).value_counts(normalize=True))
+
+
+@dataclass
+class SpuriousCorrelationInfo:
+    feature: str
+    slice_fn: SlicingFunction
+    metric_value: float
+    metric_name: str
+    predictions: pd.DataFrame
+
+
+class SpuriousCorrelationIssue(Issue):
+    group = "Spurious correlation"
+
+    @property
+    def features(self):
+        return [self.info.feature]
+
+    @property
+    def domain(self) -> str:
+        return str(self.info.slice_fn)
+
+    @property
+    def metric(self) -> str:
+        return f"Nominal association ({self.info.metric_name})"
+
+    @property
+    def deviation(self) -> str:
+        plabel, p = self.info.predictions.index[0], self.info.predictions.iloc[0]
+
+        return f"Prediction {self.dataset.target} = `{plabel}` for {p * 100:.2f}% of samples in the slice"
+
+    @property
+    def slicing_fn(self):
+        return self.info.slice_fn
+
+    @property
+    def description(self) -> str:
+        pred = self.model.predict(self.dataset.slice(self.info.slice_fn)).prediction
+        classes = pd.Series(pred).value_counts(normalize=True)
+        plabel, p = classes.index[0], classes.iloc[0]
+        return f"Data slice {self.info.slice_fn} seems to be highly associated to prediction {self.dataset.target} = `{plabel}` ({p * 100:.2f}% of predictions in the data slice)."
+
+    # @lru_cache
+    def examples(self, n=3):
+        extractor = ExampleExtractor(self)
+        return extractor.get_examples_dataframe(n, with_prediction=1)
+
+    @property
+    def importance(self) -> float:
+        return self.info.metric_value
@@ -46,10 +46,13 @@ def _repr_html_(self):
             issues=self.issues,
             issues_by_group=issues_by_group,
             num_major_issues={
-                group: len([i for i in issues if i.is_major]) for group, issues in issues_by_group.items()
+                group: len([i for i in issues if i.level == "major"]) for group, issues in issues_by_group.items()
             },
             num_medium_issues={
-                group: len([i for i in issues if not i.is_major]) for group, issues in issues_by_group.items()
+                group: len([i for i in issues if i.level == "medium"]) for group, issues in issues_by_group.items()
+            },
+            num_info_issues={
+                group: len([i for i in issues if i.level == "info"]) for group, issues in issues_by_group.items()
             },
         )
 
 
@@ -0,0 +1,37 @@
+<tr class="gsk-issue text-sm group peer text-left cursor-pointer hover:bg-zinc-700">
+    <td class="p-3">
+        <code class="mono text-blue-300">
+        {{issue.domain|replace("&", "<br>")|safe}}
+    </code>
+    </td>
+    <td class="p-3">
+        {{ issue.metric }} = {{ issue.info.metric_value|format_metric }}
+    </td>
+    <td class="p-3 text-amber-200">
+        {{ issue.deviation }}
+    </td>
+    <td class="p-3">
+        <span class="text-gray-400">
+            <!-- {{ issue.description }} -->
+        </span>
+    </td>
+    <td class="p-3 text-xs text-right space-x-1">
+        <a href="#"
+            class="gsk-issue-detail-btn inline-block group-[.open]:hidden border border-zinc-100/50 text-zinc-100/90 hover:bg-zinc-500 hover:border-zinc-500 hover:text-white px-2 py-0.5 rounded-sm">Show details</a>
+        <a href="#"
+            class="hidden group-[.open]:inline-block gsk-issue-detail-btn border border-zinc-500 text-zinc-100/90 bg-zinc-500 hover:bg-zinc-400 hover:text-white px-2 py-0.5 rounded-sm">Hide details</a>
+    </td>
+</tr>
+<tr class="gsk-issue-detail text-left collapse peer-[.open]:visible border-b border-zinc-500 bg-zinc-700">
+    <td colspan="5" class="p-3">
+        <h4 class="font-bold text-sm">Description</h4>
+        {{ issue.description | safe }}
+
+        {% if issue.examples(3)|length %}
+        <h4 class="font-bold text-sm mt-4">Examples</h4>
+        <div class="text-white max-w-xl text-sm overflow-scroll" style="max-width: 920px">
+            {{ issue.examples(3).to_html(notebook=True) | replace("\\n", "<br>") | safe }}
+        </div>
+        {% endif %}
+    </td>
+</tr>
@@ -16,6 +16,8 @@
                 {% include "_issues/stochasticity.html" %}
             {% elif issue.__class__.__name__ == 'LLMToxicityIssue' %}
                 {% include "_issues/llm_toxicity.html" %}
+            {% elif issue.__class__.__name__ == 'SpuriousCorrelationIssue' %}
+                {% include "_issues/spurious_correlation.html" %}
             {% else %}
                 {% include "_issues/default.html" %}
             {% endif %}
 
@@ -85,6 +85,12 @@
                 Your model seems to exhibit offensive behaviour when we use adversarial “Do Anything Now” (DAN)
                 prompts.
             </p>
+            {% elif issues[0].__class__.__name__ == "SpuriousCorrelationIssue" %}
+            <p>
+                We found potential spurious correlations between your data and the model predictions. Spurious
+                correlations may occur when the model overfits on relations that are not causal. We recommend that you
+                verify the causal relationship between the detected data slices and the target variable.
+            </p>
             {% else %}
             <p>Found issues for {{ issues[0].group }}</p>
             {% endif %}
@@ -101,6 +107,10 @@ <h2 class="uppercase my-4 mr-2 font-medium">Issues</h2>
         <span class="text-xs border rounded px-1 uppercase text-amber-200 border-amber-200">{{num_medium_issues[group]}}
             medium</span>
         {% endif %}
+        {% if num_info_issues[group] > 0 %}
+        <span class="text-xs border rounded px-1 uppercase text-blue-200 border-blue-200">{{num_info_issues[group]}}
+            info</span>
+        {% endif %}
     </div>
 
     {% include "_issues_table.html" %}
Original file line number	Diff line number	Diff line change
`@@ -12,6 +12,7 @@`
`12`	`12`	`".stochasticity.stochasticity_detector",`
`13`	`13`	`".calibration.overconfidence_detector",`
`14`	`14`	`".calibration.underconfidence_detector",`
	`15`	`+ ".correlation.spurious_correlation_detector",`
`15`	`16`	`".llm.toxicity_detector",`
`16`	`17`	`]`
`17`	`18`