fix(plot): validate input shape in beeswarm_plot and sentence_plot

claude · claude · commit 038319404718 · 2026-04-20T19:51:18.000Z
Both functions previously accepted malformed input silently: - beeswarm_plot with data.shape[1] != n_players would plot a subset or scramble columns without warning. - sentence_plot with len(words) != n_players would index past the InteractionValues or drop entries silently. Each gets a ValueError guard with a clear message. Re-enables the two dropped edge-case tests in TestPlotEdgeCases. https://claude.ai/code/session_01DHsGf4an1Dnnw4qTnmdB22
diff --git a/src/shapiq/plot/beeswarm.py b/src/shapiq/plot/beeswarm.py
@@ -202,6 +202,12 @@ def beeswarm_plot(
     n_samples = len(data)
     n_players = interaction_values_list[0].n_players
 
+    if data.shape[1] != n_players:
+        error_message = (
+            f"data must have {n_players} columns to match n_players, but got {data.shape[1]}."
+        )
+        raise ValueError(error_message)
+
     if feature_names is not None:
         if abbreviate:
             feature_names = abbreviate_feature_names(feature_names)
diff --git a/src/shapiq/plot/sentence.py b/src/shapiq/plot/sentence.py
@@ -91,6 +91,13 @@ def sentence_plot(
         :align: center
 
     """
+    if len(words) != interaction_values.n_players:
+        error_message = (
+            f"Number of words ({len(words)}) must match "
+            f"interaction_values.n_players ({interaction_values.n_players})."
+        )
+        raise ValueError(error_message)
+
     # set all the size parameters
     fontsize = 20
     word_spacing = 15
diff --git a/tests/shapiq/test_plots.py b/tests/shapiq/test_plots.py
@@ -421,3 +421,17 @@ def test_max_display_below_n_features(self, sample_iv):
             max_display=2,
         )
         assert ax is not None
+
+    def test_sentence_plot_word_count_mismatch_raises(self):
+        """``sentence_plot`` must raise when len(words) != n_players."""
+        iv = _build_iv(n=3).get_n_order(order=1)
+        with pytest.raises(ValueError, match="must match"):
+            sentence_plot(iv, words=["only-one"])
+        with pytest.raises(ValueError, match="must match"):
+            sentence_plot(iv, words=["a", "b", "c", "d", "e"])
+
+    def test_beeswarm_plot_data_column_mismatch_raises(self, sample_iv_list):
+        """``beeswarm_plot`` must raise when data has wrong number of columns."""
+        bad_data = np.random.default_rng(0).normal(size=(len(sample_iv_list), 99))
+        with pytest.raises(ValueError, match="columns"):
+            beeswarm_plot(sample_iv_list, data=bad_data, show=False)