From 6914faf82f13b162431f9e750b08bcdea5328b70 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 3 Jun 2025 17:24:40 +0000
Subject: [PATCH 1/2] Initial plan for issue


From 6cbedfde5b71db144c143d79c0b7e2fe5fd7ba71 Mon Sep 17 00:00:00 2001
From: "copilot-swe-agent[bot]" <198982749+Copilot@users.noreply.github.com>
Date: Tue, 3 Jun 2025 17:33:28 +0000
Subject: [PATCH 2/2] Implement dynamic color scaling with mean/std
 normalization

Co-authored-by: eh-main-bot <171766998+eh-main-bot@users.noreply.github.com>
---
 tab_right/plotting/plot_segmentations.py  | 173 +++++++++++++++++++---
 tests/plotting/test_plot_segmentations.py |  90 +++++++++++
 2 files changed, 242 insertions(+), 21 deletions(-)

diff --git a/tab_right/plotting/plot_segmentations.py b/tab_right/plotting/plot_segmentations.py
index 6569159..ae57495 100644
--- a/tab_right/plotting/plot_segmentations.py
+++ b/tab_right/plotting/plot_segmentations.py
@@ -42,6 +42,51 @@
 ColorMap = Union[str, list]
 
 
+def normalize_scores(scores: np.ndarray, method: str = "minmax", k: float = 2.0) -> np.ndarray:
+    """Normalize scores using different scaling methods.
+
+    Parameters
+    ----------
+    scores : np.ndarray
+        Array of scores to normalize.
+    method : str, default="minmax"
+        Scaling method to use. Options:
+        - "minmax": Min-max normalization using actual min and max values
+        - "std": Standard deviation based scaling using mean ± k*std
+    k : float, default=2.0
+        Number of standard deviations to use for "std" method scaling range.
+
+    Returns
+    -------
+    np.ndarray
+        Normalized scores in the range [0, 1].
+
+    Raises
+    ------
+    ValueError
+        If an unknown scaling method is provided.
+
+    """
+    if method == "std":
+        mean = np.mean(scores)
+        std = np.std(scores)
+        vmin = mean - k * std
+        vmax = mean + k * std
+    elif method == "minmax":
+        vmin = np.min(scores)
+        vmax = np.max(scores)
+    else:
+        raise ValueError(f"Unknown method: {method}. Supported methods are 'minmax' and 'std'.")
+
+    # Avoid division by zero
+    if vmax - vmin == 0:
+        return np.zeros_like(scores)
+
+    # Clip values to the computed range and normalize to [0, 1]
+    clipped = np.clip(scores, vmin, vmax)
+    return (clipped - vmin) / (vmax - vmin)
+
+
 def _prepare_data(df: pd.DataFrame) -> pd.DataFrame:
     """Prepare data for segmentation plotting by sorting.
 
@@ -86,7 +131,13 @@ def _get_color_scheme(lower_is_better: bool = True, backend: Backend = "plotly")
         return {"cmap": "RdYlGn"}  # Red (low/bad) to Green (high/good)
 
 
-def plot_single_segmentation(df: pd.DataFrame, lower_is_better: bool = True, backend: Backend = "plotly") -> Figure:
+def plot_single_segmentation(
+    df: pd.DataFrame,
+    lower_is_better: bool = True,
+    backend: Backend = "plotly",
+    scaling_method: str = "minmax",
+    scaling_k: float = 2.0,
+) -> Figure:
     """Plot the single segmentation of a given DataFrame as a bar chart.
 
     This function can use either Plotly or Matplotlib as backend.
@@ -99,6 +150,10 @@ def plot_single_segmentation(df: pd.DataFrame, lower_is_better: bool = True, bac
         Whether lower values of the metric indicate better performance.
     backend : str, default="plotly"
         The plotting backend to use. Either "plotly" or "matplotlib".
+    scaling_method : str, default="minmax"
+        Method for scaling colors. Options: "minmax" or "std".
+    scaling_k : float, default=2.0
+        Number of standard deviations for "std" scaling method.
 
     Returns
     -------
@@ -107,12 +162,14 @@ def plot_single_segmentation(df: pd.DataFrame, lower_is_better: bool = True, bac
 
     """
     if backend == "plotly":
-        return _plot_single_segmentation_plotly(df, lower_is_better)
+        return _plot_single_segmentation_plotly(df, lower_is_better, scaling_method, scaling_k)
     else:
-        return _plot_single_segmentation_matplotlib(df, lower_is_better)
+        return _plot_single_segmentation_matplotlib(df, lower_is_better, scaling_method, scaling_k)
 
 
-def _plot_single_segmentation_plotly(df: pd.DataFrame, lower_is_better: bool = True) -> PlotlyFigure:
+def _plot_single_segmentation_plotly(
+    df: pd.DataFrame, lower_is_better: bool = True, scaling_method: str = "minmax", scaling_k: float = 2.0
+) -> PlotlyFigure:
     """Implement the single segmentation plot as a Plotly bar chart.
 
     Parameters
@@ -121,6 +178,10 @@ def _plot_single_segmentation_plotly(df: pd.DataFrame, lower_is_better: bool = T
         See module docstring for format details.
     lower_is_better : bool, default=True
         Whether lower values of the metric indicate better performance.
+    scaling_method : str, default="minmax"
+        Method for scaling colors. Options: "minmax" or "std".
+    scaling_k : float, default=2.0
+        Number of standard deviations for "std" scaling method.
 
     Returns
     -------
@@ -134,6 +195,9 @@ def _plot_single_segmentation_plotly(df: pd.DataFrame, lower_is_better: bool = T
     # Get color scheme
     color_scheme = _get_color_scheme(lower_is_better, "plotly")
 
+    # Normalize scores for color mapping
+    normalized_scores = normalize_scores(df_sorted["score"].values, method=scaling_method, k=scaling_k)
+
     # Create a bar chart
     fig = go.Figure(
         data=[
@@ -141,7 +205,7 @@ def _plot_single_segmentation_plotly(df: pd.DataFrame, lower_is_better: bool = T
                 x=df_sorted["segment_name"].astype(str),
                 y=df_sorted["score"],
                 marker=dict(
-                    color=df_sorted["score"],
+                    color=normalized_scores,
                     colorscale=color_scheme["colorscale"],
                     colorbar=dict(title="Score"),
                 ),
@@ -163,7 +227,9 @@ def _plot_single_segmentation_plotly(df: pd.DataFrame, lower_is_better: bool = T
     return fig
 
 
-def _plot_single_segmentation_matplotlib(df: pd.DataFrame, lower_is_better: bool = True) -> MatplotlibFigure:
+def _plot_single_segmentation_matplotlib(
+    df: pd.DataFrame, lower_is_better: bool = True, scaling_method: str = "minmax", scaling_k: float = 2.0
+) -> MatplotlibFigure:
     """Implement the single segmentation plot as a Matplotlib bar chart.
 
     Parameters
@@ -172,6 +238,10 @@ def _plot_single_segmentation_matplotlib(df: pd.DataFrame, lower_is_better: bool
         See module docstring for format details.
     lower_is_better : bool, default=True
         Whether lower values of the metric indicate better performance.
+    scaling_method : str, default="minmax"
+        Method for scaling colors. Options: "minmax" or "std".
+    scaling_k : float, default=2.0
+        Number of standard deviations for "std" scaling method.
 
     Returns
     -------
@@ -191,14 +261,22 @@ def _plot_single_segmentation_matplotlib(df: pd.DataFrame, lower_is_better: bool
     cmap_name = color_scheme["cmap"]
     assert isinstance(cmap_name, str), "matplotlib cmap should be a string"
 
-    # Normalize the scores for colormapping
-    if len(df_sorted) > 1:
-        norm = plt.Normalize(float(df_sorted["score"].min()), float(df_sorted["score"].max()))
-    else:
+    # Normalize scores for color mapping
+    normalized_scores = normalize_scores(df_sorted["score"].values, method=scaling_method, k=scaling_k)
+
+    # Create normalization based on the scaling method
+    if scaling_method == "std":
+        # For std method, use [0, 1] range since normalized_scores are already in that range
         norm = plt.Normalize(0, 1)
+    else:
+        # For minmax method, use the actual score range for the colorbar
+        if len(df_sorted) > 1:
+            norm = plt.Normalize(float(df_sorted["score"].min()), float(df_sorted["score"].max()))
+        else:
+            norm = plt.Normalize(0, 1)
 
     cmap = plt.get_cmap(cmap_name)
-    colors = cmap(norm(df_sorted["score"].values.astype(np.float64)))
+    colors = cmap(normalized_scores)
 
     # Create bar chart
     bars = ax.bar(df_sorted["segment_name"].astype(str), df_sorted["score"], color=colors)
@@ -210,8 +288,14 @@ def _plot_single_segmentation_matplotlib(df: pd.DataFrame, lower_is_better: bool
             bar.get_x() + bar.get_width() / 2.0, height + 0.01, f"{height:.3f}", ha="center", va="bottom", fontsize=9
         )
 
-    # Create colorbar
-    sm = plt.cm.ScalarMappable(cmap=cmap, norm=norm)
+    # Create colorbar - use the original score values for the colorbar scale
+    if scaling_method == "std":
+        # For std method, create a colorbar that shows the normalized range
+        sm = plt.cm.ScalarMappable(cmap=cmap, norm=plt.Normalize(0, 1))
+    else:
+        # For minmax method, use the actual score range
+        sm = plt.cm.ScalarMappable(cmap=cmap, norm=norm)
+
     sm.set_array([])
     cbar = plt.colorbar(sm, ax=ax)
     cbar.set_label("Score")
@@ -227,7 +311,9 @@ def _plot_single_segmentation_matplotlib(df: pd.DataFrame, lower_is_better: bool
 
 
 # For backward compatibility
-def plot_single_segmentation_mp(df: pd.DataFrame, lower_is_better: bool = True) -> MatplotlibFigure:
+def plot_single_segmentation_mp(
+    df: pd.DataFrame, lower_is_better: bool = True, scaling_method: str = "minmax", scaling_k: float = 2.0
+) -> MatplotlibFigure:
     """Plot the single segmentation using matplotlib (compatibility function).
 
     This is a wrapper around plot_single_segmentation with backend="matplotlib" for backwards compatibility.
@@ -238,6 +324,10 @@ def plot_single_segmentation_mp(df: pd.DataFrame, lower_is_better: bool = True)
         See module docstring for format details.
     lower_is_better : bool, default=True
         Whether lower values indicate better performance.
+    scaling_method : str, default="minmax"
+        Method for scaling colors. Options: "minmax" or "std".
+    scaling_k : float, default=2.0
+        Number of standard deviations for "std" scaling method.
 
     Returns
     -------
@@ -245,11 +335,15 @@ def plot_single_segmentation_mp(df: pd.DataFrame, lower_is_better: bool = True)
         A matplotlib bar chart showing each segment with its corresponding score.
 
     """
-    return plot_single_segmentation(df, lower_is_better, backend="matplotlib")
+    return plot_single_segmentation(
+        df, lower_is_better, backend="matplotlib", scaling_method=scaling_method, scaling_k=scaling_k
+    )
 
 
 # For backward compatibility
-def plot_single_segmentation_impl(df: pd.DataFrame, lower_is_better: bool = True) -> PlotlyFigure:
+def plot_single_segmentation_impl(
+    df: pd.DataFrame, lower_is_better: bool = True, scaling_method: str = "minmax", scaling_k: float = 2.0
+) -> PlotlyFigure:
     """Implement the single segmentation plot as a Plotly bar chart (compatibility function).
 
     This is kept for backwards compatibility and wraps _plot_single_segmentation_plotly.
@@ -260,6 +354,10 @@ def plot_single_segmentation_impl(df: pd.DataFrame, lower_is_better: bool = True
         See module docstring for format details.
     lower_is_better : bool, default=True
         Whether lower values indicate better performance.
+    scaling_method : str, default="minmax"
+        Method for scaling colors. Options: "minmax" or "std".
+    scaling_k : float, default=2.0
+        Number of standard deviations for "std" scaling method.
 
     Returns
     -------
@@ -267,7 +365,7 @@ def plot_single_segmentation_impl(df: pd.DataFrame, lower_is_better: bool = True
         A Plotly bar chart.
 
     """
-    return _plot_single_segmentation_plotly(df, lower_is_better)
+    return _plot_single_segmentation_plotly(df, lower_is_better, scaling_method, scaling_k)
 
 
 @dataclass
@@ -284,6 +382,8 @@ class DoubleSegmPlotting:
     metric_name: str = "score"
     lower_is_better: bool = True
     backend: Backend = "plotly"
+    scaling_method: str = "minmax"
+    scaling_k: float = 2.0
 
     def get_heatmap_df(self) -> pd.DataFrame:
         """Get the DataFrame for the heatmap from the double segmentation df.
@@ -315,10 +415,25 @@ def _plot_heatmap_plotly(self) -> PlotlyFigure:
         # Get color scheme
         color_scheme = _get_color_scheme(self.lower_is_better, "plotly")
 
+        # Normalize scores for color mapping
+        scores = heatmap_df.values.flatten()
+        # Remove NaN values for normalization
+        valid_scores = scores[~np.isnan(scores)]
+        if len(valid_scores) > 0:
+            normalized_scores = normalize_scores(valid_scores, method=self.scaling_method, k=self.scaling_k)
+            # Create a normalized version of the heatmap
+            normalized_heatmap = np.full_like(heatmap_df.values, np.nan)
+            valid_mask = ~np.isnan(heatmap_df.values)
+            if len(valid_scores) > 0:
+                # Map back the normalized scores to the heatmap structure
+                normalized_heatmap[valid_mask] = normalized_scores
+        else:
+            normalized_heatmap = heatmap_df.values
+
         # Create heatmap
         fig = go.Figure(
             data=go.Heatmap(
-                z=heatmap_df.values,
+                z=normalized_heatmap,
                 x=heatmap_df.columns,
                 y=heatmap_df.index,
                 colorscale=color_scheme["colorscale"],
@@ -362,13 +477,27 @@ def _plot_heatmap_matplotlib(self) -> MatplotlibFigure:
         cmap = color_scheme["cmap"]
         assert isinstance(cmap, str), "matplotlib cmap should be a string"
 
+        # Normalize scores for color mapping
+        scores = heatmap_df.values.flatten()
+        # Remove NaN values for normalization
+        valid_scores = scores[~np.isnan(scores)]
+
+        if len(valid_scores) > 0:
+            normalized_scores = normalize_scores(valid_scores, method=self.scaling_method, k=self.scaling_k)
+            # Create a normalized version of the heatmap
+            normalized_heatmap = np.full_like(heatmap_df.values, np.nan)
+            valid_mask = ~np.isnan(heatmap_df.values)
+            normalized_heatmap[valid_mask] = normalized_scores
+        else:
+            normalized_heatmap = heatmap_df.values
+
         # Create heatmap using pcolormesh which creates a QuadMesh collection
         # First create a meshgrid for the x and y coordinates
         x = np.arange(len(heatmap_df.columns) + 1)
         y = np.arange(len(heatmap_df.index) + 1)
 
         # Create the heatmap using pcolormesh
-        mesh = ax.pcolormesh(x, y, heatmap_df.values, cmap=cmap)
+        mesh = ax.pcolormesh(x, y, normalized_heatmap, cmap=cmap, vmin=0, vmax=1)
 
         # Set x and y labels
         ax.set_xticks(np.arange(len(heatmap_df.columns)) + 0.5)
@@ -381,12 +510,14 @@ def _plot_heatmap_matplotlib(self) -> MatplotlibFigure:
         cbar = fig.colorbar(mesh, ax=ax)
         cbar.set_label(self.metric_name)
 
-        # Add text annotations with the values
+        # Add text annotations with the values (use original values, not normalized)
         for i in range(len(heatmap_df.index)):
             for j in range(len(heatmap_df.columns)):
                 value = heatmap_df.values[i, j]
                 if not pd.isna(value):
-                    text_color = "black" if 0.3 < value < 0.7 else "white"
+                    # Determine text color based on normalized value for better contrast
+                    normalized_value = normalized_heatmap[i, j] if not pd.isna(normalized_heatmap[i, j]) else 0.5
+                    text_color = "black" if 0.3 < normalized_value < 0.7 else "white"
                     ax.text(j + 0.5, i + 0.5, f"{value:.3f}", ha="center", va="center", color=text_color)
 
         # Set titles
diff --git a/tests/plotting/test_plot_segmentations.py b/tests/plotting/test_plot_segmentations.py
index c71920a..c0c95b2 100644
--- a/tests/plotting/test_plot_segmentations.py
+++ b/tests/plotting/test_plot_segmentations.py
@@ -1,6 +1,7 @@
 """Tests for the plot_segmentations module."""
 
 import matplotlib.pyplot as plt
+import numpy as np
 import pandas as pd
 import plotly.graph_objects as go
 import pytest
@@ -9,6 +10,7 @@
 
 from tab_right.plotting.plot_segmentations import (
     DoubleSegmPlotting,
+    normalize_scores,
     plot_single_segmentation,
     plot_single_segmentation_mp,
 )
@@ -145,3 +147,91 @@ def test_double_segm_plotting_mp_custom_metric(double_segmentation_df):
 
     # Close the figure to prevent memory leaks
     plt.close(fig)
+
+
+# Tests for the new scaling functionality
+def test_normalize_scores_minmax():
+    """Test normalize_scores with minmax method."""
+    scores = np.array([0.1, 0.2, 0.3, 0.4, 0.5])
+    normalized = normalize_scores(scores, method="minmax")
+
+    # Should be normalized to [0, 1] range
+    assert normalized.min() == 0.0
+    assert normalized.max() == 1.0
+    assert len(normalized) == len(scores)
+
+
+def test_normalize_scores_std():
+    """Test normalize_scores with std method."""
+    scores = np.array([0.1, 0.2, 0.3, 0.4, 0.5])
+    normalized = normalize_scores(scores, method="std", k=2)
+
+    # Should be normalized to [0, 1] range
+    assert 0.0 <= normalized.min() <= 1.0
+    assert 0.0 <= normalized.max() <= 1.0
+    assert len(normalized) == len(scores)
+
+
+def test_normalize_scores_std_with_outliers():
+    """Test normalize_scores with std method handling outliers."""
+    # Create data with outliers
+    scores = np.array([0.1, 0.2, 0.3, 0.4, 2.0])  # 2.0 is an outlier
+    normalized = normalize_scores(scores, method="std", k=2)
+
+    # Outlier should be clipped close to 1.0 (or exactly 1.0 if it exceeds the upper bound)
+    assert normalized[-1] >= 0.95  # Allow some tolerance
+    assert len(normalized) == len(scores)
+
+
+def test_normalize_scores_zero_variance():
+    """Test normalize_scores with zero variance data."""
+    scores = np.array([0.5, 0.5, 0.5, 0.5])
+    normalized = normalize_scores(scores, method="std")
+
+    # Should return zeros for zero variance
+    assert np.all(normalized == 0.0)
+
+
+def test_normalize_scores_invalid_method():
+    """Test normalize_scores with invalid method."""
+    scores = np.array([0.1, 0.2, 0.3])
+
+    with pytest.raises(ValueError, match="Unknown method"):
+        normalize_scores(scores, method="invalid")
+
+
+def test_plot_single_segmentation_scaling_methods(single_segmentation_df):
+    """Test plot_single_segmentation with different scaling methods."""
+    # Test with minmax scaling
+    fig_minmax = plot_single_segmentation(single_segmentation_df, scaling_method="minmax", backend="plotly")
+    assert isinstance(fig_minmax, go.Figure)
+
+    # Test with std scaling
+    fig_std = plot_single_segmentation(single_segmentation_df, scaling_method="std", backend="plotly")
+    assert isinstance(fig_std, go.Figure)
+
+
+def test_plot_single_segmentation_mp_scaling_methods(single_segmentation_df):
+    """Test plot_single_segmentation_mp with different scaling methods."""
+    # Test with matplotlib backend
+    fig_mp_minmax = plot_single_segmentation_mp(single_segmentation_df, scaling_method="minmax")
+    assert isinstance(fig_mp_minmax, MatplotlibFigure)
+    plt.close(fig_mp_minmax)
+
+    fig_mp_std = plot_single_segmentation_mp(single_segmentation_df, scaling_method="std")
+    assert isinstance(fig_mp_std, MatplotlibFigure)
+    plt.close(fig_mp_std)
+
+
+def test_double_segmentation_scaling(double_segmentation_df):
+    """Test DoubleSegmPlotting with scaling methods."""
+    # Test with std scaling
+    plotter_std = DoubleSegmPlotting(df=double_segmentation_df, scaling_method="std", backend="plotly")
+    fig_std = plotter_std.plot_heatmap()
+    assert isinstance(fig_std, go.Figure)
+
+    # Test with minmax scaling
+    plotter_minmax = DoubleSegmPlotting(df=double_segmentation_df, scaling_method="minmax", backend="matplotlib")
+    fig_minmax = plotter_minmax.plot_heatmap()
+    assert isinstance(fig_minmax, MatplotlibFigure)
+    plt.close(fig_minmax)