Update final scoring method for BinaryClassifierEfficacy precision & recall metrics (make 0.5 a threshold) (#725)

frances-h · web-flow · commit 69468353075d · 2025-02-19T11:39:49.000-05:00
diff --git a/sdmetrics/single_table/data_augmentation/base.py b/sdmetrics/single_table/data_augmentation/base.py
@@ -227,13 +227,9 @@ def compute_breakdown(
                 f'fixed_{metric_to_fix}_value': trainer.fixed_value,
             },
         }
-        result['score'] = max(
-            0,
-            (
-                result['augmented_data'][f'{cls.metric_name}_score_validation']
-                - result['real_data_baseline'][f'{cls.metric_name}_score_validation']
-            ),
-        )
+        augmented_score = result['augmented_data'][f'{cls.metric_name}_score_validation']
+        baseline_score = result['real_data_baseline'][f'{cls.metric_name}_score_validation']
+        result['score'] = (augmented_score - baseline_score) / 2 + 0.5
         return result
 
     @classmethod
diff --git a/sdmetrics/single_table/data_augmentation/binary_classifier_precision_efficacy.py b/sdmetrics/single_table/data_augmentation/binary_classifier_precision_efficacy.py
@@ -18,8 +18,8 @@ def compute_breakdown(
         metadata,
         prediction_column_name,
         minority_class_label,
-        classifier,
-        fixed_recall_value,
+        classifier='xgboost',
+        fixed_recall_value=0.9,
     ):
         """Compute the score breakdown of the metric."""
         return super().compute_breakdown(
@@ -42,8 +42,8 @@ def compute(
         metadata,
         prediction_column_name,
         minority_class_label,
-        classifier,
-        fixed_recall_value,
+        classifier='xgboost',
+        fixed_recall_value=0.9,
     ):
         """Compute the score of the metric.
 
diff --git a/tests/integration/single_table/data_augmentation/test_binary_classifier_precision_efficacy.py b/tests/integration/single_table/data_augmentation/test_binary_classifier_precision_efficacy.py
@@ -162,7 +162,7 @@ def test_with_nan_target_column(self):
                 'classifier': 'XGBoost',
                 'fixed_recall_value': 0.8,
             },
-            'score': 0,
+            'score': 0.48571428571428577,
         }
         assert result_breakdown == expected_result
 
@@ -244,6 +244,6 @@ def test_with_multi_class(self):
                 'classifier': 'XGBoost',
                 'fixed_recall_value': 0.8,
             },
-            'score': 0,
+            'score': 0.4944444444444444,
         }
         assert score_breakdown == expected_score_breakdown
diff --git a/tests/integration/single_table/data_augmentation/test_binary_classifier_recall_efficacy.py b/tests/integration/single_table/data_augmentation/test_binary_classifier_recall_efficacy.py
@@ -124,7 +124,7 @@ def test_with_nan_target_column(self):
         )
 
         # Assert
-        assert result_breakdown['score'] in (0, 0.07692307692307698)
+        assert result_breakdown['score'] in (0.5, 0.5384615384615385)
 
     def test_with_minority_being_majority(self):
         """Test the metric when the minority class is the majority class."""
@@ -148,7 +148,7 @@ def test_with_minority_being_majority(self):
         )
 
         # Assert
-        assert score == 0
+        assert score == 0.46153846153846156
 
     def test_with_multi_class(self):
         """Test the metric with multi-class classification.
@@ -175,4 +175,4 @@ def test_with_multi_class(self):
         )
 
         # Assert
-        assert score_breakdown['score'] in (0, 0.07692307692307687)
+        assert score_breakdown['score'] in (0.46153846153846156, 0.5384615384615384)
diff --git a/tests/unit/single_table/data_augmentation/test_base.py b/tests/unit/single_table/data_augmentation/test_base.py
@@ -357,7 +357,7 @@ def test_compute_breakdown(
 
         # Assert
         expected_result = {
-            'score': 0.19999999999999996,
+            'score': 0.6,
             'real_data_baseline': real_data_baseline,
             'augmented_data': augmented_table_result,
             'parameters': {

Original file line number	Diff line number	Diff line change
`@@ -124,7 +124,7 @@ def test_with_nan_target_column(self):`
`124`	`124`	`)`
`125`	`125`
`126`	`126`	`# Assert`
`127`		`- assert result_breakdown['score'] in (0, 0.07692307692307698)`
	`127`	`+ assert result_breakdown['score'] in (0.5, 0.5384615384615385)`
`128`	`128`
`129`	`129`	`def test_with_minority_being_majority(self):`
`130`	`130`	`"""Test the metric when the minority class is the majority class."""`
`@@ -148,7 +148,7 @@ def test_with_minority_being_majority(self):`
`148`	`148`	`)`
`149`	`149`
`150`	`150`	`# Assert`
`151`		`- assert score == 0`
	`151`	`+ assert score == 0.46153846153846156`
`152`	`152`
`153`	`153`	`def test_with_multi_class(self):`
`154`	`154`	`"""Test the metric with multi-class classification.`
`@@ -175,4 +175,4 @@ def test_with_multi_class(self):`
`175`	`175`	`)`
`176`	`176`
`177`	`177`	`# Assert`
`178`		`- assert score_breakdown['score'] in (0, 0.07692307692307687)`
	`178`	`+ assert score_breakdown['score'] in (0.46153846153846156, 0.5384615384615384)`