From d2ba8c429a93c9462afed5372a7d595f99bd2dfe Mon Sep 17 00:00:00 2001
From: Samuel Hoffman <hoffman.sc@gmail.com>
Date: Wed, 21 Feb 2024 12:50:42 -0500
Subject: [PATCH] update sphinx requirement (#512)

* add missing try-except imports
* clean up docstrings
* remove explicit __all__ from metrics.py
* drop mdss_bias_scan
* fix parameters missing trailing underscore bug
---
 aif360/metrics/ot_metric.py                   | 25 +++++++++++--------
 aif360/sklearn/datasets/openml_datasets.py    | 25 ++++++++++---------
 aif360/sklearn/inprocessing/infairness.py     | 14 ++++++++---
 aif360/sklearn/metrics/metrics.py             | 24 ------------------
 .../reject_option_classification.py           |  2 --
 docs/Makefile                                 |  2 +-
 docs/requirements.txt                         |  4 +--
 docs/source/conf.py                           | 15 ++++++++---
 docs/source/modules/sklearn.rst               |  1 -
 docs/source/templates/class.rst               |  1 +
 requirements.txt                              |  4 +--
 setup.py                                      |  8 +++---
 12 files changed, 59 insertions(+), 66 deletions(-)

diff --git a/aif360/metrics/ot_metric.py b/aif360/metrics/ot_metric.py
index 5d07ed30..696b68f9 100644
--- a/aif360/metrics/ot_metric.py
+++ b/aif360/metrics/ot_metric.py
@@ -1,7 +1,12 @@
 from typing import Union
 import pandas as pd
 import numpy as np
-import ot
+try:
+    import ot
+except ImportError as error:
+    from logging import warning
+    warning("{}: ot_distance will be unavailable. To install, run:\n"
+            "pip install 'aif360[OptimalTransport]'".format(error))
 from sklearn.preprocessing import LabelEncoder
 
 def _normalize(distribution1, distribution2):
@@ -17,7 +22,7 @@ def _normalize(distribution1, distribution2):
         extra = -np.minimum(np.min(distribution1), np.min(distribution2))
         distribution1 += extra
         distribution2 += extra
-    
+
     total_of_distribution1 = np.sum(distribution1)
     if total_of_distribution1 != 0:
         distribution1 /= total_of_distribution1
@@ -75,10 +80,10 @@ def _evaluate(
     if prot_attr is None:
         initial_distribution, required_distribution, matrix_distance = _transform(ground_truth, classifier, cost_matrix)
         return ot.emd2(a=initial_distribution, b=required_distribution, M=matrix_distance, numItermax=num_iters)
-    
+
     if not ground_truth.nunique() == 2:
         raise ValueError(f"Expected to have exactly 2 target values, got {ground_truth.nunique()}.")
-    
+
     # Calculate EMD between ground truth distribution and distribution of each group
     emds = {}
     for sa_val in sorted(prot_attr.unique()):
@@ -137,7 +142,7 @@ def ot_distance(
     # Assert correct mode passed
     if mode not in ['binary', 'continuous', 'nominal', 'ordinal']:
         raise ValueError(f"Expected one of {['binary', 'continuous', 'nominal', 'ordinal']}, got {mode}.")
-    
+
     # Assert correct types passed to ground_truth, classifier and prot_attr
     if not isinstance(ground_truth, (pd.Series, str)):
         raise TypeError(f"ground_truth: expected pd.Series or str, got {type(ground_truth)}")
@@ -148,17 +153,17 @@ def ot_distance(
             raise TypeError(f"classifier: expected pd.DataFrame for {mode} mode, got {type(classifier)}")
     if prot_attr is not None and not isinstance(prot_attr, (pd.Series, str)):
         raise TypeError(f"prot_attr: expected pd.Series or str, got {type(prot_attr)}")
-    
+
     # Assert correct type passed to cost_matrix
     if cost_matrix is not None and not isinstance(cost_matrix, np.ndarray):
         raise TypeError(f"cost_matrix: expected numpy.ndarray, got {type(cost_matrix)}")
-    
+
     # Assert scoring is "Wasserstein1"
     if not scoring == "Wasserstein1":
         raise ValueError(f"Scoring mode can only be \"Wasserstein1\", got {scoring}")
-    
+
     grt = ground_truth.copy()
- 
+
     if classifier is not None:
         cls = classifier.copy()
         if prot_attr is not None:
@@ -171,7 +176,7 @@ def ot_distance(
         sat.index = grt.index
     else:
         sat = None
-    
+
     uniques = list(grt.unique())
     if mode == "binary":
         if len(uniques) > 2:
diff --git a/aif360/sklearn/datasets/openml_datasets.py b/aif360/sklearn/datasets/openml_datasets.py
index 4525087d..a6a92c2e 100644
--- a/aif360/sklearn/datasets/openml_datasets.py
+++ b/aif360/sklearn/datasets/openml_datasets.py
@@ -168,19 +168,20 @@ def fetch_german(*, data_home=None, cache=True, binary_age=True, usecols=None,
                                dropcols=dropcols, numeric_only=numeric_only,
                                dropna=dropna)
 
-def fetch_bank(*, data_home=None, cache=True, binary_age=True, percent10=False, 
+def fetch_bank(*, data_home=None, cache=True, binary_age=True, percent10=False,
                usecols=None, dropcols=['duration'], numeric_only=False, dropna=False):
     """Load the Bank Marketing Dataset.
 
-    The protected attribute is 'age' (binarized by default as suggested by [#lequy22]: 
-    age >= 25 and age <60 is considered privileged and age< 25 or age >= 60 unprivileged; 
-    see the binary_age flag to keep this continuous). The outcome variable is 'deposit': 
+    The protected attribute is 'age' (binarized by default as suggested by [#lequy22]_:
+    age >= 25 and age <60 is considered privileged and age< 25 or age >= 60 unprivileged;
+    see the binary_age flag to keep this continuous). The outcome variable is 'deposit':
     'yes' or 'no'.
 
-        References:
-            .. [#lequy22] Le Quy, Tai, et al. "A survey on datasets for fairness‐aware machine 
-            learning." Wiley Interdisciplinary Reviews: Data Mining and Knowledge 
-            Discovery 12.3 (2022): e1452.
+    References:
+        .. [#lequy22] `Le Quy, Tai, et al. "A survey on datasets for fairness-
+           aware machine learning." Wiley Interdisciplinary Reviews: Data Mining
+           and Knowledge Discovery 12.3 (2022): e1452.
+           <https://wires.onlinelibrary.wiley.com/doi/pdf/10.1002/widm.1452>`_
 
     Note:
         By default, the data is downloaded from OpenML. See the `bank-marketing
@@ -235,15 +236,15 @@ def fetch_bank(*, data_home=None, cache=True, binary_age=True, percent10=False,
             df[col] = df[col].cat.remove_categories('unknown')
     df.education = df.education.astype('category').cat.reorder_categories(
         ['primary', 'secondary', 'tertiary'], ordered=True)
-    
+
     # binarize protected attribute (but not corresponding feature)
     age = (pd.cut(df.age, [0, 24, 60, 100], ordered=False,
-                labels=[0, 1, 0] if numeric_only 
+                labels=[0, 1, 0] if numeric_only
                 else ['<25 or >=60', '25-60', '<25 or >=60'])
         if binary_age else 'age')
-    age = age.cat.reorder_categories([0, 1] if numeric_only 
+    age = age.cat.reorder_categories([0, 1] if numeric_only
                                     else ['<25 or >=60', '25-60'])
-    
+
     return standardize_dataset(df, prot_attr=[age], target='deposit',
                                usecols=usecols, dropcols=dropcols,
                                numeric_only=numeric_only, dropna=dropna)
diff --git a/aif360/sklearn/inprocessing/infairness.py b/aif360/sklearn/inprocessing/infairness.py
index 04963aa4..99d32eec 100644
--- a/aif360/sklearn/inprocessing/infairness.py
+++ b/aif360/sklearn/inprocessing/infairness.py
@@ -1,10 +1,16 @@
-from inFairness import fairalgo
+try:
+    from inFairness import fairalgo
+    from skorch import NeuralNet
+    from skorch.dataset import unpack_data, Dataset as Dataset_
+    from skorch.utils import is_pandas_ndframe
+except ImportError as error:
+    from logging import warning
+    warning("{}: SenSeI and SenSR will be unavailable. To install, run:\n"
+            "pip install 'aif360[inFairness]'".format(error))
+    Dataset_ = NeuralNet = object
 from sklearn.preprocessing import LabelBinarizer
 from sklearn.utils.multiclass import type_of_target
 from sklearn.exceptions import NotFittedError
-from skorch import NeuralNet
-from skorch.dataset import unpack_data, Dataset as Dataset_
-from skorch.utils import is_pandas_ndframe
 
 
 class Dataset(Dataset_):
diff --git a/aif360/sklearn/metrics/metrics.py b/aif360/sklearn/metrics/metrics.py
index bcbf9c16..80322b17 100644
--- a/aif360/sklearn/metrics/metrics.py
+++ b/aif360/sklearn/metrics/metrics.py
@@ -17,30 +17,6 @@
 from aif360.detectors.mdss.MDSS import MDSS
 
 
-__all__ = [
-    # meta-metrics
-    'difference', 'ratio', 'intersection', 'one_vs_rest',
-    # scorer factory
-    'make_scorer',
-    # helpers
-    'num_samples', 'num_pos_neg',
-    'specificity_score', 'base_rate', 'selection_rate', 'smoothed_base_rate',
-    'smoothed_selection_rate', 'generalized_fpr', 'generalized_fnr',
-    # group fairness
-    'ot_distance', 'statistical_parity_difference', 'disparate_impact_ratio',
-    'equal_opportunity_difference', 'average_odds_difference', 'average_predictive_value_difference',
-    'average_odds_error', 'class_imbalance', 'kl_divergence',
-    'conditional_demographic_disparity', 'smoothed_edf',
-    'df_bias_amplification', 'mdss_bias_score',
-    # individual fairness
-    'generalized_entropy_index', 'generalized_entropy_error',
-    'between_group_generalized_entropy_error', 'theil_index',
-    'coefficient_of_variation', 'consistency_score',
-    # aliases
-    'sensitivity_score', 'mean_difference', 'false_negative_rate_error',
-    'false_positive_rate_error'
-]
-
 # ============================= META-METRICS ===================================
 def difference(func, y_true, y_pred=None, prot_attr=None, priv_group=1,
                sample_weight=None, **kwargs):
diff --git a/aif360/sklearn/postprocessing/reject_option_classification.py b/aif360/sklearn/postprocessing/reject_option_classification.py
index 331f63e0..84d4a082 100644
--- a/aif360/sklearn/postprocessing/reject_option_classification.py
+++ b/aif360/sklearn/postprocessing/reject_option_classification.py
@@ -85,8 +85,6 @@ def __init__(self, prot_attr=None, threshold=0.5, margin=0.1):
             margin (scalar): Half width of the critical region. Estimates within
                 the critical region are "rejected" and assigned according to
                 their group. Must be between 0 and min(threshold, 1-threshold).
-            metric ('statistical_parity', 'average_odds', 'equal_opportunity',
-                or callable):
         """
         self.prot_attr = prot_attr
         self.threshold = threshold
diff --git a/docs/Makefile b/docs/Makefile
index f417938a..765e0cff 100644
--- a/docs/Makefile
+++ b/docs/Makefile
@@ -3,7 +3,7 @@
 
 # You can set these variables from the command line.
 SPHINXOPTS    =
-SPHINXBUILD   = python -msphinx
+SPHINXBUILD  ?= sphinx-build
 SPHINXPROJ    = aif360
 SOURCEDIR     = source
 BUILDDIR      = build
diff --git a/docs/requirements.txt b/docs/requirements.txt
index 02d6a583..7aae1e26 100644
--- a/docs/requirements.txt
+++ b/docs/requirements.txt
@@ -5,6 +5,6 @@ fairlearn>=0.7.0
 pytest>=3.5.0
 
 # docs
-sphinx==1.8.6
+sphinx==7.2.6
 jinja2==3.0.3
-sphinx_rtd_theme==0.4.3
+sphinx_rtd_theme==2.0.0
diff --git a/docs/source/conf.py b/docs/source/conf.py
index d834cf4b..c4714a2a 100644
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -41,12 +41,16 @@
     'sphinx.ext.intersphinx',
     'sphinx.ext.mathjax']
 
+flv = tuple(map(int, fairlearn.__version__.split('.')))
+if flv > (0, 7, 0) and flv[-1] == 0:
+    flv = flv[:-1]
+flv = '.'.join(map(str, flv))
 intersphinx_mapping = {
-    'numpy': ('https://docs.scipy.org/doc/numpy/', None),
-    'scipy': ('https://docs.scipy.org/doc/scipy/reference/', None),
+    'numpy': ('https://numpy.org/doc/stable/', None),
+    'scipy': ('https://docs.scipy.org/doc/scipy/', None),
     'pandas': ('https://pandas.pydata.org/pandas-docs/stable/', None),
     'sklearn': ('https://scikit-learn.org/stable/', None),
-    'fairlearn': (f'https://fairlearn.github.io/v{fairlearn.__version__}/', None),
+    'fairlearn': (f'https://fairlearn.org/v{flv}/', None),
     'python': ('https://docs.python.org/{}.{}'.format(*sys.version_info), None),
     'inFairness': ('https://ibm.github.io/inFairness/', None),
     'skorch': ('https://skorch.readthedocs.io/en/stable/', None),
@@ -97,7 +101,7 @@
 #
 # This is also used if you do content translation via gettext catalogs.
 # Usually you set "language" from the command line for these cases.
-language = None
+language = 'en'
 
 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
@@ -117,6 +121,9 @@
 # If true, `todo` and `todoList` produce output, else they produce nothing.
 todo_include_todos = False
 
+# If true, parameters with trailing underscores will be properly escaped.
+strip_signature_backslash = True
+
 
 # -- Options for HTML output ----------------------------------------------
 
diff --git a/docs/source/modules/sklearn.rst b/docs/source/modules/sklearn.rst
index f92127d7..7fe8c8df 100644
--- a/docs/source/modules/sklearn.rst
+++ b/docs/source/modules/sklearn.rst
@@ -119,7 +119,6 @@ Group fairness metrics
    metrics.smoothed_edf
    metrics.df_bias_amplification
    metrics.between_group_generalized_entropy_error
-   metrics.mdss_bias_scan
    metrics.mdss_bias_score
 
 Individual fairness metrics
diff --git a/docs/source/templates/class.rst b/docs/source/templates/class.rst
index 9ce9f9e6..59cd39a1 100644
--- a/docs/source/templates/class.rst
+++ b/docs/source/templates/class.rst
@@ -4,6 +4,7 @@
 .. currentmodule:: {{ module }}
 
 .. autoclass:: {{ objname }}
+   :members:
 
    {% block methods %}
    {% if methods %}
diff --git a/requirements.txt b/requirements.txt
index d15a8e2f..42c6d0bd 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -24,6 +24,6 @@ pytest>=3.5.0
 pytest-cov>=2.8.1
 
 # docs
-sphinx==1.8.6
+sphinx==7.2.6
 jinja2==3.0.3
-sphinx_rtd_theme==0.4.3
+sphinx_rtd_theme==2.0.0
diff --git a/setup.py b/setup.py
index 216cf553..538c0488 100644
--- a/setup.py
+++ b/setup.py
@@ -1,5 +1,5 @@
 from setuptools import setup, find_packages
-from functools import reduce
+from itertools import chain
 
 long_description = """The AI Fairness 360 toolkit is an open-source library to help detect and mitigate bias in machine
 learning models. The AI Fairness 360 Python package includes a comprehensive set of metrics for datasets and models to
@@ -25,9 +25,9 @@
     'notebooks': ['jupyter', 'tqdm', 'igraph[plotting]', 'lightgbm', 'seaborn', 'ipympl'],
     'OptimalTransport': ['pot'],
 }
-extras['tests'] = reduce(lambda l1, l2: l1+l2, extras.values(), ['pytest>=3.5', 'pytest-cov>=2.8.1'])
-extras['docs'] = ['sphinx<2', 'jinja2<3.1.0', 'sphinx_rtd_theme']
-extras['all'] = list(reduce(lambda s, l: s.union(l), extras.values(), set()))
+extras['tests'] = list(chain(*extras.values(), ['pytest>=3.5', 'pytest-cov>=2.8.1']))
+extras['docs'] = ['sphinx', 'jinja2<3.1.0', 'sphinx_rtd_theme']
+extras['all'] = list(set(chain(*extras.values())))
 
 setup(name='aif360',
       version=version,