Add methods for dealing with fairness in rankings (#461)

Trusted-AI · Nov 10, 2023 · 01b77d4 · 01b77d4
1 parent 2572fcb
commit 01b77d4
Show file tree

Hide file tree

Showing 8 changed files with 1,164 additions and 0 deletions.
diff --git a/aif360/algorithms/postprocessing/__init__.py b/aif360/algorithms/postprocessing/__init__.py
@@ -1,3 +1,4 @@
 from aif360.algorithms.postprocessing.calibrated_eq_odds_postprocessing import CalibratedEqOddsPostprocessing
 from aif360.algorithms.postprocessing.eq_odds_postprocessing import EqOddsPostprocessing
 from aif360.algorithms.postprocessing.reject_option_classification import RejectOptionClassification
+from aif360.algorithms.postprocessing.deterministic_reranking import DeterministicReranking
diff --git a/aif360/algorithms/postprocessing/deterministic_reranking.py b/aif360/algorithms/postprocessing/deterministic_reranking.py
@@ -0,0 +1,208 @@
+import numpy as np
+import pandas as pd
+
+from aif360.algorithms import Transformer
+from aif360.datasets import StructuredDataset, RegressionDataset
+
+class DeterministicReranking(Transformer):
+    """A collection of algorithms for construction of fair ranked candidate lists. [1]_ .
+
+    References:
+        .. [1] Sahin Cem Geyik, Stuart Ambler, and Krishnaram Kenthapadi,
+            "Fairness-Aware Ranking in Search & Recommendation Systems with Application to LinkedIn Talent Search,"
+            KDD '19: Proceedings of the 25th ACM SIGKDD International Conference
+            on Knowledge Discovery & Data Mining, July 2019, Pages 2221-2231.
+    """
+
+    def __init__(self,
+            unprivileged_groups,
+            privileged_groups):
+        """
+        Args:
+            unprivileged_groups (list(dict)): Representation for the unprivileged
+                group.
+            privileged_groups (list(dict)): Representation for the privileged
+                group.
+        """
+
+        super(DeterministicReranking, self).__init__(
+            unprivileged_groups=unprivileged_groups,
+            privileged_groups=privileged_groups)
+
+        self.unprivileged_groups = unprivileged_groups
+        self.privileged_groups = privileged_groups
+        self._n_groups = len(unprivileged_groups) + len(privileged_groups)
+        self.s = set(unprivileged_groups[0].keys())
+        self.s_vals = set(self.unprivileged_groups[0].values()).union(set(self.privileged_groups[0].values()))
+
+    def fit(self, dataset: RegressionDataset):
+        if list(self.unprivileged_groups[0].keys())[0] != list(self.privileged_groups[0].keys())[0]:
+            raise ValueError("Different sensitive attributes (not values) specified for unprivileged and privileged groups.")  
+
+        items = dataset.convert_to_dataframe()[0]
+        items = items.sort_values(axis=0, by=dataset.label_names[0], ascending=False)
+
+        if not(self.s.issubset(items.columns)):
+            raise ValueError(f"The dataset must contain the protected attribute(s): '{self.s}'.")
+
+        # if we have just 1 protected attribute
+        if not isinstance(self.s, list) and False:
+            self._item_groups = [items[items[self.s] == ai] for ai in self.s_vals]
+        else:
+            self._item_groups = []
+            for group in self.unprivileged_groups + self.privileged_groups:
+                q = ' & '.join(
+                    [f'{s_i}=="{v_i}"' if isinstance(v_i, str) else f'{s_i}=={v_i}' 
+                     for s_i, v_i in group.items()]
+                     )
+                self._item_groups.append(items.query(q))
+
+        # self._item_groups = {ai: it for ai, it in zip(
+        #     self.s_vals, [items[items[self.s] == ai] for ai in self.s_vals])}
+
+        return self
+
+    def predict(self,
+                    dataset: RegressionDataset,
+                    rec_size: int,
+                    target_prop: list,
+                    rerank_type: str='Constrained',
+                    renormalize_scores: bool=False
+                    ) -> RegressionDataset:
+        """Construct a ranking of candidates in the dataset according to specified proportions of groups.
+
+        Args:
+            dataset (RegressionDataset): Dataset to rerank.
+            rec_size (int): Number of candidates in the output.
+            target_prop (list): Desired proportion of each group in the output.
+            rerank_type: Greedy, Conservative, Relaxed, or Constrained. Determines the type of algorithm \
+                as described in the original paper.
+            renormalize_scores: renormalize label (score) values in the resulting ranking. If True, uses the default \
+                behavior of RegressionDataset.
+
+        Returns:
+            RegressionDataset: The reranked dataset.
+        """
+
+
+        if rec_size <= 0:
+            raise ValueError(f"Output size should be greater than 0, got {rec_size}.")
+        # if np.any(set(target_prop.keys()) != set(self.s_vals)):
+        #     raise ValueError("""Proportion specifications do not match. \
+        #         `target_prop` should have sensitive attribute values as keys.""")
+        if len(dataset.label_names) != 1:
+            raise ValueError(f"Dataset must have exactly one label, got {len(dataset.label_names)}.")
+        if rerank_type not in ['Greedy', 'Conservative', 'Relaxed', 'Constrained']:
+            raise ValueError(f'`rerank_type` must be one of `Greedy`, `Conservative`, `Relaxed`, `Constrained`; got {rerank_type}')
+
+        # group_counts = {a: 0 for a in self.s_vals}
+        group_counts = [0] * self._n_groups
+        rankedItems = []
+        score_label = dataset.label_names[0]
+
+        if rerank_type != 'Constrained':
+            for k in range(1, rec_size+1):
+                below_min, below_max = [], []
+                # get the best-scoring candidate item from each group
+                candidates = [
+                    candidates_gi.iloc[group_counts[g_i]] for g_i, candidates_gi in enumerate(self._item_groups)
+                    ]
+                for group_idx in range(self._n_groups):
+                    # best unranked items for each group
+                    if group_counts[group_idx] < np.floor(k*target_prop[group_idx]):
+                        below_min.append(group_idx)
+                    elif group_counts[group_idx] < np.ceil(k*target_prop[group_idx]):
+                        below_max.append(group_idx)
+                # if some groups are currently underrepresented
+                if len(below_min) != 0:
+                    # choose the best next item among currently underrepresented groups
+                    candidates_bmin = [candidates[group_idx] for group_idx in below_min]
+                    next_group, next_item = max(enumerate(candidates_bmin), key = lambda x: x[1][score_label])
+                # if minimal representation requirements are satisfied
+                else:
+                    # if Greedy, add the highest scoring candidate among the groups
+                    if rerank_type == 'Greedy':
+                        candidates_bmax = [candidates[group_idx] for group_idx in below_max]
+                        next_group, next_item = max(enumerate(candidates_bmax), key = lambda x: x[1][score_label])
+                    # if Conservative, add the candidate from the group least represented so far
+                    elif rerank_type == 'Conservative':
+                        # group_rep = [np.ceil(k*target_prop[group])/target_prop[group] for group in below_max]
+                        # sort by how close the groups are to violating the condition, in case of tie sort by best element score
+                        next_group = min(below_max, key=lambda group_idx:
+                                        (np.ceil(k*target_prop[group_idx])/target_prop[group_idx],
+                                         -candidates[group_idx][score_label]))
+                        next_item = candidates[next_group]
+                    # if Relaxed, relax the conservative requirements
+                    elif rerank_type == 'Relaxed':
+                        next_group = min(below_max, key=lambda group_idx:
+                                            (np.ceil(np.ceil(k*target_prop[group_idx])/target_prop[group_idx]),
+                                             -candidates[group_idx][score_label])
+                                             )
+                        next_item = candidates[next_group]
+
+                rankedItems.append(next_item)
+                group_counts[next_group] += 1
+
+        elif rerank_type == 'Constrained':
+            rankedItems, maxIndices = [], []
+            group_counts, min_counts = [0] * self._n_groups, [0] * self._n_groups
+
+            lastEmpty, k = 0, 0
+            while lastEmpty < rec_size:
+                k+=1
+                # determine the minimum feasible counts of each group at current rec. list size
+                min_counts_at_k = [np.floor(p_gi*k) for p_gi in target_prop]
+                # get sensitive attr. values for which the current minimum count has increased
+                # since last one
+                changed_mins = []
+                for group_idx in range(self._n_groups):
+                    if min_counts_at_k[group_idx] > min_counts[group_idx]:
+                        changed_mins.append(group_idx)
+
+                if len(changed_mins) > 0:
+                    # get the list of candidates to insert and sort them by their score
+                    changed_items = []
+                    # save the candidate AND the index of the group it belongs to
+                    for group_idx in changed_mins:
+                        changed_items.append((group_idx, self._item_groups[group_idx].iloc[group_counts[group_idx]]))
+                    changed_items.sort(key=lambda x: -x[1][score_label])
+
+                    # add the candidate items, starting with the best score
+                    for newitem in changed_items:
+                        if len(rankedItems) == rec_size:
+                            break
+                        maxIndices.append(k-1)
+                        rankedItems.append(newitem[1])
+                        swapInd = lastEmpty
+                        while swapInd > 0 and maxIndices[swapInd-1] >= swapInd and rankedItems[swapInd-1][score_label] < rankedItems[swapInd][score_label]:
+                            maxIndices[swapInd-1], maxIndices[swapInd] = maxIndices[swapInd], maxIndices[swapInd-1]
+                            rankedItems[swapInd-1], rankedItems[swapInd] = rankedItems[swapInd], rankedItems[swapInd-1]
+                            swapInd -= 1
+                        lastEmpty+=1
+                        group_counts[newitem[0]] += 1
+                    min_counts = min_counts_at_k
+
+        res_df = pd.DataFrame(rankedItems, columns=dataset.feature_names + [score_label])
+        res = RegressionDataset(res_df,
+                                dep_var_name=dataset.label_names[0],
+                                protected_attribute_names=dataset.protected_attribute_names,
+                                privileged_classes=dataset.privileged_protected_attributes)
+        if not renormalize_scores:
+            res.labels = np.transpose([res_df[score_label]])
+            res.scores = np.transpose([res_df[score_label]])
+        return res
+
+
+    def fit_predict(self,
+                    dataset: RegressionDataset,
+                    rec_size: int,
+                    target_prop: dict,
+                    rerank_type: str='Constrained',
+                    renormalize_scores: bool=False
+                    ) -> RegressionDataset:
+        self.fit(dataset=dataset)
+        return self.predict(dataset=dataset, 
+                            rec_size=rec_size, 
+                            target_prop=target_prop, 
+                            rerank_type=rerank_type, 
+                            renormalize_scores=renormalize_scores)
diff --git a/aif360/metrics/__init__.py b/aif360/metrics/__init__.py
@@ -4,3 +4,4 @@
 from aif360.metrics.classification_metric import ClassificationMetric
 from aif360.metrics.sample_distortion_metric import SampleDistortionMetric
 from aif360.metrics.mdss_classification_metric import MDSSClassificationMetric 
+from aif360.metrics.regression_metric import RegressionDatasetMetric
diff --git a/aif360/metrics/regression_metric.py b/aif360/metrics/regression_metric.py
@@ -0,0 +1,100 @@
+import numpy as np
+from aif360.metrics import DatasetMetric
+from aif360.datasets import RegressionDataset
+
+
+class RegressionDatasetMetric(DatasetMetric):
+    """Class for computing metrics based on a single
+    :obj:`~aif360.datasets.RegressionDataset`.
+    """
+
+    def __init__(self, dataset, unprivileged_groups=None, privileged_groups=None):
+        """
+        Args:
+            dataset (RegressionDataset): A RegressionDataset.
+            privileged_groups (list(dict)): Privileged groups. Format is a list
+                of `dicts` where the keys are `protected_attribute_names` and
+                the values are values in `protected_attributes`. Each `dict`
+                element describes a single group. See examples for more details.
+            unprivileged_groups (list(dict)): Unprivileged groups in the same
+                format as `privileged_groups`.
+
+        Raises:
+            TypeError: `dataset` must be a
+                :obj:`~aif360.datasets.RegressionDataset` type.
+        """
+        if not isinstance(dataset, RegressionDataset):
+            raise TypeError("'dataset' should be a RegressionDataset")
+
+        # sets self.dataset, self.unprivileged_groups, self.privileged_groups
+        super(RegressionDatasetMetric, self).__init__(dataset,
+            unprivileged_groups=unprivileged_groups,
+            privileged_groups=privileged_groups)
+
+    def infeasible_index(self, target_prop: dict, r: int = None):
+        """
+        Infeasible Index metric, as described in [1]_.
+
+        Args:
+            target_prop (dict): desired proportion of groups.
+            r (int): size of the candidate list over which the metric is calculated.
+            Defaults to the size of the dataset.
+        
+        Returns:
+            A tuple (int, set{int}): InfeasibleIndex and the positions at which the 
+            feasibility condition is violated. 
+        
+    References:
+        .. [1] Sahin Cem Geyik, Stuart Ambler, and Krishnaram Kenthapadi,
+            "Fairness-Aware Ranking in Search & Recommendation Systems with Application to LinkedIn Talent Search,"
+            KDD '19: Proceedings of the 25th ACM SIGKDD International Conference
+            on Knowledge Discovery & Data Mining, July 2019, Pages 2221-2231.
+        """
+        pr_attr_values = np.ravel(
+            self.dataset.unprivileged_protected_attributes + self.dataset.privileged_protected_attributes)
+        if set(list(target_prop.keys())) != set(pr_attr_values):
+            raise ValueError('Desired proportions must be specified for all values of the protected attributes!')
+
+        ranking = np.column_stack((self.dataset.scores, self.dataset.protected_attributes))
+        if r is None:
+            r = np.ravel(self.dataset.scores).shape[0]
+        ii = 0
+        k_viol = set()
+        for k in range(1, r):
+            rk = ranking[:k]
+            for ai in pr_attr_values:
+                count_ai = rk[rk[:,1] == ai].shape[0]
+                if count_ai < np.floor(target_prop[ai]*k):
+                    ii+=1
+                    k_viol.add(k-1)
+        return ii, list(k_viol)
+
+    def discounted_cum_gain(self, r: int = None, full_dataset: RegressionDataset=None, normalized=False):
+        """
+        Discounted Cumulative Gain metric.
+
+        Args:
+            r (int): position up to which to calculate the DCG. If not specified, is set to the size of the dataset.
+            normalized (bool): return normalized DCG.
+            
+        Returns:
+            The calculated DCG.
+        """
+        if r is None:
+            r = np.ravel(self.dataset.scores).shape[0]
+        if r < 0:
+            raise ValueError(f'r must be >= 0, got {r}')
+        if normalized == True and full_dataset is None:
+            raise ValueError('`normalized` is set to True, but `full_dataset` is not specified')
+        if not isinstance(full_dataset, RegressionDataset) and not (full_dataset is None):
+            raise TypeError(f'`full_datset`: expected `RegressionDataset`, got {type(full_dataset)}')
+        scores = np.ravel(self.dataset.scores)[:r]
+        z = self._dcg(scores)
+        if normalized:
+            z /= self._dcg(np.sort(np.ravel(full_dataset.scores))[::-1][:r])
+        return z
+
+    def _dcg(self, scores):
+        logs = np.log2(np.arange(2, len(scores)+2))
+        z = np.sum(scores/logs)
+        return z
diff --git a/docs/source/modules/algorithms.rst b/docs/source/modules/algorithms.rst
@@ -57,6 +57,7 @@ Algorithms
    algorithms.postprocessing.CalibratedEqOddsPostprocessing
    algorithms.postprocessing.EqOddsPostprocessing
    algorithms.postprocessing.RejectOptionClassification
+   algorithms.postprocessing.DeterministicReranking
 
 :mod:`aif360.algorithms`
 ========================