DataResponsibly
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 78 additions & 0 deletions b/‎.github/workflows/ci.yml‎
Lines changed: 78 additions & 0 deletions
diff --git a/‎xai_ranking/benchmarks/_hilw.py‎
Lines changed: 54 additions & 1 deletion b/‎xai_ranking/benchmarks/_hilw.py‎
Lines changed: 54 additions & 1 deletion
diff --git a/‎xai_ranking/benchmarks/_hre.py‎
Lines changed: 46 additions & 6 deletions b/‎xai_ranking/benchmarks/_hre.py‎
Lines changed: 46 additions & 6 deletions
diff --git a/‎xai_ranking/benchmarks/_lime.py‎
Lines changed: 32 additions & 2 deletions b/‎xai_ranking/benchmarks/_lime.py‎
Lines changed: 32 additions & 2 deletions
diff --git a/‎xai_ranking/benchmarks/_participation.py‎
Lines changed: 55 additions & 0 deletions b/‎xai_ranking/benchmarks/_participation.py‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎xai_ranking/benchmarks/_rank_lime.py‎
Lines changed: 16 additions & 0 deletions b/‎xai_ranking/benchmarks/_rank_lime.py‎
Lines changed: 16 additions & 0 deletions
@@ -0,0 +1,78 @@
+name: Build
+
+on:
+  push:
+    branches: [ main ]
+  pull_request:
+    branches: [ main ]
+
+  workflow_dispatch:
+
+
+permissions:
+  contents: write
+
+jobs:
+  linting:
+    name: Linting
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v2
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: 3.12
+          architecture: x64
+
+      - name: Install dependencies
+        run: |
+          pip install ".[tests]"
+
+      - name: Run code analysis (black, mypy, flake8, pylint)
+        run: |
+          make code-analysis
+
+  build:
+    strategy:
+      fail-fast: false
+      matrix:
+        # NOTE: macos-13 is a workaround for an issue with the latest version
+        os: [ubuntu-latest, macos-13, windows-latest]
+        python: [3.9, "3.10", 3.11, 3.12]
+    name: ${{ matrix.os }} Python ${{ matrix.python }}
+    runs-on: ${{ matrix.os }}
+    steps:
+      - uses: actions/checkout@v2
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: ${{ matrix.python }}
+          architecture: x64
+
+      - name: Install
+        run: |
+          # NOTE: pip, setuptools and wheel should be included with any python 
+          #       installation. It's being installed/upgraded here because the 
+          #       setup-python action is not including setuptools with Python 3.12
+          pip install --upgrade pip setuptools wheel
+          pip install .[tests,optional,docs]
+
+      - name: Test library
+        run: |
+          make test
+
+      - name: Upload coverage to codecov
+        uses: codecov/codecov-action@v4
+        with:
+          files: ./coverage.xml
+          fail_ci_if_error: false
+          token: ${{ secrets.CODECOV_TOKEN }}
+          slug: DataResponsibly/sharp
+
+      - name: Test Docs
+        run: |
+          cd doc
+          make html
@@ -1,11 +1,40 @@
-import numpy as np
+"""
+Methods were adapted from the following paper:
+    Jun Yuan and Aritra Dasgupta. 2023. A Human-in-the-loop Workflow for Multi-Factorial
+    Sensitivity Analysis of Algorithmic Rankers. In Proceedings of the Workshop on
+    Human-In-the-Loop Data Analytics (HILDA '23). Association for Computing Machinery,
+    New York, NY, USA, Article 5, 1–5. https://doi.org/10.1145/3597465.3605221
+"""
 
+import numpy as np
 from xai_ranking.benchmarks.hilw import hilw_contributions, hilw_batch_contributions
 
 
 def human_in_the_loop_experiment(
     X, score_function, upper_bound=1, lower_bound=None, *args, **kwargs
 ):
+    """
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for the experiment.
+    score_function : callable
+        The function used to score the input data.
+    upper_bound : int, optional
+        The upper bound for rank of the items (default is 1).
+    lower_bound : int, optional
+        The lower bound for rank of the items. If None, it defaults to
+        the number of rows in X.
+    *args : tuple
+        Additional positional arguments to pass to the hilw_contributions function.
+    **kwargs : dict
+        Additional keyword arguments to pass to the hilw_contributions function.
+
+    Returns
+    -------
+    pandas.Series
+        The contributions of the features.
+    """
     if lower_bound is None:
         lower_bound = X.shape[0]
 
@@ -17,6 +46,30 @@ def human_in_the_loop_experiment(
 def human_in_the_loop_batch_experiment(
     X, score_function, upper_bound=1, lower_bound=None, random_state=42, *args, **kwargs
 ):
+    """
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for the experiment.
+    score_function : callable
+        The function used to score the input data.
+    upper_bound : int, optional
+        The upper bound for rank of the items (default is 1).
+    lower_bound : int, optional
+        The lower bound for rank of the items. If None, it defaults to
+        the number of rows in X.
+    random_state : int, optional
+        The seed used by the random number generator. Default is 42.
+    *args : tuple
+        Additional positional arguments to pass to the hilw_contributions function.
+    **kwargs : dict
+        Additional keyword arguments to pass to the hilw_contributions function.
+
+    Returns
+    -------
+    pandas.Series
+        The contributions of the features.
+    """
     batch_size = (
         np.ceil(0.1 * len(X)).astype(int)
         if "batch_size" not in kwargs
 
@@ -1,8 +1,4 @@
 """
-Local Explanations of Global Rankings: Insights for Competitive Rankings
-
-Hierarchical Ranking Explanation (HRE) framework.
-
 Anahideh, H., & Mohabbati-Kalejahi, N. (2022). Local explanations of global
 rankings: insights for competitive rankings. IEEE Access, 10, 30676-30693.
 
@@ -24,7 +20,28 @@ def hierarchical_ranking_explanation(
     X, score_function, model_type="OLS", s=5, *args, **kwargs
 ):
     """
-    `model_type` can be one of "DT", "LR", "OLS", "PLS".
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for which explanations are to be generated.
+    score_function : callable
+        A function that takes the input data X and returns scores.
+    model_type : str, optional
+        The type of model to use for feature importance calculation.
+        Can be one of "DT" (Decision Tree), "LR" (Logistic Regression),
+        "OLS" (Ordinary Least Squares), or "PLS" (Partial Least Squares).
+        Default is "OLS".
+    s : int, optional
+        A parameter for the feature importance function. Default is 5.
+    *args : tuple
+        Additional arguments to pass to the feature importance function.
+    **kwargs : dict
+        Additional keyword arguments to pass to the feature importance function.
+
+    Returns
+    -------
+    numpy.ndarray
+        An array of contributions for each observation in the input data.
     """
     # index = X.index
     X = X.copy().reset_index(drop=True)
@@ -52,7 +69,30 @@ def hierarchical_ranking_batch_explanation(
     **kwargs,
 ):
     """
-    `model_type` can be one of "DT", "LR", "OLS", "PLS".
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for which explanations are to be generated.
+    score_function : callable
+        A function that takes the input data X and returns scores.
+    model_type : str, optional
+        The type of model to use for feature importance calculation.
+        Can be one of "DT" (Decision Tree), "LR" (Logistic Regression),
+        "OLS" (Ordinary Least Squares), or "PLS" (Partial Least Squares).
+        Default is "OLS".
+    s : int, optional
+        A parameter for the feature importance function. Default is 5.
+    random_state : int, optional
+        The seed used by the random number generator. Default is 42.
+    *args : tuple
+        Additional arguments to pass to the feature importance function.
+    **kwargs : dict
+        Additional keyword arguments to pass to the feature importance function.
+
+    Returns
+    -------
+    numpy.ndarray
+        An array of contributions for each observation in the input data.
     """
     batch_size = (
         np.ceil(0.1 * len(X)).astype(int)
 
@@ -5,7 +5,21 @@
 
 def lime_experiment(X, score_function, mode="regression", **kwargs):
     """
-    `mode` can be one of `[classification, regression]`.
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for which explanations are to be generated.
+    score_function : callable
+        The function used to score the data.
+    mode : str, default="regression"
+        The mode of the experiment. It can be either "classification" or "regression".
+    **kwargs : dict
+        Additional keyword arguments to be passed to the LIME explainer.
+
+    Returns
+    -------
+    lime_values : array-like
+        The LIME attributions for the input data `X`.
     """
     explainer = LimeTabular(
         score_function,
@@ -20,7 +34,23 @@ def lime_batch_experiment(
     X, score_function, mode="regression", random_state=42, **kwargs
 ):
     """
-    `mode` can be one of `[classification, regression]`.
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data for which explanations are to be generated.
+    score_function : callable
+        The function used to score the data.
+    mode : str, default="regression"
+        The mode of the experiment. It can be either "classification" or "regression".
+    random_state : int, optional
+        The seed used by the random number generator. Default is 42.
+    **kwargs : dict
+        Additional keyword arguments to be passed to the LIME explainer.
+
+    Returns
+    -------
+    lime_values : array-like
+        The LIME attributions for the input data `X`.
     """
     batch_size = (
         np.ceil(0.1 * len(X)).astype(int)
 
@@ -11,6 +11,23 @@
 
 
 def participation_score(X, ranks, top_k=10):
+    """
+    Computes the participation score for the top_k items.
+
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data.
+    ranks : pandas.Series
+        The ranks of the items.
+    top_k : int, optional
+        The number of top items to consider. Default is 10.
+
+    Returns
+    -------
+    pandas.Series
+        The participation score for each feature.
+    """
     mask = ranks <= top_k
     X_top = X[mask]
     # thresh = score_function(X_top).min()
@@ -20,6 +37,25 @@ def participation_score(X, ranks, top_k=10):
 
 
 def weighted_participation_score(X, ranks, weights, top_k=10):
+    """
+    Computes the weighted participation score for the top_k items.
+
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data.
+    ranks : pandas.Series
+        The ranks of the items.
+    weights : pandas.Series
+        The weights for each item.
+    top_k : int, optional
+        The number of top items to consider. Default is 10.
+
+    Returns
+    -------
+    pandas.Series
+        The weighted participation score for each feature.
+    """
     mask = ranks <= top_k
     X_top = X[mask].mul(weights)
     # thresh = score_function(X_top).min()
@@ -29,6 +65,25 @@ def weighted_participation_score(X, ranks, weights, top_k=10):
 
 
 def participation_experiment(X, score_function, top_k=10, weights=None):
+    """
+    Runs the participation score experiment.
+
+    Parameters
+    ----------
+    X : pandas.DataFrame
+        The input data.
+    score_function : callable
+        The function to compute scores.
+    top_k : int, optional
+        The number of top items to consider. Default is 10.
+    weights : pandas.Series, optional
+        The weights for each item. Default is None.
+
+    Returns
+    -------
+    pandas.Series
+        The participation score or weighted participation score for each feature.
+    """
     ranks = scores_to_ordering(score_function(X))
     if weights is not None:
         return weighted_participation_score(X, ranks, weights=weights, top_k=top_k)
 
@@ -4,6 +4,22 @@
 
 
 def rank_lime_experiment(X, score_function, **kwargs):
+    """
+    Parameters
+    ----------
+    X : array-like
+        The input data for which the attributions are to be computed.
+    score_function : callable
+        The model or function used to score the input data.
+    **kwargs : dict
+        Additional keyword arguments to be passed to the RankingLIME constructor.
+
+    Returns
+    -------
+    numpy.ndarray
+        A 2D array where each element represents the attribution score for
+        a specific feature in a specific document.
+    """
     xai = RankingLIME(
         background_data=np.array(X), original_model=score_function, **kwargs
     )