EqualityAI · JoaoGranja · Oct 13, 2023 · May 30, 2023 · May 31, 2023 · Jun 1, 2023
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
@@ -57,25 +57,25 @@ jobs:
       #----------------------------------------------
       #       Install & configure poetry
       #----------------------------------------------
-      - name: Install Poetry
-        uses: snok/install-poetry@v1
-        with:
-          virtualenvs-create: true
-          virtualenvs-in-project: true
-          installer-parallel: true
+      - name: Install poetry
+        run: |
+          python -m pip install poetry==1.3.1
+
+      - name: Configure poetry
+        run: |
+          python -m poetry config virtualenvs.in-project true
       #----------------------------------------------
       #       load cached venv if cache exists
       #----------------------------------------------
-      - name: Load cached venv
-        id: cached-poetry-dependencies
-        uses: actions/cache@v3
+      - name: Cache the virtualenv
+        uses: actions/cache@v2
         with:
-          path: .venv
-          key: venv-${{ runner.os }}-${{ steps.setup-python.outputs.python-version }}-${{ hashFiles('**/poetry.lock') }}
+          path: ./.venv
+          key: ${{ runner.os }}-venv-${{ hashFiles('**/poetry.lock') }}
       #----------------------------------------------
       #              Install poetry dependencies
       #----------------------------------------------
-      - name: Install poetry dependencies
+      - name: Install dependencies
         run: |
           poetry install --with test
       #----------------------------------------------

diff --git a/PyPI_README.md b/PyPI_README.md
@@ -132,14 +132,14 @@ https://github.com/EqualityAI/EqualityML.git
 ```
 In the root directory of the project run the command:
 ```bash
-pip install -e '.[all]'
+poetry install
 ```
 
 ### Package Testing
 To run the bunch of tests over the EqualityML package, dependencies shall be first installed before calling pytest.
 
 ```sh
-pip install -e '.[tests]'
+poetry install --with test
 pytest tests
 ```
 ### Quick Tour

diff --git a/README.md b/README.md
@@ -123,14 +123,14 @@ https://github.com/EqualityAI/EqualityML.git
 ```
 In the root directory of the project run the command:
 ```bash
-pip install -e '.[all]'
+poetry install
 ```
 
 ### Package Testing
 To run the bunch of tests over the EqualityML package, dependencies shall be first installed before calling pytest.
 
 ```sh
-pip install -e '.[tests]'
+poetry install --with test
 pytest tests
 ```
 ### Quick Tour

diff --git a/data/data_test.csv b/data/data_test.csv
diff --git a/data/data_train.csv b/data/data_train.csv
diff --git a/equalityml/__init__.py b/equalityml/__init__.py
@@ -6,5 +6,5 @@
 
 
 __name__ = "equalityml"
-__version__ = '0.1.0a1'
+__version__ = '0.2.0'
 __all__ = ["FAIR"]
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "equalityml"
-version = "0.1.9-a1"
+version = "0.2.0"
 description = "Algorithms for evaluating fairness metrics and mitigating unfairness in supervised machine learning"
 authors = [
     "Ben Brintz, Mark Zhang, James Ng, Janice Davis, Jared Hansen, Ji won Chang, João Granja, Rizwan Muhammad <support@equalityai.com>"
@@ -18,7 +18,7 @@ classifiers=[
 
 [tool.poetry.dependencies]
 python = "^3.8"
-aif360 = "^0.5.0"
+aif360-fork2 = "0.5.0"
 BlackBoxAuditing = "^0.1.54"
 dalex = "^1.5.0"
 fairlearn = "^0.7.0"

diff --git a/requirements.txt b/requirements.txt
diff --git a/setup.py b/setup.py
diff --git a/tests/integration_test_equalityml.py b/tests/integration_test_equalityml.py
@@ -0,0 +1,183 @@
+import pandas as pd
+import os
+from sklearn.metrics import accuracy_score, roc_auc_score
+from sklearn.ensemble import RandomForestClassifier
+
+from equalityml.fair import FAIR
+from equalityml.stats import paired_ttest
+from equalityml.threshold import discrimination_threshold
+
+CURRENT_PATH = os.path.dirname(os.path.abspath(__file__))
+PACKAGE_PATH = os.path.abspath(os.path.join(CURRENT_PATH, os.pardir))
+
+if __name__ == "__main__":
+
+    # First train a Machine Learning estimator with the training data
+    random_state = 42
+
+    # Read training and testing data.
+    target_var = "HOS"
+    protected_variable = 'RACERETH'
+    train_path = os.path.join(PACKAGE_PATH, 'data', 'data_train.csv')
+    training_data = pd.read_csv(train_path)
+    X_train = training_data.drop(columns=target_var)
+    y_train = training_data[target_var]
+    test_path = os.path.join(PACKAGE_PATH, 'data', 'data_test.csv')
+    testing_data = pd.read_csv(test_path)
+    X_test = testing_data.drop(columns=target_var)
+    y_test = testing_data[target_var]
+
+    # Train a machine learning estimator
+    mdl_clf_1 = RandomForestClassifier(random_state=random_state)
+    mdl_clf_1.fit(X_train, y_train)
+
+    # Compute Fairness score for "statistical_parity_ratio"
+    fair_object = FAIR(ml_model=mdl_clf_1,
+                       training_data=training_data,
+                       testing_data=testing_data,
+                       target_variable=target_var,
+                       protected_variable=protected_variable,
+                       privileged_class=1,
+                       random_seed=random_state)
+
+    fair_object.print_fairness_metrics()
+    for metric_name in fair_object.fairness_metrics_list:
+        print(f"{metric_name} - {fair_object.fairness_metric(metric_name)}")
+
+    metric_name = "statistical_parity_ratio"
+    prev_fairness_metric = fair_object.fairness_metric(metric_name)
+
+    # Compare bias mitigation results
+    comparison_df = fair_object.compare_mitigation_methods(show=False)
+    print(comparison_df)
+
+    fair_object.print_bias_mitigation_methods()
+    mitigation_method = "resampling-preferential"
+    # "resampling-uniform", "resampling", "resampling-preferential", "correlation-remover", "reweighing",
+    # "disparate-impact-remover"
+
+    # mitigation_res = fair_object.bias_mitigation(mitigation_method=mitigation_method)
+    mdl_clf_2 = fair_object.model_mitigation(mitigation_method)
+
+    # Estimate prediction probability and predicted class of training data (Put empty dataframe for testing in order to
+    # estimate this)
+    pred_class = mdl_clf_1.predict(X_test)
+    pred_prob = mdl_clf_1.predict_proba(X_test)
+    pred_prob = pred_prob[:, 1]  # keep probabilities for positive outcomes only
+
+    # Evaluate some scores
+    prev_auc = roc_auc_score(y_test, pred_prob)  # Area under a curve
+    prev_accuracy = accuracy_score(y_test, pred_class)  # classification accuracy
+
+    pred_class = mdl_clf_2.predict(X_test)
+    pred_prob = mdl_clf_2.predict_proba(X_test)
+    pred_prob = pred_prob[:, 1]  # keep probabilities for positive outcomes only
+
+    # re-evaluate the scores
+    new_auc = roc_auc_score(y_test, pred_prob)  # Area under a curve
+    print(f"Previous AUC = {prev_auc} and New AUC = {new_auc}")
+
+    new_accuracy = accuracy_score(y_test, pred_class)  # classification accuracy
+    print(f"Previous accuracy = {prev_accuracy} and New accuracy = {new_accuracy}")
+
+    fair_object.update_classifier(mdl_clf_2)
+    new_fairness_metric = fair_object.fairness_metric(metric_name)
+
+    print(
+        f"Previous Fairness Score = {prev_fairness_metric:.2f} and New Fairness Score = {new_fairness_metric:.2f}")
+
+    data = pd.concat([training_data, testing_data])
+    X = data.drop(columns=target_var)
+    y = data[target_var]
+    X_test = testing_data.drop(columns=target_var)
+    y_test = testing_data[target_var]
+
+    # Paired ttest
+    results = paired_ttest(mdl_clf_1,
+                           X_test,
+                           y_test,
+                           model_2=mdl_clf_2,
+                           method="mcnemar",
+                           threshold=0.5)
+    print("Mcnemar result (chi2, p) = ", results)
+
+    results = paired_ttest(mdl_clf_1,
+                           X,
+                           y,
+                           model_2=mdl_clf_2,
+                           method="5x2cv",
+                           random_seed=random_state)
+    print("5x2cv result (chi2, p) = ", results)
+
+    # Paired t test based on Fairness metric
+    results = paired_ttest(mdl_clf_1,
+                           X,
+                           y,
+                           model_2=mdl_clf_2,
+                           method="5x2cv",
+                           fair_object=fair_object,
+                           mitigation_method=mitigation_method,
+                           scoring=metric_name,
+                           random_seed=random_state)
+    print("5x2cv fairness result by scoring fairness metric (chi2, p) = ", results)
+
+    results = paired_ttest(mdl_clf_1,
+                           X,
+                           y,
+                           method="5x2cv",
+                           fair_object=fair_object,
+                           mitigation_method=mitigation_method,
+                           scoring=metric_name,
+                           compute_discrimination_threshold=True,
+                           decision_maker=(metric_name, 'max'),
+                           random_seed=random_state)
+    print("5x2cv fairness result by scoring fairness metric (chi2, p) = ", results)
+
+    # Paired t test based on accuracy
+    results = paired_ttest(mdl_clf_1,
+                           X,
+                           y,
+                           method="5x2cv",
+                           fair_object=fair_object,
+                           mitigation_method=mitigation_method,
+                           scoring="accuracy",
+                           compute_discrimination_threshold=True,
+                           decision_maker=("accuracy", 'max'),
+                           random_seed=random_state)
+    print("5x2cv fairness result by scoring accuracy (chi2, p) = ", results)
+
+    # Paired t test based on accuracy
+    results = paired_ttest(mdl_clf_1,
+                           X,
+                           y,
+                           method="5x2cv",
+                           fair_object=fair_object,
+                           mitigation_method=mitigation_method,
+                           scoring="accuracy",
+                           random_seed=random_state)
+    print("5x2cv fairness result by scoring accuracy (chi2, p) = ", results)
+
+    # Discrimination Threshold
+    dt = discrimination_threshold(mdl_clf_1,
+                                  X,
+                                  y,
+                                  fair_object=fair_object,
+                                  decision_maker=['f1', 'max'],
+                                  metrics=['f1', 'cost', metric_name],
+                                  utility_costs=[1, -1, -0.1, 0.1],
+                                  show=True)
+    print(f"Discrimination Threshold {dt}")
+
+    X_test = testing_data.drop(columns=target_var)
+    y_Test = testing_data[target_var]
+    # Discrimination Threshold
+    dt = discrimination_threshold(mdl_clf_2,
+                                  X_test,
+                                  y_test,
+                                  fair_object=fair_object,
+                                  decision_maker=['f1', 'max'],
+                                  metrics=['f1', 'cost', metric_name],
+                                  utility_costs=[1, -1, -0.1, 0.1],
+                                  show=True,
+                                  model_training=False)
+    print(f"Discrimination Threshold {dt}")