humancompatible
diff --git a/‎.github/workflows/setup.yml‎
Lines changed: 93 additions & 0 deletions b/‎.github/workflows/setup.yml‎
Lines changed: 93 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 4 additions & 0 deletions b/‎.gitignore‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 68 additions & 11 deletions b/‎README.md‎
Lines changed: 68 additions & 11 deletions
diff --git a/‎constraint_demo.ipynb‎
Lines changed: 41 additions & 0 deletions b/‎constraint_demo.ipynb‎
Lines changed: 41 additions & 0 deletions
diff --git a/‎experiments/__init__.py‎ b/‎experiments/__init__.py‎
@@ -0,0 +1,93 @@
+name: Setup check
+
+on:
+  push:
+    branches: [ "main", "neurips" ]
+  pull_request:
+    branches: [ "main", "neurips" ]
+
+
+jobs:
+  run-on-linux:
+    name: Setup on linux
+    runs-on: ubuntu-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.11"]
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v3
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        python -m pip install flake8 pytest
+        pip install -r requirements.txt
+        pip install -e .
+    - name: Run algorithms
+      run: |
+        python experiments/run_folktables.py alg=sslalm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=ghost n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=alm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=sgd n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=fairret n_runs=2 run_maxtime=2
+
+  run-on-windows:
+    name: Setup on windows
+    runs-on: windows-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.11"]
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v3
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        python -m pip install flake8 pytest
+        pip install -r requirements.txt
+        pip install -e .
+    - name: Run algorithms
+      run: |
+        python experiments/run_folktables.py alg=sslalm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=ghost n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=alm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=sgd n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=fairret n_runs=2 run_maxtime=2
+
+  run-on-macos:
+    name: Setup on macos
+    runs-on: macos-latest
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.11"]
+
+    steps:
+    - uses: actions/checkout@v4
+    - name: Set up Python ${{ matrix.python-version }}
+      uses: actions/setup-python@v3
+      with:
+        python-version: ${{ matrix.python-version }}
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        python -m pip install flake8 pytest
+        pip install -r requirements.txt
+        pip install -e .
+    - name: Run algorithms
+      run: |
+        python experiments/run_folktables.py alg=sslalm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=ghost n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=alm n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=sgd n_runs=2 run_maxtime=2
+        python experiments/run_folktables.py alg=fairret n_runs=2 run_maxtime=2
@@ -3,9 +3,13 @@
 experiments/utils/raw_data/
 experiments/utils/exp_results
 experiments/utils/saved_models
+experiments/outputs
 data/
+examples/data
+experiments/data
 .vscode/
 plots/
+outputs/
 
 
 # Byte-compiled / optimized / DLL files
 
@@ -1,6 +1,6 @@
 # Benchmarking Stochastic Approximation Algorithms for Fairness-Constrained Training of Deep Neural Networks
 
-[![License](https://img.shields.io/badge/License-Apache_2.0-blue.svg)](https://opensource.org/licenses/Apache-2.0)
+[![License](https://img.shields.io/badge/License-Apache_2.0-blue.svg)](https://opensource.org/licenses/Apache-2.0) [![Setup](https://github.com/humancompatible/train/actions/workflows/setup.yml/badge.svg)](https://github.com/humancompatible/train/actions/workflows/setup.yml)
 
 This repository provides a tool to compare stochastic-constrained stochastic optimization algorithms on a _fair learning_ task.
 
@@ -16,19 +16,33 @@ requests, please file a
 [Github issue](https://github.com/humancompatible/train/issues). 
 
 ## Basic installation instructions
-The code requires Python version ```3.10```.
+The code requires Python version ```3.11```.
 
 1. Create a virtual environment
+
+**bash** (Linux)
 ```
-python3.10 -m venv fairbenchenv
+python3.11 -m venv fairbenchenv
 source fairbenchenv/bin/activate
 ```
-2. Install from source.
+**cmd** (Windows)
+```
+python -m venv fairbenchenv
+fairbenchenv\Scripts\activate.bat
+```
+2. Install from source (*as an editable package*).
 ```
 git clone https://github.com/humancompatible/train.git
 cd train
 pip install -r requirements.txt
+pip install -e .
 ```
+__Warning__: it is recommended to use Stochastic Ghost with the mkl-accelerated version of the scipy package with Stochastic Ghost; to install it, run
+
+```pip install --force-reinstall -i https://software.repos.intel.com/python/pypi scipy```
+
+after installing requirements.txt; otherwise, the algorithm will run slower. However, this is not supported on MacOS and may fail on some Windows devices.
+
 <!-- Install via pip -->
 <!-- ``` -->
 <!-- pip install folktables -->
@@ -37,24 +51,62 @@ pip install -r requirements.txt
 ## Reproducing the Benchmark
 
 ### Running the algorithms
-To reproduce the experiments in the paper, run ```experiments/run_folktables.py``` with the dataset name, algorithm name and hyperparameters as command line arguments, like below:
-```run_folktables.py --algorithm sslalm --state OK --task income --constraint loss --loss_bound 0.005 --num_exp 10 --time 30 --batch_size 8 -mu 2. -rho 1. -tau 0.01 -eta 5e-2 -beta 0.5```
-This will start 10 runs of the SSL-ALM algorithm, 30 seconds each, and save the model and the results in the ```experiments/utils/saved_models``` and ```experiments/utils/exp_results``` folders.
 
 The benchmark comprises the following algorithms:
 - Stochastic Ghost [[2]](#2),
 - SSL-ALM [[3]](#3),
 - Stochastic Switching Subgradient [[4]](#4).
 
+To reproduce the experiments of the paper, run the following:
+``` python
+cd experiments
+python run_folktables.py data=folktables alg=sslalm
+python run_folktables.py data=folktables alg=alm
+python run_folktables.py data=folktables alg=ghost
+python run_folktables.py data=folktables alg=ssg
+python run_folktables.py data=folktables alg=sgd     # baseline, no fairness
+python run_folktables.py data=folktables alg=fairret # baseline, fairness with regularizer
+```
+Each command will start 10 runs of the `alg`, 30 seconds each.
+The results will be saved to `experiments/utils/saved_models` and `experiments/utils/exp_results`.
+<!-- In the repository, we include the configuration needed to reproduce the experiments in the paper. To do so, go to `experiments` and run `python run_folktables.py data=folktables alg=sslalm`. -->
+<!-- Repeat for the other algorithms by changing the `alg` parameter. -->
+
+This repository uses [Hydra](https://hydra.cc/) to manage parameters; see `experiments/conf` for configuration files. 
+* To change the parameters of the experiment, such as the number of runs for each algorithm, run time, the dataset used (*note: for now supports only Folktables*) - use `experiment.yaml`. 
+* To change the dataset settings - such as file location - or do dataset-specific adjustments, use `data/{dataset_name}.yaml`
+* To change algorithm hyperparameters, use `alg/{algorithm_name}.yaml`.
+* To change constraint hyperparameters, use `constraint/{constraint_name}.yaml`
+
+<!-- ; it is installed as one of the dependencies. -->
+<!-- To learn more about using Hydra, please check out the [official tutorial](https://hydra.cc/docs/tutorials/basic/your_first_app). -->
+
 ### Producing plots
 The plots and tables like the ones in the paper can be produced using the two notebooks. `experiments/algo_plots.ipynb` houses the convergence plots, and `experiments/model_plots.ipynb` - all the others.
 
-**Warning**: As of 16/05, Folktables seems to be unable to connect to the American census servers. This means that downloading the dataset through the code is not possible. Manual download requires two files: the .csv dataset, at https://www2.census.gov/programs-surveys/acs/data/pums/`{year}`/`{horizon}`, and the corresponding .csv description, at https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/; use the flag ```--no-download```. By default, the files will be placed in `experiments/utils/raw_data/{task}/{year}/{horizon}` (e.g. `experiments/utils/raw_data/income/2018/1-Year/{filename}.csv`). A custom path can be specified with the --data_path argument, but it has to have the form `*/{year}/{horizon}/`.
+## Extending the benchmark
 
-## Extending the benchmark 
+**To add a new algorithm**, you can subclass the ```Algorithm``` class. Before you can run it, you will need to follow these steps:
+1. In the `experiments/conf/alg` folder, add a `.yaml` file with `import_name: {ClassName}` (so the code knows which algorithm to import) and the desired keyword parameter values under `params`:
 
-To add a different constraint formulation, you can use the ```FairnessConstraint``` class by passing your callable function to the constructor as ```fn```.
-To add a new algorithm, you can subclass the ```Algorithm``` class.
+```
+import_name: ClassName
+
+params:
+  param_name_1: value
+  param_name_2: value
+```
+
+2. In `src/algorithms/__init__.py`, add `from .{filename} import {ClassName}` (so the code is able to import it).
+
+Now you can run the algorithm by executing `python run_folktables.py data=folktables alg={yaml_file_name}`, or by changing the experiment config files.
+
+**To add a different constraint formulation**, you can use the `FairnessConstraint` class by passing your callable function to the constructor as `fn`. If you use `run_folktables.py`, you can add a new constraint function by following the steps:
+
+1. Add a `.yaml` file with `import_name: {FunctionName}`, along with the desired batch size and bound (*to be reworked for more generality*), to the `experiments/conf/constraint` folder
+2. Import it in `src/constraints/__init__.py` as in step 2 above.
+
+Now, to run the code with your constraint, use the `constraint` field in the main config.
 
 ## License and terms of use
 
@@ -80,6 +132,11 @@ For more information, see https://www.census.gov/data/developers/about/terms-of-
 <!-- } -->
 <!-- ``` -->
 
+## Future work
+
+- Add support for fairness constraints with >=2 subgroups (limitation of the code, not of the algorithms)
+- Add support to datasets besides Folktables
+- Move towards a more PyTorch-like API for optimizers
 
 ## References
 
 
@@ -0,0 +1,41 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "1efc20cc",
+   "metadata": {},
+   "source": [
+    "This notebook will demonstrate the `FairnessConstraint` class and how you can use it to **add a constraint formulation**."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "58feeb34",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "humancompatible",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}