JuliaTrustworthyAI
diff --git a/‎.github/workflows/CI.yml‎
Lines changed: 1 addition & 0 deletions b/‎.github/workflows/CI.yml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 6 additions & 0 deletions b/‎.gitignore‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎Artifacts.toml‎
Lines changed: 7 additions & 7 deletions b/‎Artifacts.toml‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎Project.toml‎
100755100644
Lines changed: 9 additions & 17 deletions b/‎Project.toml‎
100755100644
Lines changed: 9 additions & 17 deletions
diff --git a/‎README.md‎
Lines changed: 49 additions & 16 deletions b/‎README.md‎
Lines changed: 49 additions & 16 deletions
diff --git a/‎README.qmd‎
Lines changed: 22 additions & 32 deletions b/‎README.qmd‎
Lines changed: 22 additions & 32 deletions
@@ -20,6 +20,7 @@ jobs:
         version:
           - '1.6'
           - '1.7'
+          - '1.8'
           - 'nightly'
         os:
           - ubuntu-latest
 
@@ -28,10 +28,16 @@ docs/site/
 # committed for packages, but should be committed for applications that require a static
 # environment.
 Manifest.toml
+# ignore Artifacts.toml due to double-blind:
+Artifacts.toml
 
 /.quarto/
 
 /dev/artifacts/upload
 /dev/python
 .DS_Store
 .Rproj.user
+
+.luarc.json
+
+/.luarc.json
@@ -1,31 +1,31 @@
 [".DS_Store"]
-git-tree-sha1 = "d2fe43d5d50dd19de3c047c6b8be8256c79b7f6d"
+git-tree-sha1 = "b700008b7e45ef6e33455876df46047d9db5080f"
 lazy = true
 
     [[".DS_Store".download]]
-    sha256 = "80caa50f9515c0ede96213ccfaf91fe77bb92e9a509541265410515f180a59f3"
+    sha256 = "adbcc22b0124d0f87d2f00d0af6c49f91c579cb00262605d46c64526c422b369"
     url = "https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/download/artifacts/.DS_Store.tar.gz"
 
 [data]
 git-tree-sha1 = "19e4434c5cec37c302c4fb8a6058b1a685a436ba"
 lazy = true
 
     [[data.download]]
-    sha256 = "a707dbee173dfae97387a0ef0cdf628992987bcd65c47a7e9116f8de9909e869"
+    sha256 = "eedef8395f29d70eb942f85e5ff4c8a3b2cfe9749aaec36c0c631666b1746b9b"
     url = "https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/download/artifacts/data.tar.gz"
 
 [output]
-git-tree-sha1 = "b7827b37cb256c6ed6a5168b235b814b934d91fd"
+git-tree-sha1 = "ac2d6dbcc081bc5b7a4c323c1a2176e7768a5080"
 lazy = true
 
     [[output.download]]
-    sha256 = "b000d10d55a9e6a83ca941a77c39e433ea1a77e688813dfb91d5eb0874cff31b"
+    sha256 = "0c226b114a1f67a065332d16c224e488ec35149f169a278afac2355ba7dac87d"
     url = "https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/download/artifacts/output.tar.gz"
 
 [www]
-git-tree-sha1 = "9a77a16ed5ef3cc433f8ea914fd3b4272f0788ff"
+git-tree-sha1 = "a156f4aeffd1921c2ba088d6b3ebdbb9bc9cf2ec"
 lazy = true
 
     [[www.download]]
-    sha256 = "0b0eb2ab3c946b96b93f90d9e8c3104d3c6cf3d88f2ee344d4656fd693d4dced"
+    sha256 = "8b2f9eb919fa7690fdc31c042419c9b04313edc0616444328b3dcf3243a767e3"
     url = "https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/download/artifacts/www.tar.gz"
@@ -1,54 +1,46 @@
 name = "AlgorithmicRecourseDynamics"
 uuid = "3d1ede72-abb8-4340-bf8e-2ae06849b5ec"
-authors = ["Anonymous"]
+authors = ["Patrick Altmeyer"]
 version = "0.1.0"
 
 [deps]
 CSV = "336ed68f-0bac-5ca0-87d4-7b16caf5d00b"
 CounterfactualExplanations = "2f13d31b-18db-44c1-bc43-ebaf2cff0be0"
 DataFrames = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0"
 Distances = "b4f34e82-e78d-54a5-968a-f98e89d6e8f7"
-FileIO = "5789e2e9-d7fb-5bc7-8068-2c6fae9b9549"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
 Images = "916415d5-f1e6-5110-898d-aaa5f9f070e0"
 KernelFunctions = "ec8451be-7e33-11e9-00cf-bbf324bd1392"
-LaplaceRedux = "c52c1a26-f7c5-402b-80be-ba1e638ad478"
+LazyArtifacts = "4af54fe1-eca0-43a8-85a7-787d91b784e3"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 Logging = "56ddb016-857b-54e1-b83d-db4d58db5568"
-MLJ = "add582a8-e3ab-11e8-2d5e-e98b27df1bc7"
+MLJBase = "a7f614a8-145f-11e9-1d2a-a57a1082229d"
 MLUtils = "f1d291b0-491e-4a28-83b9-f70985020b54"
 Parameters = "d96e819e-fc66-5662-9728-84c9c7592b0a"
-Pkg = "44cfe95a-1eb2-52ea-b672-e2afdf69b78f"
-PlotThemes = "ccf2f8ad-2431-5c83-bf29-c5338b663b6a"
 Plots = "91a5bcdd-55d7-5caf-9e0b-520d859cae80"
 ProgressMeter = "92933f4c-e287-5a05-a399-4b506db050ca"
 RCall = "6f49c342-dc21-5d91-9882-a32aef131414"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 Serialization = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
-Zygote = "e88e6eb3-aa80-5325-afca-941959d7151f"
 
 [compat]
+CounterfactualExplanations = "0.1.4"
 CSV = "0.10"
-CounterfactualExplanations = "0.1"
 DataFrames = "1"
 Distances = "0.10"
-FileIO = "1"
 Flux = "0.13"
 Images = "0.25"
 KernelFunctions = "0.10"
-LaplaceRedux = "0.1"
-MLJ = "0.18, 0.19"
-MLUtils = "0.2, 0.3"
+MLJBase = "0.21.3"
+MLUtils = "0.3.1"
 Parameters = "0.12"
-PlotThemes = "3"
-Plots = "1"
+Plots = "1.37.2"
 ProgressMeter = "1"
-RCall = "0.13"
+RCall = "0.13.14"
 StatsBase = "0.33"
-Zygote = "0.6"
-julia = "1.6"
+julia = "1.6, 1.7, 1.8"
 
 [extras]
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 
@@ -1,30 +1,63 @@
 
+[![Stable](https://img.shields.io/badge/docs-stable-blue.svg)](https://pat-alt.github.io/AlgorithmicRecourseDynamics.jl/stable) [![Dev](https://img.shields.io/badge/docs-dev-blue.svg)](https://pat-alt.github.io/AlgorithmicRecourseDynamics.jl/dev) [![Build Status](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/actions/workflows/CI.yml?query=branch%3Amain) [![Coverage](https://codecov.io/gh/pat-alt/AlgorithmicRecourseDynamics.jl/branch/main/graph/badge.svg)](https://codecov.io/gh/pat-alt/AlgorithmicRecourseDynamics.jl) [![Code Style: Blue](https://img.shields.io/badge/code%20style-blue-4495d1.svg)](https://github.com/invenia/BlueStyle) [![ColPrac: Contributor’s Guide on Collaborative Practices for Community Packages](https://img.shields.io/badge/ColPrac-Contributor's%20Guide-blueviolet.png)](https://github.com/SciML/ColPrac) [![Twitter Badge](https://img.shields.io/twitter/url/https/twitter.com/paltmey.svg?style=social&label=Follow%20%40paltmey)](https://twitter.com/paltmey)
+
 # AlgorithmicRecourseDynamics
 
-<!-- [![Stable](https://img.shields.io/badge/docs-stable-blue.svg)](https://pat-alt.github.io/CounterfactualExplanations.jl/stable) -->
-<!-- [![Dev](https://img.shields.io/badge/docs-dev-blue.svg)](https://pat-alt.github.io/CounterfactualExplanations.jl/dev) -->
+`AlgorithmicRecourseDynamics.jl` is a small package for modeling Algorithmic Recourse Dynamics. It builds on `CounterfactualExplanations`, a package for generating counterfactual explanations.
+
+## Basic Usage
+
+### Data and Model
+
+``` julia
+N = 1000
+xmax = 2
+X, ys = make_blobs(
+    N, 2; 
+    centers=2, as_table=false, center_box=(-xmax => xmax), cluster_std=0.1
+)
+ys .= ys.==2
+X = X'
+counterfactual_data = CounterfactualData(X,ys')
+```
 
-[![Build Status](https://github.com/pat-alt/CounterfactualExplanations.jl/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/pat-alt/CounterfactualExplanations.jl/actions/workflows/CI.yml?query=branch%3Amain) <!-- [![Coverage](https://codecov.io/gh/pat-alt/CounterfactualExplanations.jl/branch/main/graph/badge.svg)](https://codecov.io/gh/pat-alt/CounterfactualExplanations.jl) -->
+``` julia
+n_epochs = 100
+model = Chain(Dense(2,1))
+mod = FluxModel(model)
 
-`AlgorithmicRecourseDynamics.jl` is a Julia package for modelling Algorithmic Recourse Dynamics.
+generator = GenericGenerator()
+```
 
-## Research Paper 📝
+``` julia
+data_train, data_test = Data.train_test_split(counterfactual_data)
+Models.train(mod, data_train; n_epochs=n_epochs)
+plt_original = plot(mod, counterfactual_data; zoom=0, colorbar=false)
+display(plt_original)
+```
 
-**Note** ⚠: You are on the `#original-paper` branch of `AlgorithmicRecourseDynamics.jl`. This branch is a static artifact corresponding to the state of the package at the time the paper was first published. It can be used to replicate the original findings of the paper. For an up-to-date version of the package, please switch to the [`#main`](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl) branch.
+![](README_files/figure-commonmark/cell-5-output-1.svg)
 
-## At a Glance
+### Simulation
 
-The paper titles **Endogenous Macrodynamics in Algorithmic Recourse** is currently under review and not yet published. You can find a preprint along with other resources right here on this branch of the repository:
+``` julia
+models = Dict(:mymodel => mod)
+generators = Dict(:wachter => generator)
+experiment = set_up_experiment(data_train, data_test, models, generators)
+```
 
--   [Paper](paper/paper.pdf)
--   [Notebooks](dev/notebooks/)
--   [Supplementary Appendix](build/dev/notebooks/appendix.html) (download the HTML and view in browser)
--   [Artifacts](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/tag/artifacts) (including data and experimental results)
+``` julia
+run!(experiment)
+```
 
-In this work we investigate what happens if Algorithmic Recourse is actually implemented by a large number of individuals. The chart below illustrates what we mean by Endogenous Macrodynamics in Algorithmic Recourse: (a) we have a simple linear classifier trained for binary classification where samples from the negative class ($y=0$) are marked in blue and samples of the positive class ($y=1$) are marked in orange; (b) the implementation of AR for a random subset of individuals leads to a noticable domain shift; (c) as the classifier is retrained we observe a corresponding model shift; (d) as this process is repeated, the decision boundary moves away from the target class.
+``` julia
+new_data = experiment.recourse_systems[1][1].data
+new_model = experiment.recourse_systems[1][1].model
+plt_original = plot(new_model, new_data; zoom=0, colorbar=false)
+```
 
-![](paper/www/poc.png)
+![](README_files/figure-commonmark/cell-8-output-1.svg)
 
-## Paper Abstract
+## Related Research Paper 📝
 
-Existing work on Counterfactual Explanations (CE) and Algorithmic Recourse (AR) has largely been limited to the static setting and focused on single individuals: given some estimated model the goal is to find valid counterfactuals for individual instance that fulfill various desiderata. The ability of such counterfactuals to handle dynamics like data and model drift remains a largely unexplored research challenge at this point. There has also been surprisingly little work on the related question of how the actual implementation of recourse by one individual may affect other individuals. Through this work we aim to close that gap by systematizing and extending existing knowledge. We first show that many of the existing methodologies can be collectively described by a generalized framework. We then argue that the existing framework fails to account for a hidden external cost of recourse, that only reveals itself when studying the endogenous dynamics of recourse at the group level. Through simulation experiments involving various state-of-the-art counterfactual generators and several benchmark datasets, we generate large numbers of counterfactuals and study the resulting domain and model shifts. We find that the induced shifts are substantial enough to likely impede the applicability Algorithmic Recourse in situations that involve competition for scarce resources. Fortunately, we find various potential mitigation strategies that can be used in combination with existing approaches. Our simulation framework for studying recourse dynamics is fast and open-sourced.
+The package was developed for a research project that investigates the dynamics of various counterfactual generators.
@@ -1,38 +1,28 @@
 ---
 format: 
-    gfm:
-        wrap: none
+  commonmark:
+    variant: -raw_html
+    wrap: none
+execute: 
+  freeze: auto
+  echo: true
+  eval: true
+  output: false
+crossref:
+  fig-prefix: Figure
+  tbl-prefix: Table
+bibliography: bib.bib
+jupyter: julia-1.8
 ---
 
-# AlgorithmicRecourseDynamics
-
-<!-- [![Stable](https://img.shields.io/badge/docs-stable-blue.svg)](https://pat-alt.github.io/CounterfactualExplanations.jl/stable) -->
-<!-- [![Dev](https://img.shields.io/badge/docs-dev-blue.svg)](https://pat-alt.github.io/CounterfactualExplanations.jl/dev) -->
-[![Build Status](https://github.com/pat-alt/CounterfactualExplanations.jl/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/pat-alt/CounterfactualExplanations.jl/actions/workflows/CI.yml?query=branch%3Amain)
-<!-- [![Coverage](https://codecov.io/gh/pat-alt/CounterfactualExplanations.jl/branch/main/graph/badge.svg)](https://codecov.io/gh/pat-alt/CounterfactualExplanations.jl) -->
-
-`AlgorithmicRecourseDynamics.jl` is a Julia package for modelling Algorithmic Recourse Dynamics.
-
-## Research Paper 📝
-
-**Note** ⚠: You are on the `#original-paper` branch of `AlgorithmicRecourseDynamics.jl`. This branch is a static artifact corresponding to the state of the package at the time the paper was first published. It can be used to replicate the original findings of the paper. For an up-to-date version of the package, please switch to the [`#main`](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl) branch.
-
-## At a Glance
+[![Stable](https://img.shields.io/badge/docs-stable-blue.svg)](https://pat-alt.github.io/AlgorithmicRecourseDynamics.jl/stable) 
+[![Dev](https://img.shields.io/badge/docs-dev-blue.svg)](https://pat-alt.github.io/AlgorithmicRecourseDynamics.jl/dev) 
+[![Build Status](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/actions/workflows/CI.yml/badge.svg?branch=main)](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/actions/workflows/CI.yml?query=branch%3Amain) 
+[![Coverage](https://codecov.io/gh/pat-alt/AlgorithmicRecourseDynamics.jl/branch/main/graph/badge.svg)](https://codecov.io/gh/pat-alt/AlgorithmicRecourseDynamics.jl) 
+[![Code Style: Blue](https://img.shields.io/badge/code%20style-blue-4495d1.svg)](https://github.com/invenia/BlueStyle) 
+[![ColPrac: Contributor’s Guide on Collaborative Practices for Community Packages](https://img.shields.io/badge/ColPrac-Contributor's%20Guide-blueviolet.png)](https://github.com/SciML/ColPrac) 
+[![Twitter Badge](https://img.shields.io/twitter/url/https/twitter.com/paltmey.svg?style=social&label=Follow%20%40paltmey)](https://twitter.com/paltmey)
 
-The paper titles **Endogenous Macrodynamics in Algorithmic Recourse** is currently under review and not yet published. You can find
-a preprint along with other resources right here on this branch of the
-repository:
-
-- [Paper](paper/paper.pdf)
-- [Notebooks](dev/notebooks/)
-- [Supplementary Appendix](build/dev/notebooks/appendix.html) (download the HTML and view in browser)
-- [Artifacts](https://github.com/pat-alt/AlgorithmicRecourseDynamics.jl/releases/tag/artifacts) (including data and experimental results)
-
-In this work we investigate what happens if Algorithmic Recourse is actually implemented by a large number of individuals. The chart below illustrates what we mean by Endogenous Macrodynamics in Algorithmic Recourse: (a) we have a simple linear classifier trained for binary classification where samples from the negative class ($y=0$) are marked in blue and samples of the positive class ($y=1$) are marked in orange; (b) the implementation of AR for a random subset of individuals leads to a noticable domain shift; (c) as the classifier is retrained we observe a corresponding model shift; (d) as this process is repeated, the decision boundary moves away from the target class.
-
-![](paper/www/poc.png)
-
-## Paper Abstract
-
-Existing work on Counterfactual Explanations (CE) and Algorithmic Recourse (AR) has largely been limited to the static setting and focused on single individuals: given some estimated model the goal is to find valid counterfactuals for individual instance that fulfill various desiderata. The ability of such counterfactuals to handle dynamics like data and model drift remains a largely unexplored research challenge at this point. There has also been surprisingly little work on the related question of how the actual implementation of recourse by one individual may affect other individuals. Through this work we aim to close that gap by systematizing and extending existing knowledge. We first show that many of the existing methodologies can be collectively described by a generalized framework. We then argue that the existing framework fails to account for a hidden external cost of recourse, that only reveals itself when studying the endogenous dynamics of recourse at the group level. Through simulation experiments involving various state-of-the-art counterfactual generators and several benchmark datasets, we generate large numbers of counterfactuals and study the resulting domain and model shifts. We find that the induced shifts are substantial enough to likely impede the applicability Algorithmic Recourse in situations that involve competition for scarce resources. Fortunately, we find various potential mitigation strategies that can be used in combination with existing approaches. Our simulation framework for studying recourse dynamics is fast and open-sourced. 
+# AlgorithmicRecourseDynamics
 
+{{< include docs/src/_intro.qmd >}}