dscolby
diff --git a/‎.github/workflows/CI.yml
Lines changed: 2 additions & 0 deletions b/‎.github/workflows/CI.yml
Lines changed: 2 additions & 0 deletions
diff --git a/‎.gitignore
Lines changed: 1 addition & 0 deletions b/‎.gitignore
Lines changed: 1 addition & 0 deletions
diff --git a/‎Manifest.toml
Lines changed: 43 additions & 10 deletions b/‎Manifest.toml
Lines changed: 43 additions & 10 deletions
diff --git a/‎Project.toml
Lines changed: 3 additions & 1 deletion b/‎Project.toml
Lines changed: 3 additions & 1 deletion
diff --git a/‎README.md
Lines changed: 39 additions & 48 deletions b/‎README.md
Lines changed: 39 additions & 48 deletions
diff --git a/‎docs/src/api.md
Lines changed: 1 addition & 0 deletions b/‎docs/src/api.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/src/guide/doublemachinelearning.md
Lines changed: 10 additions & 9 deletions b/‎docs/src/guide/doublemachinelearning.md
Lines changed: 10 additions & 9 deletions
diff --git a/‎docs/src/guide/estimatorselection.md
Lines changed: 1 addition & 1 deletion b/‎docs/src/guide/estimatorselection.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/src/guide/gcomputation.md
Lines changed: 10 additions & 10 deletions b/‎docs/src/guide/gcomputation.md
Lines changed: 10 additions & 10 deletions
diff --git a/‎docs/src/guide/its.md
Lines changed: 8 additions & 7 deletions b/‎docs/src/guide/its.md
Lines changed: 8 additions & 7 deletions
@@ -3,6 +3,7 @@ on:
   push:
     branches:
       - main
+      - development
     tags: '*'
   pull_request:
     branches:
@@ -25,6 +26,7 @@ jobs:
           - '1.8'
           - '1.9'
           - '1.10'
+          - '1.11'
           - 'nightly'
         os:
           - ubuntu-latest
 
@@ -1 +1,2 @@
 /docs/build
+/.vscode
@@ -1,41 +1,74 @@
 # This file is machine-generated - editing it directly is not advised
 
-julia_version = "1.8.5"
+julia_version = "1.11.1"
 manifest_format = "2.0"
-project_hash = "18a38d2a3c0a24ffa847859ade56a5a957640011"
+project_hash = "48b0ecc3de09367019241b9866f1be8d1ab8f4cc"
 
 [[deps.Artifacts]]
 uuid = "56f22d72-fd6d-98f1-02f0-08ddc0907c33"
+version = "1.11.0"
 
 [[deps.CompilerSupportLibraries_jll]]
 deps = ["Artifacts", "Libdl"]
 uuid = "e66e0078-7015-5450-92f7-15fbd957f2ae"
-version = "1.0.1+0"
+version = "1.1.1+0"
+
+[[deps.DataAPI]]
+git-tree-sha1 = "abe83f3a2f1b857aac70ef8b269080af17764bbe"
+uuid = "9a962f9c-6df0-11e9-0e5d-c546b8b5ee8a"
+version = "1.16.0"
+
+[[deps.DataValueInterfaces]]
+git-tree-sha1 = "bfc1187b79289637fa0ef6d4436ebdfe6905cbd6"
+uuid = "e2d170a0-9d28-54be-80f0-106bbe20a464"
+version = "1.0.0"
+
+[[deps.IteratorInterfaceExtensions]]
+git-tree-sha1 = "a3f24677c21f5bbe9d2a714f95dcd58337fb2856"
+uuid = "82899510-4779-5014-852e-03e436cf321d"
+version = "1.0.0"
 
 [[deps.Libdl]]
 uuid = "8f399da3-3557-5675-b5ff-fb832c97cbdb"
+version = "1.11.0"
 
 [[deps.LinearAlgebra]]
-deps = ["Libdl", "libblastrampoline_jll"]
+deps = ["Libdl", "OpenBLAS_jll", "libblastrampoline_jll"]
 uuid = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
+version = "1.11.0"
 
 [[deps.OpenBLAS_jll]]
 deps = ["Artifacts", "CompilerSupportLibraries_jll", "Libdl"]
 uuid = "4536629a-c528-5b80-bd46-f80d51c5b363"
-version = "0.3.20+0"
+version = "0.3.27+1"
+
+[[deps.OrderedCollections]]
+git-tree-sha1 = "12f1439c4f986bb868acda6ea33ebc78e19b95ad"
+uuid = "bac558e1-5e72-5ebc-8fee-abe8a469f55d"
+version = "1.7.0"
 
 [[deps.Random]]
-deps = ["SHA", "Serialization"]
+deps = ["SHA"]
 uuid = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
+version = "1.11.0"
 
 [[deps.SHA]]
 uuid = "ea8e919c-243c-51af-8825-aaa63cd721ce"
 version = "0.7.0"
 
-[[deps.Serialization]]
-uuid = "9e88b42a-f829-5b0c-bbe9-9e923198166b"
+[[deps.TableTraits]]
+deps = ["IteratorInterfaceExtensions"]
+git-tree-sha1 = "c06b2f539df1c6efa794486abfb6ed2022561a39"
+uuid = "3783bdb8-4a98-5b6b-af9a-565f29a5fe9c"
+version = "1.0.1"
+
+[[deps.Tables]]
+deps = ["DataAPI", "DataValueInterfaces", "IteratorInterfaceExtensions", "OrderedCollections", "TableTraits"]
+git-tree-sha1 = "598cd7c1f68d1e205689b1c2fe65a9f85846f297"
+uuid = "bd369af6-aec1-5ad0-b16a-f7cc5008161c"
+version = "1.12.0"
 
 [[deps.libblastrampoline_jll]]
-deps = ["Artifacts", "Libdl", "OpenBLAS_jll"]
+deps = ["Artifacts", "Libdl"]
 uuid = "8e850b90-86db-534c-a0d3-1478176c7d93"
-version = "5.1.1+0"
+version = "5.11.0+0"
@@ -1,18 +1,20 @@
 name = "CausalELM"
 uuid = "26abab4e-b12e-45db-9809-c199ca6ddca8"
 authors = ["Darren Colby <[email protected]> and contributors"]
-version = "0.7.0"
+version = "0.8.0"
 
 [deps]
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
+Tables = "bd369af6-aec1-5ad0-b16a-f7cc5008161c"
 
 [compat]
 Aqua = "0.8"
 DataFrames = "1.5"
 Documenter = "1.2"
 LinearAlgebra = "1.7"
 Random = "1.7"
+Tables = "1.12.0"
 Test = "1.7"
 julia = "1.7"
 
 
@@ -34,51 +34,39 @@
 </p>
 
 <p>
-CausalELM enables estimation of causal effects in settings where a randomized control trial 
-or traditional statistical models would be infeasible or unacceptable. It enables estimation 
-of the average treatment effect (ATE)/intent to treat effect (ITE) with interrupted time 
-series analysis, G-computation, and double machine learning; average treatment effect on the 
-treated (ATT) with G-computation; cumulative treatment effect with interrupted time series 
-analysis; and the conditional average treatment effect (CATE) via S-learning, T-learning, 
-X-learning, R-learning, and doubly robust estimation. Underlying all of these estimators are 
-ensembles of extreme learning machines, a simple neural network that uses randomized weights 
-and least squares optimization instead of gradient descent. Once a model has been estimated, 
-CausalELM can summarize the model and conduct sensitivity analysis to validate the 
-plausibility of modeling assumptions. Furthermore, all of this can be done in four lines of 
-code.
+CausalELM provides easy-to-use implementations of modern causal inference methods. While
+CausalELM implements a variety of estimators, they all have one thing in common—the use of 
+machine learning models to flexibly estimate causal effects. This is where the ELM in 
+CausalELM comes from—the machine learning model underlying all the estimators is an extreme 
+learning machine (ELM). ELMs are a simple neural network that use randomized weights and 
+offer a good tradeoff between learning non-linear dependencies and simplicity. Furthermore, 
+CausalELM implements bagged ensembles of ELMs to reduce the variance resulting from 
+randomized weights.
 </p>
 
-<h2>Extreme Learning Machines and Causal Inference</h2>
+<h2>Estimators</h2>
 <p>
-In some cases we would like to know the causal effect of some intervention but we do not 
-have the counterfactual, making conventional methods of statistical analysis infeasible. 
-However, it may still be possible to get an unbiased estimate of the causal effect (ATE, 
-ATE, or ITT) by predicting the counterfactual and comparing it to the observed outcomes. 
-This is the approach CausalELM takes to conduct interrupted time series analysis, 
-G-Computation, double machine learning, and metalearning via S-Learners, T-Learners, 
-X-Learners, R-learners, and doubly robust estimation. In interrupted time series analysis, 
-we want to estimate the effect of some intervention on the outcome of a single unit that we 
-observe during multiple time periods. For example, we might want to know how the 
-announcement of a merger affected the price of Stock A. To do this, we need to know what the 
-price of stock A would have been if the merger had not been announced, which we can predict 
-with machine learning methods. Then, we can compare this predicted counterfactual to the 
-observed price data to estimate the effect of the merger announcement. In another case, we 
-might want to know the effect of medicine X on disease Y but the administration of X was not 
-random and it might have also been administered at mulitiple time periods, which would 
-produce biased estimates. To overcome this, G-computation models the observed data, uses the 
-model to predict the outcomes if all patients recieved the treatment, and compares it to the 
-predictions of the outcomes if none of the patients recieved the treatment. Double machine 
-learning (DML) takes a similar approach but also models the treatment mechanism and uses it 
-to adjust the initial estimates. This approach has three advantages. First, it is more 
-efficient with high dimensional data than conventional methods. Metalearners take a similar 
-approach to estimate the CATE. While all of these models are different, they have one thing 
-in common: how well they perform depends on the underlying model they fit to the data. To 
-that end, CausalELMs use bagged ensembles of extreme learning machines because they are 
-simple yet flexible enough to be universal function approximators with lower varaince than 
-single extreme learning machines.
+CausalELM implements estimators for aggreate e.g. average treatment effect (ATE) and 
+individualized e.g. conditional average treatment effect (CATE) quantities of interest.
 </p>
 
-<h2>CausalELM Features</h2>
+<h3>Estimators for Aggregate Effects</h3>
+<ul>
+    <li>Interrupted Time Series Estimator</li>
+    <li>G-computation</li>
+    <li>Double machine Learning</li>
+</ul>
+
+<h3>Individualized Treatment Effect (CATE) Estimators</h3>
+<ul>
+    <li>S-learner</li>
+    <li>T-learner</li>
+    <li>X-learner</li>
+    <li>R-learner</li>
+    <li>Doubly Robust Estimator</li>
+</ul>
+
+<h2>Features</h2>
 <ul>
   <li>Estimate a causal effect, get a summary, and validate assumptions in just four lines of code</li>
   <li>Bagging improves performance and reduces variance without the need to tune a regularization parameter</li>
@@ -87,25 +75,28 @@ single extreme learning machines.
   <li>Most inference and validation tests do not assume functional or distributional forms</li>
   <li>Implements the latest techniques form statistics, econometrics, and biostatistics</li>
   <li>Works out of the box with arrays or any data structure that implements the Tables.jl interface</li>
+  <li>Works out of the box with AbstractArrays or any data structure that implements the Tables.jl interface</li>
+  <li>Works with CuArrays, ROCArrays, and any other GPU-specific arrays that are AbstractArrays</li>
+  <li>CausalELM is lightweight—its only dependency is Tables.jl</li>
   <li>Codebase is high-quality, well tested, and regularly updated</li>
 </ul>
 
 <h2>What's New?</h2>
 <ul>
-  <li>Now includes doubly robust estimator for CATE estimation</li>
-  <li>All estimators now implement bagging to reduce predictive performance and reduce variance</li>
-  <li>Counterfactual consistency validation simulates more realistic violations of the counterfactual consistency assumption</li>
+  <li>See the JuliaCon 2024 CausalELM demonstration <a href="https://www.youtube.com/watch?v=hh_cyj8feu8&t=26s">here.
+  <li>Includes support for GPU-specific arrays and data structures that implement the Tables.jl API<li>
+  <li>Only performs randomization inference when the inference argument is set to true in summarize methods</li>
+  <li>Summaries support calculating marginal effects and confidence intervals</li>
+  <li>Randomization inference now uses multithreading</li>
+  <li>Refactored code to be easier to extend and understand</li>
   <li>Uses a simple heuristic to choose the number of neurons, which reduces training time and still works well in practice</li>
   <li>Probability clipping for classifier predictions and residuals is no longer necessary due to the bagging procedure</li>
-  <li>CausalELM talk has been accepted to JuliaCon 2024!</li> 
 </ul>
 
 <h2>What's Next?</h2>
 <p>
-Newer versions of CausalELM will hopefully support using GPUs and provide interpretations of 
-the results of calling validate on a model that has been estimated. In addition, some 
-estimators will also support using instrumental variables. However, these priorities could 
-also change depending on feedback recieved at JuliaCon.
+Efforts for the next version of CausalELM will focus on providing interpreteations for the results of callin validate as well
+as fixing any bugs and eliciting feedback.
 </p>
 
 <h2>Disclaimer</h2>
 
@@ -112,4 +112,5 @@ CausalELM.clip_if_binary
 CausalELM.@model_config
 CausalELM.@standard_input_data
 CausalELM.generate_folds
+CausalELM.convert_if_table
 ```
@@ -16,9 +16,9 @@ the residuals from the first stage models.
 
 ## Step 1: Initialize a Model
 The DoubleMachineLearning constructor takes at least three arguments—covariates, a 
-treatment statuses, and outcomes, all of which may be either an array or any struct that 
-implements the Tables.jl interface (e.g. DataFrames). This estimator supports binary, count, 
-or continuous treatments and binary, count, continuous, or time to event outcomes.
+treatment statuses, and outcomes, all of which may be either an AbstractArray or any struct 
+that implements the Tables.jl interface (e.g. DataFrames). This estimator supports binary, 
+count, or continuous treatments and binary, count, continuous, or time to event outcomes.
 
 !!! note
     Non-binary categorical outcomes are treated as continuous.
@@ -28,8 +28,8 @@ or continuous treatments and binary, count, continuous, or time to event outcome
     extreme learning machines to incorporate in the ensemble, the number of features to 
     consider for each extreme learning machine, the activation function to use, the number 
     of observations to bootstrap in each extreme learning machine, and the number of neurons 
-    in each extreme learning machine. These arguments are specified with the `folds`, 
-    `num_machines`, `num_features`, `activation`, `sample_size`, and `num_neurons` keywords.
+    in each extreme learning machine. These arguments are specified with the folds, 
+    num\_machines, num\_features, activation, sample\_size, and num\_neurons keywords.
 
 ```julia
 # Create some data with a binary treatment
@@ -53,10 +53,11 @@ estimate_causal_effect!(dml)
 We can get a summary of the model by pasing the model to the summarize method.
 
 !!!note
-    To calculate the p-value and standard error for the treatmetn effect, you can set the 
-    inference argument to false. However, p-values and standard errors are calculated via 
-    randomization inference, which will take a long time. But can be sped up by launching 
-    Julia with a higher number of threads.
+    To calculate the p-value, standard error, and confidence interval for the treatment 
+    effect, you can set the inference keyword to true. However, these values are calculated 
+    via randomization inference, which will take a long time. This can be greatly sped up by 
+    launching Julia with more threads and lowering the number of iterations using the n 
+    keyword (at the expense of accuracy).
 
 ```julia
 # Can also use the British spelling
 
@@ -6,7 +6,7 @@ given dataset and causal question.
 | Model                            | Struct                | Causal Estimands                 | Supported Treatment Types | Supported Outcome Types                  |
 |----------------------------------|-----------------------|----------------------------------|---------------------------|------------------------------------------|
 | Interrupted Time Series Analysis | InterruptedTimeSeries | ATE, Cumulative Treatment Effect | Binary                   | Continuous, Count[^1], Time to Event         |
-| G-computation                    | GComputation          | ATE, ATT, ITT                    | Binary                   | Binary,Continuous, Time to Event, Count[^1] |
+| G-computation                    | GComputation          | ATE, ATT, ITT                    | Binary                   | Binary, Continuous, Time to Event, Count[^1] |
 | Double Machine Learning          | DoubleMachineLearning | ATE                              | Binary, Count[^1], Continuous | Binary, Count[^1], Continuous, Time to Event |
 | S-learning                       | SLearner              | CATE                             | Binary                    | Binary, Continuous, Time to Event, Count[^1] |
 | T-learning                       | TLearner              | CATE                             | Binary                    | Binary, Continuous, Count[^1], Time to Event |
 
@@ -16,9 +16,9 @@ steps for using G-computation in CausalELM are below.
 
 ## Step 1: Initialize a Model
 The GComputation constructor takes at least three arguments: covariates, treatment statuses, 
-outcomes, all of which can be either an array or any data structure that implements the 
-Tables.jl interface (e.g. DataFrames). This implementation supports binary treatments and 
-binary, continuous, time to event, and count outcome variables.
+outcomes, all of which can be either an AbstractArray or any data structure that implements 
+the Tables.jl interface (e.g. DataFrames). This implementation supports binary treatments 
+and binary, continuous, time to event, and count outcome variables.
 
 !!! note
     Non-binary categorical outcomes are treated as continuous.
@@ -29,9 +29,8 @@ binary, continuous, time to event, and count outcome variables.
     number of features to consider for each extreme learning machine, the number of 
     bootstrapped observations to include in each extreme learning machine, and the number of 
     neurons to use during estimation. These options are specified with the following keyword 
-    arguments: `quantity_of_interest`, `activation`, `temporal`, `num_machines`, `num_feats`, 
-    `sample_size`, and `num_neurons`.
-
+    arguments: quantity\_of\_interest, activation, temporal, num\_machines, num\_feats, 
+    sample\_size, and num\_neurons.
 ```julia
 # Create some data with a binary treatment
 X, T, Y =  rand(1000, 5), [rand()<0.4 for i in 1:1000], rand(1000)
@@ -54,10 +53,11 @@ estimate_causal_effect!(g_computer)
 We can get a summary of the model by pasing the model to the summarize method.
 
 !!!note
-    To calculate the p-value and standard error for the treatment effect, you can set the 
-    inference argument to false. However, p-values and standard errors are calculated via 
-    randomization inference, which will take a long time. But can be sped up by launching 
-    Julia with a higher number of threads.
+    To calculate the p-value, standard error, and confidence interval for the treatment 
+    effect, you can set the inference keyword to true. However, these values are calculated 
+    via randomization inference, which will take a long time. This can be greatly sped up by 
+    launching Julia with more threads and lowering the number of iterations using the n 
+    keyword (at the expense of accuracy).
 
 ```julia
 summarize(g_computer)
 
@@ -31,7 +31,7 @@ Estimating an interrupted time series design in CausalELM consists of three step
 ## Step 1: Initialize an interrupted time series estimator
 The InterruptedTimeSeries constructor takes at least four agruments: pre-event covariates, 
 pre-event outcomes, post-event covariates, and post-event outcomes, all of which can be 
-either an array or any data structure that implements the Tables.jl interface (e.g. 
+either an AbstractArray or any data structure that implements the Tables.jl interface (e.g. 
 DataFrames). The interrupted time series estimator assumes outcomes are either continuous, 
 count, or time to event variables.
 
@@ -43,8 +43,8 @@ count, or time to event variables.
     machines to use, the number of features to consider for each extreme learning machine, 
     the number of bootstrapped observations to include in each extreme learning machine, and 
     the number of neurons to use during estimation. These options are specified with the 
-    following keyword arguments: `activation`, `num_machines`, `num_feats`, `sample_size`, 
-    and `num_neurons`.
+    following keyword arguments: activation, num\_machines, num\_feats, sample\_size, and 
+    num\_neurons.
 
 ```julia
 # Generate some data to use
@@ -69,10 +69,11 @@ estimate_causal_effect!(its)
 We can get a summary of the model by pasing the model to the summarize method.
 
 !!!note
-    To calculate the p-value and standard error for the treatment effect, you can set the 
-    inference argument to false. However, p-values and standard errors are calculated via 
-    randomization inference, which will take a long time. But can be sped up by launching 
-    Julia with a higher number of threads.
+    To calculate the p-value, standard error, and confidence interval for the treatment 
+    effect, you can set the inference keyword to true. However, these values are calculated 
+    via randomization inference, which will take a long time. This can be greatly sped up by 
+    launching Julia with more threads and lowering the number of iterations using the n 
+    keyword (at the expense of accuracy).
 
 ```julia
 summarize(its)