diff --git a/404.html b/404.html
index d06d117..eea4a84 100644
--- a/404.html
+++ b/404.html
@@ -39,6 +39,12 @@
       
     
     
+      <link rel="stylesheet" href="/causal-validation/css/ansi-colours.css">
+    
+      <link rel="stylesheet" href="/causal-validation/css/jupyter-cells.css">
+    
+      <link rel="stylesheet" href="/causal-validation/css/pandas-dataframe.css">
+    
     <script>__md_scope=new URL("/causal-validation/",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
     
       
@@ -272,7 +278,7 @@
   
   
     <li class="md-nav__item">
-      <a href="/causal-validation/_examples/basic/" class="md-nav__link">
+      <a href="/causal-validation/examples/basic/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
@@ -293,7 +299,7 @@
   
   
     <li class="md-nav__item">
-      <a href="/causal-validation/_examples/placebo_test/" class="md-nav__link">
+      <a href="/causal-validation/examples/placebo_test/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
@@ -314,7 +320,7 @@
   
   
     <li class="md-nav__item">
-      <a href="/causal-validation/_examples/azcausal/" class="md-nav__link">
+      <a href="/causal-validation/examples/azcausal/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
diff --git a/css/ansi-colours.css b/css/ansi-colours.css
new file mode 100644
index 0000000..42301ef
--- /dev/null
+++ b/css/ansi-colours.css
@@ -0,0 +1,174 @@
+/*!
+*
+* IPython notebook
+*
+*/
+/* CSS font colors for translated ANSI escape sequences */
+/* The color values are a mix of
+   http://www.xcolors.net/dl/baskerville-ivorylight and
+   http://www.xcolors.net/dl/euphrasia */
+.ansi-black-fg {
+  color: #3E424D;
+}
+.ansi-black-bg {
+  background-color: #3E424D;
+}
+.ansi-black-intense-fg {
+  color: #282C36;
+}
+.ansi-black-intense-bg {
+  background-color: #282C36;
+}
+.ansi-red-fg {
+  color: #E75C58;
+}
+.ansi-red-bg {
+  background-color: #E75C58;
+}
+.ansi-red-intense-fg {
+  color: #B22B31;
+}
+.ansi-red-intense-bg {
+  background-color: #B22B31;
+}
+.ansi-green-fg {
+  color: #00A250;
+}
+.ansi-green-bg {
+  background-color: #00A250;
+}
+.ansi-green-intense-fg {
+  color: #007427;
+}
+.ansi-green-intense-bg {
+  background-color: #007427;
+}
+.ansi-yellow-fg {
+  color: #DDB62B;
+}
+.ansi-yellow-bg {
+  background-color: #DDB62B;
+}
+.ansi-yellow-intense-fg {
+  color: #B27D12;
+}
+.ansi-yellow-intense-bg {
+  background-color: #B27D12;
+}
+.ansi-blue-fg {
+  color: #208FFB;
+}
+.ansi-blue-bg {
+  background-color: #208FFB;
+}
+.ansi-blue-intense-fg {
+  color: #0065CA;
+}
+.ansi-blue-intense-bg {
+  background-color: #0065CA;
+}
+.ansi-magenta-fg {
+  color: #D160C4;
+}
+.ansi-magenta-bg {
+  background-color: #D160C4;
+}
+.ansi-magenta-intense-fg {
+  color: #A03196;
+}
+.ansi-magenta-intense-bg {
+  background-color: #A03196;
+}
+.ansi-cyan-fg {
+  color: #60C6C8;
+}
+.ansi-cyan-bg {
+  background-color: #60C6C8;
+}
+.ansi-cyan-intense-fg {
+  color: #258F8F;
+}
+.ansi-cyan-intense-bg {
+  background-color: #258F8F;
+}
+.ansi-white-fg {
+  color: #C5C1B4;
+}
+.ansi-white-bg {
+  background-color: #C5C1B4;
+}
+.ansi-white-intense-fg {
+  color: #A1A6B2;
+}
+.ansi-white-intense-bg {
+  background-color: #A1A6B2;
+}
+.ansi-default-inverse-fg {
+  color: #FFFFFF;
+}
+.ansi-default-inverse-bg {
+  background-color: #000000;
+}
+.ansi-bold {
+  font-weight: bold;
+}
+.ansi-underline {
+  text-decoration: underline;
+}
+/* The following styles are deprecated an will be removed in a future version */
+.ansibold {
+  font-weight: bold;
+}
+.ansi-inverse {
+  outline: 0.5px dotted;
+}
+/* use dark versions for foreground, to improve visibility */
+.ansiblack {
+  color: black;
+}
+.ansired {
+  color: darkred;
+}
+.ansigreen {
+  color: darkgreen;
+}
+.ansiyellow {
+  color: #c4a000;
+}
+.ansiblue {
+  color: darkblue;
+}
+.ansipurple {
+  color: darkviolet;
+}
+.ansicyan {
+  color: steelblue;
+}
+.ansigray {
+  color: gray;
+}
+/* and light for background, for the same reason */
+.ansibgblack {
+  background-color: black;
+}
+.ansibgred {
+  background-color: red;
+}
+.ansibggreen {
+  background-color: green;
+}
+.ansibgyellow {
+  background-color: yellow;
+}
+.ansibgblue {
+  background-color: blue;
+}
+.ansibgpurple {
+  background-color: magenta;
+}
+.ansibgcyan {
+  background-color: cyan;
+}
+.ansibggray {
+  background-color: gray;
+}
\ No newline at end of file
diff --git a/css/jupyter-cells.css b/css/jupyter-cells.css
new file mode 100644
index 0000000..46def9f
--- /dev/null
+++ b/css/jupyter-cells.css
@@ -0,0 +1,10 @@
+/* Input cells */
+.input code, .input pre {
+    background-color: #3333aa11;
+}
+
+/* Output cells */
+.output pre {
+    background-color: #ececec80;
+    padding: 10px;
+}
diff --git a/css/pandas-dataframe.css b/css/pandas-dataframe.css
new file mode 100644
index 0000000..2c18015
--- /dev/null
+++ b/css/pandas-dataframe.css
@@ -0,0 +1,36 @@
+/* Pretty Pandas Dataframes */
+/* Supports mkdocs-material color variables */
+.dataframe {
+    border: 0;
+    font-size: smaller;
+}
+.dataframe tr {
+    border: none;
+    background: var(--md-code-bg-color, #ffffff);
+}
+.dataframe tr:nth-child(even) {
+    background: var(--md-default-bg-color, #f5f5f5);
+}
+.dataframe tr:hover {
+    background-color: var(--md-footer-bg-color--dark, #e1f5fe);
+}
+
+.dataframe thead th {
+    background: var(--md-default-bg-color, #ffffff);
+    border-bottom: 1px solid #aaa;
+    font-weight: bold;
+}
+.dataframe th {
+    border: none;
+    padding-left: 10px;
+    padding-right: 10px;
+}
+
+.dataframe td{
+    /* background: #fff; */
+    border: none;
+    text-align: right;
+    min-width:5em;
+    padding-left: 10px;
+    padding-right: 10px;
+}
diff --git a/_examples/azcausal/index.html b/examples/azcausal/index.html
similarity index 84%
rename from _examples/azcausal/index.html
rename to examples/azcausal/index.html
index a5fa087..6a10b0a 100644
--- a/_examples/azcausal/index.html
+++ b/examples/azcausal/index.html
@@ -8,7 +8,7 @@
       
       
       
-        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/_examples/azcausal/">
+        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/examples/azcausal/">
       
       
         <link rel="prev" href="../placebo_test/">
@@ -43,6 +43,12 @@
       
     
     
+      <link rel="stylesheet" href="../../css/ansi-colours.css">
+    
+      <link rel="stylesheet" href="../../css/jupyter-cells.css">
+    
+      <link rel="stylesheet" href="../../css/pandas-dataframe.css">
+    
     <script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
     
       
@@ -448,12 +454,52 @@
   
 
 
+<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/2.0.3/jquery.min.js"></script>
+<script>
+(function() {
+  function addWidgetsRenderer() {
+    var requireJsScript = document.createElement('script');
+    requireJsScript.src = 'https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.4/require.min.js';
+
+    var mimeElement = document.querySelector('script[type="application/vnd.jupyter.widget-view+json"]');
+    var jupyterWidgetsScript = document.createElement('script');
+    var widgetRendererSrc = 'https://unpkg.com/@jupyter-widgets/html-manager@*/dist/embed-amd.js';
+    var widgetState;
+
+    // Fallback for older version:
+    try {
+      widgetState = mimeElement && JSON.parse(mimeElement.innerHTML);
+
+      if (widgetState && (widgetState.version_major < 2 || !widgetState.version_major)) {
+        widgetRendererSrc = 'jupyter-js-widgets@*/dist/embed.js';
+      }
+    } catch(e) {}
+
+    jupyterWidgetsScript.src = widgetRendererSrc;
+
+    document.body.appendChild(requireJsScript);
+    document.body.appendChild(jupyterWidgetsScript);
+  }
+
+  document.addEventListener('DOMContentLoaded', addWidgetsRenderer);
+}());
+</script>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h1 id="azcausal-integration">AZCausal Integration</h1>
 <p>Amazon's <a href="https://github.com/amazon-science/azcausal">AZCausal</a> library provides the
 functionality to fit synthetic control and difference-in-difference models to your
 data. Integrating the synthetic data generating process of <code>causal_validation</code> with
 AZCausal is trivial, as we show in this notebook. To start, we'll simulate a toy
 dataset.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">from azcausal.estimators.panel.sdid import SDID
 import scipy.stats as st
 
@@ -469,6 +515,14 @@ <h1 id="azcausal-integration">AZCausal Integration</h1>
 )
 from causal_validation.transforms.parameter import UnitVaryingParameter
 </code></pre>
+
+
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">cfg = Config(
     n_control_units=10,
     n_pre_intervention_timepoints=60,
@@ -480,18 +534,65 @@ <h1 id="azcausal-integration">AZCausal Integration</h1>
 data = linear_trend(simulate(cfg))
 plot(data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../azcausal_files/azcausal_2_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_2_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>will inflate the treated group's observations in the post-intervention window.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">TRUE_EFFECT = 0.05
 effect = StaticEffect(effect=TRUE_EFFECT)
 inflated_data = effect(data)
 plot(inflated_data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../azcausal_files/azcausal_4_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_4_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="fitting-a-model">Fitting a model</h2>
 <p>We now have some very toy data on which we may apply a model. For this demonstration
 we shall use the Synthetic Difference-in-Differences model implemented in AZCausal;
@@ -500,13 +601,28 @@ <h2 id="fitting-a-model">Fitting a model</h2>
 AZCausal. Through the <code>.to_azcausal()</code> method implemented here, this is
 straightforward to achieve. Once we have a AZCausal compatible dataset, the modelling
 is very simple by virtue of the clean design of AZCausal.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">panel = inflated_data.to_azcausal()
 model = SDID()
 result = model.fit(panel)
 print(f&quot;Delta: {TRUE_EFFECT - result.effect.percentage().value / 100}&quot;)
 print(result.summary(title=&quot;Synthetic Data Experiment&quot;))
 </code></pre>
-<pre><code>Delta: -2.3592239273284576e-16
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_subarea output_stream output_stdout output_text">
+<pre>
+<code>Delta: -2.3592239273284576e-16
 ╭──────────────────────────────────────────────────────────────────────────────╮
 |                          Synthetic Data Experiment                           |
 ├──────────────────────────────────────────────────────────────────────────────┤
@@ -529,7 +645,16 @@ <h2 id="fitting-a-model">Fitting a model</h2>
 |  Observed: 747.03                                                            |
 |  Counter Factual: 711.46                                                     |
 ╰──────────────────────────────────────────────────────────────────────────────╯
-</code></pre>
+</code>
+</pre>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>effect.  However, given the simplicity of the data, this is not surprising. With the
 functionality within this package though we can easily construct more complex datasets
 in effort to fully stress-test any new model and identify its limitations.</p>
@@ -545,6 +670,13 @@ <h2 id="fitting-a-model">Fitting a model</h2>
 $\delta_{t, n}$ is 5% when $n=1$ and $t\geq 60$ and 0 otherwise. Meanwhile,
 $\mathbf{Y}$ is the matrix of observations, long in the number of time points and wide
 in the number of units.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">cfg = Config(
     n_control_units=10,
     n_pre_intervention_timepoints=60,
@@ -565,18 +697,53 @@ <h2 id="fitting-a-model">Fitting a model</h2>
 data = effect(periodic(linear_trend(simulate(cfg))))
 plot(data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../azcausal_files/azcausal_8_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_8_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>time we see that the delta between the estaimted and true effect is much larger than
 before.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">panel = data.to_azcausal()
 model = SDID()
 result = model.fit(panel)
 print(f&quot;Delta: {100*(TRUE_EFFECT - result.effect.percentage().value / 100): .2f}%&quot;)
 print(result.summary(title=&quot;Synthetic Data Experiment&quot;))
 </code></pre>
-<pre><code>Delta:  1.71%
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_subarea output_stream output_stdout output_text">
+<pre>
+<code>Delta:  1.71%
 ╭──────────────────────────────────────────────────────────────────────────────╮
 |                          Synthetic Data Experiment                           |
 ├──────────────────────────────────────────────────────────────────────────────┤
@@ -599,7 +766,13 @@ <h2 id="fitting-a-model">Fitting a model</h2>
 |  Observed: 686.44                                                            |
 |  Counter Factual: 664.59                                                     |
 ╰──────────────────────────────────────────────────────────────────────────────╯
-</code></pre>
+</code>
+</pre>
+</div>
+</div>
+</div>
+</div>
+</div>
 
 
 
diff --git a/_examples/azcausal_files/azcausal_2_1.png b/examples/azcausal/output_2_1.png
similarity index 100%
rename from _examples/azcausal_files/azcausal_2_1.png
rename to examples/azcausal/output_2_1.png
diff --git a/_examples/azcausal_files/azcausal_4_1.png b/examples/azcausal/output_4_1.png
similarity index 100%
rename from _examples/azcausal_files/azcausal_4_1.png
rename to examples/azcausal/output_4_1.png
diff --git a/_examples/azcausal_files/azcausal_8_1.png b/examples/azcausal/output_8_1.png
similarity index 100%
rename from _examples/azcausal_files/azcausal_8_1.png
rename to examples/azcausal/output_8_1.png
diff --git a/_examples/basic/index.html b/examples/basic/index.html
similarity index 74%
rename from _examples/basic/index.html
rename to examples/basic/index.html
index f8f75ac..881fd30 100644
--- a/_examples/basic/index.html
+++ b/examples/basic/index.html
@@ -8,7 +8,7 @@
       
       
       
-        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/_examples/basic/">
+        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/examples/basic/">
       
       
         <link rel="prev" href="../..">
@@ -45,6 +45,12 @@
       
     
     
+      <link rel="stylesheet" href="../../css/ansi-colours.css">
+    
+      <link rel="stylesheet" href="../../css/jupyter-cells.css">
+    
+      <link rel="stylesheet" href="../../css/pandas-dataframe.css">
+    
     <script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
     
       
@@ -570,12 +576,52 @@
   
 
 
+<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/2.0.3/jquery.min.js"></script>
+<script>
+(function() {
+  function addWidgetsRenderer() {
+    var requireJsScript = document.createElement('script');
+    requireJsScript.src = 'https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.4/require.min.js';
+
+    var mimeElement = document.querySelector('script[type="application/vnd.jupyter.widget-view+json"]');
+    var jupyterWidgetsScript = document.createElement('script');
+    var widgetRendererSrc = 'https://unpkg.com/@jupyter-widgets/html-manager@*/dist/embed-amd.js';
+    var widgetState;
+
+    // Fallback for older version:
+    try {
+      widgetState = mimeElement && JSON.parse(mimeElement.innerHTML);
+
+      if (widgetState && (widgetState.version_major < 2 || !widgetState.version_major)) {
+        widgetRendererSrc = 'jupyter-js-widgets@*/dist/embed.js';
+      }
+    } catch(e) {}
+
+    jupyterWidgetsScript.src = widgetRendererSrc;
+
+    document.body.appendChild(requireJsScript);
+    document.body.appendChild(jupyterWidgetsScript);
+  }
+
+  document.addEventListener('DOMContentLoaded', addWidgetsRenderer);
+}());
+</script>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h1 id="data-synthesis">Data Synthesis</h1>
 <p>In this notebook we'll demonstrate how <code>causal-validation</code> can be used to simulate
 synthetic datasets. We'll start with very simple data to which a static treatment
 effect may be applied. From there, we'll build up to complex datasets. Along the way,
 we'll show how reproducibility can be ensured, plots can be generated, and unit-level
 parameters may be specified.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">from itertools import product
 
 import matplotlib.pyplot as plt
@@ -597,9 +643,29 @@ <h1 id="data-synthesis">Data Synthesis</h1>
 )
 from causal_validation.transforms.parameter import UnitVaryingParameter
 </code></pre>
+
+
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="simulating-a-dataset">Simulating a Dataset</h2>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>then invoking the <code>simulate</code> function. Once simulated, we may visualise the data
 through the <code>plot</code> function.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">cfg = Config(
     n_control_units=10,
     n_pre_intervention_timepoints=60,
@@ -610,14 +676,41 @@ <h2 id="simulating-a-dataset">Simulating a Dataset</h2>
 data = simulate(cfg)
 plot(data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_4_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_4_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h3 id="controlling-baseline-behaviour">Controlling baseline behaviour</h3>
 <p>We observe that we have 10 control units, each of which were sampled from a Gaussian
 distribution with mean 20 and scale 0.2. Had we wished for our underlying observations
 to have more or less noise, or to have a different global mean, then we can simply
 specify that through the config file.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">means = [10, 50]
 scales = [0.1, 0.5]
 
@@ -633,12 +726,34 @@ <h3 id="controlling-baseline-behaviour">Controlling baseline behaviour</h3>
     data = simulate(cfg)
     plot(data, ax=ax, title=f&quot;Mean: {m}, Scale: {s}&quot;)
 </code></pre>
-<p><img alt="png" src="../basic_files/basic_6_0.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_6_0.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h3 id="reproducibility">Reproducibility</h3>
 <p>In the above four panels, we can see that whilst the mean and scale of the underlying
 data generating process is varying, the functional form of the data is the same. This
 is by design to ensure that data sampling is reproducible. To sample a new dataset,
 you may either change the underlying seed in the config file.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">cfg = Config(
     n_control_units=10,
     n_pre_intervention_timepoints=60,
@@ -646,14 +761,50 @@ <h3 id="reproducibility">Reproducibility</h3>
     seed=42,
 )
 </code></pre>
+
+
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>Reusing the same config file across simulations</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">fig, axes = plt.subplots(ncols=2, figsize=(10, 3))
 for ax in axes:
     data = simulate(cfg)
     plot(data, ax=ax)
 </code></pre>
-<p><img alt="png" src="../basic_files/basic_10_0.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_10_0.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>Or manually specifying and passing your own pseudorandom number generator key</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">
 rng = np.random.RandomState(42)
 
@@ -662,67 +813,232 @@ <h3 id="reproducibility">Reproducibility</h3>
     data = simulate(cfg, key=rng)
     plot(data, ax=ax)
 </code></pre>
-<p><img alt="png" src="../basic_files/basic_12_0.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_12_0.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h3 id="simulating-an-effect">Simulating an effect</h3>
 <p>In the data we have seen up until now, the treated unit has been drawn from the same
 data generating process as the control units. However, it can be helpful to also
 inflate the treated unit to observe how well our model can recover the the true
 treatment effect. To do this, we simply compose our dataset with an <code>Effect</code> object.
 In the below, we shall inflate our data by 2%.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">effect = StaticEffect(effect=0.02)
 inflated_data = effect(data)
 fig, (ax0, ax1) = plt.subplots(ncols=2, figsize=(10, 3))
 plot(data, ax=ax0, title=&quot;Original data&quot;)
 plot(inflated_data, ax=ax1, title=&quot;Inflated data&quot;)
 </code></pre>
-<pre><code>&lt;Axes: title={'center': 'Inflated data'}, xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_14_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: title={'center': 'Inflated data'}, xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_14_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h3 id="more-complex-generation-processes">More complex generation processes</h3>
 <p>The example presented above shows a very simple stationary data generation process.
 However, we may make our example more complex by including a non-stationary trend to
 the data.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">trend_term = Trend(degree=1, coefficient=0.1)
 data_with_trend = effect(trend_term(data))
 plot(data_with_trend)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_16_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_16_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">trend_term = Trend(degree=2, coefficient=0.0025)
 data_with_trend = effect(trend_term(data))
 plot(data_with_trend)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_17_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_17_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <p>We may also include periodic components in our data</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">periodicity = Periodic(amplitude=2, frequency=6)
 perioidic_data = effect(periodicity(trend_term(data)))
 plot(perioidic_data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_19_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_19_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h3 id="unit-level-parameterisation">Unit-level parameterisation</h3>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">sampling_dist = norm(0.0, 1.0)
 intercept = UnitVaryingParameter(sampling_dist=sampling_dist)
 trend_term = Trend(degree=1, intercept=intercept, coefficient=0.1)
 data_with_trend = effect(trend_term(data))
 plot(data_with_trend)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_21_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_21_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">sampling_dist = poisson(2)
 frequency = UnitVaryingParameter(sampling_dist=sampling_dist)
 
 p = Periodic(frequency=frequency)
 plot(p(data))
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../basic_files/basic_22_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_22_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="conclusions">Conclusions</h2>
 <p>In this notebook we have shown how one can define their model's true underlying data
 generating process, starting from simple white-noise samples through to more complex
@@ -731,6 +1047,9 @@ <h2 id="conclusions">Conclusions</h2>
 Amazon's own AZCausal library to compare the effect estimated by a model with the true
 effect of the underlying data generating process. A link to this notebook is
 <a href="https://github.com/amazon-science/causal-validation/blob/main/examples/azcausal.pct.py">here</a>.</p>
+</div>
+</div>
+</div>
 
 
 
diff --git a/_examples/basic_files/basic_10_0.png b/examples/basic/output_10_0.png
similarity index 100%
rename from _examples/basic_files/basic_10_0.png
rename to examples/basic/output_10_0.png
diff --git a/_examples/basic_files/basic_12_0.png b/examples/basic/output_12_0.png
similarity index 100%
rename from _examples/basic_files/basic_12_0.png
rename to examples/basic/output_12_0.png
diff --git a/_examples/basic_files/basic_14_1.png b/examples/basic/output_14_1.png
similarity index 100%
rename from _examples/basic_files/basic_14_1.png
rename to examples/basic/output_14_1.png
diff --git a/_examples/basic_files/basic_16_1.png b/examples/basic/output_16_1.png
similarity index 100%
rename from _examples/basic_files/basic_16_1.png
rename to examples/basic/output_16_1.png
diff --git a/_examples/basic_files/basic_17_1.png b/examples/basic/output_17_1.png
similarity index 100%
rename from _examples/basic_files/basic_17_1.png
rename to examples/basic/output_17_1.png
diff --git a/_examples/basic_files/basic_19_1.png b/examples/basic/output_19_1.png
similarity index 100%
rename from _examples/basic_files/basic_19_1.png
rename to examples/basic/output_19_1.png
diff --git a/_examples/basic_files/basic_21_1.png b/examples/basic/output_21_1.png
similarity index 100%
rename from _examples/basic_files/basic_21_1.png
rename to examples/basic/output_21_1.png
diff --git a/_examples/basic_files/basic_22_1.png b/examples/basic/output_22_1.png
similarity index 100%
rename from _examples/basic_files/basic_22_1.png
rename to examples/basic/output_22_1.png
diff --git a/_examples/basic_files/basic_4_1.png b/examples/basic/output_4_1.png
similarity index 100%
rename from _examples/basic_files/basic_4_1.png
rename to examples/basic/output_4_1.png
diff --git a/_examples/basic_files/basic_6_0.png b/examples/basic/output_6_0.png
similarity index 100%
rename from _examples/basic_files/basic_6_0.png
rename to examples/basic/output_6_0.png
diff --git a/_examples/placebo_test/index.html b/examples/placebo_test/index.html
similarity index 72%
rename from _examples/placebo_test/index.html
rename to examples/placebo_test/index.html
index c06471c..a48f7b7 100644
--- a/_examples/placebo_test/index.html
+++ b/examples/placebo_test/index.html
@@ -8,7 +8,7 @@
       
       
       
-        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/_examples/placebo_test/">
+        <link rel="canonical" href="https://amazon-science.github.io/causal-validation/examples/placebo_test/">
       
       
         <link rel="prev" href="../basic/">
@@ -45,6 +45,12 @@
       
     
     
+      <link rel="stylesheet" href="../../css/ansi-colours.css">
+    
+      <link rel="stylesheet" href="../../css/jupyter-cells.css">
+    
+      <link rel="stylesheet" href="../../css/pandas-dataframe.css">
+    
     <script>__md_scope=new URL("../..",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
     
       
@@ -504,6 +510,39 @@
   
 
 
+<script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/2.0.3/jquery.min.js"></script>
+<script>
+(function() {
+  function addWidgetsRenderer() {
+    var requireJsScript = document.createElement('script');
+    requireJsScript.src = 'https://cdnjs.cloudflare.com/ajax/libs/require.js/2.3.4/require.min.js';
+
+    var mimeElement = document.querySelector('script[type="application/vnd.jupyter.widget-view+json"]');
+    var jupyterWidgetsScript = document.createElement('script');
+    var widgetRendererSrc = 'https://unpkg.com/@jupyter-widgets/html-manager@*/dist/embed-amd.js';
+    var widgetState;
+
+    // Fallback for older version:
+    try {
+      widgetState = mimeElement && JSON.parse(mimeElement.innerHTML);
+
+      if (widgetState && (widgetState.version_major < 2 || !widgetState.version_major)) {
+        widgetRendererSrc = 'jupyter-js-widgets@*/dist/embed.js';
+      }
+    } catch(e) {}
+
+    jupyterWidgetsScript.src = widgetRendererSrc;
+
+    document.body.appendChild(requireJsScript);
+    document.body.appendChild(jupyterWidgetsScript);
+  }
+
+  document.addEventListener('DOMContentLoaded', addWidgetsRenderer);
+}());
+</script>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h1 id="placebo-testing">Placebo Testing</h1>
 <p>A placebo test is an approach to assess the validity of a causal model by checking if
 the effect can truly be attributed to the treatment, or to other spurious factors. A
@@ -518,6 +557,13 @@ <h1 id="placebo-testing">Placebo Testing</h1>
 reliable. Placebo testing is thus a critical step to ensure the robustness of findings
 in RCTs. In this notebook, we demonstrate how a placebo test can be conducted in
 <code>causal-validation</code>.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">from azcausal.core.error import JackKnife
 from azcausal.estimators.panel.did import DID
 from azcausal.estimators.panel.sdid import SDID
@@ -531,13 +577,37 @@ <h1 id="placebo-testing">Placebo Testing</h1>
 from causal_validation.plotters import plot
 from causal_validation.validation.placebo import PlaceboTest
 </code></pre>
-<pre><code>/home/runner/.local/share/hatch/env/virtual/causal-validation/CYBYs5D-/docs/lib/python3.10/site-packages/pandera/engines/pandas_engine.py:67: UserWarning: Using typeguard &lt; 3. Generic types like List[TYPE], Dict[TYPE, TYPE] will only validate the first element in the collection.
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_subarea output_stream output_stderr output_text">
+<pre>
+<code>/home/runner/.local/share/hatch/env/virtual/causal-validation/CYBYs5D-/docs/lib/python3.10/site-packages/pandera/engines/pandas_engine.py:67: UserWarning: Using typeguard &lt; 3. Generic types like List[TYPE], Dict[TYPE, TYPE] will only validate the first element in the collection.
   warnings.warn(
-</code></pre>
+</code>
+</pre>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="data-simulation">Data simulation</h2>
 <p>To demonstrate a placebo test, we must first simulate some data. For the purposes of
 illustration, we'll simulate a very simple dataset containing 10 control units where
 each unit has 60 pre-intervention observations, and 30 post-intervention observations.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">cfg = Config(
     n_control_units=10,
     n_pre_intervention_timepoints=60,
@@ -550,16 +620,50 @@ <h2 id="data-simulation">Data simulation</h2>
 data = effect(simulate(cfg))
 plot(data)
 </code></pre>
-<pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;
-</code></pre>
-<p><img alt="png" src="../placebo_test_files/placebo_test_3_1.png" /></p>
+
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div class="output_text output_subarea output_execute_result">
+<pre>
+<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>
+</pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_png output_subarea">
+<img alt="No description has been provided for this image" src="output_3_1.png"/>
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="model">Model</h2>
 <p>We'll now define our model. To do this, we'll use the synthetic
 difference-in-differences implementation of AZCausal. This implementation, along with
 any other model from AZCausal, can be neatly wrapped up in our <code>AZCausalWrapper</code> to
 make fitting and effect estimation simpler.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">model = AZCausalWrapper(model=SDID(), error_estimator=JackKnife())
 </code></pre>
+
+
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="placebo-test-results">Placebo Test Results</h2>
 <p>Now that we have a dataset and model defined, we may conduct our placebo test. With 10
 control units, the test will estimate 10 individual effects; 1 per control unit when
@@ -571,32 +675,91 @@ <h2 id="placebo-test-results">Placebo Test Results</h2>
 Accordingly, the p-value attains a value of 0.5, indicating that we have insufficient
 evidence to reject the null hypothesis and we, therefore, have no evidence to suggest
 that there is bias within this particular setup.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">result = PlaceboTest(model, data).execute()
 result.summary()
 </code></pre>
-<pre><code>Output()
-</code></pre>
-<pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace"></pre>
 
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div id="6211cec0-055f-44ec-8b34-d3fa883ac48b"></div>
+<div class="output_subarea output_widget_view">
+<script type="text/javascript">
+var element = $('#6211cec0-055f-44ec-8b34-d3fa883ac48b');
+</script>
+<script type="application/vnd.jupyter.widget-view+json">
+{"version_major": 2, "version_minor": 0, "model_id": "96eb1518a64a4f779c0ad85ad74370ee"}
+</script>
+</div>
+</div>
+<div class="output_area">
+<div class="output_html rendered_html output_subarea">
+<pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace"></pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_html rendered_html output_subarea output_execute_result">
 <pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace">                                                                  
 |<span style="font-weight: bold"> Model </span>|<span style="font-weight: bold"> Effect </span>|<span style="font-weight: bold"> Standard Deviation </span>|<span style="font-weight: bold"> Standard Error </span>|<span style="font-weight: bold"> p-value </span>|
 |-------|--------|--------------------|----------------|---------|
 |<span style="color: #800080; text-decoration-color: #800080"> SDID  </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.0851 </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.4079             </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.129          </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.5472  </span>|
 
 </pre>
-
+</div>
+</div>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing text_cell rendered">
+<div class="inner_cell">
+<div class="text_cell_render border-box-sizing rendered_html">
 <h2 id="model-comparison">Model Comparison</h2>
 <p>We can also use the results of a placebo test to compare two or more models. Using
 <code>causal-validation</code>, this is as simple as supplying a series of models to the placebo
 test and comparing their outputs. To demonstrate this, we will compare the previously
 used synthetic difference-in-differences model with regular difference-in-differences.</p>
+</div>
+</div>
+</div>
+<div class="cell border-box-sizing code_cell rendered">
+<div class="input">
+
+
 <pre><code class="language-python">did_model = AZCausalWrapper(model=DID())
 PlaceboTest([model, did_model], data).execute().summary()
 </code></pre>
-<pre><code>Output()
-</code></pre>
-<pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace"></pre>
 
+
+</div>
+<div class="output_wrapper">
+<div class="output">
+<div class="output_area">
+<div id="2071cebc-301b-4cbb-b5dd-4cdebf5dcb8a"></div>
+<div class="output_subarea output_widget_view">
+<script type="text/javascript">
+var element = $('#2071cebc-301b-4cbb-b5dd-4cdebf5dcb8a');
+</script>
+<script type="application/vnd.jupyter.widget-view+json">
+{"version_major": 2, "version_minor": 0, "model_id": "08fc0a16f78e4d59aac5b13ddbb930a0"}
+</script>
+</div>
+</div>
+<div class="output_area">
+<div class="output_html rendered_html output_subarea">
+<pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace"></pre>
+</div>
+</div>
+<div class="output_area">
+<div class="output_html rendered_html output_subarea output_execute_result">
 <pre style="white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace">                                                                  
 |<span style="font-weight: bold"> Model </span>|<span style="font-weight: bold"> Effect </span>|<span style="font-weight: bold"> Standard Deviation </span>|<span style="font-weight: bold"> Standard Error </span>|<span style="font-weight: bold"> p-value </span>|
 |-------|--------|--------------------|----------------|---------|
@@ -604,6 +767,14 @@ <h2 id="model-comparison">Model Comparison</h2>
 |<span style="color: #800080; text-decoration-color: #800080"> DID   </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.0002 </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.2818             </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.0891         </span>|<span style="color: #800080; text-decoration-color: #800080"> 0.9982  </span>|
 
 </pre>
+</div>
+</div>
+</div>
+</div>
+</div>
+<script type="application/vnd.jupyter.widget-state+json">
+{"state": {"3a33da0b5a18474296fbae37322bbb82": {"model_name": "LayoutModel", "model_module": "@jupyter-widgets/base", "model_module_version": "2.0.0", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "2.0.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "2.0.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border_bottom": null, "border_left": null, "border_right": null, "border_top": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "96eb1518a64a4f779c0ad85ad74370ee": {"model_name": "OutputModel", "model_module": "@jupyter-widgets/output", "model_module_version": "1.0.0", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_model_name": "OutputModel", "_view_count": null, "_view_module": "@jupyter-widgets/output", "_view_module_version": "1.0.0", "_view_name": "OutputView", "layout": "IPY_MODEL_3a33da0b5a18474296fbae37322bbb82", "msg_id": "", "outputs": [{"output_type": "display_data", "metadata": {}, "data": {"text/plain": "", "text/html": "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\"></pre>\n"}}], "tabbable": null, "tooltip": null}}, "a84cc0a39e6542899bf60912b0a15ce2": {"model_name": "LayoutModel", "model_module": "@jupyter-widgets/base", "model_module_version": "2.0.0", "state": {"_model_module": "@jupyter-widgets/base", "_model_module_version": "2.0.0", "_model_name": "LayoutModel", "_view_count": null, "_view_module": "@jupyter-widgets/base", "_view_module_version": "2.0.0", "_view_name": "LayoutView", "align_content": null, "align_items": null, "align_self": null, "border_bottom": null, "border_left": null, "border_right": null, "border_top": null, "bottom": null, "display": null, "flex": null, "flex_flow": null, "grid_area": null, "grid_auto_columns": null, "grid_auto_flow": null, "grid_auto_rows": null, "grid_column": null, "grid_gap": null, "grid_row": null, "grid_template_areas": null, "grid_template_columns": null, "grid_template_rows": null, "height": null, "justify_content": null, "justify_items": null, "left": null, "margin": null, "max_height": null, "max_width": null, "min_height": null, "min_width": null, "object_fit": null, "object_position": null, "order": null, "overflow": null, "padding": null, "right": null, "top": null, "visibility": null, "width": null}}, "08fc0a16f78e4d59aac5b13ddbb930a0": {"model_name": "OutputModel", "model_module": "@jupyter-widgets/output", "model_module_version": "1.0.0", "state": {"_dom_classes": [], "_model_module": "@jupyter-widgets/output", "_model_module_version": "1.0.0", "_model_name": "OutputModel", "_view_count": null, "_view_module": "@jupyter-widgets/output", "_view_module_version": "1.0.0", "_view_name": "OutputView", "layout": "IPY_MODEL_a84cc0a39e6542899bf60912b0a15ce2", "msg_id": "", "outputs": [{"output_type": "display_data", "metadata": {}, "data": {"text/plain": "", "text/html": "<pre style=\"white-space:pre;overflow-x:auto;line-height:normal;font-family:Menlo,'DejaVu Sans Mono',consolas,'Courier New',monospace\"></pre>\n"}}], "tabbable": null, "tooltip": null}}}, "version_major": 2, "version_minor": 0}
+</script>
 
 
 
diff --git a/_examples/placebo_test_files/placebo_test_3_1.png b/examples/placebo_test/output_3_1.png
similarity index 100%
rename from _examples/placebo_test_files/placebo_test_3_1.png
rename to examples/placebo_test/output_3_1.png
diff --git a/index.html b/index.html
index a2a20fd..bf09321 100644
--- a/index.html
+++ b/index.html
@@ -12,7 +12,7 @@
       
       
       
-        <link rel="next" href="_examples/basic/">
+        <link rel="next" href="examples/basic/">
       
       
       <link rel="icon" href="assets/images/favicon.png">
@@ -43,6 +43,12 @@
       
     
     
+      <link rel="stylesheet" href="css/ansi-colours.css">
+    
+      <link rel="stylesheet" href="css/jupyter-cells.css">
+    
+      <link rel="stylesheet" href="css/pandas-dataframe.css">
+    
     <script>__md_scope=new URL(".",location),__md_hash=e=>[...e].reduce(((e,_)=>(e<<5)-e+_.charCodeAt(0)),0),__md_get=(e,_=localStorage,t=__md_scope)=>JSON.parse(_.getItem(t.pathname+"."+e)),__md_set=(e,_,t=localStorage,a=__md_scope)=>{try{t.setItem(a.pathname+"."+e,JSON.stringify(_))}catch(e){}}</script>
     
       
@@ -339,7 +345,7 @@
   
   
     <li class="md-nav__item">
-      <a href="_examples/basic/" class="md-nav__link">
+      <a href="examples/basic/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
@@ -360,7 +366,7 @@
   
   
     <li class="md-nav__item">
-      <a href="_examples/placebo_test/" class="md-nav__link">
+      <a href="examples/placebo_test/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
@@ -381,7 +387,7 @@
   
   
     <li class="md-nav__item">
-      <a href="_examples/azcausal/" class="md-nav__link">
+      <a href="examples/azcausal/" class="md-nav__link">
         
   
   <span class="md-ellipsis">
diff --git a/scripts/gen_examples.py b/scripts/gen_examples.py
deleted file mode 100644
index 65fd132..0000000
--- a/scripts/gen_examples.py
+++ /dev/null
@@ -1,95 +0,0 @@
-from argparse import ArgumentParser
-from pathlib import Path
-import subprocess
-from concurrent.futures import ThreadPoolExecutor, as_completed
-import shutil
-from dataclasses import dataclass
-
-EXCLUDE = ["utils.py"]
-
-
-def process_file(file: Path, out_file: Path | None = None, execute: bool = False):
-    """Converts a python file to markdown using jupytext and nbconvert."""
-
-    out_dir = out_file.parent
-    command = f"cd {out_dir.as_posix()} && "
-
-    out_file = out_file.relative_to(out_dir).as_posix()
-
-    if execute:
-        command += f"jupytext --to ipynb {file} --output - "
-        command += (
-            f"| jupyter nbconvert --to markdown --execute --stdin --output {out_file}"
-        )
-    else:
-        command += f"jupytext --to markdown {file} --output {out_file}"
-
-    subprocess.run(command, shell=True, check=False)
-
-
-def is_modified(file: Path, out_file: Path):
-    """Check if the output file is older than the input file."""
-    return out_file.exists() and out_file.stat().st_mtime < file.stat().st_mtime
-
-
-def main(args):
-    # project root directory
-    wdir = Path(__file__).parents[2]
-
-    # output directory
-    out_dir: Path = args.outdir
-    out_dir.mkdir(exist_ok=True, parents=True)
-
-    # copy directories in "examples" to output directory
-    for dir in wdir.glob("examples/*"):
-        if dir.is_dir():
-            (out_dir / dir.name).mkdir(exist_ok=True, parents=True)
-            for file in dir.glob("*"):
-                # copy, not move!
-                shutil.copy(file, out_dir / dir.name / file.name)
-
-    # list of files to be processed
-    files = [f for f in wdir.glob("examples/*.py") if f.name not in EXCLUDE]
-    print(files)
-
-    # process only modified files
-    if args.only_modified:
-        files = [f for f in files if is_modified(f, out_dir / f"{f.stem}.md")]
-
-    # process files in parallel
-    if args.parallel:
-        with ThreadPoolExecutor(max_workers=args.max_workers) as executor:
-            futures = []
-            for file in files:
-                out_file = out_dir / f"{file.stem.replace('.pct', '')}.md"
-                futures.append(
-                    executor.submit(
-                        process_file, file, out_file=out_file, execute=args.execute
-                    )
-                )
-
-            for future in as_completed(futures):
-                try:
-                    future.result()
-                except Exception as e:
-                    print(f"Error processing file: {e}")
-    else:
-        for file in files:
-            out_file = out_dir / f"{file.stem.replace('.pct', '')}.md"
-            process_file(file, out_file=out_file, execute=args.execute)
-
-
-@dataclass
-class GeneratorArgs:
-    max_workers: int = 4
-    execute: bool = True
-    only_modified: bool = False
-    project_root: Path = Path(__file__).parents[2]
-    parallel: bool = False
-
-    def __post_init__(self):
-        self.outdir: Path = self.project_root / "docs" / "_examples"
-
-
-args = GeneratorArgs()
-main(args)
diff --git a/search/search_index.json b/search/search_index.json
index 9749a8e..c1baf18 100644
--- a/search/search_index.json
+++ b/search/search_index.json
@@ -1 +1 @@
-{"config":{"lang":["en"],"separator":"[\\s\\-]+","pipeline":["stopWordFilter"]},"docs":[{"location":"","title":"Welcome to Causal Validation","text":"<p>Causal Validation is a library designed to validate and test your causal models. To achieve this, we provide functionality to simulate causal data, and vaildate your model through a placebo test. </p>"},{"location":"#data-synthesis","title":"Data Synthesis","text":"<p>Data Synthesis in Causal Validation is a fully composable process whereby a set of functions are sequentially applied to a dataset. At some point in this process we also induce a treatment effect. Any of these functions can be parameterised to either have constant parameter values across all control units, or a value that varies across parameters. To see this, consider the below example where we simulate a dataset whose trend varies across each of the 10 control units.</p> <pre><code>from causal_validation import Config, simulate\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import Trend, Periodic\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\nfrom scipy.stats import norm\n\ncfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n)\n\n# Simulate the base observation\nbase_data = simulate(cfg)\n\n# Apply a linear trend with unit-varying intercept\nintercept = UnitVaryingParameter(sampling_dist = norm(0, 1))\ntrend_component = Trend(degree=1, coefficient=0.1, intercept=intercept)\ntrended_data = trend_component(base_data)\n\n# Simulate a 5% lift in the treated unit's post-intervention data\neffect = StaticEffect(0.05)\ninflated_data = effect(trended_data)\n</code></pre> <p></p>"},{"location":"#model-validation","title":"Model Validation","text":"<p>Once a dataset has been synthesised, we may wish to validate our model using a placebo test. In Causal Validation this is straightforward and can be accomplished in combination with AZCausal by the following.</p> <pre><code>from azcausal.estimators.panel.sdid import SDID\nfrom causal_validation.validation.placebo import PlaceboTest\n\nmodel = AZCausalWrapper(model=SDID())\nresult = PlaceboTest(model, inflated_data).execute()\nresult.summary()\n</code></pre>"},{"location":"_examples/azcausal/","title":"AZCausal Integration","text":"<p>Amazon's AZCausal library provides the functionality to fit synthetic control and difference-in-difference models to your data. Integrating the synthetic data generating process of <code>causal_validation</code> with AZCausal is trivial, as we show in this notebook. To start, we'll simulate a toy dataset.</p> <pre><code>from azcausal.estimators.panel.sdid import SDID\nimport scipy.stats as st\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import (\n    Periodic,\n    Trend,\n)\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\n</code></pre> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\nlinear_trend = Trend(degree=1, coefficient=0.05)\ndata = linear_trend(simulate(cfg))\nplot(data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p> <p>will inflate the treated group's observations in the post-intervention window.</p> <pre><code>TRUE_EFFECT = 0.05\neffect = StaticEffect(effect=TRUE_EFFECT)\ninflated_data = effect(data)\nplot(inflated_data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p>"},{"location":"_examples/azcausal/#fitting-a-model","title":"Fitting a model","text":"<p>We now have some very toy data on which we may apply a model. For this demonstration we shall use the Synthetic Difference-in-Differences model implemented in AZCausal; however, the approach shown here will work for any model implemented in AZCausal. To achieve this, we must first coerce the data into a format that is digestible for AZCausal. Through the <code>.to_azcausal()</code> method implemented here, this is straightforward to achieve. Once we have a AZCausal compatible dataset, the modelling is very simple by virtue of the clean design of AZCausal.</p> <pre><code>panel = inflated_data.to_azcausal()\nmodel = SDID()\nresult = model.fit(panel)\nprint(f\"Delta: {TRUE_EFFECT - result.effect.percentage().value / 100}\")\nprint(result.summary(title=\"Synthetic Data Experiment\"))\n</code></pre> <pre><code>Delta: -2.3592239273284576e-16\n\u256d\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256e\n|                          Synthetic Data Experiment                           |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                    Panel                                     |\n|  Time Periods: 90 (60/30)                                  total (pre/post)  |\n|  Units: 11 (10/1)                                       total (contr/treat)  |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                     ATT                                      |\n|  Effect: 1.1858                                                              |\n|  Observed: 24.90                                                             |\n|  Counter Factual: 23.72                                                      |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Percentage                                  |\n|  Effect: 5.0000                                                              |\n|  Observed: 105.00                                                            |\n|  Counter Factual: 100.00                                                     |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Cumulative                                  |\n|  Effect: 35.57                                                               |\n|  Observed: 747.03                                                            |\n|  Counter Factual: 711.46                                                     |\n\u2570\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256f\n</code></pre> <p>effect.  However, given the simplicity of the data, this is not surprising. With the functionality within this package though we can easily construct more complex datasets in effort to fully stress-test any new model and identify its limitations.</p> <p>To achieve this, we'll simulate 10 control units, 60 pre-intervention time points, and 30 post-intervention time points according to the following process: $$ \\begin{align} \\mu_{n, t} &amp; \\sim\\mathcal{N}(20, 0.5^2)\\ \\alpha_{n} &amp; \\sim \\mathcal{N}(0, 1^2)\\ \\beta_{n} &amp; \\sim \\mathcal{N}(0.05, 0.01^2)\\ \\nu_n &amp; \\sim \\mathcal{N}(1, 1^2)\\ \\gamma_n &amp; \\sim \\operatorname{Student-t}{10}(1, 1^2)\\ \\mathbf{Y}{n, t} &amp; = \\mu_{n, t} + \\alpha_{n} + \\beta_{n}t + \\nu_n\\sin\\left(3\\times 2\\pi t + \\gamma\\right) + \\delta_{t, n} \\end{align} $$ where the true treatment effect $\\delta_{t, n}$ is 5% when $n=1$ and $t\\geq 60$ and 0 otherwise. Meanwhile, $\\mathbf{Y}$ is the matrix of observations, long in the number of time points and wide in the number of units.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    global_mean=20,\n    global_scale=1,\n    seed=123,\n)\n\nintercept = UnitVaryingParameter(sampling_dist=st.norm(loc=0.0, scale=1))\ncoefficient = UnitVaryingParameter(sampling_dist=st.norm(loc=0.05, scale=0.01))\nlinear_trend = Trend(degree=1, coefficient=coefficient, intercept=intercept)\n\namplitude = UnitVaryingParameter(sampling_dist=st.norm(loc=1.0, scale=2))\nshift = UnitVaryingParameter(sampling_dist=st.t(df=10))\nperiodic = Periodic(amplitude=amplitude, shift=shift, frequency=3)\n\ndata = effect(periodic(linear_trend(simulate(cfg))))\nplot(data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p> <p>time we see that the delta between the estaimted and true effect is much larger than before.</p> <pre><code>panel = data.to_azcausal()\nmodel = SDID()\nresult = model.fit(panel)\nprint(f\"Delta: {100*(TRUE_EFFECT - result.effect.percentage().value / 100): .2f}%\")\nprint(result.summary(title=\"Synthetic Data Experiment\"))\n</code></pre> <pre><code>Delta:  1.71%\n\u256d\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256e\n|                          Synthetic Data Experiment                           |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                    Panel                                     |\n|  Time Periods: 90 (60/30)                                  total (pre/post)  |\n|  Units: 11 (10/1)                                       total (contr/treat)  |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                     ATT                                      |\n|  Effect: 0.728265                                                            |\n|  Observed: 22.88                                                             |\n|  Counter Factual: 22.15                                                      |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Percentage                                  |\n|  Effect: 3.2874                                                              |\n|  Observed: 103.29                                                            |\n|  Counter Factual: 100.00                                                     |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Cumulative                                  |\n|  Effect: 21.85                                                               |\n|  Observed: 686.44                                                            |\n|  Counter Factual: 664.59                                                     |\n\u2570\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256f\n</code></pre>"},{"location":"_examples/basic/","title":"Data Synthesis","text":"<p>In this notebook we'll demonstrate how <code>causal-validation</code> can be used to simulate synthetic datasets. We'll start with very simple data to which a static treatment effect may be applied. From there, we'll build up to complex datasets. Along the way, we'll show how reproducibility can be ensured, plots can be generated, and unit-level parameters may be specified.</p> <pre><code>from itertools import product\n\nimport matplotlib.pyplot as plt\nimport numpy as np\nfrom scipy.stats import (\n    norm,\n    poisson,\n)\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import (\n    Periodic,\n    Trend,\n)\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\n</code></pre>"},{"location":"_examples/basic/#simulating-a-dataset","title":"Simulating a Dataset","text":"<p>then invoking the <code>simulate</code> function. Once simulated, we may visualise the data through the <code>plot</code> function.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\ndata = simulate(cfg)\nplot(data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p>"},{"location":"_examples/basic/#controlling-baseline-behaviour","title":"Controlling baseline behaviour","text":"<p>We observe that we have 10 control units, each of which were sampled from a Gaussian distribution with mean 20 and scale 0.2. Had we wished for our underlying observations to have more or less noise, or to have a different global mean, then we can simply specify that through the config file.</p> <pre><code>means = [10, 50]\nscales = [0.1, 0.5]\n\nfig, axes = plt.subplots(ncols=2, nrows=2, figsize=(10, 6), tight_layout=True)\nfor (m, s), ax in zip(product(means, scales), axes.ravel(), strict=False):\n    cfg = Config(\n        n_control_units=10,\n        n_pre_intervention_timepoints=60,\n        n_post_intervention_timepoints=30,\n        global_mean=m,\n        global_scale=s,\n    )\n    data = simulate(cfg)\n    plot(data, ax=ax, title=f\"Mean: {m}, Scale: {s}\")\n</code></pre> <p></p>"},{"location":"_examples/basic/#reproducibility","title":"Reproducibility","text":"<p>In the above four panels, we can see that whilst the mean and scale of the underlying data generating process is varying, the functional form of the data is the same. This is by design to ensure that data sampling is reproducible. To sample a new dataset, you may either change the underlying seed in the config file.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=42,\n)\n</code></pre> <p>Reusing the same config file across simulations</p> <pre><code>fig, axes = plt.subplots(ncols=2, figsize=(10, 3))\nfor ax in axes:\n    data = simulate(cfg)\n    plot(data, ax=ax)\n</code></pre> <p></p> <p>Or manually specifying and passing your own pseudorandom number generator key</p> <pre><code>\nrng = np.random.RandomState(42)\n\nfig, axes = plt.subplots(ncols=2, figsize=(10, 3))\nfor ax in axes:\n    data = simulate(cfg, key=rng)\n    plot(data, ax=ax)\n</code></pre> <p></p>"},{"location":"_examples/basic/#simulating-an-effect","title":"Simulating an effect","text":"<p>In the data we have seen up until now, the treated unit has been drawn from the same data generating process as the control units. However, it can be helpful to also inflate the treated unit to observe how well our model can recover the the true treatment effect. To do this, we simply compose our dataset with an <code>Effect</code> object. In the below, we shall inflate our data by 2%.</p> <pre><code>effect = StaticEffect(effect=0.02)\ninflated_data = effect(data)\nfig, (ax0, ax1) = plt.subplots(ncols=2, figsize=(10, 3))\nplot(data, ax=ax0, title=\"Original data\")\nplot(inflated_data, ax=ax1, title=\"Inflated data\")\n</code></pre> <pre><code>&lt;Axes: title={'center': 'Inflated data'}, xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p>"},{"location":"_examples/basic/#more-complex-generation-processes","title":"More complex generation processes","text":"<p>The example presented above shows a very simple stationary data generation process. However, we may make our example more complex by including a non-stationary trend to the data.</p> <pre><code>trend_term = Trend(degree=1, coefficient=0.1)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p> <pre><code>trend_term = Trend(degree=2, coefficient=0.0025)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p> <p>We may also include periodic components in our data</p> <pre><code>periodicity = Periodic(amplitude=2, frequency=6)\nperioidic_data = effect(periodicity(trend_term(data)))\nplot(perioidic_data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p>"},{"location":"_examples/basic/#unit-level-parameterisation","title":"Unit-level parameterisation","text":"<pre><code>sampling_dist = norm(0.0, 1.0)\nintercept = UnitVaryingParameter(sampling_dist=sampling_dist)\ntrend_term = Trend(degree=1, intercept=intercept, coefficient=0.1)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <pre><code>sampling_dist = poisson(2)\nfrequency = UnitVaryingParameter(sampling_dist=sampling_dist)\n\np = Periodic(frequency=frequency)\nplot(p(data))\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre>"},{"location":"_examples/basic/#conclusions","title":"Conclusions","text":"<p>In this notebook we have shown how one can define their model's true underlying data generating process, starting from simple white-noise samples through to more complex example with periodic and temporal components, perhaps containing unit-level variation. In a follow-up notebook, we show how these datasets may be integrated with Amazon's own AZCausal library to compare the effect estimated by a model with the true effect of the underlying data generating process. A link to this notebook is here.</p>"},{"location":"_examples/placebo_test/","title":"Placebo Testing","text":"<p>A placebo test is an approach to assess the validity of a causal model by checking if the effect can truly be attributed to the treatment, or to other spurious factors. A placebo test is conducted by iterating through the set of control units and at each iteration, replacing the treated unit by one of the control units and measuring the effect. If the model detects a significant effect, then it suggests potential bias or omitted variables in the analysis, indicating that the causal inference is flawed.</p> <p>A successful placebo test will show no statistically significant results and we may then conclude that the estimated effect can be attributed to the treatment and not driven by confounding factors. Conversely, a failed placebo test, which shows significant results, suggests that the identified treatment effect may not be reliable. Placebo testing is thus a critical step to ensure the robustness of findings in RCTs. In this notebook, we demonstrate how a placebo test can be conducted in <code>causal-validation</code>.</p> <pre><code>from azcausal.core.error import JackKnife\nfrom azcausal.estimators.panel.did import DID\nfrom azcausal.estimators.panel.sdid import SDID\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.models import AZCausalWrapper\nfrom causal_validation.plotters import plot\nfrom causal_validation.validation.placebo import PlaceboTest\n</code></pre> <pre><code>/home/runner/.local/share/hatch/env/virtual/causal-validation/CYBYs5D-/docs/lib/python3.10/site-packages/pandera/engines/pandas_engine.py:67: UserWarning: Using typeguard &lt; 3. Generic types like List[TYPE], Dict[TYPE, TYPE] will only validate the first element in the collection.\n  warnings.warn(\n</code></pre>"},{"location":"_examples/placebo_test/#data-simulation","title":"Data simulation","text":"<p>To demonstrate a placebo test, we must first simulate some data. For the purposes of illustration, we'll simulate a very simple dataset containing 10 control units where each unit has 60 pre-intervention observations, and 30 post-intervention observations.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\nTRUE_EFFECT = 0.05\neffect = StaticEffect(effect=TRUE_EFFECT)\ndata = effect(simulate(cfg))\nplot(data)\n</code></pre> <pre><code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;\n</code></pre> <p></p>"},{"location":"_examples/placebo_test/#model","title":"Model","text":"<p>We'll now define our model. To do this, we'll use the synthetic difference-in-differences implementation of AZCausal. This implementation, along with any other model from AZCausal, can be neatly wrapped up in our <code>AZCausalWrapper</code> to make fitting and effect estimation simpler.</p> <pre><code>model = AZCausalWrapper(model=SDID(), error_estimator=JackKnife())\n</code></pre>"},{"location":"_examples/placebo_test/#placebo-test-results","title":"Placebo Test Results","text":"<p>Now that we have a dataset and model defined, we may conduct our placebo test. With 10 control units, the test will estimate 10 individual effects; 1 per control unit when it is mocked as the treated group. With those 10 effects, the routine will then produce the mean estimated effect, along with the standard deviation across the estimated effect, the effect's standard error, and the p-value that corresponds to the null-hypothesis test that the effect is 0.</p> <p>In the below, we see that expected estimated effect is small at just 0.08. Accordingly, the p-value attains a value of 0.5, indicating that we have insufficient evidence to reject the null hypothesis and we, therefore, have no evidence to suggest that there is bias within this particular setup.</p> <pre><code>result = PlaceboTest(model, data).execute()\nresult.summary()\n</code></pre> <pre><code>Output()\n</code></pre> <pre></pre> <pre>                                                                  \n| Model | Effect | Standard Deviation | Standard Error | p-value |\n|-------|--------|--------------------|----------------|---------|\n| SDID  | 0.0851 | 0.4079             | 0.129          | 0.5472  |\n\n</pre>"},{"location":"_examples/placebo_test/#model-comparison","title":"Model Comparison","text":"<p>We can also use the results of a placebo test to compare two or more models. Using <code>causal-validation</code>, this is as simple as supplying a series of models to the placebo test and comparing their outputs. To demonstrate this, we will compare the previously used synthetic difference-in-differences model with regular difference-in-differences.</p> <pre><code>did_model = AZCausalWrapper(model=DID())\nPlaceboTest([model, did_model], data).execute().summary()\n</code></pre> <pre><code>Output()\n</code></pre> <pre></pre> <pre>                                                                  \n| Model | Effect | Standard Deviation | Standard Error | p-value |\n|-------|--------|--------------------|----------------|---------|\n| SDID  | 0.0851 | 0.4079             | 0.129          | 0.5472  |\n| DID   | 0.0002 | 0.2818             | 0.0891         | 0.9982  |\n\n</pre>"}]}
\ No newline at end of file
+{"config":{"lang":["en"],"separator":"[\\s\\-]+","pipeline":["stopWordFilter"]},"docs":[{"location":"","title":"Welcome to Causal Validation","text":"<p>Causal Validation is a library designed to validate and test your causal models. To achieve this, we provide functionality to simulate causal data, and vaildate your model through a placebo test. </p>"},{"location":"#data-synthesis","title":"Data Synthesis","text":"<p>Data Synthesis in Causal Validation is a fully composable process whereby a set of functions are sequentially applied to a dataset. At some point in this process we also induce a treatment effect. Any of these functions can be parameterised to either have constant parameter values across all control units, or a value that varies across parameters. To see this, consider the below example where we simulate a dataset whose trend varies across each of the 10 control units.</p> <pre><code>from causal_validation import Config, simulate\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import Trend, Periodic\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\nfrom scipy.stats import norm\n\ncfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n)\n\n# Simulate the base observation\nbase_data = simulate(cfg)\n\n# Apply a linear trend with unit-varying intercept\nintercept = UnitVaryingParameter(sampling_dist = norm(0, 1))\ntrend_component = Trend(degree=1, coefficient=0.1, intercept=intercept)\ntrended_data = trend_component(base_data)\n\n# Simulate a 5% lift in the treated unit's post-intervention data\neffect = StaticEffect(0.05)\ninflated_data = effect(trended_data)\n</code></pre> <p></p>"},{"location":"#model-validation","title":"Model Validation","text":"<p>Once a dataset has been synthesised, we may wish to validate our model using a placebo test. In Causal Validation this is straightforward and can be accomplished in combination with AZCausal by the following.</p> <pre><code>from azcausal.estimators.panel.sdid import SDID\nfrom causal_validation.validation.placebo import PlaceboTest\n\nmodel = AZCausalWrapper(model=SDID())\nresult = PlaceboTest(model, inflated_data).execute()\nresult.summary()\n</code></pre>"},{"location":"examples/azcausal/","title":"AZCausal Integration","text":"<pre><code>from azcausal.estimators.panel.sdid import SDID\nimport scipy.stats as st\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import (\n    Periodic,\n    Trend,\n)\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\n</code></pre> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\nlinear_trend = Trend(degree=1, coefficient=0.05)\ndata = linear_trend(simulate(cfg))\nplot(data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <p>will inflate the treated group's observations in the post-intervention window.</p> <pre><code>TRUE_EFFECT = 0.05\neffect = StaticEffect(effect=TRUE_EFFECT)\ninflated_data = effect(data)\nplot(inflated_data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>panel = inflated_data.to_azcausal()\nmodel = SDID()\nresult = model.fit(panel)\nprint(f\"Delta: {TRUE_EFFECT - result.effect.percentage().value / 100}\")\nprint(result.summary(title=\"Synthetic Data Experiment\"))\n</code></pre> <pre>\n<code>Delta: -2.3592239273284576e-16\n\u256d\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256e\n|                          Synthetic Data Experiment                           |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                    Panel                                     |\n|  Time Periods: 90 (60/30)                                  total (pre/post)  |\n|  Units: 11 (10/1)                                       total (contr/treat)  |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                     ATT                                      |\n|  Effect: 1.1858                                                              |\n|  Observed: 24.90                                                             |\n|  Counter Factual: 23.72                                                      |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Percentage                                  |\n|  Effect: 5.0000                                                              |\n|  Observed: 105.00                                                            |\n|  Counter Factual: 100.00                                                     |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Cumulative                                  |\n|  Effect: 35.57                                                               |\n|  Observed: 747.03                                                            |\n|  Counter Factual: 711.46                                                     |\n\u2570\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256f\n</code>\n</pre> <p>effect.  However, given the simplicity of the data, this is not surprising. With the functionality within this package though we can easily construct more complex datasets in effort to fully stress-test any new model and identify its limitations.</p> <p>To achieve this, we'll simulate 10 control units, 60 pre-intervention time points, and 30 post-intervention time points according to the following process: $$ \\begin{align} \\mu_{n, t} &amp; \\sim\\mathcal{N}(20, 0.5^2)\\ \\alpha_{n} &amp; \\sim \\mathcal{N}(0, 1^2)\\ \\beta_{n} &amp; \\sim \\mathcal{N}(0.05, 0.01^2)\\ \\nu_n &amp; \\sim \\mathcal{N}(1, 1^2)\\ \\gamma_n &amp; \\sim \\operatorname{Student-t}{10}(1, 1^2)\\ \\mathbf{Y}{n, t} &amp; = \\mu_{n, t} + \\alpha_{n} + \\beta_{n}t + \\nu_n\\sin\\left(3\\times 2\\pi t + \\gamma\\right) + \\delta_{t, n} \\end{align} $$ where the true treatment effect $\\delta_{t, n}$ is 5% when $n=1$ and $t\\geq 60$ and 0 otherwise. Meanwhile, $\\mathbf{Y}$ is the matrix of observations, long in the number of time points and wide in the number of units.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    global_mean=20,\n    global_scale=1,\n    seed=123,\n)\n\nintercept = UnitVaryingParameter(sampling_dist=st.norm(loc=0.0, scale=1))\ncoefficient = UnitVaryingParameter(sampling_dist=st.norm(loc=0.05, scale=0.01))\nlinear_trend = Trend(degree=1, coefficient=coefficient, intercept=intercept)\n\namplitude = UnitVaryingParameter(sampling_dist=st.norm(loc=1.0, scale=2))\nshift = UnitVaryingParameter(sampling_dist=st.t(df=10))\nperiodic = Periodic(amplitude=amplitude, shift=shift, frequency=3)\n\ndata = effect(periodic(linear_trend(simulate(cfg))))\nplot(data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <p>time we see that the delta between the estaimted and true effect is much larger than before.</p> <pre><code>panel = data.to_azcausal()\nmodel = SDID()\nresult = model.fit(panel)\nprint(f\"Delta: {100*(TRUE_EFFECT - result.effect.percentage().value / 100): .2f}%\")\nprint(result.summary(title=\"Synthetic Data Experiment\"))\n</code></pre> <pre>\n<code>Delta:  1.71%\n\u256d\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256e\n|                          Synthetic Data Experiment                           |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                    Panel                                     |\n|  Time Periods: 90 (60/30)                                  total (pre/post)  |\n|  Units: 11 (10/1)                                       total (contr/treat)  |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                     ATT                                      |\n|  Effect: 0.728265                                                            |\n|  Observed: 22.88                                                             |\n|  Counter Factual: 22.15                                                      |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Percentage                                  |\n|  Effect: 3.2874                                                              |\n|  Observed: 103.29                                                            |\n|  Counter Factual: 100.00                                                     |\n\u251c\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2524\n|                                  Cumulative                                  |\n|  Effect: 21.85                                                               |\n|  Observed: 686.44                                                            |\n|  Counter Factual: 664.59                                                     |\n\u2570\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u2500\u256f\n</code>\n</pre>"},{"location":"examples/azcausal/#azcausal-integration","title":"AZCausal Integration","text":"<p>Amazon's AZCausal library provides the functionality to fit synthetic control and difference-in-difference models to your data. Integrating the synthetic data generating process of <code>causal_validation</code> with AZCausal is trivial, as we show in this notebook. To start, we'll simulate a toy dataset.</p>"},{"location":"examples/azcausal/#fitting-a-model","title":"Fitting a model","text":"<p>We now have some very toy data on which we may apply a model. For this demonstration we shall use the Synthetic Difference-in-Differences model implemented in AZCausal; however, the approach shown here will work for any model implemented in AZCausal. To achieve this, we must first coerce the data into a format that is digestible for AZCausal. Through the <code>.to_azcausal()</code> method implemented here, this is straightforward to achieve. Once we have a AZCausal compatible dataset, the modelling is very simple by virtue of the clean design of AZCausal.</p>"},{"location":"examples/basic/","title":"Data Synthesis","text":"<pre><code>from itertools import product\n\nimport matplotlib.pyplot as plt\nimport numpy as np\nfrom scipy.stats import (\n    norm,\n    poisson,\n)\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.plotters import plot\nfrom causal_validation.transforms import (\n    Periodic,\n    Trend,\n)\nfrom causal_validation.transforms.parameter import UnitVaryingParameter\n</code></pre> <p>then invoking the <code>simulate</code> function. Once simulated, we may visualise the data through the <code>plot</code> function.</p> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\ndata = simulate(cfg)\nplot(data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>means = [10, 50]\nscales = [0.1, 0.5]\n\nfig, axes = plt.subplots(ncols=2, nrows=2, figsize=(10, 6), tight_layout=True)\nfor (m, s), ax in zip(product(means, scales), axes.ravel(), strict=False):\n    cfg = Config(\n        n_control_units=10,\n        n_pre_intervention_timepoints=60,\n        n_post_intervention_timepoints=30,\n        global_mean=m,\n        global_scale=s,\n    )\n    data = simulate(cfg)\n    plot(data, ax=ax, title=f\"Mean: {m}, Scale: {s}\")\n</code></pre> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=42,\n)\n</code></pre> <p>Reusing the same config file across simulations</p> <pre><code>fig, axes = plt.subplots(ncols=2, figsize=(10, 3))\nfor ax in axes:\n    data = simulate(cfg)\n    plot(data, ax=ax)\n</code></pre> <p>Or manually specifying and passing your own pseudorandom number generator key</p> <pre><code>\nrng = np.random.RandomState(42)\n\nfig, axes = plt.subplots(ncols=2, figsize=(10, 3))\nfor ax in axes:\n    data = simulate(cfg, key=rng)\n    plot(data, ax=ax)\n</code></pre> <pre><code>effect = StaticEffect(effect=0.02)\ninflated_data = effect(data)\nfig, (ax0, ax1) = plt.subplots(ncols=2, figsize=(10, 3))\nplot(data, ax=ax0, title=\"Original data\")\nplot(inflated_data, ax=ax1, title=\"Inflated data\")\n</code></pre> <pre>\n<code>&lt;Axes: title={'center': 'Inflated data'}, xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>trend_term = Trend(degree=1, coefficient=0.1)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>trend_term = Trend(degree=2, coefficient=0.0025)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <p>We may also include periodic components in our data</p> <pre><code>periodicity = Periodic(amplitude=2, frequency=6)\nperioidic_data = effect(periodicity(trend_term(data)))\nplot(perioidic_data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>sampling_dist = norm(0.0, 1.0)\nintercept = UnitVaryingParameter(sampling_dist=sampling_dist)\ntrend_term = Trend(degree=1, intercept=intercept, coefficient=0.1)\ndata_with_trend = effect(trend_term(data))\nplot(data_with_trend)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>sampling_dist = poisson(2)\nfrequency = UnitVaryingParameter(sampling_dist=sampling_dist)\n\np = Periodic(frequency=frequency)\nplot(p(data))\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre>"},{"location":"examples/basic/#data-synthesis","title":"Data Synthesis","text":"<p>In this notebook we'll demonstrate how <code>causal-validation</code> can be used to simulate synthetic datasets. We'll start with very simple data to which a static treatment effect may be applied. From there, we'll build up to complex datasets. Along the way, we'll show how reproducibility can be ensured, plots can be generated, and unit-level parameters may be specified.</p>"},{"location":"examples/basic/#simulating-a-dataset","title":"Simulating a Dataset","text":""},{"location":"examples/basic/#controlling-baseline-behaviour","title":"Controlling baseline behaviour","text":"<p>We observe that we have 10 control units, each of which were sampled from a Gaussian distribution with mean 20 and scale 0.2. Had we wished for our underlying observations to have more or less noise, or to have a different global mean, then we can simply specify that through the config file.</p>"},{"location":"examples/basic/#reproducibility","title":"Reproducibility","text":"<p>In the above four panels, we can see that whilst the mean and scale of the underlying data generating process is varying, the functional form of the data is the same. This is by design to ensure that data sampling is reproducible. To sample a new dataset, you may either change the underlying seed in the config file.</p>"},{"location":"examples/basic/#simulating-an-effect","title":"Simulating an effect","text":"<p>In the data we have seen up until now, the treated unit has been drawn from the same data generating process as the control units. However, it can be helpful to also inflate the treated unit to observe how well our model can recover the the true treatment effect. To do this, we simply compose our dataset with an <code>Effect</code> object. In the below, we shall inflate our data by 2%.</p>"},{"location":"examples/basic/#more-complex-generation-processes","title":"More complex generation processes","text":"<p>The example presented above shows a very simple stationary data generation process. However, we may make our example more complex by including a non-stationary trend to the data.</p>"},{"location":"examples/basic/#unit-level-parameterisation","title":"Unit-level parameterisation","text":""},{"location":"examples/basic/#conclusions","title":"Conclusions","text":"<p>In this notebook we have shown how one can define their model's true underlying data generating process, starting from simple white-noise samples through to more complex example with periodic and temporal components, perhaps containing unit-level variation. In a follow-up notebook, we show how these datasets may be integrated with Amazon's own AZCausal library to compare the effect estimated by a model with the true effect of the underlying data generating process. A link to this notebook is here.</p>"},{"location":"examples/placebo_test/","title":"Placebo Testing","text":"<pre><code>from azcausal.core.error import JackKnife\nfrom azcausal.estimators.panel.did import DID\nfrom azcausal.estimators.panel.sdid import SDID\n\nfrom causal_validation import (\n    Config,\n    simulate,\n)\nfrom causal_validation.effects import StaticEffect\nfrom causal_validation.models import AZCausalWrapper\nfrom causal_validation.plotters import plot\nfrom causal_validation.validation.placebo import PlaceboTest\n</code></pre> <pre>\n<code>/home/runner/.local/share/hatch/env/virtual/causal-validation/CYBYs5D-/docs/lib/python3.10/site-packages/pandera/engines/pandas_engine.py:67: UserWarning: Using typeguard &lt; 3. Generic types like List[TYPE], Dict[TYPE, TYPE] will only validate the first element in the collection.\n  warnings.warn(\n</code>\n</pre> <pre><code>cfg = Config(\n    n_control_units=10,\n    n_pre_intervention_timepoints=60,\n    n_post_intervention_timepoints=30,\n    seed=123,\n)\n\nTRUE_EFFECT = 0.05\neffect = StaticEffect(effect=TRUE_EFFECT)\ndata = effect(simulate(cfg))\nplot(data)\n</code></pre> <pre>\n<code>&lt;Axes: xlabel='Time', ylabel='Observed'&gt;</code>\n</pre> <pre><code>model = AZCausalWrapper(model=SDID(), error_estimator=JackKnife())\n</code></pre> <pre><code>result = PlaceboTest(model, data).execute()\nresult.summary()\n</code></pre> <pre></pre> <pre>                                                                  \n| Model | Effect | Standard Deviation | Standard Error | p-value |\n|-------|--------|--------------------|----------------|---------|\n| SDID  | 0.0851 | 0.4079             | 0.129          | 0.5472  |\n\n</pre> <pre><code>did_model = AZCausalWrapper(model=DID())\nPlaceboTest([model, did_model], data).execute().summary()\n</code></pre> <pre></pre> <pre>                                                                  \n| Model | Effect | Standard Deviation | Standard Error | p-value |\n|-------|--------|--------------------|----------------|---------|\n| SDID  | 0.0851 | 0.4079             | 0.129          | 0.5472  |\n| DID   | 0.0002 | 0.2818             | 0.0891         | 0.9982  |\n\n</pre>"},{"location":"examples/placebo_test/#placebo-testing","title":"Placebo Testing","text":"<p>A placebo test is an approach to assess the validity of a causal model by checking if the effect can truly be attributed to the treatment, or to other spurious factors. A placebo test is conducted by iterating through the set of control units and at each iteration, replacing the treated unit by one of the control units and measuring the effect. If the model detects a significant effect, then it suggests potential bias or omitted variables in the analysis, indicating that the causal inference is flawed.</p> <p>A successful placebo test will show no statistically significant results and we may then conclude that the estimated effect can be attributed to the treatment and not driven by confounding factors. Conversely, a failed placebo test, which shows significant results, suggests that the identified treatment effect may not be reliable. Placebo testing is thus a critical step to ensure the robustness of findings in RCTs. In this notebook, we demonstrate how a placebo test can be conducted in <code>causal-validation</code>.</p>"},{"location":"examples/placebo_test/#data-simulation","title":"Data simulation","text":"<p>To demonstrate a placebo test, we must first simulate some data. For the purposes of illustration, we'll simulate a very simple dataset containing 10 control units where each unit has 60 pre-intervention observations, and 30 post-intervention observations.</p>"},{"location":"examples/placebo_test/#model","title":"Model","text":"<p>We'll now define our model. To do this, we'll use the synthetic difference-in-differences implementation of AZCausal. This implementation, along with any other model from AZCausal, can be neatly wrapped up in our <code>AZCausalWrapper</code> to make fitting and effect estimation simpler.</p>"},{"location":"examples/placebo_test/#placebo-test-results","title":"Placebo Test Results","text":"<p>Now that we have a dataset and model defined, we may conduct our placebo test. With 10 control units, the test will estimate 10 individual effects; 1 per control unit when it is mocked as the treated group. With those 10 effects, the routine will then produce the mean estimated effect, along with the standard deviation across the estimated effect, the effect's standard error, and the p-value that corresponds to the null-hypothesis test that the effect is 0.</p> <p>In the below, we see that expected estimated effect is small at just 0.08. Accordingly, the p-value attains a value of 0.5, indicating that we have insufficient evidence to reject the null hypothesis and we, therefore, have no evidence to suggest that there is bias within this particular setup.</p>"},{"location":"examples/placebo_test/#model-comparison","title":"Model Comparison","text":"<p>We can also use the results of a placebo test to compare two or more models. Using <code>causal-validation</code>, this is as simple as supplying a series of models to the placebo test and comparing their outputs. To demonstrate this, we will compare the previously used synthetic difference-in-differences model with regular difference-in-differences.</p>"}]}
\ No newline at end of file
diff --git a/sitemap.xml b/sitemap.xml
index 844099f..ebb287f 100644
--- a/sitemap.xml
+++ b/sitemap.xml
@@ -5,15 +5,15 @@
          <lastmod>2024-09-06</lastmod>
     </url>
     <url>
-         <loc>https://amazon-science.github.io/causal-validation/_examples/azcausal/</loc>
+         <loc>https://amazon-science.github.io/causal-validation/examples/azcausal/</loc>
          <lastmod>2024-09-06</lastmod>
     </url>
     <url>
-         <loc>https://amazon-science.github.io/causal-validation/_examples/basic/</loc>
+         <loc>https://amazon-science.github.io/causal-validation/examples/basic/</loc>
          <lastmod>2024-09-06</lastmod>
     </url>
     <url>
-         <loc>https://amazon-science.github.io/causal-validation/_examples/placebo_test/</loc>
+         <loc>https://amazon-science.github.io/causal-validation/examples/placebo_test/</loc>
          <lastmod>2024-09-06</lastmod>
     </url>
 </urlset>
\ No newline at end of file
diff --git a/sitemap.xml.gz b/sitemap.xml.gz
index a1735ed..e6345f7 100644
Binary files a/sitemap.xml.gz and b/sitemap.xml.gz differ