From 2772f727d42cd08e93f81048d5b01877b34d1bb1 Mon Sep 17 00:00:00 2001
From: GitHub Actions <action@github.com>
Date: Mon, 16 Sep 2024 13:04:55 +0000
Subject: [PATCH] Update documentation

---
 docs/attacks/all_attacks.html     |  151 +---
 docs/attacks/attack_utils.html    |  350 +-------
 docs/attacks/gradnorm.html        |   80 +-
 docs/attacks/index.html           |   36 +-
 docs/attacks/loss.html            |   53 +-
 docs/attacks/min_k.html           |   71 +-
 docs/attacks/min_k_plus_plus.html |   71 +-
 docs/attacks/neighborhood.html    | 1134 +------------------------
 docs/attacks/quantile.html        |  193 +----
 docs/attacks/reference.html       |   59 +-
 docs/attacks/utils.html           |   78 +-
 docs/attacks/zlib.html            |   68 +-
 docs/config.html                  |  251 +-----
 docs/custom_datasets.html         |  418 +--------
 docs/data_utils.html              |  688 +--------------
 docs/index.html                   |   28 +-
 docs/models.html                  | 1314 +----------------------------
 docs/plot_utils.html              |  288 +------
 docs/utils.html                   |  139 +--
 19 files changed, 291 insertions(+), 5179 deletions(-)
diff --git a/docs/attacks/all_attacks.html b/docs/attacks/all_attacks.html
index a6a4391..8157e78 100644
--- a/docs/attacks/all_attacks.html
+++ b/docs/attacks/all_attacks.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.all_attacks API documentation</title>
-<meta name="description" content="Enum class for attacks. Also contains the base attack class." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Enum class for attacks. Also contains the base attack class.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,81 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.all_attacks</code></h1>
 </header>
 <section id="section-intro">
 <p>Enum class for attacks. Also contains the base attack class.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Enum class for attacks. Also contains the base attack class.
-&#34;&#34;&#34;
-
-from enum import Enum
-from mimir.models import Model
-
-
-# Attack definitions
-class AllAttacks(str, Enum):
-    LOSS = &#34;loss&#34; # Done
-    REFERENCE_BASED = &#34;ref&#34; # Done
-    ZLIB = &#34;zlib&#34; # Done
-    MIN_K = &#34;min_k&#34; # Done
-    MIN_K_PLUS_PLUS = &#34;min_k++&#34; # Done
-    NEIGHBOR = &#34;ne&#34; # Done
-    GRADNORM = &#34;gradnorm&#34; # Done
-    # QUANTILE = &#34;quantile&#34; # Uncomment when tested implementation is available
-
-
-# Base attack class
-class Attack:
-    def __init__(self, config, target_model: Model, ref_model: Model = None, is_blackbox: bool = True):
-        self.config = config
-        self.target_model = target_model
-        self.ref_model = ref_model
-        self.is_loaded = False
-        self.is_blackbox = is_blackbox
-
-    def load(self):
-        &#34;&#34;&#34;
-        Any attack-specific steps (one-time) preparation
-        &#34;&#34;&#34;
-        if self.ref_model is not None:
-            self.ref_model.load()
-            self.is_loaded = True
-
-    def unload(self):
-        if self.ref_model is not None:
-            self.ref_model.unload()
-            self.is_loaded = False
-
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Actual logic for attack. 
-        &#34;&#34;&#34;
-        raise NotImplementedError(&#34;Attack must implement attack()&#34;)
-
-    def attack(self, document, probs, **kwargs):
-        &#34;&#34;&#34;
-        Score a document using the attack&#39;s scoring function. Calls self._attack
-        &#34;&#34;&#34;
-        # Load attack if not loaded yet
-        if not self.is_loaded:
-            self.load()
-            self.is_loaded = True
-
-        detokenized_sample = kwargs.get(&#34;detokenized_sample&#34;, None)
-        if self.config.pretokenized and detokenized_sample is None:
-            raise ValueError(&#34;detokenized_sample must be provided&#34;)
-
-        score = (
-            self._attack(document, probs=probs, **kwargs)
-            if not self.config.pretokenized
-            else self._attack(
-                detokenized_sample, tokens=document, probs=probs, **kwargs
-            )
-        )
-
-        return score</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -243,66 +171,18 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>Score a document using the attack's scoring function. Calls self._attack</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def attack(self, document, probs, **kwargs):
-    &#34;&#34;&#34;
-    Score a document using the attack&#39;s scoring function. Calls self._attack
-    &#34;&#34;&#34;
-    # Load attack if not loaded yet
-    if not self.is_loaded:
-        self.load()
-        self.is_loaded = True
-
-    detokenized_sample = kwargs.get(&#34;detokenized_sample&#34;, None)
-    if self.config.pretokenized and detokenized_sample is None:
-        raise ValueError(&#34;detokenized_sample must be provided&#34;)
-
-    score = (
-        self._attack(document, probs=probs, **kwargs)
-        if not self.config.pretokenized
-        else self._attack(
-            detokenized_sample, tokens=document, probs=probs, **kwargs
-        )
-    )
-
-    return score</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.all_attacks.Attack.load"><code class="name flex">
 <span>def <span class="ident">load</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Any attack-specific steps (one-time) preparation</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load(self):
-    &#34;&#34;&#34;
-    Any attack-specific steps (one-time) preparation
-    &#34;&#34;&#34;
-    if self.ref_model is not None:
-        self.ref_model.load()
-        self.is_loaded = True</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.all_attacks.Attack.unload"><code class="name flex">
 <span>def <span class="ident">unload</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def unload(self):
-    if self.ref_model is not None:
-        self.ref_model.unload()
-        self.is_loaded = False</code></pre>
-</details>
 </dd>
 </dl>
 </dd>
@@ -315,7 +195,6 @@ <h3>Methods</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -353,7 +232,7 @@ <h4><code><a title="mimir.attacks.all_attacks.Attack" href="#mimir.attacks.all_a
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/attack_utils.html b/docs/attacks/attack_utils.html
index cadafca..31682a8 100644
--- a/docs/attacks/attack_utils.html
+++ b/docs/attacks/attack_utils.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.attack_utils API documentation</title>
-<meta name="description" content="Utility functions for attacks" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Utility functions for attacks">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,164 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.attack_utils</code></h1>
 </header>
 <section id="section-intro">
 <p>Utility functions for attacks</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Utility functions for attacks
-&#34;&#34;&#34;
-from typing import List
-import torch
-from collections import Counter
-import math
-import numpy as np
-from sklearn.metrics import roc_curve, auc, precision_recall_curve
-from scipy.stats import bootstrap
-
-
-def count_masks(texts):
-    return [
-        len([x for x in text.split() if x.startswith(&#34;&lt;extra_id_&#34;)]) for text in texts
-    ]
-
-
-def apply_extracted_fills(masked_texts: List[str], extracted_fills):
-    # split masked text into tokens, only splitting on spaces (not newlines)
-    tokens = [x.split(&#34; &#34;) for x in masked_texts]
-
-    n_expected = count_masks(masked_texts)
-
-    # replace each mask token with the corresponding fill
-    for idx, (text, fills, n) in enumerate(zip(tokens, extracted_fills, n_expected)):
-        if len(fills) &lt; n:
-            tokens[idx] = []
-        else:
-            for fill_idx in range(n):
-                text[text.index(f&#34;&lt;extra_id_{fill_idx}&gt;&#34;)] = fills[fill_idx]
-
-    # join tokens back into text
-    texts = [&#34; &#34;.join(x) for x in tokens]
-    return texts
-
-
-def f1_score(prediction, ground_truth):
-    &#34;&#34;&#34;
-        Compute F1 score for given prediction and ground truth.
-    &#34;&#34;&#34;
-    common = Counter(prediction) &amp; Counter(ground_truth)
-    num_same = sum(common.values())
-    if num_same == 0:
-        return 0, 0, 0
-    precision = 1.0 * num_same / len(prediction)
-    recall = 1.0 * num_same / len(ground_truth)
-    f1 = (2 * precision * recall) / (precision + recall)
-    print(num_same, f1, precision, recall)
-    return f1, precision, recall
-
-
-def get_auc_from_thresholds(preds_member, preds_nonmember, thresholds):
-    &#34;&#34;&#34;
-    Compute FPRs and TPRs corresponding to given thresholds
-    &#34;&#34;&#34;
-    tpr, fpr = [], []
-    for threshold in thresholds:
-        tp = np.sum(preds_nonmember &gt;= threshold)
-        fn = np.sum(preds_nonmember &lt; threshold)
-        fp = np.sum(preds_member &gt;= threshold)
-        tn = np.sum(preds_member &lt; threshold)
-
-        tpr.append(tp / (tp + fn))
-        fpr.append(fp / (fp + tn))
-    
-    tpr = np.array(tpr)
-    fpr = np.array(fpr)
-    roc_auc = auc(fpr, tpr)
-    return roc_auc
-
-
-def get_roc_metrics(
-    preds_member,
-    preds_nonmember,
-    perform_bootstrap: bool = False,
-    return_thresholds: bool = False,
-):  # fpr_list,
-    preds_member_ = filter_out_nan(preds_member)
-    preds_nonmember_ = filter_out_nan(preds_nonmember)
-    total_preds = preds_member_ + preds_nonmember_
-    # While roc_auc is unaffected by which class we consider
-    # positive/negative, the TPR@lowFPR calculation is.
-    # Make sure the members are positive class (larger values, so negate the raw MIA scores)
-    total_preds = np.array(total_preds) * -1
-    # Assign label &#39;0&#39; to members for computation, since sklearn
-    # expectes label &#39;0&#39; data to have lower values to get assigned that label
-    # which is true for our attacks (lower loss for members, e.g.)
-    total_labels = [1] * len(preds_member_) + [0] * len(preds_nonmember_)
-    fpr, tpr, thresholds = roc_curve(total_labels, total_preds)
-
-    roc_auc = auc(fpr, tpr)
-    # tpr_at_low_fpr = {upper_bound: tpr[np.where(np.array(fpr) &lt; upper_bound)[0][-1]] for upper_bound in fpr_list}
-
-    if perform_bootstrap:
-
-        def roc_auc_statistic(preds, labels):
-            in_preds = [pred for pred, label in zip(preds, labels) if label == 1]
-            out_preds = [pred for pred, label in zip(preds, labels) if label == 0]
-            _, _, roc_auc = get_roc_metrics(in_preds, out_preds)
-            return roc_auc
-
-        auc_roc_res = bootstrap(
-            (total_preds, total_labels),
-            roc_auc_statistic,
-            n_resamples=1000,
-            paired=True,
-        )
-
-        # tpr_at_low_fpr_res = {}
-        # for ub in fpr_list:
-        #     def tpr_at_fpr_statistic(preds, labels):
-        #         in_preds = [pred for pred, label in zip(preds, labels) if label == 1]
-        #         out_preds = [pred for pred, label in zip(preds, labels) if label == 0]
-        #         _, _, _, tpr_at_low_fpr = get_roc_metrics(in_preds, out_preds, [ub])
-        #         return tpr_at_low_fpr[ub]
-
-        #     tpr_at_low_fpr_res[ub] = bootstrap((total_preds, total_labels), tpr_at_fpr_statistic, n_resamples=1000, paired=True)
-
-        if return_thresholds:
-            return (
-                fpr.tolist(),
-                tpr.tolist(),
-                float(roc_auc),
-                auc_roc_res,
-                thresholds.tolist(),
-            )
-        return (
-            fpr.tolist(),
-            tpr.tolist(),
-            float(roc_auc),
-            auc_roc_res,
-        )  # tpr_at_low_fpr, tpr_at_low_fpr_res
-
-    if return_thresholds:
-        return fpr.tolist(), tpr.tolist(), float(roc_auc), thresholds.tolist()
-    return fpr.tolist(), tpr.tolist(), float(roc_auc)  # , tpr_at_low_fpr
-
-
-def get_precision_recall_metrics(preds_member, preds_nonmember):
-    preds_member_ = filter_out_nan(preds_member)
-    preds_nonmember_ = filter_out_nan(preds_nonmember)
-    total_preds = preds_member_ + preds_nonmember_
-
-    total_labels = [0] * len(preds_member_) + [1] * len(preds_nonmember_)
-
-    precision, recall, _ = precision_recall_curve(total_labels, total_preds)
-    pr_auc = auc(recall, precision)
-    return precision.tolist(), recall.tolist(), float(pr_auc)
-
-
-def filter_out_nan(x):
-    return [element for element in x if not math.isnan(element)]</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -194,206 +39,42 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def apply_extracted_fills(masked_texts: List[str], extracted_fills):
-    # split masked text into tokens, only splitting on spaces (not newlines)
-    tokens = [x.split(&#34; &#34;) for x in masked_texts]
-
-    n_expected = count_masks(masked_texts)
-
-    # replace each mask token with the corresponding fill
-    for idx, (text, fills, n) in enumerate(zip(tokens, extracted_fills, n_expected)):
-        if len(fills) &lt; n:
-            tokens[idx] = []
-        else:
-            for fill_idx in range(n):
-                text[text.index(f&#34;&lt;extra_id_{fill_idx}&gt;&#34;)] = fills[fill_idx]
-
-    # join tokens back into text
-    texts = [&#34; &#34;.join(x) for x in tokens]
-    return texts</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.count_masks"><code class="name flex">
 <span>def <span class="ident">count_masks</span></span>(<span>texts)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def count_masks(texts):
-    return [
-        len([x for x in text.split() if x.startswith(&#34;&lt;extra_id_&#34;)]) for text in texts
-    ]</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.f1_score"><code class="name flex">
 <span>def <span class="ident">f1_score</span></span>(<span>prediction, ground_truth)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Compute F1 score for given prediction and ground truth.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def f1_score(prediction, ground_truth):
-    &#34;&#34;&#34;
-        Compute F1 score for given prediction and ground truth.
-    &#34;&#34;&#34;
-    common = Counter(prediction) &amp; Counter(ground_truth)
-    num_same = sum(common.values())
-    if num_same == 0:
-        return 0, 0, 0
-    precision = 1.0 * num_same / len(prediction)
-    recall = 1.0 * num_same / len(ground_truth)
-    f1 = (2 * precision * recall) / (precision + recall)
-    print(num_same, f1, precision, recall)
-    return f1, precision, recall</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.filter_out_nan"><code class="name flex">
 <span>def <span class="ident">filter_out_nan</span></span>(<span>x)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def filter_out_nan(x):
-    return [element for element in x if not math.isnan(element)]</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.get_auc_from_thresholds"><code class="name flex">
 <span>def <span class="ident">get_auc_from_thresholds</span></span>(<span>preds_member, preds_nonmember, thresholds)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Compute FPRs and TPRs corresponding to given thresholds</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_auc_from_thresholds(preds_member, preds_nonmember, thresholds):
-    &#34;&#34;&#34;
-    Compute FPRs and TPRs corresponding to given thresholds
-    &#34;&#34;&#34;
-    tpr, fpr = [], []
-    for threshold in thresholds:
-        tp = np.sum(preds_nonmember &gt;= threshold)
-        fn = np.sum(preds_nonmember &lt; threshold)
-        fp = np.sum(preds_member &gt;= threshold)
-        tn = np.sum(preds_member &lt; threshold)
-
-        tpr.append(tp / (tp + fn))
-        fpr.append(fp / (fp + tn))
-    
-    tpr = np.array(tpr)
-    fpr = np.array(fpr)
-    roc_auc = auc(fpr, tpr)
-    return roc_auc</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.get_precision_recall_metrics"><code class="name flex">
 <span>def <span class="ident">get_precision_recall_metrics</span></span>(<span>preds_member, preds_nonmember)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_precision_recall_metrics(preds_member, preds_nonmember):
-    preds_member_ = filter_out_nan(preds_member)
-    preds_nonmember_ = filter_out_nan(preds_nonmember)
-    total_preds = preds_member_ + preds_nonmember_
-
-    total_labels = [0] * len(preds_member_) + [1] * len(preds_nonmember_)
-
-    precision, recall, _ = precision_recall_curve(total_labels, total_preds)
-    pr_auc = auc(recall, precision)
-    return precision.tolist(), recall.tolist(), float(pr_auc)</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.attack_utils.get_roc_metrics"><code class="name flex">
 <span>def <span class="ident">get_roc_metrics</span></span>(<span>preds_member, preds_nonmember, perform_bootstrap: bool = False, return_thresholds: bool = False)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_roc_metrics(
-    preds_member,
-    preds_nonmember,
-    perform_bootstrap: bool = False,
-    return_thresholds: bool = False,
-):  # fpr_list,
-    preds_member_ = filter_out_nan(preds_member)
-    preds_nonmember_ = filter_out_nan(preds_nonmember)
-    total_preds = preds_member_ + preds_nonmember_
-    # While roc_auc is unaffected by which class we consider
-    # positive/negative, the TPR@lowFPR calculation is.
-    # Make sure the members are positive class (larger values, so negate the raw MIA scores)
-    total_preds = np.array(total_preds) * -1
-    # Assign label &#39;0&#39; to members for computation, since sklearn
-    # expectes label &#39;0&#39; data to have lower values to get assigned that label
-    # which is true for our attacks (lower loss for members, e.g.)
-    total_labels = [1] * len(preds_member_) + [0] * len(preds_nonmember_)
-    fpr, tpr, thresholds = roc_curve(total_labels, total_preds)
-
-    roc_auc = auc(fpr, tpr)
-    # tpr_at_low_fpr = {upper_bound: tpr[np.where(np.array(fpr) &lt; upper_bound)[0][-1]] for upper_bound in fpr_list}
-
-    if perform_bootstrap:
-
-        def roc_auc_statistic(preds, labels):
-            in_preds = [pred for pred, label in zip(preds, labels) if label == 1]
-            out_preds = [pred for pred, label in zip(preds, labels) if label == 0]
-            _, _, roc_auc = get_roc_metrics(in_preds, out_preds)
-            return roc_auc
-
-        auc_roc_res = bootstrap(
-            (total_preds, total_labels),
-            roc_auc_statistic,
-            n_resamples=1000,
-            paired=True,
-        )
-
-        # tpr_at_low_fpr_res = {}
-        # for ub in fpr_list:
-        #     def tpr_at_fpr_statistic(preds, labels):
-        #         in_preds = [pred for pred, label in zip(preds, labels) if label == 1]
-        #         out_preds = [pred for pred, label in zip(preds, labels) if label == 0]
-        #         _, _, _, tpr_at_low_fpr = get_roc_metrics(in_preds, out_preds, [ub])
-        #         return tpr_at_low_fpr[ub]
-
-        #     tpr_at_low_fpr_res[ub] = bootstrap((total_preds, total_labels), tpr_at_fpr_statistic, n_resamples=1000, paired=True)
-
-        if return_thresholds:
-            return (
-                fpr.tolist(),
-                tpr.tolist(),
-                float(roc_auc),
-                auc_roc_res,
-                thresholds.tolist(),
-            )
-        return (
-            fpr.tolist(),
-            tpr.tolist(),
-            float(roc_auc),
-            auc_roc_res,
-        )  # tpr_at_low_fpr, tpr_at_low_fpr_res
-
-    if return_thresholds:
-        return fpr.tolist(), tpr.tolist(), float(roc_auc), thresholds.tolist()
-    return fpr.tolist(), tpr.tolist(), float(roc_auc)  # , tpr_at_low_fpr</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -406,7 +87,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -431,7 +111,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/gradnorm.html b/docs/attacks/gradnorm.html
index 73ee0ae..2a4ef60 100644
--- a/docs/attacks/gradnorm.html
+++ b/docs/attacks/gradnorm.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.gradnorm API documentation</title>
-<meta name="description" content="Gradient-norm attack. Proposed for MIA in multiple settings, and particularly experimented for pre-training data and LLMs in …" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Gradient-norm attack. Proposed for MIA in multiple settings, and particularly experimented for pre-training data and LLMs in …">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,58 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.gradnorm</code></h1>
 </header>
 <section id="section-intro">
 <p>Gradient-norm attack. Proposed for MIA in multiple settings, and particularly experimented for pre-training data and LLMs in <a href="https://arxiv.org/abs/2402.17012">https://arxiv.org/abs/2402.17012</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Gradient-norm attack. Proposed for MIA in multiple settings, and particularly experimented for pre-training data and LLMs in https://arxiv.org/abs/2402.17012
-&#34;&#34;&#34;
-
-import torch as ch
-import numpy as np
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model
-from mimir.config import ExperimentConfig
-
-
-class GradNormAttack(Attack):
-    def __init__(self, config: ExperimentConfig, model: Model):
-        super().__init__(config, model, ref_model=None, is_blackbox=False)
-
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Gradient Norm Attack. Computes p-norm of gradients w.r.t. model parameters.
-        &#34;&#34;&#34;
-        # We ignore probs here since they are computed in the general case without gradient-tracking (to save memory)
-
-        # Hyper-params specific to min-k attack
-        p: float = kwargs.get(&#34;p&#34;, np.inf)
-        if p not in [1, 2, np.inf]:
-            raise ValueError(f&#34;Invalid p-norm value: {p}.&#34;)
-
-        # Make sure model params require gradients
-        # for name, param in self.target_model.model.named_parameters():
-        #    param.requires_grad = True
-
-        # Get gradients for model parameters
-        self.target_model.model.zero_grad()
-        all_prob = self.target_model.get_probabilities(document, tokens=tokens, no_grads=False)
-        loss = - ch.mean(all_prob)
-        loss.backward()
-
-        # Compute p-norm of gradients (for all model params where grad exists)
-        grad_norms = []
-        for param in self.target_model.model.parameters():
-            if param.grad is not None:
-                grad_norms.append(param.grad.detach().norm(p))
-        grad_norm = ch.stack(grad_norms).mean()
-
-        # Zero out gradients again
-        self.target_model.model.zero_grad()
-
-        return -grad_norm.cpu().numpy()</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -155,7 +106,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -176,7 +126,7 @@ <h4><code><a title="mimir.attacks.gradnorm.GradNormAttack" href="#mimir.attacks.
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/index.html b/docs/attacks/index.html
index 7d97cc6..a9ed6de 100644
--- a/docs/attacks/index.html
+++ b/docs/attacks/index.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks API documentation</title>
-<meta name="description" content="Attack implementations." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Attack implementations.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,14 +26,6 @@ <h1 class="title">Module <code>mimir.attacks</code></h1>
 </header>
 <section id="section-intro">
 <p>Attack implementations.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Attack implementations.
-&#34;&#34;&#34;</code></pre>
-</details>
 </section>
 <section>
 <h2 class="section-title" id="header-submodules">Sub-modules</h2>
@@ -95,7 +90,6 @@ <h2 class="section-title" id="header-submodules">Sub-modules</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -124,7 +118,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/loss.html b/docs/attacks/loss.html
index 9e2b6e0..f37d75e 100644
--- a/docs/attacks/loss.html
+++ b/docs/attacks/loss.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.loss API documentation</title>
-<meta name="description" content="Straight-forward LOSS attack, as described in https://ieeexplore.ieee.org/abstract/document/8429311" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Straight-forward LOSS attack, as described in https://ieeexplore.ieee.org/abstract/document/8429311">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,31 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.loss</code></h1>
 </header>
 <section id="section-intro">
 <p>Straight-forward LOSS attack, as described in <a href="https://ieeexplore.ieee.org/abstract/document/8429311">https://ieeexplore.ieee.org/abstract/document/8429311</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Straight-forward LOSS attack, as described in https://ieeexplore.ieee.org/abstract/document/8429311
-&#34;&#34;&#34;
-import torch as ch
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model
-from mimir.config import ExperimentConfig
-
-
-class LOSSAttack(Attack):
-
-    def __init__(self, config: ExperimentConfig, model: Model):
-        super().__init__(config, model, ref_model=None)
-
-    @ch.no_grad()
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-            LOSS-score. Use log-likelihood from model.
-        &#34;&#34;&#34;
-        return self.target_model.get_ll(document, probs=probs, tokens=tokens)</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -103,7 +81,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -124,7 +101,7 @@ <h4><code><a title="mimir.attacks.loss.LOSSAttack" href="#mimir.attacks.loss.LOS
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/min_k.html b/docs/attacks/min_k.html
index 375ac50..841311a 100644
--- a/docs/attacks/min_k.html
+++ b/docs/attacks/min_k.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.min_k API documentation</title>
-<meta name="description" content="Min-k % Prob Attack: https://arxiv.org/pdf/2310.16789.pdf" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Min-k % Prob Attack: https://arxiv.org/pdf/2310.16789.pdf">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,49 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.min_k</code></h1>
 </header>
 <section id="section-intro">
 <p>Min-k % Prob Attack: <a href="https://arxiv.org/pdf/2310.16789.pdf">https://arxiv.org/pdf/2310.16789.pdf</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Min-k % Prob Attack: https://arxiv.org/pdf/2310.16789.pdf
-&#34;&#34;&#34;
-import torch as ch
-import numpy as np
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model
-from mimir.config import ExperimentConfig
-
-
-class MinKProbAttack(Attack):
-
-    def __init__(self, config: ExperimentConfig, model: Model):
-        super().__init__(config, model, ref_model=None)
-
-    @ch.no_grad()
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Min-k % Prob Attack. Gets model probabilities and returns likelihood when computed over top k% of ngrams.
-        &#34;&#34;&#34;
-        # Hyper-params specific to min-k attack
-        k: float = kwargs.get(&#34;k&#34;, 0.2)
-        window: int = kwargs.get(&#34;window&#34;, 1)
-        stride: int = kwargs.get(&#34;stride&#34;, 1)
-
-        all_prob = (
-            probs
-            if probs is not None
-            else self.target_model.get_probabilities(document, tokens=tokens)
-        )
-        # iterate through probabilities by ngram defined by window size at given stride
-        ngram_probs = []
-        for i in range(0, len(all_prob) - window + 1, stride):
-            ngram_prob = all_prob[i : i + window]
-            ngram_probs.append(np.mean(ngram_prob))
-        min_k_probs = sorted(ngram_probs)[: int(len(ngram_probs) * k)]
-
-        return -np.mean(min_k_probs)</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -138,7 +98,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -159,7 +118,7 @@ <h4><code><a title="mimir.attacks.min_k.MinKProbAttack" href="#mimir.attacks.min
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/min_k_plus_plus.html b/docs/attacks/min_k_plus_plus.html
index cb4bd9f..bced522 100644
--- a/docs/attacks/min_k_plus_plus.html
+++ b/docs/attacks/min_k_plus_plus.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.min_k_plus_plus API documentation</title>
-<meta name="description" content="Min-K%++ Attack: https://github.com/zjysteven/mink-plus-plus" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Min-K%++ Attack: https://github.com/zjysteven/mink-plus-plus">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,49 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.min_k_plus_plus</code></h1>
 </header>
 <section id="section-intro">
 <p>Min-K%++ Attack: <a href="https://github.com/zjysteven/mink-plus-plus">https://github.com/zjysteven/mink-plus-plus</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Min-K%++ Attack: https://github.com/zjysteven/mink-plus-plus
-&#34;&#34;&#34;
-import torch as ch
-import numpy as np
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model
-from mimir.config import ExperimentConfig
-
-
-class MinKPlusPlusAttack(Attack):
-
-    def __init__(self, config: ExperimentConfig, model: Model):
-        super().__init__(config, model, ref_model=None)
-
-    @ch.no_grad()
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Min-K%++ Attack. 
-        Gets token probabilties, normalize with the mean and std over the whole categorical distribution,
-        and returns normalized likelihood when computed over top k% of ngrams.
-        &#34;&#34;&#34;
-        # Hyper-params specific to min-k attack
-        k: float = kwargs.get(&#34;k&#34;, 0.2)
-        all_probs = kwargs.get(&#34;all_probs&#34;, None)
-
-        # these are all log probabilites
-        target_prob, all_probs = (
-            (probs, all_probs)
-            if (probs is not None and all_probs is not None)
-            else self.model.get_probabilities(document, tokens=tokens, return_all_probs=True)
-        )
-        
-        mu = (ch.exp(all_probs) * all_probs).sum(-1)
-        sigma = (ch.exp(all_probs) * ch.square(all_probs)).sum(-1) - ch.square(mu)
-        scores = (np.array(target_prob) - mu.numpy()) / sigma.sqrt().numpy()
-        
-        return -np.mean(sorted(scores)[:int(len(scores) * k)])</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -138,7 +98,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -159,7 +118,7 @@ <h4><code><a title="mimir.attacks.min_k_plus_plus.MinKPlusPlusAttack" href="#mim
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/neighborhood.html b/docs/attacks/neighborhood.html
index 211105d..031a422 100644
--- a/docs/attacks/neighborhood.html
+++ b/docs/attacks/neighborhood.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.neighborhood API documentation</title>
-<meta name="description" content="Neighborhood-MIA attack https://arxiv.org/pdf/2305.18462.pdf" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Neighborhood-MIA attack https://arxiv.org/pdf/2305.18462.pdf">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,586 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.neighborhood</code></h1>
 </header>
 <section id="section-intro">
 <p>Neighborhood-MIA attack <a href="https://arxiv.org/pdf/2305.18462.pdf">https://arxiv.org/pdf/2305.18462.pdf</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Neighborhood-MIA attack https://arxiv.org/pdf/2305.18462.pdf
-&#34;&#34;&#34;
-
-from heapq import nlargest
-import torch
-import re
-import numpy as np
-from tqdm import tqdm
-import random
-import transformers
-from typing import List
-
-from mimir.config import ExperimentConfig
-from mimir.attacks.attack_utils import count_masks, apply_extracted_fills
-from mimir.models import Model, ReferenceModel
-from mimir.attacks.all_attacks import Attack
-
-
-class NeighborhoodAttack(Attack):
-
-    def __init__(
-        self,
-        config: ExperimentConfig,
-        target_model: Model,
-        ref_model: ReferenceModel = None,
-        **kwargs,
-    ):
-        super().__init__(config, target_model, ref_model=None)
-        self.ref_model = self._pick_neighbor_model()
-        assert issubclass(type(self.ref_model), MaskFillingModel), &#34;ref_model must be MaskFillingModel for neighborhood attack&#34;
-
-    def get_mask_model(self):
-        &#34;&#34;&#34;
-            Return the mask filling model.
-        &#34;&#34;&#34;
-        return self.ref_model
-
-    def create_fill_dictionary(self, data):
-        &#34;&#34;&#34;
-            (Only valid for T5 model) Create fill-fictionary used for random_fills
-        &#34;&#34;&#34;
-        neigh_config = self.config.neighborhood_config
-        if &#34;t5&#34; in neigh_config.model and neigh_config.random_fills:
-            if not self.config.pretokenized:
-                # TODO: maybe can be done if detokenized, but currently not supported
-                self.ref_model.create_fill_dictionary(data)
-
-    def _pick_neighbor_model(self):
-        &#34;&#34;&#34;
-            Select and load the mask filling model requested in the config.
-        &#34;&#34;&#34;
-        # mask filling t5 model
-        mask_model = None
-        neigh_config = self.config.neighborhood_config
-        env_config = self.config.env_config
-
-        model_kwargs = dict()
-        if not neigh_config.random_fills:
-            if env_config.int8:
-                model_kwargs = dict(
-                    load_in_8bit=True, device_map=&#34;auto&#34;, torch_dtype=torch.bfloat16
-                )
-            elif env_config.half:
-                model_kwargs = dict(torch_dtype=torch.bfloat16)
-            try:
-                n_positions = (
-                    512  # Should fix later, but for T-5 this is 512 indeed
-                )
-                # mask_model.config.n_positions
-            except AttributeError:
-                n_positions = self.config.max_tokens
-        else:
-            n_positions = self.config.max_tokens
-        tokenizer_kwargs = {
-            &#34;model_max_length&#34;: n_positions,
-        }
-
-        print(f&#34;Loading mask filling model {neigh_config.model}...&#34;)
-        if &#34;t5&#34; in neigh_config.model:
-            mask_model = T5Model(
-                self.config,
-                model_kwargs=model_kwargs,
-                tokenizer_kwargs=tokenizer_kwargs,
-            )
-        elif &#34;bert&#34; in neigh_config.model:
-            mask_model = BertModel(self.config)
-        else:
-            raise ValueError(f&#34;Unknown model {neigh_config.model}&#34;)
-        # if config.dataset_member in [&#39;english&#39;, &#39;german&#39;]:
-        #     preproc_tokenizer = mask_tokenizer
-        return mask_model
-
-    def load(self):
-        &#34;&#34;&#34;
-        Any attack-specific steps (one-time) preparation
-        &#34;&#34;&#34;
-        print(&#34;MOVING MASK MODEL TO GPU...&#34;, end=&#34;&#34;, flush=True)
-        self.ref_model.load()
-
-    def get_neighbors(self, documents, **kwargs):
-        &#34;&#34;&#34;
-            Generate neighbors for given documents.
-        &#34;&#34;&#34;
-        n_perturbations = kwargs.get(&#34;n_perturbations&#34;, 1)
-        span_length = kwargs.get(&#34;span_length&#34;, 10)
-        neigh_config = self.config.neighborhood_config
-        ceil_pct = neigh_config.ceil_pct
-        kwargs = {}
-        if type(self.ref_model) == T5Model:
-            kwargs = {
-                &#34;span_length&#34;: span_length,
-                &#34;pct&#34;: neigh_config.pct_words_masked,
-                &#34;chunk_size&#34;: self.config.chunk_size,
-                &#34;ceil_pct&#34;: ceil_pct,
-            }
-        kwargs[&#34;n_perturbations&#34;] = n_perturbations
-
-        # Generate neighbors
-        neighbors = self.ref_model.generate_neighbors(documents, **kwargs)
-        return neighbors
-
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Neighborhood attack score. Looks at difference in likelihood for given document and average likelihood of its neighbors
-        &#34;&#34;&#34;
-        # documents here are actually neighbors
-        batch_size = kwargs.get(&#34;batch_size&#34;, 4)
-        substr_neighbors = kwargs.get(&#34;substr_neighbors&#34;, None)
-        loss = kwargs.get(&#34;loss&#34;, None)
-        if loss is None:
-            loss = self.target_model.get_ll(document, probs=probs, tokens=tokens)
-
-        # Only evaluate neighborhood attack when not caching neighbors
-        mean_substr_score = self.target_model.get_lls(
-            substr_neighbors, batch_size=batch_size
-        )
-        d_based_score = loss - mean_substr_score
-        return d_based_score
-
-
-class MaskFillingModel(Model):
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super(MaskFillingModel, self).__init__(config, **kwargs)
-        self.device = self.config.env_config.device_aux
-        self.name = self.config.neighborhood_config.model
-
-    def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-        raise NotImplementedError(&#34;generate_neighbors not implemented&#34;)
-
-
-class T5Model(MaskFillingModel):
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super().__init__(config, **kwargs)
-        model_kwargs = self.kwargs.get(&#34;model_kwargs&#34;, {})
-        tokenizer_kwargs = self.kwargs.get(&#34;tokenizer_kwargs&#34;, {})
-
-        self.model = transformers.AutoModelForSeq2SeqLM.from_pretrained(
-            self.name, **model_kwargs, cache_dir=self.cache_dir
-        )
-        self.tokenizer = transformers.AutoTokenizer.from_pretrained(
-            self.name, **tokenizer_kwargs, cache_dir=self.cache_dir
-        )
-
-        # define regex to match all &lt;extra_id_*&gt; tokens, where * is an integer
-        self.pattern = re.compile(r&#34;&lt;extra_id_\d+&gt;&#34;)
-
-    def create_fill_dictionary(self, data):
-        self.FILL_DICTIONARY = set()
-        for texts in data.values():
-            for text in texts:
-                self.FILL_DICTIONARY.update(text.split())
-        self.FILL_DICTIONARY = sorted(list(self.FILL_DICTIONARY))
-
-    def tokenize_and_mask(
-        self, text: str, span_length: int, pct: float, ceil_pct: bool = False
-    ):
-        buffer_size = self.config.neighborhood_config.buffer_size
-
-        tokens = text.split(&#34; &#34;)
-        mask_string = &#34;&lt;&lt;&lt;mask&gt;&gt;&gt;&#34;
-
-        span_length = min(int(pct * len(tokens)), span_length)
-        # avoid div zero:
-
-        span_length = max(1, span_length)
-
-        n_spans = pct * len(tokens) / (span_length + buffer_size * 2)
-        if ceil_pct:
-            n_spans = np.ceil(n_spans)
-        n_spans = int(n_spans)
-
-        n_masks = 0
-        while n_masks &lt; n_spans:
-            start = np.random.randint(0, max(1, len(tokens) - span_length))
-            end = start + span_length
-            search_start = max(0, start - buffer_size)
-            search_end = min(len(tokens), end + buffer_size)
-            if mask_string not in tokens[search_start:search_end]:
-                tokens[start:end] = [mask_string]
-                n_masks += 1
-
-        # replace each occurrence of mask_string with &lt;extra_id_NUM&gt;, where NUM increments
-        num_filled = 0
-        for idx, token in enumerate(tokens):
-            if token == mask_string:
-                tokens[idx] = f&#34;&lt;extra_id_{num_filled}&gt;&#34;
-                num_filled += 1
-        assert num_filled == n_masks, f&#34;num_filled {num_filled} != n_masks {n_masks}&#34;
-        text = &#34; &#34;.join(tokens)
-        return text
-
-    def extract_fills(self, texts):
-        # remove &lt;pad&gt; from beginning of each text
-        texts = [x.replace(&#34;&lt;pad&gt;&#34;, &#34;&#34;).replace(&#34;&lt;/s&gt;&#34;, &#34;&#34;).strip() for x in texts]
-
-        # return the text in between each matched mask token
-        extracted_fills = [self.pattern.split(x)[1:-1] for x in texts]
-
-        # remove whitespace around each fill
-        extracted_fills = [[y.strip() for y in x] for x in extracted_fills]
-
-        return extracted_fills
-
-    def replace_masks(self, texts: List[str]):
-        &#34;&#34;&#34;
-        Replace each masked span with a sample from T5 mask_model
-        &#34;&#34;&#34;
-        mask_top_p = self.config.neighborhood_config.top_p
-        n_expected = count_masks(texts)
-        stop_id = self.tokenizer.encode(f&#34;&lt;extra_id_{max(n_expected)}&gt;&#34;)[0]
-        tokens = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(
-            self.device
-        )
-        outputs = self.model.generate(
-            **tokens,
-            max_length=150,
-            do_sample=True,
-            top_p=mask_top_p,
-            num_return_sequences=1,
-            eos_token_id=stop_id,
-        )
-        return self.tokenizer.batch_decode(outputs, skip_special_tokens=False)
-
-    def generate_neighbors_(self, texts: List[str], **kwargs):
-        span_length: int = kwargs.get(&#34;span_length&#34;)
-        pct: float = kwargs.get(&#34;pct&#34;)
-        ceil_pct: bool = kwargs.get(&#34;ceil_pct&#34;, False)
-        base_tokenizer = kwargs.get(&#34;base_tokenizer&#34;, None)
-        neigh_config = self.config.neighborhood_config
-
-        if not neigh_config.random_fills:
-            masked_texts = [
-                self.tokenize_and_mask(x, span_length, pct, ceil_pct) for x in texts
-            ]
-            raw_fills = self.replace_masks(masked_texts)
-            extracted_fills = self.extract_fills(raw_fills)
-            perturbed_texts = apply_extracted_fills(masked_texts, extracted_fills)
-            idxs = [idx for idx, x in enumerate(perturbed_texts) if x == &#34;&#34;]
-
-            # Handle the fact that sometimes the model doesn&#39;t generate the right number of fills and we have to try again
-            attempts = 1
-            break_out_of_loop: bool = False
-            while &#34;&#34; in perturbed_texts:
-                if attempts &gt; neigh_config.max_tries:
-                    for idx in idxs:
-                        perturbed_texts[idx] = texts[idx]
-                    break_out_of_loop = True
-                    break
-                if break_out_of_loop:
-                    break
-                idxs = [idx for idx, x in enumerate(perturbed_texts) if x == &#34;&#34;]
-                print(
-                    f&#34;WARNING: {len(idxs)} texts have no fills. Trying again [attempt {attempts}].&#34;
-                )
-                masked_texts = [
-                    self.tokenize_and_mask(x, span_length, pct, ceil_pct)
-                    for idx, x in enumerate(texts)
-                    if idx in idxs
-                ]
-                raw_fills = self.replace_masks(masked_texts)
-                extracted_fills = self.extract_fills(raw_fills)
-                new_perturbed_texts = apply_extracted_fills(
-                    masked_texts, extracted_fills
-                )
-                for idx, x in zip(idxs, new_perturbed_texts):
-                    perturbed_texts[idx] = x
-                attempts += 1
-        else:
-            if neigh_config.random_fills_tokens:
-                if base_tokenizer is None:
-                    raise ValueError(
-                        &#34;base_tokenizer must be provided if random_fills and random_fills_tokens are True&#34;
-                    )
-
-                # tokenize base_tokenizer
-                tokens = base_tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(
-                    self.device
-                )
-                valid_tokens = tokens.input_ids != base_tokenizer.pad_token_id
-                replace_pct = neigh_config.pct_words_masked * (
-                    neigh_config.span_length
-                    / (neigh_config.span_length + 2 * neigh_config.buffer_size)
-                )
-
-                # replace replace_pct of input_ids with random tokens
-                random_mask = (
-                    torch.rand(tokens.input_ids.shape, device=self.device) &lt; replace_pct
-                )
-                random_mask &amp;= valid_tokens
-                random_tokens = torch.randint(
-                    0,
-                    base_tokenizer.vocab_size,
-                    (random_mask.sum(),),
-                    device=self.device,
-                )
-                # while any of the random tokens are special tokens, replace them with random non-special tokens
-                while any(
-                    base_tokenizer.decode(x) in base_tokenizer.all_special_tokens
-                    for x in random_tokens
-                ):
-                    random_tokens = torch.randint(
-                        0,
-                        base_tokenizer.vocab_size,
-                        (random_mask.sum(),),
-                        device=self.device,
-                    )
-                tokens.input_ids[random_mask] = random_tokens
-                perturbed_texts = base_tokenizer.batch_decode(
-                    tokens.input_ids, skip_special_tokens=True
-                )
-            else:
-                masked_texts = [
-                    self.tokenize_and_mask(x, span_length, pct, ceil_pct) for x in texts
-                ]
-                perturbed_texts = masked_texts
-                # replace each &lt;extra_id_*&gt; with neigh_config.span_length random words from FILL_DICTIONARY
-                for idx, text in enumerate(perturbed_texts):
-                    filled_text = text
-                    for fill_idx in range(count_masks([text])[0]):
-                        fill = random.sample(self.FILL_DICTIONARY, span_length)
-                        filled_text = filled_text.replace(
-                            f&#34;&lt;extra_id_{fill_idx}&gt;&#34;, &#34; &#34;.join(fill)
-                        )
-                    assert (
-                        count_masks([filled_text])[0] == 0
-                    ), &#34;Failed to replace all masks&#34;
-                    perturbed_texts[idx] = filled_text
-
-        return perturbed_texts
-
-    def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-        n_neighbors = kwargs.get(&#34;n_perturbations&#34;, 25)
-        # Repeat text if T-5 model
-        texts_use = [x for x in texts for _ in range(n_neighbors)]
-
-        chunk_size = self.config.chunk_size
-        if &#34;11b&#34; in self.config.neighborhood_config.model:
-            chunk_size //= 2
-
-        outputs = []
-        for i in tqdm(
-            range(0, len(texts_use), chunk_size), desc=&#34;Applying perturbations&#34;
-        ):
-            outputs.extend(
-                self.generate_neighbors_(texts_use[i : i + chunk_size], **kwargs)
-            )
-        return outputs
-
-
-class BertModel(MaskFillingModel):
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super().__init__(config, **kwargs)
-        self.token_dropout = torch.nn.Dropout(p=0.7)
-        if self.name == &#34;bert&#34;:
-            self.tokenizer = transformers.BertTokenizerFast.from_pretrained(
-                &#34;bert-base-uncased&#34;, cache_dir=self.cache_dir
-            )
-            self.model = transformers.BertForMaskedLM.from_pretrained(
-                &#34;bert-base-uncased&#34;, cache_dir=self.cache_dir
-            )
-        elif self.name == &#34;distilbert&#34;:
-            self.tokenizer = transformers.DistilBertTokenizer.from_pretrained(
-                &#34;distilbert-base-uncased&#34;, cache_dir=self.cache_dir
-            )
-            self.model = transformers.DistilBertForMaskedLM.from_pretrained(
-                &#34;distilbert-base-uncased&#34;, cache_dir=self.cache_dir
-            )
-        elif self.name == &#34;roberta&#34;:
-            self.tokenizer = transformers.RobertaTokenizer.from_pretrained(
-                &#34;roberta-base&#34;, cache_dir=self.cache_dir
-            )
-            self.model = transformers.RobertaForMaskedLM.from_pretrained(
-                &#34;roberta-base&#34;, cache_dir=self.cache_dir
-            )
-        else:
-            raise ValueError(f&#34;Invalid model name {self.name}&#34;)
-
-    def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-        neighbors = []
-        for text in tqdm(texts, desc=&#34;Generating neighbors&#34;):
-            neighbors.extend(self.generate_neighbors_(text, **kwargs))
-        return neighbors
-
-    def generate_neighbors_(self, text: str, **kwargs):
-        in_place_swap = self.config.neighborhood_config.original_tokenization_swap
-
-        tokenizer_output = self.tokenizer(
-            text,
-            padding=True,
-            truncation=True,
-            return_offsets_mapping=in_place_swap,
-            max_length=self.config.max_tokens,
-            return_tensors=&#34;pt&#34;,
-        )
-        text_tokenized = tokenizer_output.input_ids.to(self.device)
-        n_neighbors = kwargs.get(&#34;n_perturbations&#34;, 25)
-        num_tokens = len(text_tokenized[0, :])
-        n_swap = int(num_tokens * self.config.neighborhood_config.pct_swap_bert)
-
-        if in_place_swap:
-            token_positions = tokenizer_output.offset_mapping[0]
-
-        replacements = dict()
-
-        target_token_indices = range(1, num_tokens)
-        for target_token_index in target_token_indices:
-            target_token = text_tokenized[0, target_token_index]
-            if self.name == &#34;bert&#34;:
-                embeds = self.model.bert.embeddings(text_tokenized)
-            elif self.name == &#34;distilbert&#34;:
-                embeds = self.model.distilbert.embeddings(text_tokenized)
-            elif self.name == &#34;roberta&#34;:
-                embeds = self.model.roberta.embeddings(text_tokenized)
-
-            embeds = torch.cat(
-                (
-                    embeds[:, :target_token_index, :],
-                    self.token_dropout(embeds[:, target_token_index, :]).unsqueeze(
-                        dim=0
-                    ),
-                    embeds[:, target_token_index + 1 :, :],
-                ),
-                dim=1,
-            )
-
-            token_probs = torch.softmax(self.model(inputs_embeds=embeds).logits, dim=2)
-
-            original_prob = token_probs[0, target_token_index, target_token]
-
-            top_probabilities, top_candidates = torch.topk(
-                token_probs[:, target_token_index, :], 6, dim=1
-            )
-
-            for cand, prob in zip(top_candidates[0], top_probabilities[0]):
-                if not cand == target_token:
-                    # alt = torch.cat((text_tokenized[:,:target_token_index], torch.LongTensor([cand]).unsqueeze(0).to(device), text_tokenized[:,target_token_index+1:]), dim=1)
-                    # alt_text = search_tokenizer.batch_decode(alt)[0]
-                    if original_prob.item() == 1:
-                        replacements[(target_token_index, cand)] = prob.item() / (
-                            1 - 0.9
-                        )
-                    else:
-                        replacements[(target_token_index, cand)] = prob.item() / (
-                            1 - original_prob.item()
-                        )
-
-        if self.config.neighborhood_config.neighbor_strategy == &#34;deterministic&#34;:
-            replacement_keys = nlargest(n_neighbors, replacements, key=replacements.get)
-            replacements_new = dict()
-            for rk in replacement_keys:
-                replacements_new[rk] = replacements[rk]
-
-            replacements = replacements_new
-
-            # TODO: Not sure if this is needed (perhaps making sure we never take &gt;= 100)? Consider removing later
-            highest_scored = nlargest(100, replacements, key=replacements.get)
-
-            neighbors = []
-            for single in highest_scored:
-                target_token_index, cand = single
-
-                if in_place_swap:
-                    # Get indices of original text that we want to swap out
-                    start, end = token_positions[target_token_index]
-                    # Get text corresponding to cand token
-                    fill_in_text = self.tokenizer.decode(cand)
-                    # Remove any &#39;##&#39; from prefix (since we&#39;re doing a plug back into text)
-                    fill_in_text = fill_in_text.replace(&#34;##&#34;, &#34;&#34;)
-                    alt_text = text[:start] + fill_in_text + text[end:]
-                else:
-                    alt = text_tokenized
-                    alt = torch.cat(
-                        (
-                            alt[:, :target_token_index],
-                            torch.LongTensor([cand]).unsqueeze(0).to(self.device),
-                            alt[:, target_token_index + 1 :],
-                        ),
-                        dim=1,
-                    )
-                    alt_text = self.tokenizer.batch_decode(alt)[0]
-                    # Remove [CLS] and [SEP] tokens
-                    alt_text = alt_text.replace(&#34;[CLS]&#34;, &#34;&#34;).replace(&#34;[SEP]&#34;, &#34;&#34;)
-                    # texts.append((alt_text, replacements[single]))
-                neighbors.append(alt_text)
-
-        elif self.config.neighborhood_config.neighbor_strategy == &#34;random&#34;:
-            if not in_place_swap:
-                raise ValueError(
-                    &#34;Random neighbor strategy only works with in_place_swap=True right now&#34;
-                )
-
-            # Make new dict replacements_new with structure [key[0]]: (key[1], value) for all keys in replacements
-            replacements_new = dict()
-            for k, v in replacements.items():
-                if k[0] not in replacements_new:
-                    replacements_new[k[0]] = []
-                replacements_new[k[0]].append((k[1].item(), v))
-            # Sort each entry by score
-            for k, v in replacements_new.items():
-                replacements_new[k] = sorted(v, key=lambda x: x[1], reverse=True)
-
-            num_trials = int(1e3)
-            replacements, scores = [], []
-            for _ in range(num_trials):
-                # Pick n_swap random positions
-                swap_positions = np.random.choice(
-                    list(replacements_new.keys()), n_swap, replace=False
-                )
-                # Out of all replacements, pick keys where target_token_index is in swap_positions
-                picked = [replacements_new[x][0] for x in swap_positions]
-                # Compute score (sum)
-                score = sum([x[1] for x in picked])
-                scores.append(score)
-                # Also keep track of replacements (position, candidate)
-                replacements.append(
-                    [(i, replacements_new[i][0][0]) for i in swap_positions]
-                )
-
-            # Out of all trials, pick n_neighbors combinations (highest scores)
-            highest_scored = nlargest(
-                n_neighbors, zip(scores, replacements), key=lambda x: x[0]
-            )
-
-            neighbors = []
-            for _, single in highest_scored:
-                # Sort according to target_token_index
-                single = sorted(single, key=lambda x: x[0])
-                # Get corresponding positions in text
-                single = [
-                    (token_positions[target_token_index], cand)
-                    for target_token_index, cand in single
-                ]
-                # Add start of text (before first swap)
-                end_prev = 0
-                alt_text = &#34;&#34;
-                for (start, end), cand in single:
-                    # Get text corresponding to cand token
-                    fill_in_text = self.tokenizer.decode(cand)
-                    # Remove any &#39;##&#39; from prefix (since we&#39;re doing a plug back into text)
-                    fill_in_text = fill_in_text.replace(&#34;##&#34;, &#34;&#34;)
-                    alt_text += text[end_prev:start] + fill_in_text
-                    end_prev = end
-                # Add remainder text (after last swap)
-                start, end = single[-1][0]
-                alt_text += text[end:]
-                neighbors.append(alt_text)
-
-        else:
-            raise NotImplementedError(
-                f&#34;Invalid neighbor strategy {self.config.neighborhood_config.neighbor_strategy}&#34;
-            )
-
-        # return texts
-        return neighbors</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -836,21 +259,6 @@ <h3>Ancestors</h3>
 <li><a title="mimir.models.Model" href="../models.html#mimir.models.Model">Model</a></li>
 <li>torch.nn.modules.module.Module</li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.attacks.neighborhood.BertModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.BertModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.BertModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="mimir.attacks.neighborhood.BertModel.generate_neighbors"><code class="name flex">
@@ -858,205 +266,18 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-    neighbors = []
-    for text in tqdm(texts, desc=&#34;Generating neighbors&#34;):
-        neighbors.extend(self.generate_neighbors_(text, **kwargs))
-    return neighbors</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.BertModel.generate_neighbors_"><code class="name flex">
 <span>def <span class="ident">generate_neighbors_</span></span>(<span>self, text: str, **kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def generate_neighbors_(self, text: str, **kwargs):
-    in_place_swap = self.config.neighborhood_config.original_tokenization_swap
-
-    tokenizer_output = self.tokenizer(
-        text,
-        padding=True,
-        truncation=True,
-        return_offsets_mapping=in_place_swap,
-        max_length=self.config.max_tokens,
-        return_tensors=&#34;pt&#34;,
-    )
-    text_tokenized = tokenizer_output.input_ids.to(self.device)
-    n_neighbors = kwargs.get(&#34;n_perturbations&#34;, 25)
-    num_tokens = len(text_tokenized[0, :])
-    n_swap = int(num_tokens * self.config.neighborhood_config.pct_swap_bert)
-
-    if in_place_swap:
-        token_positions = tokenizer_output.offset_mapping[0]
-
-    replacements = dict()
-
-    target_token_indices = range(1, num_tokens)
-    for target_token_index in target_token_indices:
-        target_token = text_tokenized[0, target_token_index]
-        if self.name == &#34;bert&#34;:
-            embeds = self.model.bert.embeddings(text_tokenized)
-        elif self.name == &#34;distilbert&#34;:
-            embeds = self.model.distilbert.embeddings(text_tokenized)
-        elif self.name == &#34;roberta&#34;:
-            embeds = self.model.roberta.embeddings(text_tokenized)
-
-        embeds = torch.cat(
-            (
-                embeds[:, :target_token_index, :],
-                self.token_dropout(embeds[:, target_token_index, :]).unsqueeze(
-                    dim=0
-                ),
-                embeds[:, target_token_index + 1 :, :],
-            ),
-            dim=1,
-        )
-
-        token_probs = torch.softmax(self.model(inputs_embeds=embeds).logits, dim=2)
-
-        original_prob = token_probs[0, target_token_index, target_token]
-
-        top_probabilities, top_candidates = torch.topk(
-            token_probs[:, target_token_index, :], 6, dim=1
-        )
-
-        for cand, prob in zip(top_candidates[0], top_probabilities[0]):
-            if not cand == target_token:
-                # alt = torch.cat((text_tokenized[:,:target_token_index], torch.LongTensor([cand]).unsqueeze(0).to(device), text_tokenized[:,target_token_index+1:]), dim=1)
-                # alt_text = search_tokenizer.batch_decode(alt)[0]
-                if original_prob.item() == 1:
-                    replacements[(target_token_index, cand)] = prob.item() / (
-                        1 - 0.9
-                    )
-                else:
-                    replacements[(target_token_index, cand)] = prob.item() / (
-                        1 - original_prob.item()
-                    )
-
-    if self.config.neighborhood_config.neighbor_strategy == &#34;deterministic&#34;:
-        replacement_keys = nlargest(n_neighbors, replacements, key=replacements.get)
-        replacements_new = dict()
-        for rk in replacement_keys:
-            replacements_new[rk] = replacements[rk]
-
-        replacements = replacements_new
-
-        # TODO: Not sure if this is needed (perhaps making sure we never take &gt;= 100)? Consider removing later
-        highest_scored = nlargest(100, replacements, key=replacements.get)
-
-        neighbors = []
-        for single in highest_scored:
-            target_token_index, cand = single
-
-            if in_place_swap:
-                # Get indices of original text that we want to swap out
-                start, end = token_positions[target_token_index]
-                # Get text corresponding to cand token
-                fill_in_text = self.tokenizer.decode(cand)
-                # Remove any &#39;##&#39; from prefix (since we&#39;re doing a plug back into text)
-                fill_in_text = fill_in_text.replace(&#34;##&#34;, &#34;&#34;)
-                alt_text = text[:start] + fill_in_text + text[end:]
-            else:
-                alt = text_tokenized
-                alt = torch.cat(
-                    (
-                        alt[:, :target_token_index],
-                        torch.LongTensor([cand]).unsqueeze(0).to(self.device),
-                        alt[:, target_token_index + 1 :],
-                    ),
-                    dim=1,
-                )
-                alt_text = self.tokenizer.batch_decode(alt)[0]
-                # Remove [CLS] and [SEP] tokens
-                alt_text = alt_text.replace(&#34;[CLS]&#34;, &#34;&#34;).replace(&#34;[SEP]&#34;, &#34;&#34;)
-                # texts.append((alt_text, replacements[single]))
-            neighbors.append(alt_text)
-
-    elif self.config.neighborhood_config.neighbor_strategy == &#34;random&#34;:
-        if not in_place_swap:
-            raise ValueError(
-                &#34;Random neighbor strategy only works with in_place_swap=True right now&#34;
-            )
-
-        # Make new dict replacements_new with structure [key[0]]: (key[1], value) for all keys in replacements
-        replacements_new = dict()
-        for k, v in replacements.items():
-            if k[0] not in replacements_new:
-                replacements_new[k[0]] = []
-            replacements_new[k[0]].append((k[1].item(), v))
-        # Sort each entry by score
-        for k, v in replacements_new.items():
-            replacements_new[k] = sorted(v, key=lambda x: x[1], reverse=True)
-
-        num_trials = int(1e3)
-        replacements, scores = [], []
-        for _ in range(num_trials):
-            # Pick n_swap random positions
-            swap_positions = np.random.choice(
-                list(replacements_new.keys()), n_swap, replace=False
-            )
-            # Out of all replacements, pick keys where target_token_index is in swap_positions
-            picked = [replacements_new[x][0] for x in swap_positions]
-            # Compute score (sum)
-            score = sum([x[1] for x in picked])
-            scores.append(score)
-            # Also keep track of replacements (position, candidate)
-            replacements.append(
-                [(i, replacements_new[i][0][0]) for i in swap_positions]
-            )
-
-        # Out of all trials, pick n_neighbors combinations (highest scores)
-        highest_scored = nlargest(
-            n_neighbors, zip(scores, replacements), key=lambda x: x[0]
-        )
-
-        neighbors = []
-        for _, single in highest_scored:
-            # Sort according to target_token_index
-            single = sorted(single, key=lambda x: x[0])
-            # Get corresponding positions in text
-            single = [
-                (token_positions[target_token_index], cand)
-                for target_token_index, cand in single
-            ]
-            # Add start of text (before first swap)
-            end_prev = 0
-            alt_text = &#34;&#34;
-            for (start, end), cand in single:
-                # Get text corresponding to cand token
-                fill_in_text = self.tokenizer.decode(cand)
-                # Remove any &#39;##&#39; from prefix (since we&#39;re doing a plug back into text)
-                fill_in_text = fill_in_text.replace(&#34;##&#34;, &#34;&#34;)
-                alt_text += text[end_prev:start] + fill_in_text
-                end_prev = end
-            # Add remainder text (after last swap)
-            start, end = single[-1][0]
-            alt_text += text[end:]
-            neighbors.append(alt_text)
-
-    else:
-        raise NotImplementedError(
-            f&#34;Invalid neighbor strategy {self.config.neighborhood_config.neighbor_strategy}&#34;
-        )
-
-    # return texts
-    return neighbors</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.attacks.neighborhood.MaskFillingModel" href="#mimir.attacks.neighborhood.MaskFillingModel">MaskFillingModel</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.forward" href="../models.html#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.get_ll" href="../models.html#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.get_probabilities" href="../models.html#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.load" href="../models.html#mimir.models.Model.load">load</a></code></li>
@@ -1098,21 +319,6 @@ <h3>Subclasses</h3>
 <li><a title="mimir.attacks.neighborhood.BertModel" href="#mimir.attacks.neighborhood.BertModel">BertModel</a></li>
 <li><a title="mimir.attacks.neighborhood.T5Model" href="#mimir.attacks.neighborhood.T5Model">T5Model</a></li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.attacks.neighborhood.MaskFillingModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.MaskFillingModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.MaskFillingModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="mimir.attacks.neighborhood.MaskFillingModel.generate_neighbors"><code class="name flex">
@@ -1120,20 +326,12 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-    raise NotImplementedError(&#34;generate_neighbors not implemented&#34;)</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.models.Model" href="../models.html#mimir.models.Model">Model</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.models.Model.forward" href="../models.html#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.Model.get_ll" href="../models.html#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.Model.get_probabilities" href="../models.html#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.Model.load" href="../models.html#mimir.models.Model.load">load</a></code></li>
@@ -1287,68 +485,18 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>(Only valid for T5 model) Create fill-fictionary used for random_fills</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def create_fill_dictionary(self, data):
-    &#34;&#34;&#34;
-        (Only valid for T5 model) Create fill-fictionary used for random_fills
-    &#34;&#34;&#34;
-    neigh_config = self.config.neighborhood_config
-    if &#34;t5&#34; in neigh_config.model and neigh_config.random_fills:
-        if not self.config.pretokenized:
-            # TODO: maybe can be done if detokenized, but currently not supported
-            self.ref_model.create_fill_dictionary(data)</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.NeighborhoodAttack.get_mask_model"><code class="name flex">
 <span>def <span class="ident">get_mask_model</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Return the mask filling model.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_mask_model(self):
-    &#34;&#34;&#34;
-        Return the mask filling model.
-    &#34;&#34;&#34;
-    return self.ref_model</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.NeighborhoodAttack.get_neighbors"><code class="name flex">
 <span>def <span class="ident">get_neighbors</span></span>(<span>self, documents, **kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Generate neighbors for given documents.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_neighbors(self, documents, **kwargs):
-    &#34;&#34;&#34;
-        Generate neighbors for given documents.
-    &#34;&#34;&#34;
-    n_perturbations = kwargs.get(&#34;n_perturbations&#34;, 1)
-    span_length = kwargs.get(&#34;span_length&#34;, 10)
-    neigh_config = self.config.neighborhood_config
-    ceil_pct = neigh_config.ceil_pct
-    kwargs = {}
-    if type(self.ref_model) == T5Model:
-        kwargs = {
-            &#34;span_length&#34;: span_length,
-            &#34;pct&#34;: neigh_config.pct_words_masked,
-            &#34;chunk_size&#34;: self.config.chunk_size,
-            &#34;ceil_pct&#34;: ceil_pct,
-        }
-    kwargs[&#34;n_perturbations&#34;] = n_perturbations
-
-    # Generate neighbors
-    neighbors = self.ref_model.generate_neighbors(documents, **kwargs)
-    return neighbors</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
@@ -1596,21 +744,6 @@ <h3>Ancestors</h3>
 <li><a title="mimir.models.Model" href="../models.html#mimir.models.Model">Model</a></li>
 <li>torch.nn.modules.module.Module</li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.attacks.neighborhood.T5Model.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.T5Model.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.attacks.neighborhood.T5Model.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="mimir.attacks.neighborhood.T5Model.create_fill_dictionary"><code class="name flex">
@@ -1618,269 +751,42 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def create_fill_dictionary(self, data):
-    self.FILL_DICTIONARY = set()
-    for texts in data.values():
-        for text in texts:
-            self.FILL_DICTIONARY.update(text.split())
-    self.FILL_DICTIONARY = sorted(list(self.FILL_DICTIONARY))</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.T5Model.extract_fills"><code class="name flex">
 <span>def <span class="ident">extract_fills</span></span>(<span>self, texts)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def extract_fills(self, texts):
-    # remove &lt;pad&gt; from beginning of each text
-    texts = [x.replace(&#34;&lt;pad&gt;&#34;, &#34;&#34;).replace(&#34;&lt;/s&gt;&#34;, &#34;&#34;).strip() for x in texts]
-
-    # return the text in between each matched mask token
-    extracted_fills = [self.pattern.split(x)[1:-1] for x in texts]
-
-    # remove whitespace around each fill
-    extracted_fills = [[y.strip() for y in x] for x in extracted_fills]
-
-    return extracted_fills</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.T5Model.generate_neighbors"><code class="name flex">
 <span>def <span class="ident">generate_neighbors</span></span>(<span>self, texts, **kwargs) ‑> List[str]</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def generate_neighbors(self, texts, **kwargs) -&gt; List[str]:
-    n_neighbors = kwargs.get(&#34;n_perturbations&#34;, 25)
-    # Repeat text if T-5 model
-    texts_use = [x for x in texts for _ in range(n_neighbors)]
-
-    chunk_size = self.config.chunk_size
-    if &#34;11b&#34; in self.config.neighborhood_config.model:
-        chunk_size //= 2
-
-    outputs = []
-    for i in tqdm(
-        range(0, len(texts_use), chunk_size), desc=&#34;Applying perturbations&#34;
-    ):
-        outputs.extend(
-            self.generate_neighbors_(texts_use[i : i + chunk_size], **kwargs)
-        )
-    return outputs</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.T5Model.generate_neighbors_"><code class="name flex">
 <span>def <span class="ident">generate_neighbors_</span></span>(<span>self, texts: List[str], **kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def generate_neighbors_(self, texts: List[str], **kwargs):
-    span_length: int = kwargs.get(&#34;span_length&#34;)
-    pct: float = kwargs.get(&#34;pct&#34;)
-    ceil_pct: bool = kwargs.get(&#34;ceil_pct&#34;, False)
-    base_tokenizer = kwargs.get(&#34;base_tokenizer&#34;, None)
-    neigh_config = self.config.neighborhood_config
-
-    if not neigh_config.random_fills:
-        masked_texts = [
-            self.tokenize_and_mask(x, span_length, pct, ceil_pct) for x in texts
-        ]
-        raw_fills = self.replace_masks(masked_texts)
-        extracted_fills = self.extract_fills(raw_fills)
-        perturbed_texts = apply_extracted_fills(masked_texts, extracted_fills)
-        idxs = [idx for idx, x in enumerate(perturbed_texts) if x == &#34;&#34;]
-
-        # Handle the fact that sometimes the model doesn&#39;t generate the right number of fills and we have to try again
-        attempts = 1
-        break_out_of_loop: bool = False
-        while &#34;&#34; in perturbed_texts:
-            if attempts &gt; neigh_config.max_tries:
-                for idx in idxs:
-                    perturbed_texts[idx] = texts[idx]
-                break_out_of_loop = True
-                break
-            if break_out_of_loop:
-                break
-            idxs = [idx for idx, x in enumerate(perturbed_texts) if x == &#34;&#34;]
-            print(
-                f&#34;WARNING: {len(idxs)} texts have no fills. Trying again [attempt {attempts}].&#34;
-            )
-            masked_texts = [
-                self.tokenize_and_mask(x, span_length, pct, ceil_pct)
-                for idx, x in enumerate(texts)
-                if idx in idxs
-            ]
-            raw_fills = self.replace_masks(masked_texts)
-            extracted_fills = self.extract_fills(raw_fills)
-            new_perturbed_texts = apply_extracted_fills(
-                masked_texts, extracted_fills
-            )
-            for idx, x in zip(idxs, new_perturbed_texts):
-                perturbed_texts[idx] = x
-            attempts += 1
-    else:
-        if neigh_config.random_fills_tokens:
-            if base_tokenizer is None:
-                raise ValueError(
-                    &#34;base_tokenizer must be provided if random_fills and random_fills_tokens are True&#34;
-                )
-
-            # tokenize base_tokenizer
-            tokens = base_tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(
-                self.device
-            )
-            valid_tokens = tokens.input_ids != base_tokenizer.pad_token_id
-            replace_pct = neigh_config.pct_words_masked * (
-                neigh_config.span_length
-                / (neigh_config.span_length + 2 * neigh_config.buffer_size)
-            )
-
-            # replace replace_pct of input_ids with random tokens
-            random_mask = (
-                torch.rand(tokens.input_ids.shape, device=self.device) &lt; replace_pct
-            )
-            random_mask &amp;= valid_tokens
-            random_tokens = torch.randint(
-                0,
-                base_tokenizer.vocab_size,
-                (random_mask.sum(),),
-                device=self.device,
-            )
-            # while any of the random tokens are special tokens, replace them with random non-special tokens
-            while any(
-                base_tokenizer.decode(x) in base_tokenizer.all_special_tokens
-                for x in random_tokens
-            ):
-                random_tokens = torch.randint(
-                    0,
-                    base_tokenizer.vocab_size,
-                    (random_mask.sum(),),
-                    device=self.device,
-                )
-            tokens.input_ids[random_mask] = random_tokens
-            perturbed_texts = base_tokenizer.batch_decode(
-                tokens.input_ids, skip_special_tokens=True
-            )
-        else:
-            masked_texts = [
-                self.tokenize_and_mask(x, span_length, pct, ceil_pct) for x in texts
-            ]
-            perturbed_texts = masked_texts
-            # replace each &lt;extra_id_*&gt; with neigh_config.span_length random words from FILL_DICTIONARY
-            for idx, text in enumerate(perturbed_texts):
-                filled_text = text
-                for fill_idx in range(count_masks([text])[0]):
-                    fill = random.sample(self.FILL_DICTIONARY, span_length)
-                    filled_text = filled_text.replace(
-                        f&#34;&lt;extra_id_{fill_idx}&gt;&#34;, &#34; &#34;.join(fill)
-                    )
-                assert (
-                    count_masks([filled_text])[0] == 0
-                ), &#34;Failed to replace all masks&#34;
-                perturbed_texts[idx] = filled_text
-
-    return perturbed_texts</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.T5Model.replace_masks"><code class="name flex">
 <span>def <span class="ident">replace_masks</span></span>(<span>self, texts: List[str])</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Replace each masked span with a sample from T5 mask_model</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def replace_masks(self, texts: List[str]):
-    &#34;&#34;&#34;
-    Replace each masked span with a sample from T5 mask_model
-    &#34;&#34;&#34;
-    mask_top_p = self.config.neighborhood_config.top_p
-    n_expected = count_masks(texts)
-    stop_id = self.tokenizer.encode(f&#34;&lt;extra_id_{max(n_expected)}&gt;&#34;)[0]
-    tokens = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(
-        self.device
-    )
-    outputs = self.model.generate(
-        **tokens,
-        max_length=150,
-        do_sample=True,
-        top_p=mask_top_p,
-        num_return_sequences=1,
-        eos_token_id=stop_id,
-    )
-    return self.tokenizer.batch_decode(outputs, skip_special_tokens=False)</code></pre>
-</details>
 </dd>
 <dt id="mimir.attacks.neighborhood.T5Model.tokenize_and_mask"><code class="name flex">
 <span>def <span class="ident">tokenize_and_mask</span></span>(<span>self, text: str, span_length: int, pct: float, ceil_pct: bool = False)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def tokenize_and_mask(
-    self, text: str, span_length: int, pct: float, ceil_pct: bool = False
-):
-    buffer_size = self.config.neighborhood_config.buffer_size
-
-    tokens = text.split(&#34; &#34;)
-    mask_string = &#34;&lt;&lt;&lt;mask&gt;&gt;&gt;&#34;
-
-    span_length = min(int(pct * len(tokens)), span_length)
-    # avoid div zero:
-
-    span_length = max(1, span_length)
-
-    n_spans = pct * len(tokens) / (span_length + buffer_size * 2)
-    if ceil_pct:
-        n_spans = np.ceil(n_spans)
-    n_spans = int(n_spans)
-
-    n_masks = 0
-    while n_masks &lt; n_spans:
-        start = np.random.randint(0, max(1, len(tokens) - span_length))
-        end = start + span_length
-        search_start = max(0, start - buffer_size)
-        search_end = min(len(tokens), end + buffer_size)
-        if mask_string not in tokens[search_start:search_end]:
-            tokens[start:end] = [mask_string]
-            n_masks += 1
-
-    # replace each occurrence of mask_string with &lt;extra_id_NUM&gt;, where NUM increments
-    num_filled = 0
-    for idx, token in enumerate(tokens):
-        if token == mask_string:
-            tokens[idx] = f&#34;&lt;extra_id_{num_filled}&gt;&#34;
-            num_filled += 1
-    assert num_filled == n_masks, f&#34;num_filled {num_filled} != n_masks {n_masks}&#34;
-    text = &#34; &#34;.join(tokens)
-    return text</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.attacks.neighborhood.MaskFillingModel" href="#mimir.attacks.neighborhood.MaskFillingModel">MaskFillingModel</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.forward" href="../models.html#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.get_ll" href="../models.html#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.get_probabilities" href="../models.html#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.load" href="../models.html#mimir.models.Model.load">load</a></code></li>
@@ -1901,7 +807,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -1916,20 +821,14 @@ <h1>Index</h1>
 <li>
 <h4><code><a title="mimir.attacks.neighborhood.BertModel" href="#mimir.attacks.neighborhood.BertModel">BertModel</a></code></h4>
 <ul class="">
-<li><code><a title="mimir.attacks.neighborhood.BertModel.call_super_init" href="#mimir.attacks.neighborhood.BertModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.BertModel.dump_patches" href="#mimir.attacks.neighborhood.BertModel.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.BertModel.generate_neighbors" href="#mimir.attacks.neighborhood.BertModel.generate_neighbors">generate_neighbors</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.BertModel.generate_neighbors_" href="#mimir.attacks.neighborhood.BertModel.generate_neighbors_">generate_neighbors_</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.BertModel.training" href="#mimir.attacks.neighborhood.BertModel.training">training</a></code></li>
 </ul>
 </li>
 <li>
 <h4><code><a title="mimir.attacks.neighborhood.MaskFillingModel" href="#mimir.attacks.neighborhood.MaskFillingModel">MaskFillingModel</a></code></h4>
 <ul class="">
-<li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.call_super_init" href="#mimir.attacks.neighborhood.MaskFillingModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.dump_patches" href="#mimir.attacks.neighborhood.MaskFillingModel.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.generate_neighbors" href="#mimir.attacks.neighborhood.MaskFillingModel.generate_neighbors">generate_neighbors</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.MaskFillingModel.training" href="#mimir.attacks.neighborhood.MaskFillingModel.training">training</a></code></li>
 </ul>
 </li>
 <li>
@@ -1943,15 +842,12 @@ <h4><code><a title="mimir.attacks.neighborhood.NeighborhoodAttack" href="#mimir.
 <li>
 <h4><code><a title="mimir.attacks.neighborhood.T5Model" href="#mimir.attacks.neighborhood.T5Model">T5Model</a></code></h4>
 <ul class="">
-<li><code><a title="mimir.attacks.neighborhood.T5Model.call_super_init" href="#mimir.attacks.neighborhood.T5Model.call_super_init">call_super_init</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.create_fill_dictionary" href="#mimir.attacks.neighborhood.T5Model.create_fill_dictionary">create_fill_dictionary</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.T5Model.dump_patches" href="#mimir.attacks.neighborhood.T5Model.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.extract_fills" href="#mimir.attacks.neighborhood.T5Model.extract_fills">extract_fills</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.generate_neighbors" href="#mimir.attacks.neighborhood.T5Model.generate_neighbors">generate_neighbors</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.generate_neighbors_" href="#mimir.attacks.neighborhood.T5Model.generate_neighbors_">generate_neighbors_</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.replace_masks" href="#mimir.attacks.neighborhood.T5Model.replace_masks">replace_masks</a></code></li>
 <li><code><a title="mimir.attacks.neighborhood.T5Model.tokenize_and_mask" href="#mimir.attacks.neighborhood.T5Model.tokenize_and_mask">tokenize_and_mask</a></code></li>
-<li><code><a title="mimir.attacks.neighborhood.T5Model.training" href="#mimir.attacks.neighborhood.T5Model.training">training</a></code></li>
 </ul>
 </li>
 </ul>
@@ -1960,7 +856,7 @@ <h4><code><a title="mimir.attacks.neighborhood.T5Model" href="#mimir.attacks.nei
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/quantile.html b/docs/attacks/quantile.html
index c03cb29..1a9e564 100644
--- a/docs/attacks/quantile.html
+++ b/docs/attacks/quantile.html
@@ -2,19 +2,22 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.quantile API documentation</title>
 <meta name="description" content="Implementation of the attack proposed in &#39;Scalable Membership Inference Attacks via Quantile Regression&#39;
-https://arxiv.org/pdf/2307.03694.pdf" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+https://arxiv.org/pdf/2307.03694.pdf">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -25,127 +28,6 @@ <h1 class="title">Module <code>mimir.attacks.quantile</code></h1>
 <section id="section-intro">
 <p>Implementation of the attack proposed in 'Scalable Membership Inference Attacks via Quantile Regression'
 <a href="https://arxiv.org/pdf/2307.03694.pdf">https://arxiv.org/pdf/2307.03694.pdf</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Implementation of the attack proposed in &#39;Scalable Membership Inference Attacks via Quantile Regression&#39;
-    https://arxiv.org/pdf/2307.03694.pdf
-&#34;&#34;&#34;
-import torch as ch
-from mimir.models import QuantileReferenceModel, Model
-from transformers import TrainingArguments
-from sklearn.metrics import mean_squared_error
-from transformers import TrainingArguments, Trainer
-from datasets import Dataset
-
-from mimir.attacks.all_attacks import Attack
-
-
-class CustomTrainer(Trainer):
-    def __init__(
-        self,
-        alpha_fpr,
-        **kwargs,
-    ):
-        super().__init__(**kwargs)
-        self.alpha_fpr = alpha_fpr
-
-    def compute_loss(self, model, inputs, return_outputs=False):
-        labels = inputs.pop(&#34;labels&#34;)
-        # forward pass
-        outputs = model(**inputs)
-        logits = outputs.get(&#34;logits&#34;)
-        loss = ch.mean(
-            ch.max(
-                self.alpha_fpr * (logits - labels),
-                (1 - self.alpha_fpr) * (labels - logits),
-            )
-        )
-        return (loss, outputs) if return_outputs else loss
-
-
-class QuantileAttack(Attack):
-    &#34;&#34;&#34;
-    Implementation of the attack proposed in &#39;Scalable Membership Inference Attacks via Quantile Regression&#39;
-    https://arxiv.org/pdf/2307.03694.pdf
-    &#34;&#34;&#34;
-
-    def __init__(self, config, model: Model, alpha: float):
-        &#34;&#34;&#34;
-        alpha (float): Desired FPR
-        &#34;&#34;&#34;
-        ref_model = QuantileReferenceModel(
-            config, name=&#34;Sreevishnu/funnel-transformer-small-imdb&#34;
-        )
-        super().__init__(self, config, model, ref_model)
-        self.alpha = alpha
-
-    def _train_quantile_model(self, dataset):
-        def tokenize_function(examples):
-            return self.ref_model.tokenizer(
-                examples[&#34;text&#34;], padding=&#34;max_length&#34;, truncation=True
-            )
-
-        tokenized_dataset = dataset.map(tokenize_function, batched=True)
-        training_args = TrainingArguments(
-            output_dir=&#34;quantile_ref_model&#34;,
-            evaluation_strategy=&#34;epoch&#34;,
-            num_train_epochs=1,
-        )
-
-        def compute_metrics(eval_pred):
-            predictions, labels = eval_pred
-            rmse = mean_squared_error(labels, predictions, squared=False)
-            return {&#34;rmse&#34;: rmse}
-
-        trainer = CustomTrainer(
-            alpha_fpr=self.alpha,
-            model=self.ref_model.model,
-            args=training_args,
-            train_dataset=tokenized_dataset,
-            eval_dataset=tokenized_dataset,
-            compute_metrics=compute_metrics,
-        )
-        # Train quantile model
-        trainer.train()
-
-    def prepare(self, known_non_members):
-        &#34;&#34;&#34;
-        Step 1: Use non-member dataset, collect confidence scores for correct label.
-        Step 2: Train a quantile regression model that takes X as input and predicts quantile. Use pinball loss
-        Step 3: Test by checking if member: score is higher than output of quantile regression model.
-        &#34;&#34;&#34;
-
-        # Step 1: Use non-member dataset, collect confidence scores for correct label.
-        # Get likelihood scores from target model for known_non_members
-        # Note that these non-members should be different from the ones in testing
-        scores = [self.target_model.get_ll(x) for x in known_non_members]
-        # Construct a dataset out of this to be used in Huggingface, with
-        # &#34;text&#34; containing the actual data, and &#34;labels&#34; containing the scores
-        dataset = Dataset.from_dict({&#34;text&#34;: known_non_members, &#34;labels&#34;: scores})
-
-        # Step 2: Train a quantile regression model that takes X as input and predicts quantile. Use pinball loss
-        self._train_quantile_model(dataset)
-
-    def attack(self, document, **kwargs):
-        # Step 3: Test by checking if member: score is higher than output of quantile regression model.
-
-        # Get likelihood score from target model for doc
-        ll = self.target_model.get_ll(document)
-
-        # Return ll - quantile_model(doc)
-        tokenized = self.ref_model.tokenizer(document, return_tensors=&#34;pt&#34;)
-        # Shift items in the dictionary to the correct device
-        tokenized = {k: v.to(self.ref_model.model.device, non_blocking=True) for k, v in tokenized.items()}
-        quantile_score = self.ref_model.model(**tokenized)
-        print(quantile_score)
-        quantile_score = quantile_score.logits.item()
-
-        # We want higher score to be non-member
-        return quantile_score - ll</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -206,7 +88,10 @@ <h2 id="args">Args</h2>
 </code></pre>
 <p>compute_metrics (<code>Callable[[EvalPrediction], Dict]</code>, <em>optional</em>):
 The function that will be used to compute metrics at evaluation. Must take a [<code>EvalPrediction</code>] and return
-a dictionary string to metric values.
+a dictionary string to metric values. <em>Note</em> When passing TrainingArgs with <code>batch_eval_metrics</code> set to
+<code>True</code>, your compute_metrics function must take a boolean <code>compute_result</code> argument. This will be triggered
+after the last eval batch to signal that the function needs to calculate and return the global summary
+statistics rather than accumulating the batch-level statistics.
 callbacks (List of [<code>TrainerCallback</code>], <em>optional</em>):
 A list of callbacks to customize the training loop. Will add those to the list of default callbacks
 detailed in <a href="callback">here</a>.</p>
@@ -274,23 +159,6 @@ <h3>Methods</h3>
 <dd>
 <div class="desc"><p>How the loss is computed by Trainer. By default, all models return the loss in the first element.</p>
 <p>Subclass and override for custom behavior.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def compute_loss(self, model, inputs, return_outputs=False):
-    labels = inputs.pop(&#34;labels&#34;)
-    # forward pass
-    outputs = model(**inputs)
-    logits = outputs.get(&#34;logits&#34;)
-    loss = ch.mean(
-        ch.max(
-            self.alpha_fpr * (logits - labels),
-            (1 - self.alpha_fpr) * (labels - logits),
-        )
-    )
-    return (loss, outputs) if return_outputs else loss</code></pre>
-</details>
 </dd>
 </dl>
 </dd>
@@ -399,28 +267,6 @@ <h3>Methods</h3>
 <div class="desc"><p>Step 1: Use non-member dataset, collect confidence scores for correct label.
 Step 2: Train a quantile regression model that takes X as input and predicts quantile. Use pinball loss
 Step 3: Test by checking if member: score is higher than output of quantile regression model.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def prepare(self, known_non_members):
-    &#34;&#34;&#34;
-    Step 1: Use non-member dataset, collect confidence scores for correct label.
-    Step 2: Train a quantile regression model that takes X as input and predicts quantile. Use pinball loss
-    Step 3: Test by checking if member: score is higher than output of quantile regression model.
-    &#34;&#34;&#34;
-
-    # Step 1: Use non-member dataset, collect confidence scores for correct label.
-    # Get likelihood scores from target model for known_non_members
-    # Note that these non-members should be different from the ones in testing
-    scores = [self.target_model.get_ll(x) for x in known_non_members]
-    # Construct a dataset out of this to be used in Huggingface, with
-    # &#34;text&#34; containing the actual data, and &#34;labels&#34; containing the scores
-    dataset = Dataset.from_dict({&#34;text&#34;: known_non_members, &#34;labels&#34;: scores})
-
-    # Step 2: Train a quantile regression model that takes X as input and predicts quantile. Use pinball loss
-    self._train_quantile_model(dataset)</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
@@ -442,7 +288,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -472,7 +317,7 @@ <h4><code><a title="mimir.attacks.quantile.QuantileAttack" href="#mimir.attacks.
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/reference.html b/docs/attacks/reference.html
index 7d1dd6d..f8e4029 100644
--- a/docs/attacks/reference.html
+++ b/docs/attacks/reference.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.reference API documentation</title>
-<meta name="description" content="Reference-based attacks." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Reference-based attacks.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,37 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.reference</code></h1>
 </header>
 <section id="section-intro">
 <p>Reference-based attacks.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Reference-based attacks.
-&#34;&#34;&#34;
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model, ReferenceModel
-from mimir.config import ExperimentConfig
-
-
-class ReferenceAttack(Attack):
-
-    def __init__(
-        self, config: ExperimentConfig,
-        model: Model,
-        reference_model: ReferenceModel
-    ):
-        super().__init__(config, model, reference_model)
-
-    def _attack(self, document, probs, tokens=None, **kwargs):
-        &#34;&#34;&#34;
-        Reference-based attack score. Performs difficulty calibration in model likelihood using a reference model.
-        &#34;&#34;&#34;
-        loss = kwargs.get(&#39;loss&#39;, None)
-        if loss is None:
-            loss = self.target_model.get_ll(document, probs=probs, tokens=tokens)
-        ref_loss = self.ref_model.get_ll(document, probs=probs, tokens=tokens)
-        return loss - ref_loss</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -116,7 +88,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -137,7 +108,7 @@ <h4><code><a title="mimir.attacks.reference.ReferenceAttack" href="#mimir.attack
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/utils.html b/docs/attacks/utils.html
index 264ee55..3366e73 100644
--- a/docs/attacks/utils.html
+++ b/docs/attacks/utils.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.utils API documentation</title>
-<meta name="description" content="" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -22,37 +25,6 @@
 <h1 class="title">Module <code>mimir.attacks.utils</code></h1>
 </header>
 <section id="section-intro">
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">from mimir.attacks.all_attacks import AllAttacks
-
-from mimir.attacks.loss import LOSSAttack
-from mimir.attacks.reference import ReferenceAttack
-from mimir.attacks.zlib import ZLIBAttack
-from mimir.attacks.min_k import MinKProbAttack
-from mimir.attacks.min_k_plus_plus import MinKPlusPlusAttack
-from mimir.attacks.neighborhood import NeighborhoodAttack
-from mimir.attacks.gradnorm import GradNormAttack
-
-
-# TODO Use decorators to link attack implementations with enum above
-def get_attacker(attack: str):
-    mapping = {
-        AllAttacks.LOSS: LOSSAttack,
-        AllAttacks.REFERENCE_BASED: ReferenceAttack,
-        AllAttacks.ZLIB: ZLIBAttack,
-        AllAttacks.MIN_K: MinKProbAttack,
-        AllAttacks.MIN_K_PLUS_PLUS: MinKPlusPlusAttack,
-        AllAttacks.NEIGHBOR: NeighborhoodAttack,
-        AllAttacks.GRADNORM: GradNormAttack,
-    }
-    attack_cls = mapping.get(attack, None)
-    if attack_cls is None:
-        raise ValueError(f&#34;Attack {attack} not found&#34;)
-    return attack_cls</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -66,25 +38,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_attacker(attack: str):
-    mapping = {
-        AllAttacks.LOSS: LOSSAttack,
-        AllAttacks.REFERENCE_BASED: ReferenceAttack,
-        AllAttacks.ZLIB: ZLIBAttack,
-        AllAttacks.MIN_K: MinKProbAttack,
-        AllAttacks.MIN_K_PLUS_PLUS: MinKPlusPlusAttack,
-        AllAttacks.NEIGHBOR: NeighborhoodAttack,
-        AllAttacks.GRADNORM: GradNormAttack,
-    }
-    attack_cls = mapping.get(attack, None)
-    if attack_cls is None:
-        raise ValueError(f&#34;Attack {attack} not found&#34;)
-    return attack_cls</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -97,7 +50,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -116,7 +68,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/attacks/zlib.html b/docs/attacks/zlib.html
index fda63ec..50b24da 100644
--- a/docs/attacks/zlib.html
+++ b/docs/attacks/zlib.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.attacks.zlib API documentation</title>
-<meta name="description" content="zlib-normalization Attack: https://www.usenix.org/system/files/sec21-carlini-extracting.pdf" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="zlib-normalization Attack: https://www.usenix.org/system/files/sec21-carlini-extracting.pdf">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,46 +26,6 @@ <h1 class="title">Module <code>mimir.attacks.zlib</code></h1>
 </header>
 <section id="section-intro">
 <p>zlib-normalization Attack: <a href="https://www.usenix.org/system/files/sec21-carlini-extracting.pdf">https://www.usenix.org/system/files/sec21-carlini-extracting.pdf</a></p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    zlib-normalization Attack: https://www.usenix.org/system/files/sec21-carlini-extracting.pdf
-&#34;&#34;&#34;
-
-import torch as ch
-import zlib
-
-from mimir.attacks.all_attacks import Attack
-from mimir.models import Model
-from mimir.config import ExperimentConfig
-
-
-class ZLIBAttack(Attack):
-
-    def __init__(self,
-                 config: ExperimentConfig,
-                 model: Model):
-        super().__init__(config, model, ref_model=None)
-
-    @ch.no_grad()
-    def _attack(
-        self,
-        document,
-        probs,
-        tokens=None,
-        **kwargs
-    ):
-        &#34;&#34;&#34;
-        zlib-based attack score. Performs difficulty calibration in model likelihood by normalizing with zlib entropy.
-        &#34;&#34;&#34;
-        loss = kwargs.get(&#34;loss&#34;, None)
-        if loss is None:
-            loss = self.target_model.get_ll(document, probs=probs, tokens=tokens)
-        zlib_entropy = len(zlib.compress(bytes(document, &#34;utf-8&#34;)))
-        return loss / zlib_entropy</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -130,7 +93,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -151,7 +113,7 @@ <h4><code><a title="mimir.attacks.zlib.ZLIBAttack" href="#mimir.attacks.zlib.ZLI
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/config.html b/docs/config.html
index 9c1fb4f..e2cb034 100644
--- a/docs/config.html
+++ b/docs/config.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.config API documentation</title>
-<meta name="description" content="Definitions for configurations." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Definitions for configurations.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,229 +26,6 @@ <h1 class="title">Module <code>mimir.config</code></h1>
 </header>
 <section id="section-intro">
 <p>Definitions for configurations.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Definitions for configurations.
-&#34;&#34;&#34;
-
-from dataclasses import dataclass
-from typing import Optional, List
-from simple_parsing.helpers import Serializable, field
-from mimir.utils import get_cache_path, get_data_source
-
-
-@dataclass
-class ReferenceConfig(Serializable):
-    &#34;&#34;&#34;
-    Config for attacks that use reference models.
-    &#34;&#34;&#34;
-    models: List[str]
-    &#34;&#34;&#34;Reference model names&#34;&#34;&#34;
-
-
-@dataclass
-class NeighborhoodConfig(Serializable):
-    &#34;&#34;&#34;
-    Config for neighborhood attack
-    &#34;&#34;&#34;
-    model: str
-    &#34;&#34;&#34;Mask-filling model&#34;&#34;&#34;
-    n_perturbation_list: List[int] = field(default_factory=lambda: [1, 10])
-    &#34;&#34;&#34;List of n_neighbors to try.&#34;&#34;&#34;
-    dump_cache: Optional[bool] = False
-    &#34;Dump neighbors data to cache? Exits program after dumping&#34;
-    load_from_cache: Optional[bool] = False
-    &#34;&#34;&#34;Load neighbors data from cache?&#34;&#34;&#34;
-    # BERT-specific param
-    original_tokenization_swap: Optional[bool] = True
-    &#34;&#34;&#34;Swap out token in original text with neighbor token, instead of re-generating text&#34;&#34;&#34;
-    pct_swap_bert: Optional[float] = 0.05
-    &#34;&#34;&#34;Percentage of tokens per neighbor that are different from the original text&#34;&#34;&#34;
-    neighbor_strategy: Optional[str] = &#34;deterministic&#34;
-    &#34;&#34;&#34;Strategy for generating neighbors. One of [&#39;deterministic&#39;, &#39;random&#39;]. Deterministic uses only one-word neighbors&#34;&#34;&#34;
-    # T-5 specific hyper-parameters
-    span_length: Optional[int] = 2
-    &#34;&#34;&#34;Span length for neighborhood attack&#34;&#34;&#34;
-    random_fills_tokens: Optional[bool] = False
-    &#34;&#34;&#34;Randomly fill tokens?&#34;&#34;&#34;
-    random_fills: Optional[bool] = False
-    &#34;&#34;&#34;Randomly fill?&#34;&#34;&#34;
-    pct_words_masked: Optional[float] = 0.3
-    &#34;&#34;&#34;Percentage masked is actually pct_words_masked * (span_length / (span_length + 2 * buffer_size))&#34;&#34;&#34;
-    buffer_size: Optional[int] = 1
-    &#34;&#34;&#34;Buffer size&#34;&#34;&#34;
-    top_p: Optional[float] = 1.0
-    &#34;&#34;&#34;Use tokens (minimal set) with cumulative probability of &lt;=top_p&#34;&#34;&#34;
-    max_tries: Optional[int] = 100
-    &#34;&#34;&#34;Maximum number of trials in finding replacements for masked tokens&#34;&#34;&#34;
-    ceil_pct: Optional[bool] = False
-    &#34;&#34;&#34;Apply ceil operation on span length calculation?&#34;&#34;&#34;
-
-    def __post_init__(self):
-        if self.dump_cache and self.load_from_cache:
-            raise ValueError(&#34;Cannot dump and load cache at the same time&#34;)
-
-
-@dataclass
-class EnvironmentConfig(Serializable):
-    &#34;&#34;&#34;
-    Config for environment-specific parameters
-    &#34;&#34;&#34;
-    cache_dir: Optional[str] = None
-    &#34;&#34;&#34;Path to cache directory&#34;&#34;&#34;
-    data_source: Optional[str] = None
-    &#34;&#34;&#34;Path where data is stored&#34;&#34;&#34;
-    device: Optional[str] = &#39;cuda:0&#39;
-    &#34;&#34;&#34;Device (GPU) to load main model on&#34;&#34;&#34;
-    device_map: Optional[str] = None
-    &#34;&#34;&#34;Configuration for device map if needing to split model across gpus&#34;&#34;&#34;
-    device_aux: Optional[str] = &#34;cuda:1&#34;
-    &#34;&#34;&#34;Device (GPU) to load any auxiliary model(s) on&#34;&#34;&#34;
-    compile: Optional[bool] = True
-    &#34;&#34;&#34;Compile models?&#34;&#34;&#34;
-    int8: Optional[bool] = False
-    &#34;&#34;&#34;Use int8 quantization?&#34;&#34;&#34;
-    half: Optional[bool] = False
-    &#34;&#34;&#34;Use half precision?&#34;&#34;&#34;
-    results: Optional[str] = &#34;results&#34;
-    &#34;&#34;&#34;Path for saving final results&#34;&#34;&#34;
-    tmp_results: Optional[str] = &#34;tmp_results&#34;
-
-    def __post_init__(self):
-        if self.cache_dir is None:
-            self.cache_dir = get_cache_path()
-        if self.data_source is None:
-            self.data_source = get_data_source()
-
-
-@dataclass
-class OpenAIConfig(Serializable):
-    &#34;&#34;&#34;
-    Config for OpenAI calls
-    &#34;&#34;&#34;
-    key: str
-    &#34;&#34;&#34;OpenAI API key&#34;&#34;&#34;
-    model: str
-    &#34;&#34;&#34;Model name&#34;&#34;&#34;
-
-
-@dataclass
-class ExperimentConfig(Serializable):
-    &#34;&#34;&#34;
-    Config for attacks
-    &#34;&#34;&#34;
-    experiment_name: str
-    &#34;&#34;&#34;Name for the experiment&#34;&#34;&#34;
-    base_model: str
-    &#34;&#34;&#34;Base model name&#34;&#34;&#34;
-    dataset_member: str
-    &#34;&#34;&#34;Dataset source for members&#34;&#34;&#34;
-    dataset_nonmember: str
-    &#34;&#34;&#34;Dataset source for nonmembers&#34;&#34;&#34;
-    output_name: str = None
-    &#34;&#34;&#34;Output name for sub-directory.&#34;&#34;&#34;
-    dataset_nonmember_other_sources: Optional[List[str]] = field(
-        default_factory=lambda: None
-    )
-    &#34;&#34;&#34;Dataset sources for nonmembers for which metrics will be computed, using the thresholds derived from the main member/nonmember datasets&#34;&#34;&#34;
-    pretokenized: Optional[bool] = False
-    &#34;&#34;&#34;Is the data already pretokenized&#34;&#34;&#34;
-    revision: Optional[str] = None
-    &#34;&#34;&#34;Model revision to use&#34;&#34;&#34;
-    presampled_dataset_member: Optional[str] = None
-    &#34;&#34;&#34;Path to presampled dataset source for members&#34;&#34;&#34;
-    presampled_dataset_nonmember: Optional[str] = None
-    &#34;&#34;&#34;Path to presampled dataset source for non-members&#34;&#34;&#34;
-    token_frequency_map: Optional[
-        str
-    ] = None  # TODO: Handling auxiliary data structures
-    &#34;&#34;&#34;Path to a pre-computed token frequency map&#34;&#34;&#34;
-    dataset_key: Optional[str] = None
-    &#34;&#34;&#34;Dataset key&#34;&#34;&#34;
-    specific_source: Optional[str] = None
-    &#34;&#34;&#34;Specific sub-source to focus on. Only valid for the_pile&#34;&#34;&#34;
-    full_doc: Optional[bool] = False  # TODO: refactor full_doc design?
-    &#34;&#34;&#34;Determines whether MIA will be performed over entire doc or not&#34;&#34;&#34;
-    max_substrs: Optional[int] = 20
-    &#34;&#34;&#34;If full_doc, determines the maximum number of sample substrs to evaluate on&#34;&#34;&#34;
-    dump_cache: Optional[bool] = False
-    &#34;&#34;&#34;Dump data to cache? Exits program after dumping&#34;&#34;&#34;
-    load_from_cache: Optional[bool] = False
-    &#34;&#34;&#34;Load data from cache?&#34;&#34;&#34;
-    load_from_hf: Optional[bool] = True
-    &#34;&#34;&#34;Load data from HuggingFace?&#34;&#34;&#34;
-    blackbox_attacks: Optional[List[str]] = field(
-        default_factory=lambda: None
-    )  # Can replace with &#34;default&#34; attacks if we want
-    &#34;&#34;&#34;List of attacks to evaluate&#34;&#34;&#34;
-    tokenization_attack: Optional[bool] = False
-    &#34;&#34;&#34;Run tokenization attack?&#34;&#34;&#34;
-    quantile_attack: Optional[bool] = False
-    &#34;&#34;&#34;Run quantile attack?&#34;&#34;&#34;
-    n_samples: Optional[int] = 200
-    &#34;&#34;&#34;Number of records (member and non-member each) to run the attack(s) for&#34;&#34;&#34;
-    max_tokens: Optional[int] = 512
-    &#34;&#34;&#34;Consider samples with at most these many tokens&#34;&#34;&#34;
-    max_data: Optional[int] = 5_000
-    &#34;&#34;&#34;Maximum samples to load from data before processing. Helps with efficiency&#34;&#34;&#34;
-    min_words: Optional[int] = 100
-    &#34;&#34;&#34;Consider documents with at least these many words&#34;&#34;&#34;
-    max_words: Optional[int] = 200
-    &#34;&#34;&#34;Consider documents with at most these many words&#34;&#34;&#34;
-    max_words_cutoff: Optional[bool] = True
-    &#34;&#34;&#34;Is max_words a selection criteria (False), or a cutoff added on text (True)?&#34;&#34;&#34;
-    batch_size: Optional[int] = 50
-    &#34;&#34;&#34;Batch size&#34;&#34;&#34;
-    chunk_size: Optional[int] = 20
-    &#34;&#34;&#34;Chunk size&#34;&#34;&#34;
-    scoring_model_name: Optional[str] = None
-    &#34;&#34;&#34;Scoring model (if different from base model)&#34;&#34;&#34;
-    top_k: Optional[int] = 40
-    &#34;&#34;&#34;Consider only top-k tokens&#34;&#34;&#34;
-    do_top_k: Optional[bool] = False
-    &#34;&#34;&#34;Use top-k sampling?&#34;&#34;&#34;
-    top_p: Optional[float] = 0.96
-    &#34;&#34;&#34;Use tokens (minimal set) with cumulative probability of &lt;=top_p&#34;&#34;&#34;
-    do_top_p: Optional[bool] = False
-    &#34;&#34;&#34;Use top-p sampling?&#34;&#34;&#34;
-    pre_perturb_pct: Optional[float] = 0.0
-    &#34;&#34;&#34;Percentage of tokens to perturb before attack&#34;&#34;&#34;
-    pre_perturb_span_length: Optional[int] = 5
-    &#34;&#34;&#34;Span length for pre-perturbation&#34;&#34;&#34;
-    tok_by_tok: Optional[bool] = False
-    &#34;&#34;&#34;Process data token-wise?&#34;&#34;&#34;
-    fpr_list: Optional[List[float]] = field(default_factory=lambda: [0.001, 0.01])
-    &#34;&#34;&#34;FPRs at which to compute TPR&#34;&#34;&#34;
-    random_seed: Optional[int] = 0
-    &#34;&#34;&#34;Random seed&#34;&#34;&#34;
-    ref_config: Optional[ReferenceConfig] = None
-    &#34;&#34;&#34;Reference model config&#34;&#34;&#34;
-    neighborhood_config: Optional[NeighborhoodConfig] = None
-    &#34;&#34;&#34;Neighborhood attack config&#34;&#34;&#34;
-    env_config: Optional[EnvironmentConfig] = None
-    &#34;&#34;&#34;Environment config&#34;&#34;&#34;
-    openai_config: Optional[OpenAIConfig] = None
-    &#34;&#34;&#34;OpenAI config&#34;&#34;&#34;
-
-    def __post_init__(self):
-        if self.dump_cache and (self.load_from_cache or self.load_from_hf):
-            raise ValueError(&#34;Cannot dump and load cache at the same time&#34;)
-
-        if self.neighborhood_config:
-            if (
-                self.neighborhood_config.dump_cache
-                or self.neighborhood_config.load_from_cache
-            ) and not (self.load_from_cache or self.dump_cache or self.load_from_hf):
-                raise ValueError(
-                    &#34;Using dump/load for neighborhood cache without dumping/loading main cache does not make sense&#34;
-                )
-
-            if self.neighborhood_config.dump_cache and (self.neighborhood_config.load_from_cache or self.load_from_hf):
-                raise ValueError(&#34;Cannot dump and load neighborhood cache at the same time&#34;)    </code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -869,7 +649,6 @@ <h3>Class variables</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -988,7 +767,7 @@ <h4><code><a title="mimir.config.ReferenceConfig" href="#mimir.config.ReferenceC
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/custom_datasets.html b/docs/custom_datasets.html
index e82f863..39ac586 100644
--- a/docs/custom_datasets.html
+++ b/docs/custom_datasets.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.custom_datasets API documentation</title>
-<meta name="description" content="Helper functions for processing of data (ultimately used for membership inference evaluation)" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Helper functions for processing of data (ultimately used for membership inference evaluation)">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,199 +26,6 @@ <h1 class="title">Module <code>mimir.custom_datasets</code></h1>
 </header>
 <section id="section-intro">
 <p>Helper functions for processing of data (ultimately used for membership inference evaluation)</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Helper functions for processing of data (ultimately used for membership inference evaluation)
-&#34;&#34;&#34;
-import random
-import datasets
-import os
-import json
-from typing import List
-
-
-SEPARATOR = &#39;&lt;&lt;&lt;SEP&gt;&gt;&gt;&#39;
-
-DATASETS = [&#39;writing&#39;, &#39;english&#39;, &#39;german&#39;, &#39;pubmed&#39;]
-
-SOURCES_UPLOADED = [
-    &#34;arxiv&#34;,
-    &#34;dm_mathematics&#34;,
-    &#34;github&#34;,
-    &#34;hackernews&#34;,
-    &#34;pile_cc&#34;,
-    &#34;pubmed_central&#34;,
-    &#34;wikipedia_(en)&#34;,
-    &#34;full_pile&#34;,
-    &#34;c4&#34;,
-    &#34;temporal_arxiv&#34;,
-    &#34;temporal_wiki&#34;
-]
-
-
-def load_pubmed(cache_dir):
-    data = datasets.load_dataset(&#39;pubmed_qa&#39;, &#39;pqa_labeled&#39;, split=&#39;train&#39;, cache_dir=cache_dir)
-    
-    # combine question and long_answer
-    data = [f&#39;Question: {q} Answer:{SEPARATOR}{a}&#39; for q, a in zip(data[&#39;question&#39;], data[&#39;long_answer&#39;])]
-
-    return data
-
-
-def load_cached(cache_dir,
-                data_split: str,
-                filename: str,
-                min_length: int,
-                max_length: int,
-                n_samples: int,
-                max_tokens: int,
-                load_from_hf: bool = False):
-    &#34;&#34;&#34;&#34;
-        Read from cache if available. Used for certain pile sources and xsum
-        to ensure fairness in comparison across attacks.runs.
-    &#34;&#34;&#34;
-    if load_from_hf:
-        print(&#34;Loading from HuggingFace!&#34;)
-        data_split = data_split.replace(&#34;train&#34;, &#34;member&#34;)
-        data_split = data_split.replace(&#34;test&#34;, &#34;nonmember&#34;)
-        if not filename.startswith(&#34;the_pile&#34;):
-            raise ValueError(f&#34;HuggingFace data only available for The Pile.&#34;)
-
-        for source in SOURCES_UPLOADED:
-            # Got a match
-            if source in filename and filename.startswith(f&#34;the_pile_{source}&#34;):
-                split = filename.split(f&#34;the_pile_{source}&#34;)[1]
-                if split == &#34;&#34;:
-                    # The way HF data is uploaded, no split is recorded as &#34;none&#34;
-                    split = &#34;none&#34;
-                else:
-                    # remove the first underscore
-                    split = split[1:]
-                    # remove &#39;&lt;&#39; , &#39;&gt;&#39;
-                    split = split.replace(&#34;&lt;&#34;, &#34;&#34;).replace(&#34;&gt;&#34;, &#34;&#34;)
-                    # Remove &#34;_truncated&#34; from the end, if present
-                    split = split.rsplit(&#34;_truncated&#34;, 1)[0]
-
-                # Load corresponding dataset
-                ds = datasets.load_dataset(&#34;iamgroot42/mimir&#34;, name=source, split=split)
-                data = ds[data_split]
-                # Check if the number of samples is correct
-                if len(data) != n_samples:
-                    raise ValueError(f&#34;Requested {n_samples} samples, but only {len(data)} samples available. Potential mismatch in HuggingFace data and requested data.&#34;)
-                return data
-        # If got here, matching source was not found
-        raise ValueError(f&#34;Requested source {filename} not found in HuggingFace data.&#34;)
-    else:
-        file_path = os.path.join(cache_dir, f&#34;cache_{min_length}_{max_length}_{n_samples}_{max_tokens}&#34;, data_split, filename + &#34;.jsonl&#34;)
-        if not os.path.exists(file_path):
-            raise ValueError(f&#34;Requested cache file {file_path} does not exist&#34;)
-        data = load_data(file_path)
-    return data
-
-
-def load_data(file_path):
-    &#34;&#34;&#34;
-        Load data from a given filepath (.jsonl)
-    &#34;&#34;&#34;
-    with open(file_path, &#39;r&#39;) as f:
-        data = [json.loads(line) for line in f.readlines()]
-    return data
-
-
-def dump_to_cache(data: List, cache_dir, path, filename: str, min_length: int, max_length: int, n_samples: int, max_tokens: int):
-    &#34;&#34;&#34;
-        Cache a file (one sample per line)
-    &#34;&#34;&#34;
-    # Make sure path directory exists
-    subdir = os.path.join(cache_dir, f&#34;cache_{min_length}_{max_length}_{n_samples}_{max_tokens}&#34;, path)
-    os.makedirs(subdir, exist_ok=True)
-    # Dump to file
-    # Since each datum has newlines in it potentially, use jsonl format
-    save_data(os.path.join(subdir, filename + &#34;.jsonl&#34;), data)
-
-
-def save_data(file_path, data):
-    # Since each datum has newlines in it potentially, use jsonl format
-    with open(file_path, &#39;w&#39;) as f:
-        for datum in data:
-            f.write(json.dumps(datum) + &#34;\n&#34;)
-
-
-def process_prompt(prompt):
-    return prompt.replace(&#39;[ WP ]&#39;, &#39;&#39;).replace(&#39;[ OT ]&#39;, &#39;&#39;)
-
-
-def process_spaces(story):
-    return story.replace(
-        &#39; ,&#39;, &#39;,&#39;).replace(
-        &#39; .&#39;, &#39;.&#39;).replace(
-        &#39; ?&#39;, &#39;?&#39;).replace(
-        &#39; !&#39;, &#39;!&#39;).replace(
-        &#39; ;&#39;, &#39;;&#39;).replace(
-        &#39; \&#39;&#39;, &#39;\&#39;&#39;).replace(
-        &#39; ’ &#39;, &#39;\&#39;&#39;).replace(
-        &#39; :&#39;, &#39;:&#39;).replace(
-        &#39;&lt;newline&gt;&#39;, &#39;\n&#39;).replace(
-        &#39;`` &#39;, &#39;&#34;&#39;).replace(
-        &#39; \&#39;\&#39;&#39;, &#39;&#34;&#39;).replace(
-        &#39;\&#39;\&#39;&#39;, &#39;&#34;&#39;).replace(
-        &#39;.. &#39;, &#39;... &#39;).replace(
-        &#39; )&#39;, &#39;)&#39;).replace(
-        &#39;( &#39;, &#39;(&#39;).replace(
-        &#39; n\&#39;t&#39;, &#39;n\&#39;t&#39;).replace(
-        &#39; i &#39;, &#39; I &#39;).replace(
-        &#39; i\&#39;&#39;, &#39; I\&#39;&#39;).replace(
-        &#39;\\\&#39;&#39;, &#39;\&#39;&#39;).replace(
-        &#39;\n &#39;, &#39;\n&#39;).strip()
-
-
-def load_writing(cache_dir=None):
-    writing_path = &#39;data/writingPrompts&#39;
-    
-    with open(f&#39;{writing_path}/valid.wp_source&#39;, &#39;r&#39;) as f:
-        prompts = f.readlines()
-    with open(f&#39;{writing_path}/valid.wp_target&#39;, &#39;r&#39;) as f:
-        stories = f.readlines()
-    
-    prompts = [process_prompt(prompt) for prompt in prompts]
-    joined = [process_spaces(prompt + &#34; &#34; + story) for prompt, story in zip(prompts, stories)]
-    filtered = [story for story in joined if &#39;nsfw&#39; not in story and &#39;NSFW&#39; not in story]
-
-    random.seed(0)
-    random.shuffle(filtered)
-
-    return filtered
-
-
-def load_language(language, cache_dir):
-    # load either the english or german portion of the wmt16 dataset
-    assert language in [&#39;en&#39;, &#39;de&#39;]
-    d = datasets.load_dataset(&#39;wmt16&#39;, &#39;de-en&#39;, split=&#39;train&#39;, cache_dir=cache_dir)
-    docs = d[&#39;translation&#39;]
-    desired_language_docs = [d[language] for d in docs]
-    lens = [len(d.split()) for d in desired_language_docs]
-    sub = [d for d, l in zip(desired_language_docs, lens) if l &gt; 100 and l &lt; 150]
-    return sub
-
-
-def load_german(cache_dir):
-    return load_language(&#39;de&#39;, cache_dir)
-
-
-def load_english(cache_dir):
-    return load_language(&#39;en&#39;, cache_dir)
-
-
-def load(name, cache_dir, **kwargs):
-    if name in DATASETS:
-        load_fn = globals()[f&#39;load_{name}&#39;]
-        return load_fn(cache_dir=cache_dir, **kwargs)
-    else:
-        raise ValueError(f&#39;Unknown dataset {name}&#39;)</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -229,38 +39,12 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </code></dt>
 <dd>
 <div class="desc"><p>Cache a file (one sample per line)</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def dump_to_cache(data: List, cache_dir, path, filename: str, min_length: int, max_length: int, n_samples: int, max_tokens: int):
-    &#34;&#34;&#34;
-        Cache a file (one sample per line)
-    &#34;&#34;&#34;
-    # Make sure path directory exists
-    subdir = os.path.join(cache_dir, f&#34;cache_{min_length}_{max_length}_{n_samples}_{max_tokens}&#34;, path)
-    os.makedirs(subdir, exist_ok=True)
-    # Dump to file
-    # Since each datum has newlines in it potentially, use jsonl format
-    save_data(os.path.join(subdir, filename + &#34;.jsonl&#34;), data)</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load"><code class="name flex">
 <span>def <span class="ident">load</span></span>(<span>name, cache_dir, **kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load(name, cache_dir, **kwargs):
-    if name in DATASETS:
-        load_fn = globals()[f&#39;load_{name}&#39;]
-        return load_fn(cache_dir=cache_dir, **kwargs)
-    else:
-        raise ValueError(f&#39;Unknown dataset {name}&#39;)</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_cached"><code class="name flex">
 <span>def <span class="ident">load_cached</span></span>(<span>cache_dir, data_split: str, filename: str, min_length: int, max_length: int, n_samples: int, max_tokens: int, load_from_hf: bool = False)</span>
@@ -269,231 +53,60 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <div class="desc"><p>"
 Read from cache if available. Used for certain pile sources and xsum
 to ensure fairness in comparison across attacks.runs.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_cached(cache_dir,
-                data_split: str,
-                filename: str,
-                min_length: int,
-                max_length: int,
-                n_samples: int,
-                max_tokens: int,
-                load_from_hf: bool = False):
-    &#34;&#34;&#34;&#34;
-        Read from cache if available. Used for certain pile sources and xsum
-        to ensure fairness in comparison across attacks.runs.
-    &#34;&#34;&#34;
-    if load_from_hf:
-        print(&#34;Loading from HuggingFace!&#34;)
-        data_split = data_split.replace(&#34;train&#34;, &#34;member&#34;)
-        data_split = data_split.replace(&#34;test&#34;, &#34;nonmember&#34;)
-        if not filename.startswith(&#34;the_pile&#34;):
-            raise ValueError(f&#34;HuggingFace data only available for The Pile.&#34;)
-
-        for source in SOURCES_UPLOADED:
-            # Got a match
-            if source in filename and filename.startswith(f&#34;the_pile_{source}&#34;):
-                split = filename.split(f&#34;the_pile_{source}&#34;)[1]
-                if split == &#34;&#34;:
-                    # The way HF data is uploaded, no split is recorded as &#34;none&#34;
-                    split = &#34;none&#34;
-                else:
-                    # remove the first underscore
-                    split = split[1:]
-                    # remove &#39;&lt;&#39; , &#39;&gt;&#39;
-                    split = split.replace(&#34;&lt;&#34;, &#34;&#34;).replace(&#34;&gt;&#34;, &#34;&#34;)
-                    # Remove &#34;_truncated&#34; from the end, if present
-                    split = split.rsplit(&#34;_truncated&#34;, 1)[0]
-
-                # Load corresponding dataset
-                ds = datasets.load_dataset(&#34;iamgroot42/mimir&#34;, name=source, split=split)
-                data = ds[data_split]
-                # Check if the number of samples is correct
-                if len(data) != n_samples:
-                    raise ValueError(f&#34;Requested {n_samples} samples, but only {len(data)} samples available. Potential mismatch in HuggingFace data and requested data.&#34;)
-                return data
-        # If got here, matching source was not found
-        raise ValueError(f&#34;Requested source {filename} not found in HuggingFace data.&#34;)
-    else:
-        file_path = os.path.join(cache_dir, f&#34;cache_{min_length}_{max_length}_{n_samples}_{max_tokens}&#34;, data_split, filename + &#34;.jsonl&#34;)
-        if not os.path.exists(file_path):
-            raise ValueError(f&#34;Requested cache file {file_path} does not exist&#34;)
-        data = load_data(file_path)
-    return data</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_data"><code class="name flex">
 <span>def <span class="ident">load_data</span></span>(<span>file_path)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Load data from a given filepath (.jsonl)</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_data(file_path):
-    &#34;&#34;&#34;
-        Load data from a given filepath (.jsonl)
-    &#34;&#34;&#34;
-    with open(file_path, &#39;r&#39;) as f:
-        data = [json.loads(line) for line in f.readlines()]
-    return data</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_english"><code class="name flex">
 <span>def <span class="ident">load_english</span></span>(<span>cache_dir)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_english(cache_dir):
-    return load_language(&#39;en&#39;, cache_dir)</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_german"><code class="name flex">
 <span>def <span class="ident">load_german</span></span>(<span>cache_dir)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_german(cache_dir):
-    return load_language(&#39;de&#39;, cache_dir)</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_language"><code class="name flex">
 <span>def <span class="ident">load_language</span></span>(<span>language, cache_dir)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_language(language, cache_dir):
-    # load either the english or german portion of the wmt16 dataset
-    assert language in [&#39;en&#39;, &#39;de&#39;]
-    d = datasets.load_dataset(&#39;wmt16&#39;, &#39;de-en&#39;, split=&#39;train&#39;, cache_dir=cache_dir)
-    docs = d[&#39;translation&#39;]
-    desired_language_docs = [d[language] for d in docs]
-    lens = [len(d.split()) for d in desired_language_docs]
-    sub = [d for d, l in zip(desired_language_docs, lens) if l &gt; 100 and l &lt; 150]
-    return sub</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_pubmed"><code class="name flex">
 <span>def <span class="ident">load_pubmed</span></span>(<span>cache_dir)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_pubmed(cache_dir):
-    data = datasets.load_dataset(&#39;pubmed_qa&#39;, &#39;pqa_labeled&#39;, split=&#39;train&#39;, cache_dir=cache_dir)
-    
-    # combine question and long_answer
-    data = [f&#39;Question: {q} Answer:{SEPARATOR}{a}&#39; for q, a in zip(data[&#39;question&#39;], data[&#39;long_answer&#39;])]
-
-    return data</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.load_writing"><code class="name flex">
 <span>def <span class="ident">load_writing</span></span>(<span>cache_dir=None)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_writing(cache_dir=None):
-    writing_path = &#39;data/writingPrompts&#39;
-    
-    with open(f&#39;{writing_path}/valid.wp_source&#39;, &#39;r&#39;) as f:
-        prompts = f.readlines()
-    with open(f&#39;{writing_path}/valid.wp_target&#39;, &#39;r&#39;) as f:
-        stories = f.readlines()
-    
-    prompts = [process_prompt(prompt) for prompt in prompts]
-    joined = [process_spaces(prompt + &#34; &#34; + story) for prompt, story in zip(prompts, stories)]
-    filtered = [story for story in joined if &#39;nsfw&#39; not in story and &#39;NSFW&#39; not in story]
-
-    random.seed(0)
-    random.shuffle(filtered)
-
-    return filtered</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.process_prompt"><code class="name flex">
 <span>def <span class="ident">process_prompt</span></span>(<span>prompt)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def process_prompt(prompt):
-    return prompt.replace(&#39;[ WP ]&#39;, &#39;&#39;).replace(&#39;[ OT ]&#39;, &#39;&#39;)</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.process_spaces"><code class="name flex">
 <span>def <span class="ident">process_spaces</span></span>(<span>story)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def process_spaces(story):
-    return story.replace(
-        &#39; ,&#39;, &#39;,&#39;).replace(
-        &#39; .&#39;, &#39;.&#39;).replace(
-        &#39; ?&#39;, &#39;?&#39;).replace(
-        &#39; !&#39;, &#39;!&#39;).replace(
-        &#39; ;&#39;, &#39;;&#39;).replace(
-        &#39; \&#39;&#39;, &#39;\&#39;&#39;).replace(
-        &#39; ’ &#39;, &#39;\&#39;&#39;).replace(
-        &#39; :&#39;, &#39;:&#39;).replace(
-        &#39;&lt;newline&gt;&#39;, &#39;\n&#39;).replace(
-        &#39;`` &#39;, &#39;&#34;&#39;).replace(
-        &#39; \&#39;\&#39;&#39;, &#39;&#34;&#39;).replace(
-        &#39;\&#39;\&#39;&#39;, &#39;&#34;&#39;).replace(
-        &#39;.. &#39;, &#39;... &#39;).replace(
-        &#39; )&#39;, &#39;)&#39;).replace(
-        &#39;( &#39;, &#39;(&#39;).replace(
-        &#39; n\&#39;t&#39;, &#39;n\&#39;t&#39;).replace(
-        &#39; i &#39;, &#39; I &#39;).replace(
-        &#39; i\&#39;&#39;, &#39; I\&#39;&#39;).replace(
-        &#39;\\\&#39;&#39;, &#39;\&#39;&#39;).replace(
-        &#39;\n &#39;, &#39;\n&#39;).strip()</code></pre>
-</details>
 </dd>
 <dt id="mimir.custom_datasets.save_data"><code class="name flex">
 <span>def <span class="ident">save_data</span></span>(<span>file_path, data)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def save_data(file_path, data):
-    # Since each datum has newlines in it potentially, use jsonl format
-    with open(file_path, &#39;w&#39;) as f:
-        for datum in data:
-            f.write(json.dumps(datum) + &#34;\n&#34;)</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -506,7 +119,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -536,7 +148,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/data_utils.html b/docs/data_utils.html
index 16ddbc6..27b719f 100644
--- a/docs/data_utils.html
+++ b/docs/data_utils.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.data_utils API documentation</title>
-<meta name="description" content="Datasets and data-processing utilities" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Datasets and data-processing utilities">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,342 +26,6 @@ <h1 class="title">Module <code>mimir.data_utils</code></h1>
 </header>
 <section id="section-intro">
 <p>Datasets and data-processing utilities</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Datasets and data-processing utilities
-&#34;&#34;&#34;
-import datasets
-import numpy as np
-import os
-import mimir.custom_datasets as custom_datasets
-from mimir.config import ExperimentConfig
-from nltk.tokenize import WhitespaceTokenizer
-
-
-class Data:
-    &#34;&#34;&#34;
-    Data class to load and cache datasets.
-    &#34;&#34;&#34;
-    def __init__(self, name,
-                 config: ExperimentConfig,
-                 presampled: str = None,
-                 name_key_mapping: dict = {&#34;the_pile&#34;: &#34;text&#34;, &#34;xsum&#34;: &#34;document&#34;}):
-        self.name_key_mapping = name_key_mapping
-        self.config = config
-        self.name = name
-        self.presampled = presampled
-        self.key = (
-            config.dataset_key
-            if config.dataset_key
-            else self.name_key_mapping.get(name, None)
-        )
-        if self.key is None:
-            raise ValueError(
-                f&#34;Key for dataset {name} not provided or found inname_key_mapping&#34;
-            )
-        self.cache_dir = self.config.env_config.cache_dir
-
-    def load_neighbors(
-        self,
-        train: bool,
-        num_neighbors: int,
-        model: str = &#34;bert&#34;,
-        in_place_swap: bool = False,
-    ):
-        &#34;&#34;&#34;
-        Load neighbors from cache (local or from HF)
-        &#34;&#34;&#34;
-        data_split = &#34;train&#34; if train else &#34;test&#34;
-        data_split += &#34;_neighbors&#34;
-        filename = self._get_name_to_save() + &#34;_neighbors_{}_{}&#34;.format(
-            num_neighbors, model
-        )
-        if in_place_swap:
-            filename += &#34;_in_place_swap&#34;
-        data = custom_datasets.load_cached(
-            self.cache_dir,
-            data_split,
-            filename,
-            min_length=self.config.min_words,
-            max_length=self.config.max_words,
-            n_samples=self.config.n_samples,
-            max_tokens=self.config.max_tokens,
-            load_from_hf=self.config.load_from_hf
-        )
-        return data
-
-    def dump_neighbors(
-        self,
-        data,
-        train: bool,
-        num_neighbors: int,
-        model: str = &#34;bert&#34;,
-        in_place_swap: bool = False,
-    ):
-        &#34;&#34;&#34;
-        Dump neighbors to cache local cache.
-        &#34;&#34;&#34;
-        data_split = &#34;train&#34; if train else &#34;test&#34;
-        data_split += &#34;_neighbors&#34;
-        filename = self._get_name_to_save() + &#34;_neighbors_{}_{}&#34;.format(
-            num_neighbors, model
-        )
-        if in_place_swap:
-            filename += &#34;_in_place_swap&#34;
-        custom_datasets.dump_to_cache(
-            data,
-            self.cache_dir,
-            data_split,
-            filename,
-            min_length=self.config.min_words,
-            max_length=self.config.max_words,
-            n_samples=self.config.n_samples,
-            max_tokens=self.config.max_tokens,
-        )
-
-    def load(self, train: bool, mask_tokenizer=None, specific_source: str = None):
-        data_split = &#34;train&#34; if train else &#34;test&#34;
-        n_samples = self.config.n_samples
-
-        # Load from numpy file storing pretokenized sample in a 2d array of shape (num_samples, num_tokens_per_sample)
-        if self.config.pretokenized:
-            assert self.presampled
-            # TODO: Pretokenized full documents (split into substrs) is not currently supported
-            assert not self.config.full_doc
-            data = np.load(self.presampled)
-            return data
-        elif (self.config.load_from_cache or self.config.load_from_hf):
-            # Load from cache, if requested
-            filename = self._get_name_to_save()
-            data = custom_datasets.load_cached(
-                self.cache_dir,
-                data_split,
-                filename,
-                min_length=self.config.min_words,
-                max_length=self.config.max_words,
-                n_samples=self.config.n_samples,
-                max_tokens=self.config.max_tokens,
-                load_from_hf=self.config.load_from_hf
-            )
-            return data
-        else:
-            if self.presampled or self.config.full_doc:
-                print(&#34;using presampled data&#34;)
-                data = datasets.load_dataset(
-                    &#34;json&#34;,
-                    data_files=self.presampled,
-                    split=f&#34;train&#34;,
-                    cache_dir=self.cache_dir,
-                )[self.key]
-            elif self.name in custom_datasets.DATASETS:
-                data = custom_datasets.load(self.name)
-            elif self.name == &#34;the_pile&#34;:
-                min_load = max(10000, self.config.max_data)
-                data = datasets.load_dataset(
-                    &#34;json&#34;,
-                    data_files=os.path.join(
-                        self.config.env_config.data_source,
-                        &#34;pile/00.jsonl.zst&#34; if train else &#34;pile/test.jsonl.zst&#34;,
-                    ),
-                    cache_dir=self.cache_dir,
-                    split=f&#34;train[:{min_load}]&#34;,
-                )
-                specific_source_use = (
-                    self.config.specific_source
-                    if specific_source is None
-                    else specific_source
-                )
-                data = pile_selection_utility(
-                    data, self.key, wanted_source=specific_source_use
-                )
-            elif &#34;human&#34; in self.name:
-                data = datasets.load_dataset(
-                    self.name, split=f&#34;train[:100]&#34;, cache_dir=self.cache_dir
-                )[self.key]
-            elif &#34;nthngdy&#34; in self.name:
-                data = datasets.load_dataset(
-                    self.name, split=&#34;test&#34;, cache_dir=self.cache_dir
-                )[self.key]
-            else:
-                data = datasets.load_dataset(
-                    self.name, split=f&#34;train&#34;, cache_dir=self.cache_dir
-                )[self.key]
-
-        if not self.config.full_doc:
-            # get unique examples
-            # then take just the long examples, shuffle, take the first 5,000 to tokenize to save time
-            # then take just the examples that are &lt;= 512 tokens (for the mask model)
-            # then generate n_samples samples
-            wsp_tokenizer = WhitespaceTokenizer()
-
-            # remove duplicates from the data
-            data = list(dict.fromkeys(data))  # deterministic, as opposed to set()
-
-            whitespace_tokenized_spans = [
-                (x, list(wsp_tokenizer.span_tokenize(x))) for x in data
-            ]
-
-            # Pick samples with at least self.config.min_words words
-            whitespace_tokenized_spans = [
-                x
-                for x in whitespace_tokenized_spans
-                if len(x[1]) &gt;= self.config.min_words
-            ]
-            if len(whitespace_tokenized_spans) == 0:
-                raise ValueError(&#34;No examples with length &gt;= min_words&#34;)
-
-            if self.config.max_words_cutoff:
-                last_spans = [
-                    x[1][min(self.config.max_words, len(x[1])) - 1][1]
-                    for x in whitespace_tokenized_spans
-                ]
-                data = [
-                    x[0][:y] for x, y in zip(whitespace_tokenized_spans, last_spans)
-                ]
-            else:
-                data = [
-                    x[0]
-                    for x in whitespace_tokenized_spans
-                    if len(x[1]) &lt; self.config.max_words
-                ]
-                if len(data) == 0:
-                    raise ValueError(&#34;No examples with length &lt; max_words&#34;)
-
-            # TODO: why shuffle
-            # random.seed(0)
-            # random.shuffle(data)
-
-            data = data[: self.config.max_data]
-
-            # If there is mask tokenizer, keep only examples with &lt;= 512 tokens according to mask_tokenizer
-            # this step has the extra effect of removing examples with low-quality/garbage content
-            if mask_tokenizer:
-                tokenized_data = mask_tokenizer(data)
-                new_data = []
-                for i, (x, y) in enumerate(zip(data, tokenized_data[&#34;input_ids&#34;])):
-                    if len(y) &lt;= self.config.max_tokens:
-                        new_data.append(x)
-                    else:
-                        print(
-                            &#34;Trimming text to nearest word that fits within mask tokenizer window&#34;
-                        )
-                        max_token_char_span = tokenized_data.token_to_chars(
-                            i, self.config.max_tokens - 1
-                        )
-                        x = x[: max_token_char_span.end]
-                        token_truncated_word_spans = list(
-                            wsp_tokenizer.span_tokenize(x)
-                        )
-
-                        # Pop off the last &#34;word&#34; since it may be a word piece
-                        second_last_span = token_truncated_word_spans[-2]
-                        x = x[: second_last_span[1]]
-
-                        new_len = len(mask_tokenizer(x)[&#34;input_ids&#34;])
-                        assert new_len &lt;= self.config.max_tokens
-                        new_data.append(x)
-                data = new_data
-
-            # print stats about remainining data
-            print(f&#34;Total number of samples: {len(data)}&#34;)
-            print(f&#34;Average number of words: {np.mean([len(x.split()) for x in data])}&#34;)
-
-            if n_samples &gt; len(data):
-                print(f&#34;WARNING: n_samples ({n_samples}) &gt; len(data) ({len(data)})&#34;)
-
-        # Sample &#39;n_samples&#39; examples
-        data = data[:n_samples]
-
-        # Save to cache (if requested)
-        if self.config.dump_cache:
-            self.dump_to_cache(data, data_split)
-
-        return data
-
-    def dump_to_cache(self, data, data_split):
-        filename = self._get_name_to_save()
-        custom_datasets.dump_to_cache(
-            data,
-            self.cache_dir,
-            data_split,
-            filename,
-            min_length=self.config.min_words,
-            max_length=self.config.max_words,
-            n_samples=self.config.n_samples,
-            max_tokens=self.config.max_tokens,
-        )
-
-    def _get_name_to_save(self):
-        if self.config.specific_source and self.name == &#34;the_pile&#34;:
-            processed_source = sourcename_process(self.config.specific_source)
-            filename = f&#34;{self.name}_{processed_source}&#34;
-        else:
-            filename = self.name
-        return filename
-
-
-def strip_newlines(text):
-    &#34;&#34;&#34;
-    Strip newlines from each example; replace one or more newlines with a single space
-    &#34;&#34;&#34;
-    return &#34; &#34;.join(text.split())
-
-
-def trim_to_shorter_length(text_a: str, text_b: str, max_length: int = None):
-    &#34;&#34;&#34;
-    Truncate to shorter of o and s
-    &#34;&#34;&#34;
-    shorter_length = min(len(text_a.split(&#34; &#34;)), len(text_b.split(&#34; &#34;)))
-    if max_length is not None:
-        shorter_length = min(shorter_length, max_length)
-    text_a = &#34; &#34;.join(text_a.split(&#34; &#34;)[:shorter_length])
-    text_b = &#34; &#34;.join(text_b.split(&#34; &#34;)[:shorter_length])
-    return text_a, text_b
-
-
-def truncate_to_substring(text: str, substring: str, idx_occurrence: int):
-    &#34;&#34;&#34;
-    Truncate everything after the idx_occurrence occurrence of substring
-    &#34;&#34;&#34;
-    assert idx_occurrence &gt; 0, &#34;idx_occurrence must be &gt; 0&#34;
-    idx = -1
-    for _ in range(idx_occurrence):
-        idx = text.find(substring, idx + 1)
-        if idx == -1:
-            return text
-    return text[:idx]
-
-
-def pile_selection_utility(data, key: str, wanted_source: str = None):
-    &#34;&#34;&#34;
-    Filter and select data corresponding to source, if requested.
-    &#34;&#34;&#34;
-    if wanted_source is None:
-        return data[key]
-    wanted_data = []
-    # Pick sources that match requested source
-    for datum in data:
-        if datum[&#34;meta&#34;][&#34;pile_set_name&#34;] == wanted_source:
-            wanted_data.append(datum[key])
-    return wanted_data
-
-
-def sourcename_process(x: str):
-    &#34;&#34;&#34;
-        Helper function to process source name.
-    &#34;&#34;&#34;
-    return x.replace(&#34; &#34;, &#34;_&#34;).replace(&#34;-&#34;, &#34;_&#34;).lower()
-
-
-def drop_last_word(text):
-    &#34;&#34;&#34;
-        Drop the last word from a given text.
-    &#34;&#34;&#34;
-    return &#34; &#34;.join(text.split(&#34; &#34;)[:-1])</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -372,114 +39,36 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </code></dt>
 <dd>
 <div class="desc"><p>Drop the last word from a given text.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def drop_last_word(text):
-    &#34;&#34;&#34;
-        Drop the last word from a given text.
-    &#34;&#34;&#34;
-    return &#34; &#34;.join(text.split(&#34; &#34;)[:-1])</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.pile_selection_utility"><code class="name flex">
 <span>def <span class="ident">pile_selection_utility</span></span>(<span>data, key: str, wanted_source: str = None)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Filter and select data corresponding to source, if requested.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def pile_selection_utility(data, key: str, wanted_source: str = None):
-    &#34;&#34;&#34;
-    Filter and select data corresponding to source, if requested.
-    &#34;&#34;&#34;
-    if wanted_source is None:
-        return data[key]
-    wanted_data = []
-    # Pick sources that match requested source
-    for datum in data:
-        if datum[&#34;meta&#34;][&#34;pile_set_name&#34;] == wanted_source:
-            wanted_data.append(datum[key])
-    return wanted_data</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.sourcename_process"><code class="name flex">
 <span>def <span class="ident">sourcename_process</span></span>(<span>x: str)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Helper function to process source name.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def sourcename_process(x: str):
-    &#34;&#34;&#34;
-        Helper function to process source name.
-    &#34;&#34;&#34;
-    return x.replace(&#34; &#34;, &#34;_&#34;).replace(&#34;-&#34;, &#34;_&#34;).lower()</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.strip_newlines"><code class="name flex">
 <span>def <span class="ident">strip_newlines</span></span>(<span>text)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Strip newlines from each example; replace one or more newlines with a single space</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def strip_newlines(text):
-    &#34;&#34;&#34;
-    Strip newlines from each example; replace one or more newlines with a single space
-    &#34;&#34;&#34;
-    return &#34; &#34;.join(text.split())</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.trim_to_shorter_length"><code class="name flex">
 <span>def <span class="ident">trim_to_shorter_length</span></span>(<span>text_a: str, text_b: str, max_length: int = None)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Truncate to shorter of o and s</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def trim_to_shorter_length(text_a: str, text_b: str, max_length: int = None):
-    &#34;&#34;&#34;
-    Truncate to shorter of o and s
-    &#34;&#34;&#34;
-    shorter_length = min(len(text_a.split(&#34; &#34;)), len(text_b.split(&#34; &#34;)))
-    if max_length is not None:
-        shorter_length = min(shorter_length, max_length)
-    text_a = &#34; &#34;.join(text_a.split(&#34; &#34;)[:shorter_length])
-    text_b = &#34; &#34;.join(text_b.split(&#34; &#34;)[:shorter_length])
-    return text_a, text_b</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.truncate_to_substring"><code class="name flex">
 <span>def <span class="ident">truncate_to_substring</span></span>(<span>text: str, substring: str, idx_occurrence: int)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Truncate everything after the idx_occurrence occurrence of substring</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def truncate_to_substring(text: str, substring: str, idx_occurrence: int):
-    &#34;&#34;&#34;
-    Truncate everything after the idx_occurrence occurrence of substring
-    &#34;&#34;&#34;
-    assert idx_occurrence &gt; 0, &#34;idx_occurrence must be &gt; 0&#34;
-    idx = -1
-    for _ in range(idx_occurrence):
-        idx = text.find(substring, idx + 1)
-        if idx == -1:
-            return text
-    return text[:idx]</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -764,270 +353,24 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>Dump neighbors to cache local cache.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def dump_neighbors(
-    self,
-    data,
-    train: bool,
-    num_neighbors: int,
-    model: str = &#34;bert&#34;,
-    in_place_swap: bool = False,
-):
-    &#34;&#34;&#34;
-    Dump neighbors to cache local cache.
-    &#34;&#34;&#34;
-    data_split = &#34;train&#34; if train else &#34;test&#34;
-    data_split += &#34;_neighbors&#34;
-    filename = self._get_name_to_save() + &#34;_neighbors_{}_{}&#34;.format(
-        num_neighbors, model
-    )
-    if in_place_swap:
-        filename += &#34;_in_place_swap&#34;
-    custom_datasets.dump_to_cache(
-        data,
-        self.cache_dir,
-        data_split,
-        filename,
-        min_length=self.config.min_words,
-        max_length=self.config.max_words,
-        n_samples=self.config.n_samples,
-        max_tokens=self.config.max_tokens,
-    )</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.Data.dump_to_cache"><code class="name flex">
 <span>def <span class="ident">dump_to_cache</span></span>(<span>self, data, data_split)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def dump_to_cache(self, data, data_split):
-    filename = self._get_name_to_save()
-    custom_datasets.dump_to_cache(
-        data,
-        self.cache_dir,
-        data_split,
-        filename,
-        min_length=self.config.min_words,
-        max_length=self.config.max_words,
-        n_samples=self.config.n_samples,
-        max_tokens=self.config.max_tokens,
-    )</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.Data.load"><code class="name flex">
 <span>def <span class="ident">load</span></span>(<span>self, train: bool, mask_tokenizer=None, specific_source: str = None)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load(self, train: bool, mask_tokenizer=None, specific_source: str = None):
-    data_split = &#34;train&#34; if train else &#34;test&#34;
-    n_samples = self.config.n_samples
-
-    # Load from numpy file storing pretokenized sample in a 2d array of shape (num_samples, num_tokens_per_sample)
-    if self.config.pretokenized:
-        assert self.presampled
-        # TODO: Pretokenized full documents (split into substrs) is not currently supported
-        assert not self.config.full_doc
-        data = np.load(self.presampled)
-        return data
-    elif (self.config.load_from_cache or self.config.load_from_hf):
-        # Load from cache, if requested
-        filename = self._get_name_to_save()
-        data = custom_datasets.load_cached(
-            self.cache_dir,
-            data_split,
-            filename,
-            min_length=self.config.min_words,
-            max_length=self.config.max_words,
-            n_samples=self.config.n_samples,
-            max_tokens=self.config.max_tokens,
-            load_from_hf=self.config.load_from_hf
-        )
-        return data
-    else:
-        if self.presampled or self.config.full_doc:
-            print(&#34;using presampled data&#34;)
-            data = datasets.load_dataset(
-                &#34;json&#34;,
-                data_files=self.presampled,
-                split=f&#34;train&#34;,
-                cache_dir=self.cache_dir,
-            )[self.key]
-        elif self.name in custom_datasets.DATASETS:
-            data = custom_datasets.load(self.name)
-        elif self.name == &#34;the_pile&#34;:
-            min_load = max(10000, self.config.max_data)
-            data = datasets.load_dataset(
-                &#34;json&#34;,
-                data_files=os.path.join(
-                    self.config.env_config.data_source,
-                    &#34;pile/00.jsonl.zst&#34; if train else &#34;pile/test.jsonl.zst&#34;,
-                ),
-                cache_dir=self.cache_dir,
-                split=f&#34;train[:{min_load}]&#34;,
-            )
-            specific_source_use = (
-                self.config.specific_source
-                if specific_source is None
-                else specific_source
-            )
-            data = pile_selection_utility(
-                data, self.key, wanted_source=specific_source_use
-            )
-        elif &#34;human&#34; in self.name:
-            data = datasets.load_dataset(
-                self.name, split=f&#34;train[:100]&#34;, cache_dir=self.cache_dir
-            )[self.key]
-        elif &#34;nthngdy&#34; in self.name:
-            data = datasets.load_dataset(
-                self.name, split=&#34;test&#34;, cache_dir=self.cache_dir
-            )[self.key]
-        else:
-            data = datasets.load_dataset(
-                self.name, split=f&#34;train&#34;, cache_dir=self.cache_dir
-            )[self.key]
-
-    if not self.config.full_doc:
-        # get unique examples
-        # then take just the long examples, shuffle, take the first 5,000 to tokenize to save time
-        # then take just the examples that are &lt;= 512 tokens (for the mask model)
-        # then generate n_samples samples
-        wsp_tokenizer = WhitespaceTokenizer()
-
-        # remove duplicates from the data
-        data = list(dict.fromkeys(data))  # deterministic, as opposed to set()
-
-        whitespace_tokenized_spans = [
-            (x, list(wsp_tokenizer.span_tokenize(x))) for x in data
-        ]
-
-        # Pick samples with at least self.config.min_words words
-        whitespace_tokenized_spans = [
-            x
-            for x in whitespace_tokenized_spans
-            if len(x[1]) &gt;= self.config.min_words
-        ]
-        if len(whitespace_tokenized_spans) == 0:
-            raise ValueError(&#34;No examples with length &gt;= min_words&#34;)
-
-        if self.config.max_words_cutoff:
-            last_spans = [
-                x[1][min(self.config.max_words, len(x[1])) - 1][1]
-                for x in whitespace_tokenized_spans
-            ]
-            data = [
-                x[0][:y] for x, y in zip(whitespace_tokenized_spans, last_spans)
-            ]
-        else:
-            data = [
-                x[0]
-                for x in whitespace_tokenized_spans
-                if len(x[1]) &lt; self.config.max_words
-            ]
-            if len(data) == 0:
-                raise ValueError(&#34;No examples with length &lt; max_words&#34;)
-
-        # TODO: why shuffle
-        # random.seed(0)
-        # random.shuffle(data)
-
-        data = data[: self.config.max_data]
-
-        # If there is mask tokenizer, keep only examples with &lt;= 512 tokens according to mask_tokenizer
-        # this step has the extra effect of removing examples with low-quality/garbage content
-        if mask_tokenizer:
-            tokenized_data = mask_tokenizer(data)
-            new_data = []
-            for i, (x, y) in enumerate(zip(data, tokenized_data[&#34;input_ids&#34;])):
-                if len(y) &lt;= self.config.max_tokens:
-                    new_data.append(x)
-                else:
-                    print(
-                        &#34;Trimming text to nearest word that fits within mask tokenizer window&#34;
-                    )
-                    max_token_char_span = tokenized_data.token_to_chars(
-                        i, self.config.max_tokens - 1
-                    )
-                    x = x[: max_token_char_span.end]
-                    token_truncated_word_spans = list(
-                        wsp_tokenizer.span_tokenize(x)
-                    )
-
-                    # Pop off the last &#34;word&#34; since it may be a word piece
-                    second_last_span = token_truncated_word_spans[-2]
-                    x = x[: second_last_span[1]]
-
-                    new_len = len(mask_tokenizer(x)[&#34;input_ids&#34;])
-                    assert new_len &lt;= self.config.max_tokens
-                    new_data.append(x)
-            data = new_data
-
-        # print stats about remainining data
-        print(f&#34;Total number of samples: {len(data)}&#34;)
-        print(f&#34;Average number of words: {np.mean([len(x.split()) for x in data])}&#34;)
-
-        if n_samples &gt; len(data):
-            print(f&#34;WARNING: n_samples ({n_samples}) &gt; len(data) ({len(data)})&#34;)
-
-    # Sample &#39;n_samples&#39; examples
-    data = data[:n_samples]
-
-    # Save to cache (if requested)
-    if self.config.dump_cache:
-        self.dump_to_cache(data, data_split)
-
-    return data</code></pre>
-</details>
 </dd>
 <dt id="mimir.data_utils.Data.load_neighbors"><code class="name flex">
 <span>def <span class="ident">load_neighbors</span></span>(<span>self, train: bool, num_neighbors: int, model: str = 'bert', in_place_swap: bool = False)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Load neighbors from cache (local or from HF)</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_neighbors(
-    self,
-    train: bool,
-    num_neighbors: int,
-    model: str = &#34;bert&#34;,
-    in_place_swap: bool = False,
-):
-    &#34;&#34;&#34;
-    Load neighbors from cache (local or from HF)
-    &#34;&#34;&#34;
-    data_split = &#34;train&#34; if train else &#34;test&#34;
-    data_split += &#34;_neighbors&#34;
-    filename = self._get_name_to_save() + &#34;_neighbors_{}_{}&#34;.format(
-        num_neighbors, model
-    )
-    if in_place_swap:
-        filename += &#34;_in_place_swap&#34;
-    data = custom_datasets.load_cached(
-        self.cache_dir,
-        data_split,
-        filename,
-        min_length=self.config.min_words,
-        max_length=self.config.max_words,
-        n_samples=self.config.n_samples,
-        max_tokens=self.config.max_tokens,
-        load_from_hf=self.config.load_from_hf
-    )
-    return data</code></pre>
-</details>
 </dd>
 </dl>
 </dd>
@@ -1040,7 +383,6 @@ <h3>Methods</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -1077,7 +419,7 @@ <h4><code><a title="mimir.data_utils.Data" href="#mimir.data_utils.Data">Data</a
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/index.html b/docs/index.html
index bf42f4f..78d7a60 100644
--- a/docs/index.html
+++ b/docs/index.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir API documentation</title>
-<meta name="description" content="" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -70,7 +73,6 @@ <h2 class="section-title" id="header-submodules">Sub-modules</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -90,7 +92,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/models.html b/docs/models.html
index 568f229..9985c38 100644
--- a/docs/models.html
+++ b/docs/models.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.models API documentation</title>
-<meta name="description" content="Model definitions, with basic helper functions. Supports any model as long as it supports the functions specified in Model." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Model definitions, with basic helper functions. Supports any model as long as it supports the functions specified in Model.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,635 +26,6 @@ <h1 class="title">Module <code>mimir.models</code></h1>
 </header>
 <section id="section-intro">
 <p>Model definitions, with basic helper functions. Supports any model as long as it supports the functions specified in Model.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Model definitions, with basic helper functions. Supports any model as long as it supports the functions specified in Model.
-&#34;&#34;&#34;
-import torch
-import torch.nn as nn
-import openai
-from typing import List
-import numpy as np
-import transformers
-import time
-from collections import defaultdict
-from multiprocessing.pool import ThreadPool
-import torch.nn.functional as F
-from transformers import AutoTokenizer, AutoModelForSequenceClassification
-from hf_olmo import *
-
-from mimir.config import ExperimentConfig
-from mimir.custom_datasets import SEPARATOR
-from mimir.data_utils import drop_last_word
-
-
-class Model(nn.Module):
-    &#34;&#34;&#34;
-        Base class (for LLMs).
-    &#34;&#34;&#34;
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super().__init__()
-        self.model = None # Set by child class
-        self.tokenizer = None # Set by child class
-        self.config = config
-        self.device = None
-        self.device_map = None
-        self.name = None
-        self.kwargs = kwargs
-        self.cache_dir = self.config.env_config.cache_dir
-
-    def to(self, device):
-        &#34;&#34;&#34;
-            Shift model to a particular device.
-        &#34;&#34;&#34;
-        self.model.to(device, non_blocking=True)
-
-    def load(self):
-        &#34;&#34;&#34;
-            Load model onto GPU (and compile, if requested) if not already loaded with device map.
-        &#34;&#34;&#34;
-        if not self.device_map:
-            start = time.time()
-            try:
-                self.model.cpu()
-            except NameError:
-                pass
-            if self.config.openai_config is None:
-                self.model.to(self.device, non_blocking=True)
-            if self.config.env_config.compile:
-                torch.compile(self.model)
-            print(f&#39;DONE ({time.time() - start:.2f}s)&#39;)
-
-    def unload(self):
-        &#34;&#34;&#34;
-            Unload model from GPU
-        &#34;&#34;&#34;
-        start = time.time()
-        try:
-            self.model.cpu()
-        except NameError:
-            pass
-        print(f&#39;DONE ({time.time() - start:.2f}s)&#39;)
-
-    def get_probabilities(self,
-                          text: str,
-                          tokens: np.ndarray = None,
-                          no_grads: bool = True,
-                          return_all_probs: bool = False):
-        &#34;&#34;&#34;
-            Get the probabilities or log-softmaxed logits for a text under the current model.
-            Args:
-                text (str): The input text for which to calculate probabilities.
-                tokens (numpy.ndarray, optional): An optional array of token ids. If provided, these tokens
-                are used instead of tokenizing the input text. Defaults to None.
-
-            Raises:
-                ValueError: If the device or name attributes of the instance are not set.
-
-            Returns:
-                list: A list of probabilities.
-        &#34;&#34;&#34;
-        with torch.set_grad_enabled(not no_grads):
-            if self.device is None or self.name is None:
-                raise ValueError(&#34;Please set self.device and self.name in child class&#34;)
-
-            if tokens is not None:
-                labels = torch.from_numpy(tokens.astype(np.int64)).type(torch.LongTensor)
-                if labels.shape[0] != 1:
-                    # expand first dimension
-                    labels = labels.unsqueeze(0)
-            else:
-                tokenized = self.tokenizer(
-                    text, return_tensors=&#34;pt&#34;)
-                labels = tokenized.input_ids
-
-            target_token_log_prob = []
-            all_token_log_prob = []
-            for i in range(0, labels.size(1), self.stride):
-                begin_loc = max(i + self.stride - self.max_length, 0)
-                end_loc = min(i + self.stride, labels.size(1))
-                trg_len = end_loc - i  # may be different from stride on last loop
-                input_ids = labels[:, begin_loc:end_loc].to(self.device)
-                target_ids = input_ids.clone()
-                target_ids[:, :-trg_len] = -100
-
-                logits = self.model(input_ids, labels=target_ids).logits
-                if no_grads:
-                    logits = logits.cpu()
-                shift_logits = logits[..., :-1, :].contiguous()
-                log_probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-                shift_labels = target_ids[..., 1:]
-                if no_grads:
-                    shift_labels = shift_labels.cpu()
-                shift_labels = shift_labels.contiguous()
-                labels_processed = shift_labels[0]
-
-                del input_ids
-                del target_ids
-
-                for i, token_id in enumerate(labels_processed):
-                    if token_id != -100:
-                        log_probability = log_probabilities[0, i, token_id]
-                        if no_grads:
-                            log_probability = log_probability.item()
-                        target_token_log_prob.append(log_probability)
-                        all_token_log_prob.append(log_probabilities[0, i])
-            
-            # Should be equal to # of tokens - 1 to account for shift
-            assert len(target_token_log_prob) == labels.size(1) - 1
-            all_token_log_prob = torch.stack(all_token_log_prob, dim=0)
-            assert len(target_token_log_prob) == len(all_token_log_prob)
-
-        if not no_grads:
-            target_token_log_prob = torch.stack(target_token_log_prob)
-
-        if not return_all_probs:
-            return target_token_log_prob
-        return target_token_log_prob, all_token_log_prob
-
-    @torch.no_grad()
-    def get_ll(self,
-               text: str,
-               tokens: np.ndarray=None,
-               probs = None):
-        &#34;&#34;&#34;
-            Get the log likelihood of each text under the base_model.
-
-            Args:
-                text (str): The input text for which to calculate the log likelihood.
-                tokens (numpy.ndarray, optional): An optional array of token ids. If provided, these tokens
-                are used instead of tokenizing the input text. Defaults to None.
-                probs (list, optional): An optional list of probabilities. If provided, these probabilities
-                are used instead of calling the `get_probabilities` method. Defaults to None.
-        &#34;&#34;&#34;
-        all_prob = probs if probs is not None else self.get_probabilities(text, tokens=tokens)
-        return -np.mean(all_prob)
-
-    def load_base_model_and_tokenizer(self, model_kwargs):
-        &#34;&#34;&#34;
-            Load the base model and tokenizer for a given model name.
-        &#34;&#34;&#34;
-        if self.device is None or self.name is None:
-            raise ValueError(&#34;Please set self.device and self.name in child class&#34;)
-
-        if self.config.openai_config is None:
-            print(f&#39;Loading BASE model {self.name}...&#39;)
-            device_map = self.device_map # if self.device_map else &#39;cpu&#39;
-            if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-                from utils.transformers.model import OpenLMforCausalLM
-                model = OpenLMforCausalLM.from_pretrained(
-                    self.name, **model_kwargs, device_map=self.device, cache_dir=self.cache_dir)
-                # Extract the model from the model wrapper so we dont need to call model.model
-            elif &#34;llama&#34; in self.name or &#34;alpaca&#34; in self.name:
-                # TODO: This should be smth specified in config in case user has
-                # llama is too big, gotta use device map
-                model = transformers.AutoModelForCausalLM.from_pretrained(self.name, **model_kwargs, device_map=&#34;balanced_low_0&#34;, cache_dir=self.cache_dir)
-                self.device = &#39;cuda:1&#39;
-            elif &#34;stablelm&#34; in self.name.lower():  # models requiring custom code
-                model = transformers.AutoModelForCausalLM.from_pretrained(
-                    self.name, **model_kwargs, trust_remote_code=True, device_map=device_map, cache_dir=self.cache_dir)
-            elif &#34;olmo&#34; in self.name.lower():
-                model = transformers.AutoModelForCausalLM.from_pretrained(
-                    self.name, **model_kwargs, trust_remote_code=True, cache_dir=self.cache_dir)
-            else:
-                model = transformers.AutoModelForCausalLM.from_pretrained(
-                    self.name, **model_kwargs, device_map=device_map, cache_dir=self.cache_dir)
-        else:
-            model = None
-
-        optional_tok_kwargs = {}
-        if &#34;facebook/opt-&#34; in self.name:
-            print(&#34;Using non-fast tokenizer for OPT&#34;)
-            optional_tok_kwargs[&#39;fast&#39;] = False
-        if self.config.dataset_member in [&#39;pubmed&#39;] or self.config.dataset_nonmember in [&#39;pubmed&#39;]:
-            optional_tok_kwargs[&#39;padding_side&#39;] = &#39;left&#39;
-            self.pad_token = self.tokenizer.eos_token_id
-        if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-            tokenizer = transformers.GPTNeoXTokenizerFast.from_pretrained(
-                &#34;EleutherAI/gpt-neox-20b&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-        elif &#34;datablations&#34; in self.name:
-            tokenizer = transformers.AutoTokenizer.from_pretrained(
-                &#34;gpt2&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-        elif &#34;llama&#34; in self.name or &#34;alpaca&#34; in self.name:
-            tokenizer = transformers.LlamaTokenizer.from_pretrained(
-                self.name, **optional_tok_kwargs, cache_dir=self.cache_dir)
-        elif &#34;pubmedgpt&#34; in self.name:
-            tokenizer = transformers.AutoTokenizer.from_pretrained(
-                &#34;stanford-crfm/BioMedLM&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-        else:
-            tokenizer = transformers.AutoTokenizer.from_pretrained(
-                self.name, **optional_tok_kwargs, cache_dir=self.cache_dir,
-                trust_remote_code=True if &#34;olmo&#34; in self.name.lower() else False)
-        tokenizer.add_special_tokens({&#39;pad_token&#39;: &#39;[PAD]&#39;})
-
-        return model, tokenizer
-
-    def load_model_properties(self):
-        &#34;&#34;&#34;
-            Load model properties, such as max length and stride.
-        &#34;&#34;&#34;
-        # TODO: getting max_length of input could be more generic
-        if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-            self.max_length = self.model.model.seq_len
-        elif hasattr(self.model.config, &#39;max_position_embeddings&#39;):
-            self.max_length = self.model.config.max_position_embeddings
-        elif hasattr(self.model.config, &#39;n_positions&#39;):
-            self.max_length = self.model.config.n_positions
-        else:
-            # Default window size
-            self.max_length = 1024
-        self.stride = self.max_length // 2
-
-
-class ReferenceModel(Model):
-    &#34;&#34;&#34;
-        Wrapper for reference model
-    &#34;&#34;&#34;
-    def __init__(self, config: ExperimentConfig, name: str):
-        super().__init__(config)
-        self.device = self.config.env_config.device_aux
-        self.name = name
-        base_model_kwargs = {&#39;revision&#39;: &#39;main&#39;}
-        if &#39;gpt-j&#39; in self.name or &#39;neox&#39; in self.name or &#39;llama&#39; in self.name or &#39;alpaca&#39; in self.name:
-            base_model_kwargs.update(dict(torch_dtype=torch.float16))
-        if &#39;gpt-j&#39; in self.name:
-            base_model_kwargs.update(dict(revision=&#39;float16&#39;))
-        if &#39;:&#39; in self.name:
-            print(&#34;Applying ref model revision&#34;)
-            # Allow them to provide revisions as part of model name, then parse accordingly
-            split = self.name.split(&#39;:&#39;)
-            self.name = split[0]
-            base_model_kwargs.update(dict(revision=split[-1]))
-        self.model, self.tokenizer = self.load_base_model_and_tokenizer(
-            model_kwargs=base_model_kwargs)
-        self.load_model_properties()
-
-    def load(self):
-        &#34;&#34;&#34;
-        Load reference model noto GPU(s)
-        &#34;&#34;&#34;
-        if &#34;llama&#34; not in self.name and &#34;alpaca&#34; not in self.name:
-            super().load()
-
-    def unload(self):
-        &#34;&#34;&#34;
-        Unload reference model from GPU(s)
-        &#34;&#34;&#34;
-        if &#34;llama&#34; not in self.name and &#34;alpaca&#34; not in self.name:
-            super().unload()
-
-
-class QuantileReferenceModel(Model):
-    &#34;&#34;&#34;
-        Wrapper for referenc model, specifically used for quantile regression
-    &#34;&#34;&#34;
-    def __init__(self, config: ExperimentConfig, name: str):
-        super().__init__(config)
-        self.device = self.config.env_config.device_aux
-        self.name = name
-        self.tokenizer = AutoTokenizer.from_pretrained(
-            name, use_fast=False)
-        self.model = AutoModelForSequenceClassification.from_pretrained(
-            name,
-            num_labels=2,
-            max_position_embeddings=1024)
-        # Modify model&#39;s last linear layer to have only 1 output
-        self.model.classifier.linear_out = nn.Linear(self.model.classifier.linear_out.in_features, 1)
-        self.load_model_properties()
-
-
-class LanguageModel(Model):
-    &#34;&#34;&#34;
-        Generic LM- used most often for target model
-    &#34;&#34;&#34;
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super().__init__(config, **kwargs)
-        self.device = self.config.env_config.device
-        self.device_map = self.config.env_config.device_map
-        # Use provided name (if provided)
-        # Relevant for scoring-model scenario
-        self.name = self.kwargs.get(&#39;name&#39;, self.config.base_model)
-
-        base_model_kwargs = {}
-        if config.revision:
-            base_model_kwargs.update(dict(revision=config.revision))
-        if &#39;gpt-j&#39; in self.name or &#39;neox&#39; in self.name:
-            base_model_kwargs.update(dict(torch_dtype=torch.float16))
-        if &#39;gpt-j&#39; in self.name:
-            base_model_kwargs.update(dict(revision=&#39;float16&#39;))
-        self.model, self.tokenizer = self.load_base_model_and_tokenizer(
-            model_kwargs=base_model_kwargs)
-        self.load_model_properties()
-
-    @torch.no_grad()
-    def get_ref(self, text: str, ref_model: ReferenceModel, tokens=None, probs=None):
-        &#34;&#34;&#34;
-            Compute the loss of a given text calibrated against the text&#39;s loss under a reference model -- MIA baseline
-        &#34;&#34;&#34;
-        lls = self.get_ll(text, tokens=tokens, probs=probs)
-        lls_ref = ref_model.get_ll(text)
-
-        return lls - lls_ref
-
-    @torch.no_grad()
-    def get_rank(self, text: str, log: bool=False):
-        &#34;&#34;&#34;
-            Get the average rank of each observed token sorted by model likelihood
-        &#34;&#34;&#34;
-        openai_config = self.config.openai_config
-        assert openai_config is None, &#34;get_rank not implemented for OpenAI models&#34;
-
-        tokenized = self.tokenizer(text, return_tensors=&#34;pt&#34;).to(self.device)
-        logits = self.model(**tokenized).logits[:,:-1]
-        labels = tokenized.input_ids[:,1:]
-
-        # get rank of each label token in the model&#39;s likelihood ordering
-        matches = (logits.argsort(-1, descending=True) == labels.unsqueeze(-1)).nonzero()
-
-        assert matches.shape[1] == 3, f&#34;Expected 3 dimensions in matches tensor, got {matches.shape}&#34;
-
-        ranks, timesteps = matches[:,-1], matches[:,-2]
-
-        # make sure we got exactly one match for each timestep in the sequence
-        assert (timesteps == torch.arange(len(timesteps)).to(timesteps.device)).all(), &#34;Expected one match per timestep&#34;
-
-        ranks = ranks.float() + 1 # convert to 1-indexed rank
-        if log:
-            ranks = torch.log(ranks)
-
-        return ranks.float().mean().item()
-
-    # TODO extend for longer sequences
-    @torch.no_grad()
-    def get_lls(self, texts: List[str], batch_size: int = 6):
-        #return [self.get_ll(text) for text in texts] # -np.mean([self.get_ll(text) for text in texts])
-        # tokenized = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True)
-        # labels = tokenized.input_ids
-        total_size = len(texts)
-        losses = []
-        for i in range(0, total_size, batch_size):
-            # Delegate batches and tokenize
-            batch = texts[i:i+batch_size]
-            tokenized = self.tokenizer(batch, return_tensors=&#34;pt&#34;, padding=True, return_attention_mask=True)
-            label_batch = tokenized.input_ids
-            
-            # # mask out padding tokens
-            attention_mask = tokenized.attention_mask
-            assert attention_mask.size() == label_batch.size()
-
-            needs_sliding = label_batch.size(1) &gt; self.max_length // 2
-            if not needs_sliding:
-                label_batch = label_batch.to(self.device)
-                attention_mask = attention_mask.to(self.device)
-
-            # Collect token probabilities per sample in batch
-            all_prob = defaultdict(list)
-            for i in range(0, label_batch.size(1), self.stride):
-                begin_loc = max(i + self.stride - self.max_length, 0)
-                end_loc = min(i + self.stride, label_batch.size(1))
-                trg_len = end_loc - i  # may be different from stride on last loop
-                input_ids = label_batch[:, begin_loc:end_loc]
-                mask = attention_mask[:, begin_loc:end_loc]
-                if needs_sliding:
-                    input_ids = input_ids.to(self.device)
-                    mask = mask.to(self.device)
-                    
-                target_ids = input_ids.clone()
-                # Don&#39;t count padded tokens or tokens that already have computed probabilities
-                target_ids[:, :-trg_len] = -100
-                # target_ids[attention_mask == 0] = -100
-                
-                logits = self.model(input_ids, labels=target_ids, attention_mask=mask).logits.cpu()
-                target_ids = target_ids.cpu()
-                shift_logits = logits[..., :-1, :].contiguous()
-                probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-                shift_labels = target_ids[..., 1:].contiguous()
-
-                for i, sample in enumerate(shift_labels):
-                    for j, token_id in enumerate(sample):
-                        if token_id != -100 and token_id != self.tokenizer.pad_token_id:
-                            probability = probabilities[i, j, token_id].item()
-                            all_prob[i].append(probability)
-
-                del input_ids
-                del mask
-            
-            # average over each sample to get losses
-            batch_losses = [-np.mean(all_prob[idx]) for idx in range(label_batch.size(0))]
-            # print(batch_losses)
-            losses.extend(batch_losses)
-            del label_batch
-            del attention_mask
-        return losses #np.mean(losses)
-
-    def sample_from_model(self, texts: List[str], **kwargs):
-        &#34;&#34;&#34;
-            Sample from base_model using ****only**** the first 30 tokens in each example as context
-        &#34;&#34;&#34;
-        min_words = kwargs.get(&#39;min_words&#39;, 55)
-        max_words = kwargs.get(&#39;max_words&#39;, 200)
-        prompt_tokens = kwargs.get(&#39;prompt_tokens&#39;, 30)
-
-        # encode each text as a list of token ids
-        if self.config.dataset_member == &#39;pubmed&#39;:
-            texts = [t[:t.index(SEPARATOR)] for t in texts]
-            all_encoded = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device, non_blocking=True)
-        else:
-            all_encoded = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device, non_blocking=True)
-            all_encoded = {key: value[:, :prompt_tokens] for key, value in all_encoded.items()}
-
-        decoded = [&#39;&#39; for _ in range(len(texts))]
-
-        # sample from the model until we get a sample with at least min_words words for each example
-        # this is an inefficient way to do this (since we regenerate for all inputs if just one is too short), but it works
-        tries = 0
-        while (m := min(len(x.split()) for x in decoded)) &lt; min_words and tries &lt;  self.config.neighborhood_config.top_p:
-            if tries != 0:
-                print()
-                print(f&#34;min words: {m}, needed {min_words}, regenerating (try {tries})&#34;)
-
-            sampling_kwargs = {}
-            if self.config.do_top_p:
-                sampling_kwargs[&#39;top_p&#39;] = self.config.top_p
-            elif self.config.do_top_k:
-                sampling_kwargs[&#39;top_k&#39;] = self.config.top_k
-            #min_length = 50 if config.dataset_member in [&#39;pubmed&#39;] else 150
-
-            #outputs = base_model.generate(**all_encoded, min_length=min_length, max_length=max_length, do_sample=True, **sampling_kwargs, pad_token_id=base_tokenizer.eos_token_id, eos_token_id=base_tokenizer.eos_token_id)
-            #removed minlen and attention mask min_length=min_length, max_length=200, do_sample=True,pad_token_id=base_tokenizer.eos_token_id,
-            outputs = self.model.generate(**all_encoded, min_length=min_words*2, max_length=max_words*3,  **sampling_kwargs,  eos_token_id=self.tokenizer.eos_token_id)
-            decoded = self.tokenizer.batch_decode(outputs, skip_special_tokens=True)
-            tries += 1
-
-        return decoded
-
-    @torch.no_grad()
-    def get_entropy(self, text: str):
-        &#34;&#34;&#34;
-            Get average entropy of each token in the text
-        &#34;&#34;&#34;
-        # raise NotImplementedError(&#34;get_entropy not implemented for OpenAI models&#34;)
-        
-        tokenized = self.tokenizer(text, return_tensors=&#34;pt&#34;).to(self.device)
-        logits = self.model(**tokenized).logits[:,:-1]
-        neg_entropy = F.softmax(logits, dim=-1) * F.log_softmax(logits, dim=-1)
-        return -neg_entropy.sum(-1).mean().item()
-    
-    @torch.no_grad()
-    def get_max_norm(self, text: str, context_len=None, tk_freq_map=None):
-        # TODO: update like other attacks
-        tokenized = self.tokenizer(
-            text, return_tensors=&#34;pt&#34;).to(self.device)
-        labels = tokenized.input_ids
-
-        max_length = context_len if context_len is not None else self.max_length
-        stride = max_length // 2 #self.stride
-        all_prob = []
-        for i in range(0, labels.size(1), stride):
-            begin_loc = max(i + stride - max_length, 0)
-            end_loc = min(i + stride, labels.size(1))
-            trg_len = end_loc - i  # may be different from stride on last loop
-            input_ids = labels[:, begin_loc:end_loc]
-            target_ids = input_ids.clone()
-            target_ids[:, :-trg_len] = -100
-
-            outputs = self.model(input_ids, labels=target_ids)
-            logits = outputs.logits
-            # Shift so that tokens &lt; n predict n
-            # print(logits.shape)
-            shift_logits = logits[..., :-1, :].contiguous()
-            # shift_logits = torch.transpose(shift_logits, 1, 2)
-            probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-            shift_labels = target_ids[..., 1:].contiguous()
-            labels_processed = shift_labels[0]
-
-            for i, token_id in enumerate(labels_processed):
-                if token_id != -100:
-                    probability = probabilities[0, i, token_id].item()
-                    max_tk_prob = torch.max(probabilities[0, i]).item()
-                    tk_weight = max(tk_freq_map[token_id.item()], 1) / sum(tk_freq_map.values()) if tk_freq_map is not None else 1
-                    if tk_weight == 0:
-                        print(&#34;0 count token&#34;, token_id.item())
-                    tk_norm = tk_weight
-                    all_prob.append((1 - (max_tk_prob - probability)) / tk_norm)
-
-        # Should be equal to # of tokens - 1 to account for shift
-        assert len(all_prob) == labels.size(1) - 1
-        return -np.mean(all_prob)
-
-
-class OpenAI_APIModel(LanguageModel):
-    &#34;&#34;&#34;
-        Wrapper for OpenAI API calls
-    &#34;&#34;&#34;
-    def __init__(self, config: ExperimentConfig, **kwargs):
-        super().__init__(config, **kwargs)
-        self.model = None
-        self.tokenizer = transformers.GPT2Tokenizer.from_pretrained(&#39;gpt2&#39;, cache_dir=self.cache_dir)
-        self.API_TOKEN_COUNTER = 0
-    
-    @property
-    def api_calls(self):
-        &#34;&#34;&#34;
-            Get the number of tokens used in API calls
-        &#34;&#34;&#34;
-        return self.API_TOKEN_COUNTER
-
-    @torch.no_grad()
-    def get_ll(self, text: str):
-        &#34;&#34;&#34;
-            Get the log likelihood of each text under the base_model
-        &#34;&#34;&#34;
-        openai_config = self.config.openai_config
-
-        kwargs = {&#34;engine&#34;: openai_config.model, &#34;temperature&#34;: 0, &#34;max_tokens&#34;: 0, &#34;echo&#34;: True, &#34;logprobs&#34;: 0}
-        r = openai.Completion.create(prompt=f&#34;&lt;|endoftext|&gt;{text}&#34;, **kwargs)
-        result = r[&#39;choices&#39;][0]
-        tokens, logprobs = result[&#34;logprobs&#34;][&#34;tokens&#34;][1:], result[&#34;logprobs&#34;][&#34;token_logprobs&#34;][1:]
-
-        assert len(tokens) == len(logprobs), f&#34;Expected {len(tokens)} logprobs, got {len(logprobs)}&#34;
-
-        return np.mean(logprobs)
-
-    @torch.no_grad()
-    def get_ref(self, text: str, ref_model: ReferenceModel):
-        &#34;&#34;&#34;
-            Get the  likelihood ratio of each text under the base_model -- MIA baseline
-        &#34;&#34;&#34;
-        raise NotImplementedError(&#34;OpenAI model not implemented for LIRA&#34;)
-        openai_config = self.config.openai_config
-        kwargs = {&#34;engine&#34;: openai_config.model, &#34;temperature&#34;: 0,
-                    &#34;max_tokens&#34;: 0, &#34;echo&#34;: True, &#34;logprobs&#34;: 0}
-        r = openai.Completion.create(prompt=f&#34;&lt;|endoftext|&gt;{text}&#34;, **kwargs)
-        result = r[&#39;choices&#39;][0]
-        tokens, logprobs = result[&#34;logprobs&#34;][&#34;tokens&#34;][1:], result[&#34;logprobs&#34;][&#34;token_logprobs&#34;][1:]
-
-        assert len(tokens) == len(logprobs), f&#34;Expected {len(tokens)} logprobs, got {len(logprobs)}&#34;
-
-        return np.mean(logprobs)
-
-    def get_lls(self, texts: str):
-
-        # use GPT2_TOKENIZER to get total number of tokens
-        total_tokens = sum(len(self.tokenizer.encode(text)) for text in texts)
-        self.API_TOKEN_COUNTER += total_tokens * 2  # multiply by two because OpenAI double-counts echo_prompt tokens
-
-        pool = ThreadPool(self.config.batch_size)
-        return pool.map(self.get_ll, texts)
-
-    def _openai_sample(self, p: str):
-        openai_config = self.config.openai_config
-        if self.config.dataset_member != &#39;pubmed&#39;:  # keep Answer: prefix for pubmed
-            p = drop_last_word(p)
-
-        # sample from the openai model
-        kwargs = { &#34;engine&#34;: openai_config.model, &#34;max_tokens&#34;: 200 }
-        if self.config.do_top_p:
-            kwargs[&#39;top_p&#39;] = self.config.top_p
-    
-        r = openai.Completion.create(prompt=f&#34;{p}&#34;, **kwargs)
-        return p + r[&#39;choices&#39;][0].text
-
-
-    def sample_from_model(self, texts: List[str], **kwargs):
-        &#34;&#34;&#34;
-            Sample from base_model using ****only**** the first 30 tokens in each example as context
-        &#34;&#34;&#34;
-        prompt_tokens = kwargs.get(&#39;prompt_tokens&#39;, 30)
-        base_tokenizer = kwargs.get(&#39;base_tokenizer&#39;, None)
-        if base_tokenizer is None:
-            raise ValueError(&#34;Please provide base_tokenizer&#34;)
-
-        # encode each text as a list of token ids
-        if self.config.dataset_member == &#39;pubmed&#39;:
-            texts = [t[:t.index(SEPARATOR)] for t in texts]
-            all_encoded = base_tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device)
-        else:
-            all_encoded = base_tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device)
-            all_encoded = {key: value[:, :prompt_tokens] for key, value in all_encoded.items()}
-
-        # decode the prefixes back into text
-        prefixes = base_tokenizer.batch_decode(all_encoded[&#39;input_ids&#39;], skip_special_tokens=True)
-        pool = ThreadPool(self.config.batch_size)
-
-        decoded = pool.map(self._openai_sample, prefixes)
-
-        # count total number of tokens with GPT2_TOKENIZER
-        total_tokens = sum(len(self.tokenizer.encode(x)) for x in decoded)
-        self.API_TOKEN_COUNTER += total_tokens
-
-        return decoded
-    
-    @torch.no_grad()
-    def get_entropy(self, text: str):
-        &#34;&#34;&#34;
-            Get average entropy of each token in the text
-        &#34;&#34;&#34;
-        raise NotImplementedError(&#34;get_entropy not implemented for OpenAI models&#34;)</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -901,21 +275,6 @@ <h3>Subclasses</h3>
 <ul class="hlist">
 <li><a title="mimir.models.OpenAI_APIModel" href="#mimir.models.OpenAI_APIModel">OpenAI_APIModel</a></li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.models.LanguageModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.LanguageModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.LanguageModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="mimir.models.LanguageModel.get_entropy"><code class="name flex">
@@ -923,262 +282,42 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>Get average entropy of each token in the text</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_entropy(self, text: str):
-    &#34;&#34;&#34;
-        Get average entropy of each token in the text
-    &#34;&#34;&#34;
-    # raise NotImplementedError(&#34;get_entropy not implemented for OpenAI models&#34;)
-    
-    tokenized = self.tokenizer(text, return_tensors=&#34;pt&#34;).to(self.device)
-    logits = self.model(**tokenized).logits[:,:-1]
-    neg_entropy = F.softmax(logits, dim=-1) * F.log_softmax(logits, dim=-1)
-    return -neg_entropy.sum(-1).mean().item()</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.LanguageModel.get_lls"><code class="name flex">
 <span>def <span class="ident">get_lls</span></span>(<span>self, texts: List[str], batch_size: int = 6)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_lls(self, texts: List[str], batch_size: int = 6):
-    #return [self.get_ll(text) for text in texts] # -np.mean([self.get_ll(text) for text in texts])
-    # tokenized = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True)
-    # labels = tokenized.input_ids
-    total_size = len(texts)
-    losses = []
-    for i in range(0, total_size, batch_size):
-        # Delegate batches and tokenize
-        batch = texts[i:i+batch_size]
-        tokenized = self.tokenizer(batch, return_tensors=&#34;pt&#34;, padding=True, return_attention_mask=True)
-        label_batch = tokenized.input_ids
-        
-        # # mask out padding tokens
-        attention_mask = tokenized.attention_mask
-        assert attention_mask.size() == label_batch.size()
-
-        needs_sliding = label_batch.size(1) &gt; self.max_length // 2
-        if not needs_sliding:
-            label_batch = label_batch.to(self.device)
-            attention_mask = attention_mask.to(self.device)
-
-        # Collect token probabilities per sample in batch
-        all_prob = defaultdict(list)
-        for i in range(0, label_batch.size(1), self.stride):
-            begin_loc = max(i + self.stride - self.max_length, 0)
-            end_loc = min(i + self.stride, label_batch.size(1))
-            trg_len = end_loc - i  # may be different from stride on last loop
-            input_ids = label_batch[:, begin_loc:end_loc]
-            mask = attention_mask[:, begin_loc:end_loc]
-            if needs_sliding:
-                input_ids = input_ids.to(self.device)
-                mask = mask.to(self.device)
-                
-            target_ids = input_ids.clone()
-            # Don&#39;t count padded tokens or tokens that already have computed probabilities
-            target_ids[:, :-trg_len] = -100
-            # target_ids[attention_mask == 0] = -100
-            
-            logits = self.model(input_ids, labels=target_ids, attention_mask=mask).logits.cpu()
-            target_ids = target_ids.cpu()
-            shift_logits = logits[..., :-1, :].contiguous()
-            probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-            shift_labels = target_ids[..., 1:].contiguous()
-
-            for i, sample in enumerate(shift_labels):
-                for j, token_id in enumerate(sample):
-                    if token_id != -100 and token_id != self.tokenizer.pad_token_id:
-                        probability = probabilities[i, j, token_id].item()
-                        all_prob[i].append(probability)
-
-            del input_ids
-            del mask
-        
-        # average over each sample to get losses
-        batch_losses = [-np.mean(all_prob[idx]) for idx in range(label_batch.size(0))]
-        # print(batch_losses)
-        losses.extend(batch_losses)
-        del label_batch
-        del attention_mask
-    return losses #np.mean(losses)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.LanguageModel.get_max_norm"><code class="name flex">
 <span>def <span class="ident">get_max_norm</span></span>(<span>self, text: str, context_len=None, tk_freq_map=None)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_max_norm(self, text: str, context_len=None, tk_freq_map=None):
-    # TODO: update like other attacks
-    tokenized = self.tokenizer(
-        text, return_tensors=&#34;pt&#34;).to(self.device)
-    labels = tokenized.input_ids
-
-    max_length = context_len if context_len is not None else self.max_length
-    stride = max_length // 2 #self.stride
-    all_prob = []
-    for i in range(0, labels.size(1), stride):
-        begin_loc = max(i + stride - max_length, 0)
-        end_loc = min(i + stride, labels.size(1))
-        trg_len = end_loc - i  # may be different from stride on last loop
-        input_ids = labels[:, begin_loc:end_loc]
-        target_ids = input_ids.clone()
-        target_ids[:, :-trg_len] = -100
-
-        outputs = self.model(input_ids, labels=target_ids)
-        logits = outputs.logits
-        # Shift so that tokens &lt; n predict n
-        # print(logits.shape)
-        shift_logits = logits[..., :-1, :].contiguous()
-        # shift_logits = torch.transpose(shift_logits, 1, 2)
-        probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-        shift_labels = target_ids[..., 1:].contiguous()
-        labels_processed = shift_labels[0]
-
-        for i, token_id in enumerate(labels_processed):
-            if token_id != -100:
-                probability = probabilities[0, i, token_id].item()
-                max_tk_prob = torch.max(probabilities[0, i]).item()
-                tk_weight = max(tk_freq_map[token_id.item()], 1) / sum(tk_freq_map.values()) if tk_freq_map is not None else 1
-                if tk_weight == 0:
-                    print(&#34;0 count token&#34;, token_id.item())
-                tk_norm = tk_weight
-                all_prob.append((1 - (max_tk_prob - probability)) / tk_norm)
-
-    # Should be equal to # of tokens - 1 to account for shift
-    assert len(all_prob) == labels.size(1) - 1
-    return -np.mean(all_prob)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.LanguageModel.get_rank"><code class="name flex">
 <span>def <span class="ident">get_rank</span></span>(<span>self, text: str, log: bool = False)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Get the average rank of each observed token sorted by model likelihood</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_rank(self, text: str, log: bool=False):
-    &#34;&#34;&#34;
-        Get the average rank of each observed token sorted by model likelihood
-    &#34;&#34;&#34;
-    openai_config = self.config.openai_config
-    assert openai_config is None, &#34;get_rank not implemented for OpenAI models&#34;
-
-    tokenized = self.tokenizer(text, return_tensors=&#34;pt&#34;).to(self.device)
-    logits = self.model(**tokenized).logits[:,:-1]
-    labels = tokenized.input_ids[:,1:]
-
-    # get rank of each label token in the model&#39;s likelihood ordering
-    matches = (logits.argsort(-1, descending=True) == labels.unsqueeze(-1)).nonzero()
-
-    assert matches.shape[1] == 3, f&#34;Expected 3 dimensions in matches tensor, got {matches.shape}&#34;
-
-    ranks, timesteps = matches[:,-1], matches[:,-2]
-
-    # make sure we got exactly one match for each timestep in the sequence
-    assert (timesteps == torch.arange(len(timesteps)).to(timesteps.device)).all(), &#34;Expected one match per timestep&#34;
-
-    ranks = ranks.float() + 1 # convert to 1-indexed rank
-    if log:
-        ranks = torch.log(ranks)
-
-    return ranks.float().mean().item()</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.LanguageModel.get_ref"><code class="name flex">
 <span>def <span class="ident">get_ref</span></span>(<span>self, text: str, ref_model: <a title="mimir.models.ReferenceModel" href="#mimir.models.ReferenceModel">ReferenceModel</a>, tokens=None, probs=None)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Compute the loss of a given text calibrated against the text's loss under a reference model &ndash; MIA baseline</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_ref(self, text: str, ref_model: ReferenceModel, tokens=None, probs=None):
-    &#34;&#34;&#34;
-        Compute the loss of a given text calibrated against the text&#39;s loss under a reference model -- MIA baseline
-    &#34;&#34;&#34;
-    lls = self.get_ll(text, tokens=tokens, probs=probs)
-    lls_ref = ref_model.get_ll(text)
-
-    return lls - lls_ref</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.LanguageModel.sample_from_model"><code class="name flex">
 <span>def <span class="ident">sample_from_model</span></span>(<span>self, texts: List[str], **kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Sample from base_model using <strong><em>*only</em></strong>* the first 30 tokens in each example as context</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def sample_from_model(self, texts: List[str], **kwargs):
-    &#34;&#34;&#34;
-        Sample from base_model using ****only**** the first 30 tokens in each example as context
-    &#34;&#34;&#34;
-    min_words = kwargs.get(&#39;min_words&#39;, 55)
-    max_words = kwargs.get(&#39;max_words&#39;, 200)
-    prompt_tokens = kwargs.get(&#39;prompt_tokens&#39;, 30)
-
-    # encode each text as a list of token ids
-    if self.config.dataset_member == &#39;pubmed&#39;:
-        texts = [t[:t.index(SEPARATOR)] for t in texts]
-        all_encoded = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device, non_blocking=True)
-    else:
-        all_encoded = self.tokenizer(texts, return_tensors=&#34;pt&#34;, padding=True).to(self.device, non_blocking=True)
-        all_encoded = {key: value[:, :prompt_tokens] for key, value in all_encoded.items()}
-
-    decoded = [&#39;&#39; for _ in range(len(texts))]
-
-    # sample from the model until we get a sample with at least min_words words for each example
-    # this is an inefficient way to do this (since we regenerate for all inputs if just one is too short), but it works
-    tries = 0
-    while (m := min(len(x.split()) for x in decoded)) &lt; min_words and tries &lt;  self.config.neighborhood_config.top_p:
-        if tries != 0:
-            print()
-            print(f&#34;min words: {m}, needed {min_words}, regenerating (try {tries})&#34;)
-
-        sampling_kwargs = {}
-        if self.config.do_top_p:
-            sampling_kwargs[&#39;top_p&#39;] = self.config.top_p
-        elif self.config.do_top_k:
-            sampling_kwargs[&#39;top_k&#39;] = self.config.top_k
-        #min_length = 50 if config.dataset_member in [&#39;pubmed&#39;] else 150
-
-        #outputs = base_model.generate(**all_encoded, min_length=min_length, max_length=max_length, do_sample=True, **sampling_kwargs, pad_token_id=base_tokenizer.eos_token_id, eos_token_id=base_tokenizer.eos_token_id)
-        #removed minlen and attention mask min_length=min_length, max_length=200, do_sample=True,pad_token_id=base_tokenizer.eos_token_id,
-        outputs = self.model.generate(**all_encoded, min_length=min_words*2, max_length=max_words*3,  **sampling_kwargs,  eos_token_id=self.tokenizer.eos_token_id)
-        decoded = self.tokenizer.batch_decode(outputs, skip_special_tokens=True)
-        tries += 1
-
-    return decoded</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.models.Model.forward" href="#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.Model.get_ll" href="#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.Model.get_probabilities" href="#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.Model.load" href="#mimir.models.Model.load">load</a></code></li>
@@ -1429,54 +568,8 @@ <h3>Subclasses</h3>
 <li><a title="mimir.models.QuantileReferenceModel" href="#mimir.models.QuantileReferenceModel">QuantileReferenceModel</a></li>
 <li><a title="mimir.models.ReferenceModel" href="#mimir.models.ReferenceModel">ReferenceModel</a></li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.models.Model.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.Model.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.Model.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
-<dt id="mimir.models.Model.forward"><code class="name flex">
-<span>def <span class="ident">forward</span></span>(<span>self, *input: Any) ‑> None</span>
-</code></dt>
-<dd>
-<div class="desc"><p>Define the computation performed at every call.</p>
-<p>Should be overridden by all subclasses.</p>
-<div class="admonition note">
-<p class="admonition-title">Note</p>
-<p>Although the recipe for forward pass needs to be defined within
-this function, one should call the :class:<code>Module</code> instance afterwards
-instead of this since the former takes care of running the
-registered hooks while the latter silently ignores them.</p>
-</div></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def _forward_unimplemented(self, *input: Any) -&gt; None:
-    r&#34;&#34;&#34;Define the computation performed at every call.
-
-    Should be overridden by all subclasses.
-
-    .. note::
-        Although the recipe for forward pass needs to be defined within
-        this function, one should call the :class:`Module` instance afterwards
-        instead of this since the former takes care of running the
-        registered hooks while the latter silently ignores them.
-    &#34;&#34;&#34;
-    raise NotImplementedError(f&#34;Module [{type(self).__name__}] is missing the required \&#34;forward\&#34; function&#34;)</code></pre>
-</details>
-</dd>
 <dt id="mimir.models.Model.get_ll"><code class="name flex">
 <span>def <span class="ident">get_ll</span></span>(<span>self, text: str, tokens: numpy.ndarray = None, probs=None)</span>
 </code></dt>
@@ -1493,28 +586,6 @@ <h2 id="args">Args</h2>
 <dd>An optional list of probabilities. If provided, these probabilities</dd>
 </dl>
 <p>are used instead of calling the <code>get_probabilities</code> method. Defaults to None.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_ll(self,
-           text: str,
-           tokens: np.ndarray=None,
-           probs = None):
-    &#34;&#34;&#34;
-        Get the log likelihood of each text under the base_model.
-
-        Args:
-            text (str): The input text for which to calculate the log likelihood.
-            tokens (numpy.ndarray, optional): An optional array of token ids. If provided, these tokens
-            are used instead of tokenizing the input text. Defaults to None.
-            probs (list, optional): An optional list of probabilities. If provided, these probabilities
-            are used instead of calling the `get_probabilities` method. Defaults to None.
-    &#34;&#34;&#34;
-    all_prob = probs if probs is not None else self.get_probabilities(text, tokens=tokens)
-    return -np.mean(all_prob)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.get_probabilities"><code class="name flex">
 <span>def <span class="ident">get_probabilities</span></span>(<span>self, text: str, tokens: numpy.ndarray = None, no_grads: bool = True, return_all_probs: bool = False)</span>
@@ -1539,244 +610,36 @@ <h2 id="returns">Returns</h2>
 <dt><code>list</code></dt>
 <dd>A list of probabilities.</dd>
 </dl></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_probabilities(self,
-                      text: str,
-                      tokens: np.ndarray = None,
-                      no_grads: bool = True,
-                      return_all_probs: bool = False):
-    &#34;&#34;&#34;
-        Get the probabilities or log-softmaxed logits for a text under the current model.
-        Args:
-            text (str): The input text for which to calculate probabilities.
-            tokens (numpy.ndarray, optional): An optional array of token ids. If provided, these tokens
-            are used instead of tokenizing the input text. Defaults to None.
-
-        Raises:
-            ValueError: If the device or name attributes of the instance are not set.
-
-        Returns:
-            list: A list of probabilities.
-    &#34;&#34;&#34;
-    with torch.set_grad_enabled(not no_grads):
-        if self.device is None or self.name is None:
-            raise ValueError(&#34;Please set self.device and self.name in child class&#34;)
-
-        if tokens is not None:
-            labels = torch.from_numpy(tokens.astype(np.int64)).type(torch.LongTensor)
-            if labels.shape[0] != 1:
-                # expand first dimension
-                labels = labels.unsqueeze(0)
-        else:
-            tokenized = self.tokenizer(
-                text, return_tensors=&#34;pt&#34;)
-            labels = tokenized.input_ids
-
-        target_token_log_prob = []
-        all_token_log_prob = []
-        for i in range(0, labels.size(1), self.stride):
-            begin_loc = max(i + self.stride - self.max_length, 0)
-            end_loc = min(i + self.stride, labels.size(1))
-            trg_len = end_loc - i  # may be different from stride on last loop
-            input_ids = labels[:, begin_loc:end_loc].to(self.device)
-            target_ids = input_ids.clone()
-            target_ids[:, :-trg_len] = -100
-
-            logits = self.model(input_ids, labels=target_ids).logits
-            if no_grads:
-                logits = logits.cpu()
-            shift_logits = logits[..., :-1, :].contiguous()
-            log_probabilities = torch.nn.functional.log_softmax(shift_logits, dim=-1)
-            shift_labels = target_ids[..., 1:]
-            if no_grads:
-                shift_labels = shift_labels.cpu()
-            shift_labels = shift_labels.contiguous()
-            labels_processed = shift_labels[0]
-
-            del input_ids
-            del target_ids
-
-            for i, token_id in enumerate(labels_processed):
-                if token_id != -100:
-                    log_probability = log_probabilities[0, i, token_id]
-                    if no_grads:
-                        log_probability = log_probability.item()
-                    target_token_log_prob.append(log_probability)
-                    all_token_log_prob.append(log_probabilities[0, i])
-        
-        # Should be equal to # of tokens - 1 to account for shift
-        assert len(target_token_log_prob) == labels.size(1) - 1
-        all_token_log_prob = torch.stack(all_token_log_prob, dim=0)
-        assert len(target_token_log_prob) == len(all_token_log_prob)
-
-    if not no_grads:
-        target_token_log_prob = torch.stack(target_token_log_prob)
-
-    if not return_all_probs:
-        return target_token_log_prob
-    return target_token_log_prob, all_token_log_prob</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.load"><code class="name flex">
 <span>def <span class="ident">load</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Load model onto GPU (and compile, if requested) if not already loaded with device map.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load(self):
-    &#34;&#34;&#34;
-        Load model onto GPU (and compile, if requested) if not already loaded with device map.
-    &#34;&#34;&#34;
-    if not self.device_map:
-        start = time.time()
-        try:
-            self.model.cpu()
-        except NameError:
-            pass
-        if self.config.openai_config is None:
-            self.model.to(self.device, non_blocking=True)
-        if self.config.env_config.compile:
-            torch.compile(self.model)
-        print(f&#39;DONE ({time.time() - start:.2f}s)&#39;)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.load_base_model_and_tokenizer"><code class="name flex">
 <span>def <span class="ident">load_base_model_and_tokenizer</span></span>(<span>self, model_kwargs)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Load the base model and tokenizer for a given model name.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_base_model_and_tokenizer(self, model_kwargs):
-    &#34;&#34;&#34;
-        Load the base model and tokenizer for a given model name.
-    &#34;&#34;&#34;
-    if self.device is None or self.name is None:
-        raise ValueError(&#34;Please set self.device and self.name in child class&#34;)
-
-    if self.config.openai_config is None:
-        print(f&#39;Loading BASE model {self.name}...&#39;)
-        device_map = self.device_map # if self.device_map else &#39;cpu&#39;
-        if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-            from utils.transformers.model import OpenLMforCausalLM
-            model = OpenLMforCausalLM.from_pretrained(
-                self.name, **model_kwargs, device_map=self.device, cache_dir=self.cache_dir)
-            # Extract the model from the model wrapper so we dont need to call model.model
-        elif &#34;llama&#34; in self.name or &#34;alpaca&#34; in self.name:
-            # TODO: This should be smth specified in config in case user has
-            # llama is too big, gotta use device map
-            model = transformers.AutoModelForCausalLM.from_pretrained(self.name, **model_kwargs, device_map=&#34;balanced_low_0&#34;, cache_dir=self.cache_dir)
-            self.device = &#39;cuda:1&#39;
-        elif &#34;stablelm&#34; in self.name.lower():  # models requiring custom code
-            model = transformers.AutoModelForCausalLM.from_pretrained(
-                self.name, **model_kwargs, trust_remote_code=True, device_map=device_map, cache_dir=self.cache_dir)
-        elif &#34;olmo&#34; in self.name.lower():
-            model = transformers.AutoModelForCausalLM.from_pretrained(
-                self.name, **model_kwargs, trust_remote_code=True, cache_dir=self.cache_dir)
-        else:
-            model = transformers.AutoModelForCausalLM.from_pretrained(
-                self.name, **model_kwargs, device_map=device_map, cache_dir=self.cache_dir)
-    else:
-        model = None
-
-    optional_tok_kwargs = {}
-    if &#34;facebook/opt-&#34; in self.name:
-        print(&#34;Using non-fast tokenizer for OPT&#34;)
-        optional_tok_kwargs[&#39;fast&#39;] = False
-    if self.config.dataset_member in [&#39;pubmed&#39;] or self.config.dataset_nonmember in [&#39;pubmed&#39;]:
-        optional_tok_kwargs[&#39;padding_side&#39;] = &#39;left&#39;
-        self.pad_token = self.tokenizer.eos_token_id
-    if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-        tokenizer = transformers.GPTNeoXTokenizerFast.from_pretrained(
-            &#34;EleutherAI/gpt-neox-20b&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-    elif &#34;datablations&#34; in self.name:
-        tokenizer = transformers.AutoTokenizer.from_pretrained(
-            &#34;gpt2&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-    elif &#34;llama&#34; in self.name or &#34;alpaca&#34; in self.name:
-        tokenizer = transformers.LlamaTokenizer.from_pretrained(
-            self.name, **optional_tok_kwargs, cache_dir=self.cache_dir)
-    elif &#34;pubmedgpt&#34; in self.name:
-        tokenizer = transformers.AutoTokenizer.from_pretrained(
-            &#34;stanford-crfm/BioMedLM&#34;, **optional_tok_kwargs, cache_dir=self.cache_dir)
-    else:
-        tokenizer = transformers.AutoTokenizer.from_pretrained(
-            self.name, **optional_tok_kwargs, cache_dir=self.cache_dir,
-            trust_remote_code=True if &#34;olmo&#34; in self.name.lower() else False)
-    tokenizer.add_special_tokens({&#39;pad_token&#39;: &#39;[PAD]&#39;})
-
-    return model, tokenizer</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.load_model_properties"><code class="name flex">
 <span>def <span class="ident">load_model_properties</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Load model properties, such as max length and stride.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load_model_properties(self):
-    &#34;&#34;&#34;
-        Load model properties, such as max length and stride.
-    &#34;&#34;&#34;
-    # TODO: getting max_length of input could be more generic
-    if &#34;silo&#34; in self.name or &#34;balanced&#34; in self.name:
-        self.max_length = self.model.model.seq_len
-    elif hasattr(self.model.config, &#39;max_position_embeddings&#39;):
-        self.max_length = self.model.config.max_position_embeddings
-    elif hasattr(self.model.config, &#39;n_positions&#39;):
-        self.max_length = self.model.config.n_positions
-    else:
-        # Default window size
-        self.max_length = 1024
-    self.stride = self.max_length // 2</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.to"><code class="name flex">
 <span>def <span class="ident">to</span></span>(<span>self, device)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Shift model to a particular device.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def to(self, device):
-    &#34;&#34;&#34;
-        Shift model to a particular device.
-    &#34;&#34;&#34;
-    self.model.to(device, non_blocking=True)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.Model.unload"><code class="name flex">
 <span>def <span class="ident">unload</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Unload model from GPU</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def unload(self):
-    &#34;&#34;&#34;
-        Unload model from GPU
-    &#34;&#34;&#34;
-    start = time.time()
-    try:
-        self.model.cpu()
-    except NameError:
-        pass
-    print(f&#39;DONE ({time.time() - start:.2f}s)&#39;)</code></pre>
-</details>
 </dd>
 </dl>
 </dd>
@@ -1906,24 +769,9 @@ <h3>Ancestors</h3>
 <li><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></li>
 <li>torch.nn.modules.module.Module</li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.models.OpenAI_APIModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.OpenAI_APIModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.OpenAI_APIModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Instance variables</h3>
 <dl>
-<dt id="mimir.models.OpenAI_APIModel.api_calls"><code class="name">var <span class="ident">api_calls</span></code></dt>
+<dt id="mimir.models.OpenAI_APIModel.api_calls"><code class="name">prop <span class="ident">api_calls</span></code></dt>
 <dd>
 <div class="desc"><p>Get the number of tokens used in API calls</p></div>
 <details class="source">
@@ -1946,45 +794,12 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>Get the log likelihood of each text under the base_model</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_ll(self, text: str):
-    &#34;&#34;&#34;
-        Get the log likelihood of each text under the base_model
-    &#34;&#34;&#34;
-    openai_config = self.config.openai_config
-
-    kwargs = {&#34;engine&#34;: openai_config.model, &#34;temperature&#34;: 0, &#34;max_tokens&#34;: 0, &#34;echo&#34;: True, &#34;logprobs&#34;: 0}
-    r = openai.Completion.create(prompt=f&#34;&lt;|endoftext|&gt;{text}&#34;, **kwargs)
-    result = r[&#39;choices&#39;][0]
-    tokens, logprobs = result[&#34;logprobs&#34;][&#34;tokens&#34;][1:], result[&#34;logprobs&#34;][&#34;token_logprobs&#34;][1:]
-
-    assert len(tokens) == len(logprobs), f&#34;Expected {len(tokens)} logprobs, got {len(logprobs)}&#34;
-
-    return np.mean(logprobs)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.OpenAI_APIModel.get_lls"><code class="name flex">
 <span>def <span class="ident">get_lls</span></span>(<span>self, texts: str)</span>
 </code></dt>
 <dd>
 <div class="desc"></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_lls(self, texts: str):
-
-    # use GPT2_TOKENIZER to get total number of tokens
-    total_tokens = sum(len(self.tokenizer.encode(text)) for text in texts)
-    self.API_TOKEN_COUNTER += total_tokens * 2  # multiply by two because OpenAI double-counts echo_prompt tokens
-
-    pool = ThreadPool(self.config.batch_size)
-    return pool.map(self.get_ll, texts)</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.OpenAI_APIModel.get_ref"><code class="name flex">
 <span>def <span class="ident">get_ref</span></span>(<span>self, text: str, ref_model: <a title="mimir.models.ReferenceModel" href="#mimir.models.ReferenceModel">ReferenceModel</a>)</span>
@@ -1992,34 +807,12 @@ <h3>Methods</h3>
 <dd>
 <div class="desc"><p>Get the
 likelihood ratio of each text under the base_model &ndash; MIA baseline</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">@torch.no_grad()
-def get_ref(self, text: str, ref_model: ReferenceModel):
-    &#34;&#34;&#34;
-        Get the  likelihood ratio of each text under the base_model -- MIA baseline
-    &#34;&#34;&#34;
-    raise NotImplementedError(&#34;OpenAI model not implemented for LIRA&#34;)
-    openai_config = self.config.openai_config
-    kwargs = {&#34;engine&#34;: openai_config.model, &#34;temperature&#34;: 0,
-                &#34;max_tokens&#34;: 0, &#34;echo&#34;: True, &#34;logprobs&#34;: 0}
-    r = openai.Completion.create(prompt=f&#34;&lt;|endoftext|&gt;{text}&#34;, **kwargs)
-    result = r[&#39;choices&#39;][0]
-    tokens, logprobs = result[&#34;logprobs&#34;][&#34;tokens&#34;][1:], result[&#34;logprobs&#34;][&#34;token_logprobs&#34;][1:]
-
-    assert len(tokens) == len(logprobs), f&#34;Expected {len(tokens)} logprobs, got {len(logprobs)}&#34;
-
-    return np.mean(logprobs)</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.models.LanguageModel" href="#mimir.models.LanguageModel">LanguageModel</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.models.LanguageModel.forward" href="#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_entropy" href="#mimir.models.LanguageModel.get_entropy">get_entropy</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_probabilities" href="#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_rank" href="#mimir.models.LanguageModel.get_rank">get_rank</a></code></li>
@@ -2067,26 +860,10 @@ <h3>Ancestors</h3>
 <li><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></li>
 <li>torch.nn.modules.module.Module</li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.models.QuantileReferenceModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.QuantileReferenceModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.QuantileReferenceModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.models.Model.forward" href="#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.Model.get_ll" href="#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.Model.get_probabilities" href="#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.Model.load" href="#mimir.models.Model.load">load</a></code></li>
@@ -2151,21 +928,6 @@ <h3>Ancestors</h3>
 <li><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></li>
 <li>torch.nn.modules.module.Module</li>
 </ul>
-<h3>Class variables</h3>
-<dl>
-<dt id="mimir.models.ReferenceModel.call_super_init"><code class="name">var <span class="ident">call_super_init</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.ReferenceModel.dump_patches"><code class="name">var <span class="ident">dump_patches</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-<dt id="mimir.models.ReferenceModel.training"><code class="name">var <span class="ident">training</span> : bool</code></dt>
-<dd>
-<div class="desc"></div>
-</dd>
-</dl>
 <h3>Methods</h3>
 <dl>
 <dt id="mimir.models.ReferenceModel.load"><code class="name flex">
@@ -2173,41 +935,18 @@ <h3>Methods</h3>
 </code></dt>
 <dd>
 <div class="desc"><p>Load reference model noto GPU(s)</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def load(self):
-    &#34;&#34;&#34;
-    Load reference model noto GPU(s)
-    &#34;&#34;&#34;
-    if &#34;llama&#34; not in self.name and &#34;alpaca&#34; not in self.name:
-        super().load()</code></pre>
-</details>
 </dd>
 <dt id="mimir.models.ReferenceModel.unload"><code class="name flex">
 <span>def <span class="ident">unload</span></span>(<span>self)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Unload reference model from GPU(s)</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def unload(self):
-    &#34;&#34;&#34;
-    Unload reference model from GPU(s)
-    &#34;&#34;&#34;
-    if &#34;llama&#34; not in self.name and &#34;alpaca&#34; not in self.name:
-        super().unload()</code></pre>
-</details>
 </dd>
 </dl>
 <h3>Inherited members</h3>
 <ul class="hlist">
 <li><code><b><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></b></code>:
 <ul class="hlist">
-<li><code><a title="mimir.models.Model.forward" href="#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.Model.get_ll" href="#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.Model.get_probabilities" href="#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.Model.load_base_model_and_tokenizer" href="#mimir.models.Model.load_base_model_and_tokenizer">load_base_model_and_tokenizer</a></code></li>
@@ -2226,7 +965,6 @@ <h3>Inherited members</h3>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -2241,60 +979,42 @@ <h1>Index</h1>
 <li>
 <h4><code><a title="mimir.models.LanguageModel" href="#mimir.models.LanguageModel">LanguageModel</a></code></h4>
 <ul class="two-column">
-<li><code><a title="mimir.models.LanguageModel.call_super_init" href="#mimir.models.LanguageModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.models.LanguageModel.dump_patches" href="#mimir.models.LanguageModel.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_entropy" href="#mimir.models.LanguageModel.get_entropy">get_entropy</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_lls" href="#mimir.models.LanguageModel.get_lls">get_lls</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_max_norm" href="#mimir.models.LanguageModel.get_max_norm">get_max_norm</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_rank" href="#mimir.models.LanguageModel.get_rank">get_rank</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.get_ref" href="#mimir.models.LanguageModel.get_ref">get_ref</a></code></li>
 <li><code><a title="mimir.models.LanguageModel.sample_from_model" href="#mimir.models.LanguageModel.sample_from_model">sample_from_model</a></code></li>
-<li><code><a title="mimir.models.LanguageModel.training" href="#mimir.models.LanguageModel.training">training</a></code></li>
 </ul>
 </li>
 <li>
 <h4><code><a title="mimir.models.Model" href="#mimir.models.Model">Model</a></code></h4>
 <ul class="">
-<li><code><a title="mimir.models.Model.call_super_init" href="#mimir.models.Model.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.models.Model.dump_patches" href="#mimir.models.Model.dump_patches">dump_patches</a></code></li>
-<li><code><a title="mimir.models.Model.forward" href="#mimir.models.Model.forward">forward</a></code></li>
 <li><code><a title="mimir.models.Model.get_ll" href="#mimir.models.Model.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.Model.get_probabilities" href="#mimir.models.Model.get_probabilities">get_probabilities</a></code></li>
 <li><code><a title="mimir.models.Model.load" href="#mimir.models.Model.load">load</a></code></li>
 <li><code><a title="mimir.models.Model.load_base_model_and_tokenizer" href="#mimir.models.Model.load_base_model_and_tokenizer">load_base_model_and_tokenizer</a></code></li>
 <li><code><a title="mimir.models.Model.load_model_properties" href="#mimir.models.Model.load_model_properties">load_model_properties</a></code></li>
 <li><code><a title="mimir.models.Model.to" href="#mimir.models.Model.to">to</a></code></li>
-<li><code><a title="mimir.models.Model.training" href="#mimir.models.Model.training">training</a></code></li>
 <li><code><a title="mimir.models.Model.unload" href="#mimir.models.Model.unload">unload</a></code></li>
 </ul>
 </li>
 <li>
 <h4><code><a title="mimir.models.OpenAI_APIModel" href="#mimir.models.OpenAI_APIModel">OpenAI_APIModel</a></code></h4>
-<ul class="two-column">
+<ul class="">
 <li><code><a title="mimir.models.OpenAI_APIModel.api_calls" href="#mimir.models.OpenAI_APIModel.api_calls">api_calls</a></code></li>
-<li><code><a title="mimir.models.OpenAI_APIModel.call_super_init" href="#mimir.models.OpenAI_APIModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.models.OpenAI_APIModel.dump_patches" href="#mimir.models.OpenAI_APIModel.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.models.OpenAI_APIModel.get_ll" href="#mimir.models.OpenAI_APIModel.get_ll">get_ll</a></code></li>
 <li><code><a title="mimir.models.OpenAI_APIModel.get_lls" href="#mimir.models.OpenAI_APIModel.get_lls">get_lls</a></code></li>
 <li><code><a title="mimir.models.OpenAI_APIModel.get_ref" href="#mimir.models.OpenAI_APIModel.get_ref">get_ref</a></code></li>
-<li><code><a title="mimir.models.OpenAI_APIModel.training" href="#mimir.models.OpenAI_APIModel.training">training</a></code></li>
 </ul>
 </li>
 <li>
 <h4><code><a title="mimir.models.QuantileReferenceModel" href="#mimir.models.QuantileReferenceModel">QuantileReferenceModel</a></code></h4>
-<ul class="">
-<li><code><a title="mimir.models.QuantileReferenceModel.call_super_init" href="#mimir.models.QuantileReferenceModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.models.QuantileReferenceModel.dump_patches" href="#mimir.models.QuantileReferenceModel.dump_patches">dump_patches</a></code></li>
-<li><code><a title="mimir.models.QuantileReferenceModel.training" href="#mimir.models.QuantileReferenceModel.training">training</a></code></li>
-</ul>
 </li>
 <li>
 <h4><code><a title="mimir.models.ReferenceModel" href="#mimir.models.ReferenceModel">ReferenceModel</a></code></h4>
 <ul class="">
-<li><code><a title="mimir.models.ReferenceModel.call_super_init" href="#mimir.models.ReferenceModel.call_super_init">call_super_init</a></code></li>
-<li><code><a title="mimir.models.ReferenceModel.dump_patches" href="#mimir.models.ReferenceModel.dump_patches">dump_patches</a></code></li>
 <li><code><a title="mimir.models.ReferenceModel.load" href="#mimir.models.ReferenceModel.load">load</a></code></li>
-<li><code><a title="mimir.models.ReferenceModel.training" href="#mimir.models.ReferenceModel.training">training</a></code></li>
 <li><code><a title="mimir.models.ReferenceModel.unload" href="#mimir.models.ReferenceModel.unload">unload</a></code></li>
 </ul>
 </li>
@@ -2304,7 +1024,7 @@ <h4><code><a title="mimir.models.ReferenceModel" href="#mimir.models.ReferenceMo
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/plot_utils.html b/docs/plot_utils.html
index 0edaa63..6eec9ed 100644
--- a/docs/plot_utils.html
+++ b/docs/plot_utils.html
@@ -2,18 +2,21 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.plot_utils API documentation</title>
-<meta name="description" content="Utilities related to plotting." />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+<meta name="description" content="Utilities related to plotting.">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -23,139 +26,6 @@ <h1 class="title">Module <code>mimir.plot_utils</code></h1>
 </header>
 <section id="section-intro">
 <p>Utilities related to plotting.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-    Utilities related to plotting.
-&#34;&#34;&#34;
-
-import matplotlib.pyplot as plt
-# Set high DPI
-plt.rcParams[&#39;figure.dpi&#39;] = 300
-
-
-# 15 colorblind-friendly colors
-COLORS = [&#34;#0072B2&#34;, &#34;#009E73&#34;, &#34;#D55E00&#34;, &#34;#CC79A7&#34;, &#34;#F0E442&#34;,
-            &#34;#56B4E9&#34;, &#34;#E69F00&#34;, &#34;#000000&#34;, &#34;#0072B2&#34;, &#34;#009E73&#34;,
-            &#34;#D55E00&#34;, &#34;#CC79A7&#34;, &#34;#F0E442&#34;, &#34;#56B4E9&#34;, &#34;#E69F00&#34;]
-
-
-def save_roc_curves(experiments, save_folder, model_name, neighbor_model_name: str = None):
-    &#34;&#34;&#34;
-        Save the ROC curve for each experiment, given a list of output dictionaries, one for each experiment, using colorblind-friendly colors.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment, color in zip(experiments, COLORS):
-        metrics = experiment[&#34;metrics&#34;]
-        plt.plot(metrics[&#34;fpr&#34;], metrics[&#34;tpr&#34;], label=f&#34;{experiment[&#39;name&#39;]}, roc_auc={metrics[&#39;roc_auc&#39;]:.3f}&#34;, color=color)
-        # print roc_auc for this experiment
-        print(f&#34;{experiment[&#39;name&#39;]} roc_auc: {metrics[&#39;roc_auc&#39;]:.3f}&#34;)
-    plt.plot([0, 1], [0, 1], color=&#39;black&#39;, lw=2, linestyle=&#39;--&#39;)
-    plt.xlim([0.0, 1.0])
-    plt.ylim([0.0, 1.05])
-    plt.xlabel(&#39;False Positive Rate&#39;)
-    plt.ylabel(&#39;True Positive Rate&#39;)
-    if neighbor_model_name:
-        plt.title(f&#39;ROC Curves ({model_name} - {neighbor_model_name})&#39;)
-    else:
-        plt.title(f&#39;ROC Curves ({model_name})&#39;)
-    plt.legend(loc=&#34;lower right&#34;, fontsize=6)
-    plt.savefig(f&#34;{save_folder}/roc_curves.png&#34;)
-
-    # Also plot ROC curves for low TPR-FPR region
-    plt.clf()
-    for experiment, color in zip(experiments, COLORS):
-        metrics = experiment[&#34;metrics&#34;]
-        plt.plot(metrics[&#34;fpr&#34;], metrics[&#34;tpr&#34;], label=f&#34;{experiment[&#39;name&#39;]}, roc_auc={metrics[&#39;roc_auc&#39;]:.3f}&#34;, color=color)
-    plt.xscale(&#39;log&#39;)
-    plt.yscale(&#39;log&#39;)
-    plt.xlim(1e-5, 1)
-    plt.ylim(1e-5, 1)
-    plt.plot([1e-5, 1], [1e-5, 1], color=&#39;black&#39;, lw=2, linestyle=&#39;--&#39;)
-    plt.xlabel(&#39;False Positive Rate&#39;)
-    plt.ylabel(&#39;True Positive Rate&#39;)
-    if neighbor_model_name:
-        plt.title(f&#39;ROC Curves ({model_name} - {neighbor_model_name}) : low FPR region&#39;)
-    else:
-        plt.title(f&#39;ROC Curves ({model_name} : low FPR region&#39;)
-    plt.legend(loc=&#34;lower right&#34;, fontsize=6)
-    plt.savefig(f&#34;{save_folder}/roc_curves_low_fpr.png&#34;)
-
-
-def save_f1_histogram(f1_scores, save_folder):
-    &#34;&#34;&#34;
-        Function for saving F1-score histograms.
-    &#34;&#34;&#34;
-    plt.hist(f1_scores, bins=20, edgecolor=&#39;black&#39;, alpha=0.7)
-    plt.xlabel(&#39;F1 Score&#39;)
-    plt.ylabel(&#39;Frequency&#39;)
-    plt.title(&#39;Histogram of F1 Scores&#39;)
-    plt.savefig(f&#34;{save_folder}/f1_hist.png&#34;)
-    plt.close()
-
-
-def save_ll_histograms(experiments, save_folder):
-    &#34;&#34;&#34;
-        Save the histogram of log likelihoods in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment in experiments:
-        try:
-            results = experiment[&#34;raw_results&#34;]
-            # plot histogram of sampled/perturbed sampled on left, original/perturbed original on right
-            plt.figure(figsize=(20, 6))
-            plt.subplot(1, 2, 1)
-            plt.hist([r[&#34;sampled_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;member&#39;)
-            plt.hist([r[&#34;perturbed_sampled_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;perturbed sampled&#39;)
-            plt.xlabel(&#34;log likelihood&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.subplot(1, 2, 2)
-            plt.hist([r[&#34;original_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;nonmember&#39;)
-            plt.hist([r[&#34;perturbed_original_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;perturbed original&#39;)
-            plt.xlabel(&#34;log likelihood&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.savefig(
-                f&#34;{save_folder}/ll_histograms_{experiment[&#39;name&#39;]}.png&#34;)
-        except:
-            pass
-
-
-def save_llr_histograms(experiments, save_folder):
-    &#34;&#34;&#34;
-        Save the histograms of log likelihood ratios in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment in experiments:
-        try:
-            results = experiment[&#34;raw_results&#34;]
-            # plot histogram of sampled/perturbed sampled on left, original/perturbed original on right
-            plt.figure(figsize=(20, 6))
-            plt.subplot(1, 2, 1)
-
-            # compute the log likelihood ratio for each result
-            for r in results:
-                r[&#34;sampled_llr&#34;] = r[&#34;sampled_ll&#34;] - r[&#34;perturbed_sampled_ll&#34;]
-                r[&#34;original_llr&#34;] = r[&#34;original_ll&#34;] - r[&#34;perturbed_original_ll&#34;]
-            
-            plt.hist([r[&#34;sampled_llr&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;member&#39;)
-            plt.hist([r[&#34;original_llr&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;nonmember&#39;)
-            plt.xlabel(&#34;log likelihood ratio&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.savefig(f&#34;{save_folder}/llr_histograms_{experiment[&#39;name&#39;]}.png&#34;)
-        except:
-            pass</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -169,151 +39,24 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 </code></dt>
 <dd>
 <div class="desc"><p>Function for saving F1-score histograms.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def save_f1_histogram(f1_scores, save_folder):
-    &#34;&#34;&#34;
-        Function for saving F1-score histograms.
-    &#34;&#34;&#34;
-    plt.hist(f1_scores, bins=20, edgecolor=&#39;black&#39;, alpha=0.7)
-    plt.xlabel(&#39;F1 Score&#39;)
-    plt.ylabel(&#39;Frequency&#39;)
-    plt.title(&#39;Histogram of F1 Scores&#39;)
-    plt.savefig(f&#34;{save_folder}/f1_hist.png&#34;)
-    plt.close()</code></pre>
-</details>
 </dd>
 <dt id="mimir.plot_utils.save_ll_histograms"><code class="name flex">
 <span>def <span class="ident">save_ll_histograms</span></span>(<span>experiments, save_folder)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Save the histogram of log likelihoods in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def save_ll_histograms(experiments, save_folder):
-    &#34;&#34;&#34;
-        Save the histogram of log likelihoods in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment in experiments:
-        try:
-            results = experiment[&#34;raw_results&#34;]
-            # plot histogram of sampled/perturbed sampled on left, original/perturbed original on right
-            plt.figure(figsize=(20, 6))
-            plt.subplot(1, 2, 1)
-            plt.hist([r[&#34;sampled_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;member&#39;)
-            plt.hist([r[&#34;perturbed_sampled_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;perturbed sampled&#39;)
-            plt.xlabel(&#34;log likelihood&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.subplot(1, 2, 2)
-            plt.hist([r[&#34;original_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;nonmember&#39;)
-            plt.hist([r[&#34;perturbed_original_ll&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;perturbed original&#39;)
-            plt.xlabel(&#34;log likelihood&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.savefig(
-                f&#34;{save_folder}/ll_histograms_{experiment[&#39;name&#39;]}.png&#34;)
-        except:
-            pass</code></pre>
-</details>
 </dd>
 <dt id="mimir.plot_utils.save_llr_histograms"><code class="name flex">
 <span>def <span class="ident">save_llr_histograms</span></span>(<span>experiments, save_folder)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Save the histograms of log likelihood ratios in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def save_llr_histograms(experiments, save_folder):
-    &#34;&#34;&#34;
-        Save the histograms of log likelihood ratios in two side-by-side plots, one for real and real perturbed, and one for sampled and sampled perturbed.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment in experiments:
-        try:
-            results = experiment[&#34;raw_results&#34;]
-            # plot histogram of sampled/perturbed sampled on left, original/perturbed original on right
-            plt.figure(figsize=(20, 6))
-            plt.subplot(1, 2, 1)
-
-            # compute the log likelihood ratio for each result
-            for r in results:
-                r[&#34;sampled_llr&#34;] = r[&#34;sampled_ll&#34;] - r[&#34;perturbed_sampled_ll&#34;]
-                r[&#34;original_llr&#34;] = r[&#34;original_ll&#34;] - r[&#34;perturbed_original_ll&#34;]
-            
-            plt.hist([r[&#34;sampled_llr&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;member&#39;)
-            plt.hist([r[&#34;original_llr&#34;] for r in results], alpha=0.5, bins=&#39;auto&#39;, label=&#39;nonmember&#39;)
-            plt.xlabel(&#34;log likelihood ratio&#34;)
-            plt.ylabel(&#39;count&#39;)
-            plt.legend(loc=&#39;upper right&#39;)
-            plt.savefig(f&#34;{save_folder}/llr_histograms_{experiment[&#39;name&#39;]}.png&#34;)
-        except:
-            pass</code></pre>
-</details>
 </dd>
 <dt id="mimir.plot_utils.save_roc_curves"><code class="name flex">
 <span>def <span class="ident">save_roc_curves</span></span>(<span>experiments, save_folder, model_name, neighbor_model_name: str = None)</span>
 </code></dt>
 <dd>
 <div class="desc"><p>Save the ROC curve for each experiment, given a list of output dictionaries, one for each experiment, using colorblind-friendly colors.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def save_roc_curves(experiments, save_folder, model_name, neighbor_model_name: str = None):
-    &#34;&#34;&#34;
-        Save the ROC curve for each experiment, given a list of output dictionaries, one for each experiment, using colorblind-friendly colors.
-    &#34;&#34;&#34;
-    # first, clear plt
-    plt.clf()
-
-    for experiment, color in zip(experiments, COLORS):
-        metrics = experiment[&#34;metrics&#34;]
-        plt.plot(metrics[&#34;fpr&#34;], metrics[&#34;tpr&#34;], label=f&#34;{experiment[&#39;name&#39;]}, roc_auc={metrics[&#39;roc_auc&#39;]:.3f}&#34;, color=color)
-        # print roc_auc for this experiment
-        print(f&#34;{experiment[&#39;name&#39;]} roc_auc: {metrics[&#39;roc_auc&#39;]:.3f}&#34;)
-    plt.plot([0, 1], [0, 1], color=&#39;black&#39;, lw=2, linestyle=&#39;--&#39;)
-    plt.xlim([0.0, 1.0])
-    plt.ylim([0.0, 1.05])
-    plt.xlabel(&#39;False Positive Rate&#39;)
-    plt.ylabel(&#39;True Positive Rate&#39;)
-    if neighbor_model_name:
-        plt.title(f&#39;ROC Curves ({model_name} - {neighbor_model_name})&#39;)
-    else:
-        plt.title(f&#39;ROC Curves ({model_name})&#39;)
-    plt.legend(loc=&#34;lower right&#34;, fontsize=6)
-    plt.savefig(f&#34;{save_folder}/roc_curves.png&#34;)
-
-    # Also plot ROC curves for low TPR-FPR region
-    plt.clf()
-    for experiment, color in zip(experiments, COLORS):
-        metrics = experiment[&#34;metrics&#34;]
-        plt.plot(metrics[&#34;fpr&#34;], metrics[&#34;tpr&#34;], label=f&#34;{experiment[&#39;name&#39;]}, roc_auc={metrics[&#39;roc_auc&#39;]:.3f}&#34;, color=color)
-    plt.xscale(&#39;log&#39;)
-    plt.yscale(&#39;log&#39;)
-    plt.xlim(1e-5, 1)
-    plt.ylim(1e-5, 1)
-    plt.plot([1e-5, 1], [1e-5, 1], color=&#39;black&#39;, lw=2, linestyle=&#39;--&#39;)
-    plt.xlabel(&#39;False Positive Rate&#39;)
-    plt.ylabel(&#39;True Positive Rate&#39;)
-    if neighbor_model_name:
-        plt.title(f&#39;ROC Curves ({model_name} - {neighbor_model_name}) : low FPR region&#39;)
-    else:
-        plt.title(f&#39;ROC Curves ({model_name} : low FPR region&#39;)
-    plt.legend(loc=&#34;lower right&#34;, fontsize=6)
-    plt.savefig(f&#34;{save_folder}/roc_curves_low_fpr.png&#34;)</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -326,7 +69,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -348,7 +90,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>
diff --git a/docs/utils.html b/docs/utils.html
index ed5bb72..fe6876c 100644
--- a/docs/utils.html
+++ b/docs/utils.html
@@ -2,19 +2,22 @@
 <html lang="en">
 <head>
 <meta charset="utf-8">
-<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1" />
-<meta name="generator" content="pdoc 0.10.0" />
+<meta name="viewport" content="width=device-width, initial-scale=1, minimum-scale=1">
+<meta name="generator" content="pdoc3 0.11.1">
 <title>mimir.utils API documentation</title>
 <meta name="description" content="utils.py
-This module provides utility functions …" />
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/sanitize.min.css" integrity="sha256-PK9q560IAAa6WVRRh76LtCaI8pjTJ2z11v0miyNNjrs=" crossorigin>
-<link rel="preload stylesheet" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/11.0.1/typography.min.css" integrity="sha256-7l/o7C8jubJiy74VsKTidCy1yBkRtiUGbVkYBylBqUg=" crossorigin>
-<link rel="stylesheet preload" as="style" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/styles/github.min.css" crossorigin>
-<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:30px;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:1em 0 .50em 0}h3{font-size:1.4em;margin:25px 0 10px 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .3s ease-in-out}a:hover{color:#e82}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900}pre code{background:#f8f8f8;font-size:.8em;line-height:1.4em}code{background:#f2f2f1;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{background:#f8f8f8;border:0;border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0;padding:1ex}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-weight:bold;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em .5em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
-<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.item .name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul{padding-left:1.5em}.toc > ul > li{margin-top:.5em}}</style>
+This module provides utility functions …">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/sanitize.min.css" integrity="sha512-y1dtMcuvtTMJc1yPgEqF0ZjQbhnc/bFhyvIyVNb9Zk5mIGtqVaAB1Ttl28su8AvFMOY0EwRbAe+HCLqj6W7/KA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/10up-sanitize.css/13.0.0/typography.min.css" integrity="sha512-Y1DYSb995BAfxobCkKepB1BqJJTPrOp3zPL74AWFugHHmmdcvO+C48WLrUOlhGMc0QG7AE3f7gmvvcrmX2fDoA==" crossorigin>
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/styles/default.min.css" crossorigin>
+<style>:root{--highlight-color:#fe9}.flex{display:flex !important}body{line-height:1.5em}#content{padding:20px}#sidebar{padding:1.5em;overflow:hidden}#sidebar > *:last-child{margin-bottom:2cm}.http-server-breadcrumbs{font-size:130%;margin:0 0 15px 0}#footer{font-size:.75em;padding:5px 30px;border-top:1px solid #ddd;text-align:right}#footer p{margin:0 0 0 1em;display:inline-block}#footer p:last-child{margin-right:30px}h1,h2,h3,h4,h5{font-weight:300}h1{font-size:2.5em;line-height:1.1em}h2{font-size:1.75em;margin:2em 0 .50em 0}h3{font-size:1.4em;margin:1.6em 0 .7em 0}h4{margin:0;font-size:105%}h1:target,h2:target,h3:target,h4:target,h5:target,h6:target{background:var(--highlight-color);padding:.2em 0}a{color:#058;text-decoration:none;transition:color .2s ease-in-out}a:visited{color:#503}a:hover{color:#b62}.title code{font-weight:bold}h2[id^="header-"]{margin-top:2em}.ident{color:#900;font-weight:bold}pre code{font-size:.8em;line-height:1.4em;padding:1em;display:block}code{background:#f3f3f3;font-family:"DejaVu Sans Mono",monospace;padding:1px 4px;overflow-wrap:break-word}h1 code{background:transparent}pre{border-top:1px solid #ccc;border-bottom:1px solid #ccc;margin:1em 0}#http-server-module-list{display:flex;flex-flow:column}#http-server-module-list div{display:flex}#http-server-module-list dt{min-width:10%}#http-server-module-list p{margin-top:0}.toc ul,#index{list-style-type:none;margin:0;padding:0}#index code{background:transparent}#index h3{border-bottom:1px solid #ddd}#index ul{padding:0}#index h4{margin-top:.6em;font-weight:bold}@media (min-width:200ex){#index .two-column{column-count:2}}@media (min-width:300ex){#index .two-column{column-count:3}}dl{margin-bottom:2em}dl dl:last-child{margin-bottom:4em}dd{margin:0 0 1em 3em}#header-classes + dl > dd{margin-bottom:3em}dd dd{margin-left:2em}dd p{margin:10px 0}.name{background:#eee;font-size:.85em;padding:5px 10px;display:inline-block;min-width:40%}.name:hover{background:#e0e0e0}dt:target .name{background:var(--highlight-color)}.name > span:first-child{white-space:nowrap}.name.class > span:nth-child(2){margin-left:.4em}.inherited{color:#999;border-left:5px solid #eee;padding-left:1em}.inheritance em{font-style:normal;font-weight:bold}.desc h2{font-weight:400;font-size:1.25em}.desc h3{font-size:1em}.desc dt code{background:inherit}.source summary,.git-link-div{color:#666;text-align:right;font-weight:400;font-size:.8em;text-transform:uppercase}.source summary > *{white-space:nowrap;cursor:pointer}.git-link{color:inherit;margin-left:1em}.source pre{max-height:500px;overflow:auto;margin:0}.source pre code{font-size:12px;overflow:visible}.hlist{list-style:none}.hlist li{display:inline}.hlist li:after{content:',\2002'}.hlist li:last-child:after{content:none}.hlist .hlist{display:inline;padding-left:1em}img{max-width:100%}td{padding:0 .5em}.admonition{padding:.1em 1em;margin-bottom:1em}.admonition-title{font-weight:bold}.admonition.note,.admonition.info,.admonition.important{background:#aef}.admonition.todo,.admonition.versionadded,.admonition.tip,.admonition.hint{background:#dfd}.admonition.warning,.admonition.versionchanged,.admonition.deprecated{background:#fd4}.admonition.error,.admonition.danger,.admonition.caution{background:lightpink}</style>
+<style media="screen and (min-width: 700px)">@media screen and (min-width:700px){#sidebar{width:30%;height:100vh;overflow:auto;position:sticky;top:0}#content{width:70%;max-width:100ch;padding:3em 4em;border-left:1px solid #ddd}pre code{font-size:1em}.name{font-size:1em}main{display:flex;flex-direction:row-reverse;justify-content:flex-end}.toc ul ul,#index ul ul{padding-left:1em}.toc > ul > li{margin-top:.5em}}</style>
 <style media="print">@media print{#sidebar h1{page-break-before:always}.source{display:none}}@media print{*{background:transparent !important;color:#000 !important;box-shadow:none !important;text-shadow:none !important}a[href]:after{content:" (" attr(href) ")";font-size:90%}a[href][title]:after{content:none}abbr[title]:after{content:" (" attr(title) ")"}.ir a:after,a[href^="javascript:"]:after,a[href^="#"]:after{content:""}pre,blockquote{border:1px solid #999;page-break-inside:avoid}thead{display:table-header-group}tr,img{page-break-inside:avoid}img{max-width:100% !important}@page{margin:0.5cm}p,h2,h3{orphans:3;widows:3}h1,h2,h3,h4,h5,h6{page-break-after:avoid}}</style>
-<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.1.1/highlight.min.js" integrity="sha256-Uv3H6lx7dJmRfRvH8TH6kJD1TSK1aFcwgx+mdg3epi8=" crossorigin></script>
-<script>window.addEventListener('DOMContentLoaded', () => hljs.initHighlighting())</script>
+<script defer src="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/11.9.0/highlight.min.js" integrity="sha512-D9gUyxqja7hBtkWpPWGt9wfbfaMGVt9gnyCvYa+jojwwPHLCzUm5i8rpk7vD7wNee9bA35eYIjobYPaQuKS1MQ==" crossorigin></script>
+<script>window.addEventListener('DOMContentLoaded', () => {
+hljs.configure({languages: ['bash', 'css', 'diff', 'graphql', 'ini', 'javascript', 'json', 'plaintext', 'python', 'python-repl', 'rust', 'shell', 'sql', 'typescript', 'xml', 'yaml']});
+hljs.highlightAll();
+})</script>
 </head>
 <body>
 <main>
@@ -28,68 +31,6 @@ <h1 class="title">Module <code>mimir.utils</code></h1>
 <p>Environment Variables:
 MIMIR_CACHE_PATH: The path to the cache directory. This should be set in the environment.
 MIMIR_DATA_SOURCE: The data source for the MIMIR project. This should be set in the environment.</p>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">&#34;&#34;&#34;
-utils.py
-This module provides utility functions.
-
-Environment Variables:
-    MIMIR_CACHE_PATH: The path to the cache directory. This should be set in the environment.
-    MIMIR_DATA_SOURCE: The data source for the MIMIR project. This should be set in the environment.
-&#34;&#34;&#34;
-
-import os
-import random
-import torch as ch
-import numpy as np
-
-# Read environment variables
-CACHE_PATH = os.environ.get(&#39;MIMIR_CACHE_PATH&#39;, None)
-DATA_SOURCE = os.environ.get(&#39;MIMIR_DATA_SOURCE&#39;, None)
-
-
-def fix_seed(seed: int = 0):
-    &#34;&#34;&#34;
-    Fix seed for reproducibility.
-
-    Parameters:
-        seed (int): The seed to set. Default is 0.
-    &#34;&#34;&#34;
-    ch.manual_seed(seed)
-    np.random.seed(seed)
-    random.seed(seed)
-
-
-def get_cache_path():
-    &#34;&#34;&#34;
-    Get path to cache directory.
-    Returns:
-        str: path to cache directory
-
-    Raises:
-        ValueError: If the MIMIR_CACHE_PATH environment variable is not set.
-    &#34;&#34;&#34;
-    if CACHE_PATH is None:
-        raise ValueError(&#39;MIMIR_CACHE_PATH environment variable not set&#39;)
-    return CACHE_PATH
-
-
-def get_data_source():
-    &#34;&#34;&#34;
-    Get path to data source directory.
-    Returns:
-        str: path to data source directory
-
-    Raises:
-        ValueError: If the MIMIR_DATA_SOURCE environment variable is not set.
-    &#34;&#34;&#34;
-    if DATA_SOURCE is None:
-        raise ValueError(&#39;MIMIR_DATA_SOURCE environment variable not set&#39;)
-    return DATA_SOURCE</code></pre>
-</details>
 </section>
 <section>
 </section>
@@ -105,21 +46,6 @@ <h2 class="section-title" id="header-functions">Functions</h2>
 <div class="desc"><p>Fix seed for reproducibility.</p>
 <h2 id="parameters">Parameters</h2>
 <p>seed (int): The seed to set. Default is 0.</p></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def fix_seed(seed: int = 0):
-    &#34;&#34;&#34;
-    Fix seed for reproducibility.
-
-    Parameters:
-        seed (int): The seed to set. Default is 0.
-    &#34;&#34;&#34;
-    ch.manual_seed(seed)
-    np.random.seed(seed)
-    random.seed(seed)</code></pre>
-</details>
 </dd>
 <dt id="mimir.utils.get_cache_path"><code class="name flex">
 <span>def <span class="ident">get_cache_path</span></span>(<span>)</span>
@@ -136,23 +62,6 @@ <h2 id="raises">Raises</h2>
 <dt><code>ValueError</code></dt>
 <dd>If the MIMIR_CACHE_PATH environment variable is not set.</dd>
 </dl></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_cache_path():
-    &#34;&#34;&#34;
-    Get path to cache directory.
-    Returns:
-        str: path to cache directory
-
-    Raises:
-        ValueError: If the MIMIR_CACHE_PATH environment variable is not set.
-    &#34;&#34;&#34;
-    if CACHE_PATH is None:
-        raise ValueError(&#39;MIMIR_CACHE_PATH environment variable not set&#39;)
-    return CACHE_PATH</code></pre>
-</details>
 </dd>
 <dt id="mimir.utils.get_data_source"><code class="name flex">
 <span>def <span class="ident">get_data_source</span></span>(<span>)</span>
@@ -169,23 +78,6 @@ <h2 id="raises">Raises</h2>
 <dt><code>ValueError</code></dt>
 <dd>If the MIMIR_DATA_SOURCE environment variable is not set.</dd>
 </dl></div>
-<details class="source">
-<summary>
-<span>Expand source code</span>
-</summary>
-<pre><code class="python">def get_data_source():
-    &#34;&#34;&#34;
-    Get path to data source directory.
-    Returns:
-        str: path to data source directory
-
-    Raises:
-        ValueError: If the MIMIR_DATA_SOURCE environment variable is not set.
-    &#34;&#34;&#34;
-    if DATA_SOURCE is None:
-        raise ValueError(&#39;MIMIR_DATA_SOURCE environment variable not set&#39;)
-    return DATA_SOURCE</code></pre>
-</details>
 </dd>
 </dl>
 </section>
@@ -198,7 +90,6 @@ <h2 id="raises">Raises</h2>
 <img src="https://raw.githubusercontent.com/iamgroot42/mimir/8ed6886fb6df7a72f2f0f398688f48b68c5f48b0/assets/logo.png" alt="MIMIR">
 </a>
 </header>
-<h1>Index</h1>
 <div class="toc">
 <ul></ul>
 </div>
@@ -219,7 +110,7 @@ <h1>Index</h1>
 </nav>
 </main>
 <footer id="footer">
-<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.10.0</a>.</p>
+<p>Generated by <a href="https://pdoc3.github.io/pdoc" title="pdoc: Python API documentation generator"><cite>pdoc</cite> 0.11.1</a>.</p>
 </footer>
 </body>
-</html>
\ No newline at end of file
+</html>