diff --git a/docs/topic_guides/comparisons/choosing_comparators.ipynb b/docs/topic_guides/comparisons/choosing_comparators.ipynb
index 28c8b2f73f..32172e4e5b 100644
--- a/docs/topic_guides/comparisons/choosing_comparators.ipynb
+++ b/docs/topic_guides/comparisons/choosing_comparators.ipynb
@@ -51,70 +51,12 @@
    "cell_type": "code",
    "execution_count": 1,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>string1</th>\n",
-       "      <th>string2</th>\n",
-       "      <th>levenshtein_distance</th>\n",
-       "      <th>damerau_levenshtein_distance</th>\n",
-       "      <th>jaro_similarity</th>\n",
-       "      <th>jaro_winkler_similarity</th>\n",
-       "      <th>jaccard_similarity</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>iRchard</td>\n",
-       "      <td>2</td>\n",
-       "      <td>1</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>1.0</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "   string1  string2  levenshtein_distance  damerau_levenshtein_distance  \\\n",
-       "0  Richard  iRchard                     2                             1   \n",
-       "\n",
-       "   jaro_similarity  jaro_winkler_similarity  jaccard_similarity  \n",
-       "0             0.95                     0.95                 1.0  "
-      ]
-     },
-     "execution_count": 1,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "import splink.comparison_helpers as ch\n",
     "\n",
     "ch.comparator_score(\"Richard\", \"iRchard\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -128,131 +70,6 @@
    "cell_type": "code",
    "execution_count": 2,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>string1</th>\n",
-       "      <th>string2</th>\n",
-       "      <th>error_type</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richard</td>\n",
-       "      <td>None</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>ichard</td>\n",
-       "      <td>Deletion</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richar</td>\n",
-       "      <td>Deletion</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>iRchard</td>\n",
-       "      <td>Transposition</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richadr</td>\n",
-       "      <td>Transposition</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rich</td>\n",
-       "      <td>Shortening</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rick</td>\n",
-       "      <td>Nickname/Alias</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Ricky</td>\n",
-       "      <td>Nickname/Alias</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Dick</td>\n",
-       "      <td>Nickname/Alias</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rico</td>\n",
-       "      <td>Nickname/Alias</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rachael</td>\n",
-       "      <td>Different Name</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Different Name</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "    string1  string2      error_type\n",
-       "0   Richard  Richard            None\n",
-       "1   Richard   ichard        Deletion\n",
-       "2   Richard   Richar        Deletion\n",
-       "3   Richard  iRchard   Transposition\n",
-       "4   Richard  Richadr   Transposition\n",
-       "5   Richard     Rich      Shortening\n",
-       "6   Richard     Rick  Nickname/Alias\n",
-       "7   Richard    Ricky  Nickname/Alias\n",
-       "8   Richard     Dick  Nickname/Alias\n",
-       "9   Richard     Rico  Nickname/Alias\n",
-       "10  Richard  Rachael  Different Name\n",
-       "11  Richard  Stephen  Different Name"
-      ]
-     },
-     "execution_count": 2,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "import pandas as pd\n",
     "\n",
@@ -302,7 +119,8 @@
     "}\n",
     "df = pd.DataFrame(data)\n",
     "df"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -316,107 +134,10 @@
    "cell_type": "code",
    "execution_count": 3,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/Users/rosskennedy/splink/splink/comparison_helpers.py:121: SettingWithCopyWarning: \n",
-      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
-      "Try using .loc[row_indexer,col_indexer] = value instead\n",
-      "\n",
-      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
-      "  similarity_df[\"comparator\"] = similarity_df[\"comparator\"].str.replace(\n",
-      "/Users/rosskennedy/splink/splink/comparison_helpers.py:126: SettingWithCopyWarning: \n",
-      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
-      "Try using .loc[row_indexer,col_indexer] = value instead\n",
-      "\n",
-      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
-      "  distance_df[\"comparator\"] = distance_df[\"comparator\"].str.replace(\"_distance\", \"\")\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<style>\n",
-       "  #altair-viz-c4cb5c9ac0704c58be721985f863269f.vega-embed {\n",
-       "    width: 100%;\n",
-       "    display: flex;\n",
-       "  }\n",
-       "\n",
-       "  #altair-viz-c4cb5c9ac0704c58be721985f863269f.vega-embed details,\n",
-       "  #altair-viz-c4cb5c9ac0704c58be721985f863269f.vega-embed details summary {\n",
-       "    position: relative;\n",
-       "  }\n",
-       "</style>\n",
-       "<div id=\"altair-viz-c4cb5c9ac0704c58be721985f863269f\"></div>\n",
-       "<script type=\"text/javascript\">\n",
-       "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
-       "  (function(spec, embedOpt){\n",
-       "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-c4cb5c9ac0704c58be721985f863269f\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-c4cb5c9ac0704c58be721985f863269f\");\n",
-       "    }\n",
-       "    const paths = {\n",
-       "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
-       "      \"vega-lib\": \"https://cdn.jsdelivr.net/npm/vega-lib?noext\",\n",
-       "      \"vega-lite\": \"https://cdn.jsdelivr.net/npm/vega-lite@5.8.0?noext\",\n",
-       "      \"vega-embed\": \"https://cdn.jsdelivr.net/npm/vega-embed@6?noext\",\n",
-       "    };\n",
-       "\n",
-       "    function maybeLoadScript(lib, version) {\n",
-       "      var key = `${lib.replace(\"-\", \"\")}_version`;\n",
-       "      return (VEGA_DEBUG[key] == version) ?\n",
-       "        Promise.resolve(paths[lib]) :\n",
-       "        new Promise(function(resolve, reject) {\n",
-       "          var s = document.createElement('script');\n",
-       "          document.getElementsByTagName(\"head\")[0].appendChild(s);\n",
-       "          s.async = true;\n",
-       "          s.onload = () => {\n",
-       "            VEGA_DEBUG[key] = version;\n",
-       "            return resolve(paths[lib]);\n",
-       "          };\n",
-       "          s.onerror = () => reject(`Error loading script: ${paths[lib]}`);\n",
-       "          s.src = paths[lib];\n",
-       "        });\n",
-       "    }\n",
-       "\n",
-       "    function showError(err) {\n",
-       "      outputDiv.innerHTML = `<div class=\"error\" style=\"color:red;\">${err}</div>`;\n",
-       "      throw err;\n",
-       "    }\n",
-       "\n",
-       "    function displayChart(vegaEmbed) {\n",
-       "      vegaEmbed(outputDiv, spec, embedOpt)\n",
-       "        .catch(err => showError(`Javascript Error: ${err.message}<br>This usually means there's a typo in your chart specification. See the javascript console for the full traceback.`));\n",
-       "    }\n",
-       "\n",
-       "    if(typeof define === \"function\" && define.amd) {\n",
-       "      requirejs.config({paths});\n",
-       "      require([\"vega-embed\"], displayChart, err => showError(`Error loading script: ${err.message}`));\n",
-       "    } else {\n",
-       "      maybeLoadScript(\"vega\", \"5\")\n",
-       "        .then(() => maybeLoadScript(\"vega-lite\", \"5.8.0\"))\n",
-       "        .then(() => maybeLoadScript(\"vega-embed\", \"6\"))\n",
-       "        .catch(showError)\n",
-       "        .then(() => displayChart(vegaEmbed));\n",
-       "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300, \"discreteHeight\": {\"step\": 30}, \"discreteWidth\": {\"step\": 40}}}, \"hconcat\": [{\"layer\": [{\"mark\": {\"type\": \"rect\"}, \"encoding\": {\"color\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"domain\": [0, 1], \"scheme\": \"greenblue\"}, \"type\": \"quantitative\"}, \"x\": {\"field\": \"comparator\", \"title\": null, \"type\": \"ordinal\"}, \"y\": {\"axis\": {\"titleFontSize\": 14}, \"field\": \"strings_to_compare\", \"title\": \"String comparison\", \"type\": \"ordinal\"}}, \"title\": \"Similarity\"}, {\"mark\": {\"type\": \"text\", \"baseline\": \"middle\"}, \"encoding\": {\"size\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"range\": [8, 14]}}, \"text\": {\"field\": \"score\", \"format\": \".2f\", \"type\": \"quantitative\"}, \"x\": {\"axis\": {\"labelFontSize\": 12}, \"field\": \"comparator\", \"type\": \"ordinal\"}, \"y\": {\"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}}], \"data\": {\"name\": \"data-similarity\"}}, {\"layer\": [{\"mark\": {\"type\": \"rect\"}, \"encoding\": {\"color\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"reverse\": true, \"scheme\": \"yelloworangered\"}, \"type\": \"quantitative\"}, \"x\": {\"axis\": {\"labelFontSize\": 12}, \"field\": \"comparator\", \"title\": null, \"type\": \"ordinal\"}, \"y\": {\"axis\": null, \"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}, \"title\": \"Distance\"}, {\"mark\": {\"type\": \"text\", \"baseline\": \"middle\"}, \"encoding\": {\"size\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"range\": [8, 14], \"reverse\": true}}, \"text\": {\"field\": \"score\", \"type\": \"quantitative\"}, \"x\": {\"field\": \"comparator\", \"type\": \"ordinal\"}, \"y\": {\"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}}], \"data\": {\"name\": \"data-distance\"}}], \"datasets\": {\"data-similarity\": \"[{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.73},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.68},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.6},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.73},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.71},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.43},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.97},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.97},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.91},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.81},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.68},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.6},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.81},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.74},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.43},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.57},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.38},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.33},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.22},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.38},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.44},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.08}]\", \"data-distance\": \"[{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":0.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":2.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":2.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":5.0},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":7.0},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":0.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":5.0},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":7.0}]\"}, \"resolve\": {\"scale\": {\"color\": \"independent\", \"size\": \"independent\", \"y\": \"shared\"}}, \"title\": {\"text\": \"Heatmaps of string comparison metrics\", \"anchor\": \"middle\", \"fontSize\": 16}, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.9.3.json\"}, {\"mode\": \"vega-lite\"});\n",
-       "</script>"
-      ],
-      "text/plain": [
-       "alt.HConcatChart(...)"
-      ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.comparator_score_chart(data, \"string1\", \"string2\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -438,200 +159,10 @@
    "cell_type": "code",
    "execution_count": 4,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>string1</th>\n",
-       "      <th>string2</th>\n",
-       "      <th>levenshtein_distance</th>\n",
-       "      <th>damerau_levenshtein_distance</th>\n",
-       "      <th>jaro_similarity</th>\n",
-       "      <th>jaro_winkler_similarity</th>\n",
-       "      <th>jaccard_similarity</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richard</td>\n",
-       "      <td>0</td>\n",
-       "      <td>0</td>\n",
-       "      <td>1.00</td>\n",
-       "      <td>1.00</td>\n",
-       "      <td>1.00</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>ichard</td>\n",
-       "      <td>1</td>\n",
-       "      <td>1</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.86</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richar</td>\n",
-       "      <td>1</td>\n",
-       "      <td>1</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.97</td>\n",
-       "      <td>0.86</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>iRchard</td>\n",
-       "      <td>2</td>\n",
-       "      <td>1</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>1.00</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Richadr</td>\n",
-       "      <td>2</td>\n",
-       "      <td>1</td>\n",
-       "      <td>0.95</td>\n",
-       "      <td>0.97</td>\n",
-       "      <td>1.00</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rich</td>\n",
-       "      <td>3</td>\n",
-       "      <td>3</td>\n",
-       "      <td>0.86</td>\n",
-       "      <td>0.91</td>\n",
-       "      <td>0.57</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rick</td>\n",
-       "      <td>4</td>\n",
-       "      <td>4</td>\n",
-       "      <td>0.73</td>\n",
-       "      <td>0.81</td>\n",
-       "      <td>0.38</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Ricky</td>\n",
-       "      <td>4</td>\n",
-       "      <td>4</td>\n",
-       "      <td>0.68</td>\n",
-       "      <td>0.68</td>\n",
-       "      <td>0.33</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Dick</td>\n",
-       "      <td>5</td>\n",
-       "      <td>5</td>\n",
-       "      <td>0.60</td>\n",
-       "      <td>0.60</td>\n",
-       "      <td>0.22</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rico</td>\n",
-       "      <td>4</td>\n",
-       "      <td>4</td>\n",
-       "      <td>0.73</td>\n",
-       "      <td>0.81</td>\n",
-       "      <td>0.38</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Rachael</td>\n",
-       "      <td>3</td>\n",
-       "      <td>3</td>\n",
-       "      <td>0.71</td>\n",
-       "      <td>0.74</td>\n",
-       "      <td>0.44</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>7</td>\n",
-       "      <td>7</td>\n",
-       "      <td>0.43</td>\n",
-       "      <td>0.43</td>\n",
-       "      <td>0.08</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "    string1  string2  levenshtein_distance  damerau_levenshtein_distance  \\\n",
-       "0   Richard  Richard                     0                             0   \n",
-       "1   Richard   ichard                     1                             1   \n",
-       "2   Richard   Richar                     1                             1   \n",
-       "3   Richard  iRchard                     2                             1   \n",
-       "4   Richard  Richadr                     2                             1   \n",
-       "5   Richard     Rich                     3                             3   \n",
-       "6   Richard     Rick                     4                             4   \n",
-       "7   Richard    Ricky                     4                             4   \n",
-       "8   Richard     Dick                     5                             5   \n",
-       "9   Richard     Rico                     4                             4   \n",
-       "10  Richard  Rachael                     3                             3   \n",
-       "11  Richard  Stephen                     7                             7   \n",
-       "\n",
-       "    jaro_similarity  jaro_winkler_similarity  jaccard_similarity  \n",
-       "0              1.00                     1.00                1.00  \n",
-       "1              0.95                     0.95                0.86  \n",
-       "2              0.95                     0.97                0.86  \n",
-       "3              0.95                     0.95                1.00  \n",
-       "4              0.95                     0.97                1.00  \n",
-       "5              0.86                     0.91                0.57  \n",
-       "6              0.73                     0.81                0.38  \n",
-       "7              0.68                     0.68                0.33  \n",
-       "8              0.60                     0.60                0.22  \n",
-       "9              0.73                     0.81                0.38  \n",
-       "10             0.71                     0.74                0.44  \n",
-       "11             0.43                     0.43                0.08  "
-      ]
-     },
-     "execution_count": 4,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.comparator_score_df(data, \"string1\", \"string2\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -647,109 +178,12 @@
    "cell_type": "code",
    "execution_count": 5,
    "metadata": {},
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "/Users/rosskennedy/splink/splink/comparison_helpers.py:172: SettingWithCopyWarning: \n",
-      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
-      "Try using .loc[row_indexer,col_indexer] = value instead\n",
-      "\n",
-      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
-      "  similarity_df[\"comparator\"] = similarity_df[\"comparator\"].str.replace(\n",
-      "/Users/rosskennedy/splink/splink/comparison_helpers.py:177: SettingWithCopyWarning: \n",
-      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
-      "Try using .loc[row_indexer,col_indexer] = value instead\n",
-      "\n",
-      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
-      "  distance_df[\"comparator\"] = distance_df[\"comparator\"].str.replace(\"_distance\", \"\")\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<style>\n",
-       "  #altair-viz-0006dfe03b4947c5a741996fbc84161b.vega-embed {\n",
-       "    width: 100%;\n",
-       "    display: flex;\n",
-       "  }\n",
-       "\n",
-       "  #altair-viz-0006dfe03b4947c5a741996fbc84161b.vega-embed details,\n",
-       "  #altair-viz-0006dfe03b4947c5a741996fbc84161b.vega-embed details summary {\n",
-       "    position: relative;\n",
-       "  }\n",
-       "</style>\n",
-       "<div id=\"altair-viz-0006dfe03b4947c5a741996fbc84161b\"></div>\n",
-       "<script type=\"text/javascript\">\n",
-       "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
-       "  (function(spec, embedOpt){\n",
-       "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-0006dfe03b4947c5a741996fbc84161b\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-0006dfe03b4947c5a741996fbc84161b\");\n",
-       "    }\n",
-       "    const paths = {\n",
-       "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
-       "      \"vega-lib\": \"https://cdn.jsdelivr.net/npm/vega-lib?noext\",\n",
-       "      \"vega-lite\": \"https://cdn.jsdelivr.net/npm/vega-lite@5.8.0?noext\",\n",
-       "      \"vega-embed\": \"https://cdn.jsdelivr.net/npm/vega-embed@6?noext\",\n",
-       "    };\n",
-       "\n",
-       "    function maybeLoadScript(lib, version) {\n",
-       "      var key = `${lib.replace(\"-\", \"\")}_version`;\n",
-       "      return (VEGA_DEBUG[key] == version) ?\n",
-       "        Promise.resolve(paths[lib]) :\n",
-       "        new Promise(function(resolve, reject) {\n",
-       "          var s = document.createElement('script');\n",
-       "          document.getElementsByTagName(\"head\")[0].appendChild(s);\n",
-       "          s.async = true;\n",
-       "          s.onload = () => {\n",
-       "            VEGA_DEBUG[key] = version;\n",
-       "            return resolve(paths[lib]);\n",
-       "          };\n",
-       "          s.onerror = () => reject(`Error loading script: ${paths[lib]}`);\n",
-       "          s.src = paths[lib];\n",
-       "        });\n",
-       "    }\n",
-       "\n",
-       "    function showError(err) {\n",
-       "      outputDiv.innerHTML = `<div class=\"error\" style=\"color:red;\">${err}</div>`;\n",
-       "      throw err;\n",
-       "    }\n",
-       "\n",
-       "    function displayChart(vegaEmbed) {\n",
-       "      vegaEmbed(outputDiv, spec, embedOpt)\n",
-       "        .catch(err => showError(`Javascript Error: ${err.message}<br>This usually means there's a typo in your chart specification. See the javascript console for the full traceback.`));\n",
-       "    }\n",
-       "\n",
-       "    if(typeof define === \"function\" && define.amd) {\n",
-       "      requirejs.config({paths});\n",
-       "      require([\"vega-embed\"], displayChart, err => showError(`Error loading script: ${err.message}`));\n",
-       "    } else {\n",
-       "      maybeLoadScript(\"vega\", \"5\")\n",
-       "        .then(() => maybeLoadScript(\"vega-lite\", \"5.8.0\"))\n",
-       "        .then(() => maybeLoadScript(\"vega-embed\", \"6\"))\n",
-       "        .catch(showError)\n",
-       "        .then(() => displayChart(vegaEmbed));\n",
-       "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300, \"discreteHeight\": {\"step\": 30}, \"discreteWidth\": {\"step\": 40}}}, \"hconcat\": [{\"layer\": [{\"mark\": {\"type\": \"rect\"}, \"encoding\": {\"color\": {\"condition\": {\"test\": \"datum.score > similarity_threshold\", \"value\": \"lightgreen\"}, \"value\": \"lightgrey\"}, \"x\": {\"field\": \"comparator\", \"title\": null, \"type\": \"ordinal\"}, \"y\": {\"axis\": {\"titleFontSize\": 14}, \"field\": \"strings_to_compare\", \"title\": \"String comparison\", \"type\": \"ordinal\"}}, \"title\": {\"text\": \"Similarity\", \"subtitle\": \">= 0.8\"}}, {\"mark\": {\"type\": \"text\", \"baseline\": \"middle\"}, \"encoding\": {\"opacity\": {\"condition\": {\"test\": \"datum.score > 0.9\", \"value\": 1}, \"value\": 0.5}, \"size\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"range\": [8, 14]}}, \"text\": {\"field\": \"score\", \"format\": \".2f\", \"type\": \"quantitative\"}, \"x\": {\"axis\": {\"labelFontSize\": 12}, \"field\": \"comparator\", \"type\": \"ordinal\"}, \"y\": {\"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}}], \"data\": {\"name\": \"data-similarity\"}}, {\"layer\": [{\"mark\": {\"type\": \"rect\"}, \"encoding\": {\"color\": {\"condition\": {\"test\": \"datum.score <= distance_threshold\", \"value\": \"lightgreen\"}, \"value\": \"lightgrey\"}, \"x\": {\"axis\": {\"labelFontSize\": 12}, \"field\": \"comparator\", \"title\": null, \"type\": \"ordinal\"}, \"y\": {\"axis\": null, \"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}, \"title\": {\"text\": \"Distance\", \"subtitle\": \"<= 2\"}}, {\"mark\": {\"type\": \"text\", \"baseline\": \"middle\"}, \"encoding\": {\"opacity\": {\"condition\": {\"test\": \"datum.score <= 2\", \"value\": 1}, \"value\": 0.5}, \"size\": {\"field\": \"score\", \"legend\": null, \"scale\": {\"range\": [8, 14], \"reverse\": true}}, \"text\": {\"field\": \"score\", \"type\": \"quantitative\"}, \"x\": {\"field\": \"comparator\", \"type\": \"ordinal\"}, \"y\": {\"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}}], \"data\": {\"name\": \"data-distance\"}}], \"datasets\": {\"data-similarity\": \"[{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.73},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.68},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.6},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.73},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.71},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaro\\\",\\\"score\\\":0.43},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.97},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.95},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.97},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.91},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.81},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.68},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.6},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.81},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.74},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaro_winkler\\\",\\\"score\\\":0.43},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.86},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.57},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.38},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.33},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.22},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.38},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.44},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"jaccard\\\",\\\"score\\\":0.08}]\", \"data-distance\": \"[{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":0.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":2.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":2.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":5.0},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"levenshtein\\\",\\\"score\\\":7.0},{\\\"strings_to_compare\\\":\\\"Richard, Richard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":0.0},{\\\"strings_to_compare\\\":\\\"Richard, ichard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richar\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, iRchard\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Richadr\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":1.0},{\\\"strings_to_compare\\\":\\\"Richard, Rich\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Rick\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Ricky\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Dick\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":5.0},{\\\"strings_to_compare\\\":\\\"Richard, Rico\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":4.0},{\\\"strings_to_compare\\\":\\\"Richard, Rachael\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":3.0},{\\\"strings_to_compare\\\":\\\"Richard, Stephen\\\",\\\"comparator\\\":\\\"damerau_levenshtein\\\",\\\"score\\\":7.0}]\"}, \"params\": [{\"name\": \"similarity_threshold\", \"value\": 0.8}, {\"name\": \"distance_threshold\", \"value\": 2}], \"resolve\": {\"scale\": {\"color\": \"independent\", \"size\": \"independent\", \"y\": \"shared\"}}, \"title\": {\"text\": \"Heatmaps of string comparison metrics\", \"anchor\": \"middle\", \"fontSize\": 16}, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.9.3.json\"}, {\"mode\": \"vega-lite\"});\n",
-       "</script>"
-      ],
-      "text/plain": [
-       "alt.HConcatChart(...)"
-      ]
-     },
-     "execution_count": 5,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.comparator_score_threshold_chart(\n",
     "    data, \"string1\", \"string2\", distance_threshold=2, similarity_threshold=0.8\n",
     ")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -767,12 +201,12 @@
    "cell_type": "code",
    "execution_count": 6,
    "metadata": {},
-   "outputs": [],
    "source": [
     "import splink.duckdb.comparison_library as cl\n",
     "\n",
     "first_name_comparison = cl.jaro_winkler_at_thresholds(\"first_name\", [0.9, 0.8, 0.7])"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -786,34 +220,10 @@
    "cell_type": "code",
    "execution_count": 7,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "{'output_column_name': 'first_name',\n",
-       " 'comparison_levels': [{'sql_condition': '\"first_name_l\" IS NULL OR \"first_name_r\" IS NULL',\n",
-       "   'label_for_charts': 'Null',\n",
-       "   'is_null_level': True},\n",
-       "  {'sql_condition': '\"first_name_l\" = \"first_name_r\"',\n",
-       "   'label_for_charts': 'Exact match'},\n",
-       "  {'sql_condition': 'jaro_winkler_similarity(\"first_name_l\", \"first_name_r\") >= 0.9',\n",
-       "   'label_for_charts': 'Jaro_winkler_similarity >= 0.9'},\n",
-       "  {'sql_condition': 'jaro_winkler_similarity(\"first_name_l\", \"first_name_r\") >= 0.8',\n",
-       "   'label_for_charts': 'Jaro_winkler_similarity >= 0.8'},\n",
-       "  {'sql_condition': 'jaro_winkler_similarity(\"first_name_l\", \"first_name_r\") >= 0.7',\n",
-       "   'label_for_charts': 'Jaro_winkler_similarity >= 0.7'},\n",
-       "  {'sql_condition': 'ELSE', 'label_for_charts': 'All other comparisons'}],\n",
-       " 'comparison_description': 'Exact match vs. First_Name within jaro_winkler_similarity thresholds 0.9, 0.8, 0.7 vs. anything else'}"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "first_name_comparison.as_dict()"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -845,43 +255,21 @@
    "cell_type": "code",
    "execution_count": 8,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "{'soundex': 'R02063', 'metaphone': 'RXRT', 'dmetaphone': ('RXRT', 'RKRT')}"
-      ]
-     },
-     "execution_count": 8,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "import splink.comparison_helpers\n",
     "\n",
     "ch.phonetic_transform(\"Richard\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "cell_type": "code",
    "execution_count": 9,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "{'soundex': 'S30105', 'metaphone': 'STFN', 'dmetaphone': ('STFN', '')}"
-      ]
-     },
-     "execution_count": 9,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.phonetic_transform(\"Steven\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -895,124 +283,6 @@
    "cell_type": "code",
    "execution_count": 10,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>string1</th>\n",
-       "      <th>string2</th>\n",
-       "      <th>error_type</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>None</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Steven</td>\n",
-       "      <td>Spelling Variation</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephan</td>\n",
-       "      <td>Spelling Variation/Similar Name</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Steve</td>\n",
-       "      <td>Nickname/Alias</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stehpen</td>\n",
-       "      <td>Transposition</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>tSephen</td>\n",
-       "      <td>Transposition</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephne</td>\n",
-       "      <td>Transposition</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stphen</td>\n",
-       "      <td>Deletion</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stepheb</td>\n",
-       "      <td>Replacement</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephanie</td>\n",
-       "      <td>Different Name</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Richard</td>\n",
-       "      <td>Different Name</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "    string1    string2                       error_type\n",
-       "0   Stephen    Stephen                             None\n",
-       "1   Stephen     Steven               Spelling Variation\n",
-       "2   Stephen    Stephan  Spelling Variation/Similar Name\n",
-       "3   Stephen      Steve                   Nickname/Alias\n",
-       "4   Stephen    Stehpen                    Transposition\n",
-       "5   Stephen    tSephen                    Transposition\n",
-       "6   Stephen    Stephne                    Transposition\n",
-       "7   Stephen     Stphen                         Deletion\n",
-       "8   Stephen    Stepheb                      Replacement\n",
-       "9   Stephen  Stephanie                   Different Name\n",
-       "10  Stephen    Richard                   Different Name"
-      ]
-     },
-     "execution_count": 10,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "data = {\n",
     "    \"string1\": [\n",
@@ -1058,7 +328,8 @@
     "\n",
     "df = pd.DataFrame(data)\n",
     "df"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -1072,89 +343,10 @@
    "cell_type": "code",
    "execution_count": 11,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "\n",
-       "<style>\n",
-       "  #altair-viz-293552f8371c48efa5c2e4c92344fe33.vega-embed {\n",
-       "    width: 100%;\n",
-       "    display: flex;\n",
-       "  }\n",
-       "\n",
-       "  #altair-viz-293552f8371c48efa5c2e4c92344fe33.vega-embed details,\n",
-       "  #altair-viz-293552f8371c48efa5c2e4c92344fe33.vega-embed details summary {\n",
-       "    position: relative;\n",
-       "  }\n",
-       "</style>\n",
-       "<div id=\"altair-viz-293552f8371c48efa5c2e4c92344fe33\"></div>\n",
-       "<script type=\"text/javascript\">\n",
-       "  var VEGA_DEBUG = (typeof VEGA_DEBUG == \"undefined\") ? {} : VEGA_DEBUG;\n",
-       "  (function(spec, embedOpt){\n",
-       "    let outputDiv = document.currentScript.previousElementSibling;\n",
-       "    if (outputDiv.id !== \"altair-viz-293552f8371c48efa5c2e4c92344fe33\") {\n",
-       "      outputDiv = document.getElementById(\"altair-viz-293552f8371c48efa5c2e4c92344fe33\");\n",
-       "    }\n",
-       "    const paths = {\n",
-       "      \"vega\": \"https://cdn.jsdelivr.net/npm/vega@5?noext\",\n",
-       "      \"vega-lib\": \"https://cdn.jsdelivr.net/npm/vega-lib?noext\",\n",
-       "      \"vega-lite\": \"https://cdn.jsdelivr.net/npm/vega-lite@5.8.0?noext\",\n",
-       "      \"vega-embed\": \"https://cdn.jsdelivr.net/npm/vega-embed@6?noext\",\n",
-       "    };\n",
-       "\n",
-       "    function maybeLoadScript(lib, version) {\n",
-       "      var key = `${lib.replace(\"-\", \"\")}_version`;\n",
-       "      return (VEGA_DEBUG[key] == version) ?\n",
-       "        Promise.resolve(paths[lib]) :\n",
-       "        new Promise(function(resolve, reject) {\n",
-       "          var s = document.createElement('script');\n",
-       "          document.getElementsByTagName(\"head\")[0].appendChild(s);\n",
-       "          s.async = true;\n",
-       "          s.onload = () => {\n",
-       "            VEGA_DEBUG[key] = version;\n",
-       "            return resolve(paths[lib]);\n",
-       "          };\n",
-       "          s.onerror = () => reject(`Error loading script: ${paths[lib]}`);\n",
-       "          s.src = paths[lib];\n",
-       "        });\n",
-       "    }\n",
-       "\n",
-       "    function showError(err) {\n",
-       "      outputDiv.innerHTML = `<div class=\"error\" style=\"color:red;\">${err}</div>`;\n",
-       "      throw err;\n",
-       "    }\n",
-       "\n",
-       "    function displayChart(vegaEmbed) {\n",
-       "      vegaEmbed(outputDiv, spec, embedOpt)\n",
-       "        .catch(err => showError(`Javascript Error: ${err.message}<br>This usually means there's a typo in your chart specification. See the javascript console for the full traceback.`));\n",
-       "    }\n",
-       "\n",
-       "    if(typeof define === \"function\" && define.amd) {\n",
-       "      requirejs.config({paths});\n",
-       "      require([\"vega-embed\"], displayChart, err => showError(`Error loading script: ${err.message}`));\n",
-       "    } else {\n",
-       "      maybeLoadScript(\"vega\", \"5\")\n",
-       "        .then(() => maybeLoadScript(\"vega-lite\", \"5.8.0\"))\n",
-       "        .then(() => maybeLoadScript(\"vega-embed\", \"6\"))\n",
-       "        .catch(showError)\n",
-       "        .then(() => displayChart(vegaEmbed));\n",
-       "    }\n",
-       "  })({\"config\": {\"view\": {\"continuousWidth\": 300, \"continuousHeight\": 300}}, \"layer\": [{\"mark\": {\"type\": \"rect\"}, \"encoding\": {\"color\": {\"field\": \"match\", \"legend\": {\"labelExpr\": \"{'true': 'Match', 'false': 'Non-match'}[datum.label]\", \"labelFontWeight\": \"bold\", \"symbolSize\": 1000, \"title\": null}, \"scale\": {\"range\": [\"lightgray\", \"lightgreen\"]}, \"type\": \"nominal\"}, \"x\": {\"axis\": {\"labelAlign\": \"center\", \"labelAngle\": -10, \"labelFontWeight\": \"bold\", \"orient\": \"top\"}, \"field\": \"phonetic\", \"title\": null, \"type\": \"nominal\"}, \"y\": {\"axis\": {\"titleFontSize\": 14}, \"field\": \"strings_to_compare\", \"title\": \"String comparison\", \"type\": \"ordinal\"}}}, {\"mark\": {\"type\": \"text\", \"baseline\": \"bottom\"}, \"encoding\": {\"opacity\": {\"condition\": {\"test\": \"datum.match\", \"value\": 1}, \"value\": 0.5}, \"text\": {\"field\": \"transform\", \"type\": \"nominal\"}, \"x\": {\"axis\": {\"labelFontSize\": 12}, \"field\": \"phonetic\", \"type\": \"ordinal\"}, \"y\": {\"field\": \"strings_to_compare\", \"type\": \"ordinal\"}}}], \"data\": {\"name\": \"data-phonetic\"}, \"datasets\": {\"data-phonetic\": \"[{\\\"strings_to_compare\\\":\\\"Stephen, Stephen\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steven\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stephan\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steve\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STF\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stehpen\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STPN\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, tSephen\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"TSFN\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephne\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stphen\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stepheb\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFP\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephanie\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"STFN\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Richard\\\",\\\"phonetic\\\":\\\"metaphone\\\",\\\"transform\\\":[\\\"STFN\\\",\\\"RXRT\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephen\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steven\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stephan\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steve\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STF\\\",\\\"\\\"]],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stehpen\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STPN\\\",\\\"\\\"]],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, tSephen\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"TSFN\\\",\\\"\\\"]],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephne\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stphen\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stepheb\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFP\\\",\\\"\\\"]],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephanie\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"STFN\\\",\\\"\\\"]],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Richard\\\",\\\"phonetic\\\":\\\"dmetaphone\\\",\\\"transform\\\":[[\\\"STFN\\\",\\\"\\\"],[\\\"RXRT\\\",\\\"RKRT\\\"]],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephen\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S30105\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steven\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S30105\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Stephan\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S30105\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, Steve\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S3010\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stehpen\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S30105\\\"],\\\"match\\\":true},{\\\"strings_to_compare\\\":\\\"Stephen, tSephen\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"t50105\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephne\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S301050\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stphen\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S3105\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stepheb\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S30101\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Stephanie\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"S301050\\\"],\\\"match\\\":false},{\\\"strings_to_compare\\\":\\\"Stephen, Richard\\\",\\\"phonetic\\\":\\\"soundex\\\",\\\"transform\\\":[\\\"S30105\\\",\\\"R02063\\\"],\\\"match\\\":false}]\"}, \"height\": {\"step\": 40}, \"title\": {\"text\": \"Heatmap of Phonetic Matches\", \"anchor\": \"middle\", \"fontSize\": 16}, \"width\": {\"step\": 70}, \"$schema\": \"https://vega.github.io/schema/vega-lite/v5.9.3.json\"}, {\"mode\": \"vega-lite\"});\n",
-       "</script>"
-      ],
-      "text/plain": [
-       "alt.LayerChart(...)"
-      ]
-     },
-     "execution_count": 11,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.phonetic_match_chart(data, \"string1\", \"string2\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -1178,164 +370,10 @@
    "cell_type": "code",
    "execution_count": 12,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>string1</th>\n",
-       "      <th>string2</th>\n",
-       "      <th>soundex</th>\n",
-       "      <th>metaphone</th>\n",
-       "      <th>dmetaphone</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>[S30105, S30105]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Steven</td>\n",
-       "      <td>[S30105, S30105]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephan</td>\n",
-       "      <td>[S30105, S30105]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Steve</td>\n",
-       "      <td>[S30105, S3010]</td>\n",
-       "      <td>[STFN, STF]</td>\n",
-       "      <td>[(STFN, ), (STF, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stehpen</td>\n",
-       "      <td>[S30105, S30105]</td>\n",
-       "      <td>[STFN, STPN]</td>\n",
-       "      <td>[(STFN, ), (STPN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>tSephen</td>\n",
-       "      <td>[S30105, t50105]</td>\n",
-       "      <td>[STFN, TSFN]</td>\n",
-       "      <td>[(STFN, ), (TSFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephne</td>\n",
-       "      <td>[S30105, S301050]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stphen</td>\n",
-       "      <td>[S30105, S3105]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stepheb</td>\n",
-       "      <td>[S30105, S30101]</td>\n",
-       "      <td>[STFN, STFP]</td>\n",
-       "      <td>[(STFN, ), (STFP, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Stephanie</td>\n",
-       "      <td>[S30105, S301050]</td>\n",
-       "      <td>[STFN, STFN]</td>\n",
-       "      <td>[(STFN, ), (STFN, )]</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>Stephen</td>\n",
-       "      <td>Richard</td>\n",
-       "      <td>[S30105, R02063]</td>\n",
-       "      <td>[STFN, RXRT]</td>\n",
-       "      <td>[(STFN, ), (RXRT, RKRT)]</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "    string1    string2            soundex     metaphone  \\\n",
-       "0   Stephen    Stephen   [S30105, S30105]  [STFN, STFN]   \n",
-       "1   Stephen     Steven   [S30105, S30105]  [STFN, STFN]   \n",
-       "2   Stephen    Stephan   [S30105, S30105]  [STFN, STFN]   \n",
-       "3   Stephen      Steve    [S30105, S3010]   [STFN, STF]   \n",
-       "4   Stephen    Stehpen   [S30105, S30105]  [STFN, STPN]   \n",
-       "5   Stephen    tSephen   [S30105, t50105]  [STFN, TSFN]   \n",
-       "6   Stephen    Stephne  [S30105, S301050]  [STFN, STFN]   \n",
-       "7   Stephen     Stphen    [S30105, S3105]  [STFN, STFN]   \n",
-       "8   Stephen    Stepheb   [S30105, S30101]  [STFN, STFP]   \n",
-       "9   Stephen  Stephanie  [S30105, S301050]  [STFN, STFN]   \n",
-       "10  Stephen    Richard   [S30105, R02063]  [STFN, RXRT]   \n",
-       "\n",
-       "                  dmetaphone  \n",
-       "0       [(STFN, ), (STFN, )]  \n",
-       "1       [(STFN, ), (STFN, )]  \n",
-       "2       [(STFN, ), (STFN, )]  \n",
-       "3        [(STFN, ), (STF, )]  \n",
-       "4       [(STFN, ), (STPN, )]  \n",
-       "5       [(STFN, ), (TSFN, )]  \n",
-       "6       [(STFN, ), (STFN, )]  \n",
-       "7       [(STFN, ), (STFN, )]  \n",
-       "8       [(STFN, ), (STFP, )]  \n",
-       "9       [(STFN, ), (STFN, )]  \n",
-       "10  [(STFN, ), (RXRT, RKRT)]  "
-      ]
-     },
-     "execution_count": 12,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "ch.phonetic_transform_df(data, \"string1\", \"string2\")"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
@@ -1359,31 +397,6 @@
    "cell_type": "code",
    "execution_count": 13,
    "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "{'output_column_name': 'custom_first_name_first_name_dm',\n",
-       " 'comparison_levels': [{'sql_condition': '\"first_name_l\" IS NULL OR \"first_name_r\" IS NULL',\n",
-       "   'label_for_charts': 'Null',\n",
-       "   'is_null_level': True},\n",
-       "  {'sql_condition': '\"first_name_l\" = \"first_name_r\"',\n",
-       "   'label_for_charts': 'Exact match first_name'},\n",
-       "  {'sql_condition': '\"first_name_dm_l\" = \"first_name_dm_r\"',\n",
-       "   'label_for_charts': 'Exact match first_name_dm'},\n",
-       "  {'sql_condition': 'levenshtein(\"first_name_l\", \"first_name_r\") <= 2',\n",
-       "   'label_for_charts': 'Levenshtein <= 2'},\n",
-       "  {'sql_condition': 'jaro_winkler_similarity(\"first_name_l\", \"first_name_r\") >= 0.8',\n",
-       "   'label_for_charts': 'Jaro_winkler_similarity >= 0.8'},\n",
-       "  {'sql_condition': 'ELSE', 'label_for_charts': 'All other comparisons'}],\n",
-       " 'comparison_description': 'Exact match vs. Names with phonetic exact match vs. First_Name within levenshtein threshold 2 vs. First_Name within jaro_winkler threshold 0.8 vs. anything else'}"
-      ]
-     },
-     "execution_count": 13,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
    "source": [
     "import splink.duckdb.comparison_template_library as ctl\n",
     "\n",
@@ -1396,7 +409,8 @@
     ")\n",
     "\n",
     "first_name_comparison.as_dict()"
-   ]
+   ],
+   "outputs": []
   },
   {
    "attachments": {},
diff --git a/scripts/generate_dialect_comparison_docs.py b/scripts/generate_dialect_comparison_docs.py
index ebd9f8d616..fd485cbd56 100644
--- a/scripts/generate_dialect_comparison_docs.py
+++ b/scripts/generate_dialect_comparison_docs.py
@@ -4,8 +4,8 @@
 import inspect
 from pathlib import Path
 
-from splink.comparison import Comparison
-from splink.comparison_level import ComparisonLevel
+from splink.internals.comparison import Comparison
+from splink.internals.comparison_level import ComparisonLevel
 from splink.dialect_base import DialectBase
 
 # could always pick this up dynamically,
diff --git a/splink/comparison_library.py b/splink/comparison_library.py
index 28c7b17940..8be9600e12 100644
--- a/splink/comparison_library.py
+++ b/splink/comparison_library.py
@@ -2,10 +2,10 @@
 
 from typing import Any, Iterable, List, Optional, Union
 
-from . import comparison_level_library as cll
-from .comparison_creator import ComparisonCreator
-from .comparison_level_creator import ComparisonLevelCreator
-from .comparison_level_library import CustomLevel, DateMetricType
+from .internals import comparison_level_library as cll
+from splink.internals.comparison_creator import ComparisonCreator
+from splink.internals.comparison_level_creator import ComparisonLevelCreator
+from splink.internals.comparison_level_library import CustomLevel, DateMetricType
 from .misc import ensure_is_iterable
 
 
diff --git a/splink/comparison_template_library.py b/splink/comparison_template_library.py
index f7664f1214..ba7d74dd00 100644
--- a/splink/comparison_template_library.py
+++ b/splink/comparison_template_library.py
@@ -2,11 +2,11 @@
 
 from typing import List, Type, Union
 
-from . import comparison_level_library as cll
+from .internals import comparison_level_library as cll
 from splink.internals.column_expression import ColumnExpression
-from .comparison_creator import ComparisonCreator
-from .comparison_level_creator import ComparisonLevelCreator
-from .comparison_level_library import DateMetricType
+from splink.internals.comparison_creator import ComparisonCreator
+from splink.internals.comparison_level_creator import ComparisonLevelCreator
+from splink.internals.comparison_level_library import DateMetricType
 from .misc import ensure_is_iterable
 
 # alternatively we could stick an inheritance layer in these, just for typing:
diff --git a/splink/dialects.py b/splink/dialects.py
index 3167150943..0941657d16 100644
--- a/splink/dialects.py
+++ b/splink/dialects.py
@@ -4,7 +4,7 @@
 from typing import TYPE_CHECKING, Type, TypeVar, final
 
 if TYPE_CHECKING:
-    from .comparison_level_library import (
+    from splink.internals.comparison_level_library import (
         AbsoluteTimeDifferenceLevel,
         ArrayIntersectLevel,
     )
diff --git a/splink/em_training_session.py b/splink/em_training_session.py
index e3e58df69a..3edc8b03dd 100644
--- a/splink/em_training_session.py
+++ b/splink/em_training_session.py
@@ -10,8 +10,8 @@
     probability_two_random_records_match_iteration_chart,
 )
 
-from .comparison import Comparison
-from .comparison_level import ComparisonLevel
+from splink.internals.comparison import Comparison
+from splink.internals.comparison_level import ComparisonLevel
 from .comparison_vector_values import compute_comparison_vector_values_sql
 from .constants import LEVEL_NOT_OBSERVED_TEXT
 from .database_api import DatabaseAPISubClass
diff --git a/splink/expectation_maximisation.py b/splink/expectation_maximisation.py
index 22eef53447..a5d1b678f9 100644
--- a/splink/expectation_maximisation.py
+++ b/splink/expectation_maximisation.py
@@ -6,8 +6,8 @@
 
 import pandas as pd
 
-from .comparison import Comparison
-from .comparison_level import ComparisonLevel
+from splink.internals.comparison import Comparison
+from splink.internals.comparison_level import ComparisonLevel
 from .constants import LEVEL_NOT_OBSERVED_TEXT
 from .database_api import DatabaseAPISubClass
 from .input_column import InputColumn
diff --git a/splink/comparison.py b/splink/internals/comparison.py
similarity index 99%
rename from splink/comparison.py
rename to splink/internals/comparison.py
index 46a9d46b77..a6f5500cf5 100644
--- a/splink/comparison.py
+++ b/splink/internals/comparison.py
@@ -3,11 +3,11 @@
 from typing import TYPE_CHECKING, Any, List, Optional
 
 from .comparison_level import ComparisonLevel, _default_m_values, _default_u_values
-from .misc import dedupe_preserving_order, join_list_with_commas_final_and
+from splink.misc import dedupe_preserving_order, join_list_with_commas_final_and
 
 # https://stackoverflow.com/questions/39740632/python-type-hinting-without-cyclic-imports
 if TYPE_CHECKING:
-    from .settings import ColumnInfoSettings
+    from splink.settings import ColumnInfoSettings
 
 
 class Comparison:
diff --git a/splink/comparison_creator.py b/splink/internals/comparison_creator.py
similarity index 99%
rename from splink/comparison_creator.py
rename to splink/internals/comparison_creator.py
index 8930657332..2f8343248c 100644
--- a/splink/comparison_creator.py
+++ b/splink/internals/comparison_creator.py
@@ -6,7 +6,7 @@
 from splink.internals.column_expression import ColumnExpression
 from .comparison import Comparison
 from .comparison_level_creator import ComparisonLevelCreator
-from .exceptions import SplinkException
+from splink.exceptions import SplinkException
 
 
 class ComparisonCreator(ABC):
diff --git a/splink/comparison_helpers.py b/splink/internals/comparison_helpers.py
similarity index 100%
rename from splink/comparison_helpers.py
rename to splink/internals/comparison_helpers.py
diff --git a/splink/comparison_level.py b/splink/internals/comparison_level.py
similarity index 99%
rename from splink/comparison_level.py
rename to splink/internals/comparison_level.py
index c177731e6a..63cbd1890f 100644
--- a/splink/comparison_level.py
+++ b/splink/internals/comparison_level.py
@@ -13,16 +13,16 @@
 from sqlglot.optimizer.normalize import normalize
 from sqlglot.optimizer.simplify import simplify
 
-from .constants import LEVEL_NOT_OBSERVED_TEXT
-from .input_column import InputColumn
-from .misc import (
+from splink.constants import LEVEL_NOT_OBSERVED_TEXT
+from splink.input_column import InputColumn
+from splink.misc import (
     dedupe_preserving_order,
     interpolate,
     join_list_with_commas_final_and,
     match_weight_to_bayes_factor,
 )
-from .parse_sql import get_columns_used_from_sql
-from .sql_transform import sqlglot_tree_signature
+from splink.parse_sql import get_columns_used_from_sql
+from splink.sql_transform import sqlglot_tree_signature
 
 logger = logging.getLogger(__name__)
 
diff --git a/splink/comparison_level_composition.py b/splink/internals/comparison_level_composition.py
similarity index 98%
rename from splink/comparison_level_composition.py
rename to splink/internals/comparison_level_composition.py
index 54f5fbdeb8..e64088aef0 100644
--- a/splink/comparison_level_composition.py
+++ b/splink/internals/comparison_level_composition.py
@@ -6,7 +6,7 @@
 
 from .comparison_creator import ComparisonLevelCreator
 from .comparison_level import ComparisonLevel
-from .dialects import SplinkDialect
+from splink.dialects import SplinkDialect
 
 
 def _ensure_is_comparison_level_creator(
diff --git a/splink/comparison_level_creator.py b/splink/internals/comparison_level_creator.py
similarity index 99%
rename from splink/comparison_level_creator.py
rename to splink/internals/comparison_level_creator.py
index 5f6eee7302..6434c36e8e 100644
--- a/splink/comparison_level_creator.py
+++ b/splink/internals/comparison_level_creator.py
@@ -6,7 +6,7 @@
 
 from splink.internals.column_expression import ColumnExpression
 from .comparison_level import ComparisonLevel
-from .dialects import SplinkDialect
+from splink.dialects import SplinkDialect
 
 
 class ComparisonLevelCreator(ABC):
diff --git a/splink/comparison_level_library.py b/splink/internals/comparison_level_library.py
similarity index 99%
rename from splink/comparison_level_library.py
rename to splink/internals/comparison_level_library.py
index 72b0036111..ad0aa2a2b7 100644
--- a/splink/comparison_level_library.py
+++ b/splink/internals/comparison_level_library.py
@@ -11,8 +11,8 @@
 # import composition functions for export
 from .comparison_level_composition import And, Not, Or  # NOQA: F401
 from .comparison_level_creator import ComparisonLevelCreator
-from .comparison_level_sql import great_circle_distance_km_sql
-from .dialects import SplinkDialect
+from splink.comparison_level_sql import great_circle_distance_km_sql
+from splink.dialects import SplinkDialect
 
 # type aliases:
 T = TypeVar("T", bound=ComparisonLevelCreator)
diff --git a/splink/linker.py b/splink/linker.py
index 3f52f736ed..54713758ac 100644
--- a/splink/linker.py
+++ b/splink/linker.py
@@ -40,8 +40,8 @@
     render_splink_cluster_studio_html,
 )
 
-from .comparison import Comparison
-from .comparison_level import ComparisonLevel
+from splink.internals.comparison import Comparison
+from splink.internals.comparison_level import ComparisonLevel
 from .comparison_vector_distribution import (
     comparison_vector_distribution_sql,
 )
diff --git a/splink/m_u_records_to_parameters.py b/splink/m_u_records_to_parameters.py
index 8c7b6f42de..91376ebc2d 100644
--- a/splink/m_u_records_to_parameters.py
+++ b/splink/m_u_records_to_parameters.py
@@ -3,7 +3,7 @@
 import logging
 from typing import Any, Dict, List
 
-from .comparison_level import ComparisonLevel
+from splink.internals.comparison_level import ComparisonLevel
 from .constants import LEVEL_NOT_OBSERVED_TEXT
 
 logger = logging.getLogger(__name__)
diff --git a/splink/predict.py b/splink/predict.py
index cb65c2ee27..93150e0569 100644
--- a/splink/predict.py
+++ b/splink/predict.py
@@ -4,7 +4,7 @@
 import logging
 from typing import List
 
-from .comparison import Comparison
+from splink.internals.comparison import Comparison
 from .input_column import InputColumn
 from .misc import prob_to_bayes_factor, prob_to_match_weight
 from .settings import CoreModelSettings, Settings
diff --git a/splink/settings.py b/splink/settings.py
index 7c83b7a16a..f40114aa87 100644
--- a/splink/settings.py
+++ b/splink/settings.py
@@ -12,8 +12,8 @@
 )
 from splink.internals.charts import m_u_parameters_chart, match_weights_chart
 
-from .comparison import Comparison
-from .comparison_level import ComparisonLevel
+from splink.internals.comparison import Comparison
+from splink.internals.comparison_level import ComparisonLevel
 from .input_column import InputColumn
 from .misc import dedupe_preserving_order, prob_to_bayes_factor, prob_to_match_weight
 from .parse_sql import get_columns_used_from_sql
diff --git a/splink/settings_creator.py b/splink/settings_creator.py
index 407a793799..1c9c9559d1 100644
--- a/splink/settings_creator.py
+++ b/splink/settings_creator.py
@@ -9,7 +9,7 @@
 from splink.internals.blocking_rule_creator import BlockingRuleCreator
 from splink.internals.blocking_rule_creator_utils import to_blocking_rule_creator
 
-from .comparison_creator import ComparisonCreator
+from splink.internals.comparison_creator import ComparisonCreator
 from .comparison_library import CustomComparison
 from .settings import Settings
 
diff --git a/splink/settings_validation/log_invalid_columns.py b/splink/settings_validation/log_invalid_columns.py
index 4a8abe5aa8..b0d21ff3c4 100644
--- a/splink/settings_validation/log_invalid_columns.py
+++ b/splink/settings_validation/log_invalid_columns.py
@@ -7,7 +7,7 @@
 import sqlglot
 import sqlglot.expressions
 
-from ..comparison import Comparison
+from splink.internals.comparison import Comparison
 from ..parse_sql import parse_columns_in_sql
 from .settings_column_cleaner import (
     SettingsColumnCleaner,
diff --git a/splink/waterfall_chart.py b/splink/waterfall_chart.py
index 8747bf2f95..900c813bdb 100644
--- a/splink/waterfall_chart.py
+++ b/splink/waterfall_chart.py
@@ -4,7 +4,7 @@
 from copy import deepcopy
 from typing import Any, Dict
 
-from .comparison import Comparison
+from splink.internals.comparison import Comparison
 from .misc import prob_to_bayes_factor
 
 
diff --git a/tests/literal_utils.py b/tests/literal_utils.py
index f7095088ee..8c63b8c016 100644
--- a/tests/literal_utils.py
+++ b/tests/literal_utils.py
@@ -3,8 +3,8 @@
 
 import pytest
 
-from splink.comparison_creator import ComparisonCreator
-from splink.comparison_level_creator import ComparisonLevelCreator
+from splink.internals.comparison_creator import ComparisonCreator
+from splink.internals.comparison_level_creator import ComparisonLevelCreator
 
 
 class ComparisonLevelTestSpec:
diff --git a/tests/test_columns_selected.py b/tests/test_columns_selected.py
index 19bd2f111f..fe0efe7fa8 100644
--- a/tests/test_columns_selected.py
+++ b/tests/test_columns_selected.py
@@ -4,7 +4,7 @@
 
 import pandas as pd
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 from splink.duckdb.database_api import DuckDBAPI
 from splink.linker import Linker
 
diff --git a/tests/test_comparison_level.py b/tests/test_comparison_level.py
index 968f13d982..dd25797422 100644
--- a/tests/test_comparison_level.py
+++ b/tests/test_comparison_level.py
@@ -1,6 +1,6 @@
 from pytest import mark, raises
 
-from splink.comparison_level import ComparisonLevel
+from splink.internals.comparison_level import ComparisonLevel
 
 from .decorator import mark_with_dialects_excluding
 
diff --git a/tests/test_comparison_level_composition.py b/tests/test_comparison_level_composition.py
index 9cb694113f..9967d05341 100644
--- a/tests/test_comparison_level_composition.py
+++ b/tests/test_comparison_level_composition.py
@@ -1,7 +1,7 @@
 import pandas as pd
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 from splink.input_column import _get_dialect_quotes
 
 from .decorator import mark_with_dialects_excluding
diff --git a/tests/test_comparison_level_lib.py b/tests/test_comparison_level_lib.py
index 4ae459cb45..60c2a4c09e 100644
--- a/tests/test_comparison_level_lib.py
+++ b/tests/test_comparison_level_lib.py
@@ -1,6 +1,6 @@
 import pandas as pd
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 
 from .decorator import mark_with_dialects_excluding
 
diff --git a/tests/test_compound_comparison_levels.py b/tests/test_compound_comparison_levels.py
index 107a9b8a60..ee802575e4 100644
--- a/tests/test_compound_comparison_levels.py
+++ b/tests/test_compound_comparison_levels.py
@@ -1,6 +1,6 @@
 import pandas as pd
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 from splink.duckdb.database_api import DuckDBAPI
 from splink.linker import Linker
diff --git a/tests/test_date_levels_and_comparisons.py b/tests/test_date_levels_and_comparisons.py
index 6d6291219b..199bd2b1c0 100644
--- a/tests/test_date_levels_and_comparisons.py
+++ b/tests/test_date_levels_and_comparisons.py
@@ -2,7 +2,7 @@
 
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 import splink.comparison_template_library as ctl
 from splink.internals.column_expression import ColumnExpression
diff --git a/tests/test_disable_tf_exact_match_detection.py b/tests/test_disable_tf_exact_match_detection.py
index ddf7257f5f..5b4ab37f9c 100644
--- a/tests/test_disable_tf_exact_match_detection.py
+++ b/tests/test_disable_tf_exact_match_detection.py
@@ -1,7 +1,7 @@
 import pandas as pd
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 from splink import DuckDBAPI, Linker, SettingsCreator
 
 
diff --git a/tests/test_full_example_duckdb.py b/tests/test_full_example_duckdb.py
index 8eb6268951..afe2175a58 100644
--- a/tests/test_full_example_duckdb.py
+++ b/tests/test_full_example_duckdb.py
@@ -6,7 +6,7 @@
 import pyarrow.parquet as pq
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 from splink.blocking_analysis import count_comparisons_from_blocking_rule
 from splink.duckdb.database_api import DuckDBAPI
diff --git a/tests/test_full_example_spark.py b/tests/test_full_example_spark.py
index 08246a6516..9f52b481c7 100644
--- a/tests/test_full_example_spark.py
+++ b/tests/test_full_example_spark.py
@@ -5,7 +5,7 @@
 import pytest
 from pyspark.sql.types import StringType, StructField, StructType
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 from splink.exploratory import completeness_chart, profile_columns
 from splink.linker import Linker
diff --git a/tests/test_km_distance_level.py b/tests/test_km_distance_level.py
index 771f484a8f..862b70b234 100644
--- a/tests/test_km_distance_level.py
+++ b/tests/test_km_distance_level.py
@@ -1,6 +1,6 @@
 import pandas as pd
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 from splink.duckdb.database_api import DuckDBAPI
 from splink.linker import Linker
diff --git a/tests/test_new_comparison_levels.py b/tests/test_new_comparison_levels.py
index 2db086dc8e..4153256733 100644
--- a/tests/test_new_comparison_levels.py
+++ b/tests/test_new_comparison_levels.py
@@ -3,7 +3,7 @@
 import pandas as pd
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 import splink.comparison_template_library as ctl
 from splink.internals.column_expression import ColumnExpression
diff --git a/tests/test_new_db_api.py b/tests/test_new_db_api.py
index 5019b44a92..9c15eddb54 100644
--- a/tests/test_new_db_api.py
+++ b/tests/test_new_db_api.py
@@ -1,6 +1,6 @@
 import os
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 import splink.comparison_library as cl
 from splink import block_on
 from splink.blocking_analysis import (
diff --git a/tests/test_regex_param.py b/tests/test_regex_param.py
index 5d1594d28d..a9d02642b4 100644
--- a/tests/test_regex_param.py
+++ b/tests/test_regex_param.py
@@ -1,7 +1,7 @@
 import pandas as pd
 import pytest
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 from splink.internals.column_expression import ColumnExpression
 
 from .decorator import mark_with_dialects_excluding
diff --git a/tests/test_spark_udfs.py b/tests/test_spark_udfs.py
index 73b28a6964..06599c169d 100644
--- a/tests/test_spark_udfs.py
+++ b/tests/test_spark_udfs.py
@@ -1,6 +1,6 @@
 import pandas as pd
 
-import splink.comparison_level_library as cll
+import splink.internals.comparison_level_library as cll
 from splink.linker import Linker
 from tests.decorator import mark_with_dialects_including
 

	string1	string2	error_type
0	Richard	Richard	None
1	Richard	ichard	Deletion
2	Richard	Richar	Deletion
3	Richard	iRchard	Transposition
4	Richard	Richadr	Transposition
5	Richard	Rich	Shortening
6	Richard	Rick	Nickname/Alias
7	Richard	Ricky	Nickname/Alias
8	Richard	Dick	Nickname/Alias
9	Richard	Rico	Nickname/Alias
10	Richard	Rachael	Different Name
11	Richard	Stephen	Different Name
	string1	string2	levenshtein_distance	damerau_levenshtein_distance	jaro_similarity	jaro_winkler_similarity	jaccard_similarity
0	Richard	Richard	0	0	1.00	1.00	1.00
1	Richard	ichard	1	1	0.95	0.95	0.86
2	Richard	Richar	1	1	0.95	0.97	0.86
3	Richard	iRchard	2	1	0.95	0.95	1.00
4	Richard	Richadr	2	1	0.95	0.97	1.00
5	Richard	Rich	3	3	0.86	0.91	0.57
6	Richard	Rick	4	4	0.73	0.81	0.38
7	Richard	Ricky	4	4	0.68	0.68	0.33
8	Richard	Dick	5	5	0.60	0.60	0.22
9	Richard	Rico	4	4	0.73	0.81	0.38
10	Richard	Rachael	3	3	0.71	0.74	0.44
11	Richard	Stephen	7	7	0.43	0.43	0.08
	string1	string2	soundex	metaphone	dmetaphone
0	Stephen	Stephen	[S30105, S30105]	[STFN, STFN]	[(STFN, ), (STFN, )]
1	Stephen	Steven	[S30105, S30105]	[STFN, STFN]	[(STFN, ), (STFN, )]
2	Stephen	Stephan	[S30105, S30105]	[STFN, STFN]	[(STFN, ), (STFN, )]
3	Stephen	Steve	[S30105, S3010]	[STFN, STF]	[(STFN, ), (STF, )]
4	Stephen	Stehpen	[S30105, S30105]	[STFN, STPN]	[(STFN, ), (STPN, )]
5	Stephen	tSephen	[S30105, t50105]	[STFN, TSFN]	[(STFN, ), (TSFN, )]
6	Stephen	Stephne	[S30105, S301050]	[STFN, STFN]	[(STFN, ), (STFN, )]
7	Stephen	Stphen	[S30105, S3105]	[STFN, STFN]	[(STFN, ), (STFN, )]
8	Stephen	Stepheb	[S30105, S30101]	[STFN, STFP]	[(STFN, ), (STFP, )]
9	Stephen	Stephanie	[S30105, S301050]	[STFN, STFN]	[(STFN, ), (STFN, )]
10	Stephen	Richard	[S30105, R02063]	[STFN, RXRT]	[(STFN, ), (RXRT, RKRT)]