diff --git a/bdikit/visualization/scope_reducing.py b/bdikit/visualization/scope_reducing.py
index 64ba9765..0256d240 100644
--- a/bdikit/visualization/scope_reducing.py
+++ b/bdikit/visualization/scope_reducing.py
@@ -1,4 +1,5 @@
 import json
+import logging
 
 import altair as alt
 import numpy as np
@@ -11,6 +12,8 @@
 pn.extension("mathjax")
 pn.extension("vega")
 
+logger = logging.getLogger(__name__)
+
 
 class SRHeatMapManager:
     def __init__(self) -> None:
@@ -23,6 +26,9 @@ def __init__(self) -> None:
         self.rec_cols_gdc = None
         self.clusters = None
 
+        # Selected column
+        self.selected_row = None
+
     def _load_json(self):
         with open(self.json_path) as f:
             data = json.load(f)
@@ -32,7 +38,8 @@ def _write_json(self, data):
         with open(self.json_path, "w") as f:
             json.dump(data, f)
 
-    def get_heatmap(self, recommendations):
+    def get_heatmap(self):
+        recommendations = self._load_json()
         rec_cols = set()
         rec_table = []
         rec_list = []
@@ -124,6 +131,48 @@ def _get_column_values(self, properties):
         else:
             return None
 
+    def _accept_match(self, col_name=None, match_name=None):
+        if self.selected_row is None:
+            return
+        col_name = self.selected_row["Column"].values[0]
+        match_name = self.selected_row["Recommendation"].values[0]
+        recommendations = self._load_json()
+        for idx, d in enumerate(recommendations):
+            candidate_name = d["Candidate column"]
+            if candidate_name != col_name:
+                continue
+            for top_k_name, top_k_score in d["Top k columns"]:
+                if top_k_name == match_name:
+                    recommendations[idx] = {
+                        "Candidate column": candidate_name,
+                        "Top k columns": [[top_k_name, top_k_score]],
+                    }
+                    self._write_json(recommendations)
+                    self.get_heatmap()
+                    return
+
+    def _reject_match(self):
+        if self.selected_row is None:
+            return
+        col_name = self.selected_row["Column"].values[0]
+        match_name = self.selected_row["Recommendation"].values[0]
+        recommendations = self._load_json()
+        for idx, d in enumerate(recommendations):
+            candidate_name = d["Candidate column"]
+            if candidate_name != col_name:
+                continue
+            new_top_k = []
+            for top_k_name, top_k_score in d["Top k columns"]:
+                if top_k_name != match_name:
+                    new_top_k.append([top_k_name, top_k_score])
+            recommendations[idx] = {
+                "Candidate column": candidate_name,
+                "Top k columns": new_top_k,
+            }
+            self._write_json(recommendations)
+            self.get_heatmap()
+            return
+
     def get_clusters(self):
         words = self.rec_table_df["Column"].to_numpy()
         lev_similarity = -1 * np.array(
@@ -136,19 +185,52 @@ def get_clusters(self):
         )
         affprop.fit(lev_similarity)
 
-        print(f"Number of clusters: {np.unique(affprop.labels_).shape[0]}\n")
+        logger.debug(f"Number of clusters: {np.unique(affprop.labels_).shape[0]}\n")
         cluster_names = []
         clusters = {}
         for cluster_id in np.unique(affprop.labels_):
             exemplar = words[affprop.cluster_centers_indices_[cluster_id]]
             cluster = np.unique(words[np.nonzero(affprop.labels_ == cluster_id)])
             cluster_str = ", ".join(cluster)
-            print(" - *%s:* %s" % (exemplar, cluster_str))
+            logger.debug(" - *%s:* %s" % (exemplar, cluster_str))
             cluster_names.append(exemplar)
             clusters[exemplar] = cluster
         self.clusters = clusters
 
-    def _plot_heatmap(self, clusters=[], subschemas=[], threshold=0.5):
+    def _plot_heatmap_base(self, heatmap_rec_list):
+        single = alt.selection_point(name="single")
+        base = (
+            alt.Chart(heatmap_rec_list)
+            .mark_rect(size=100)
+            .encode(
+                y=alt.X("Column:O", sort=None),
+                x=alt.X(f"Recommendation:O", sort=None),
+                color=alt.condition(single, "Value:Q", alt.value("lightgray")),
+                # color="Value:Q",
+                tooltip=[
+                    alt.Tooltip("Column", title="Column"),
+                    alt.Tooltip("Recommendation", title="Recommendation"),
+                    alt.Tooltip("Value", title="Value"),
+                ],
+            )
+            .add_params(single)
+        )
+        return pn.pane.Vega(base)
+
+    def _plot_selected_row(self, heatmap_rec_list, selection):
+        if not selection:
+            return "## No selection"
+        selected_row = heatmap_rec_list.iloc[selection]
+        column = selected_row["Column"].values[0]
+        rec = selected_row["Recommendation"].values[0]
+        # value = selected_row["Value"]
+        # self._accept_match(column, rec)
+        self.selected_row = selected_row
+        return pn.widgets.DataFrame(selected_row)
+
+    def _plot_pane(
+        self, clusters=[], subschemas=[], threshold=0.5, acc_click=0, rej_click=0
+    ):
         heatmap_rec_list = self.rec_list_df[self.rec_list_df["Value"] >= threshold]
         if clusters:
             clustered_cols = []
@@ -165,21 +247,15 @@ def _plot_heatmap(self, clusters=[], subschemas=[], threshold=0.5):
                 heatmap_rec_list["Recommendation"].isin(subschema_rec_cols)
             ]
 
-        base = (
-            alt.Chart(heatmap_rec_list)
-            .mark_rect()
-            .encode(
-                y=alt.X("Column:O", sort=None),
-                x=alt.X(f"Recommendation:O", sort=None),
-                color="Value:Q",
-                tooltip=[
-                    alt.Tooltip("Column", title="Column"),
-                    alt.Tooltip("Recommendation", title="Recommendation"),
-                    alt.Tooltip("Value", title="Value"),
-                ],
-            )
+        heatmap_pane = self._plot_heatmap_base(heatmap_rec_list)
+        return pn.Column(
+            heatmap_pane,
+            pn.bind(
+                self._plot_selected_row,
+                heatmap_rec_list,
+                heatmap_pane.selection.param.single,
+            ),
         )
-        return pn.pane.Vega(base)
 
     def plot_heatmap(self):
         select_cluster = pn.widgets.MultiChoice(
@@ -192,8 +268,26 @@ def plot_heatmap(self):
             name="Threshold", start=0, end=1.0, step=0.01, value=0.5, width=220
         )
 
+        acc_button = pn.widgets.Button(name="Accept Match", button_type="success")
+
+        rej_button = pn.widgets.Button(name="Decline Match", button_type="danger")
+
+        def on_click_accept_match(event):
+            self._accept_match()
+
+        def on_click_reject_match(event):
+            self._reject_match()
+
+        acc_button.on_click(on_click_accept_match)
+        rej_button.on_click(on_click_reject_match)
+
         heatmap_bind = pn.bind(
-            self._plot_heatmap, select_cluster, select_rec_groups, thresh_slider
+            self._plot_pane,
+            select_cluster,
+            select_rec_groups,
+            thresh_slider,
+            acc_button.param.clicks,
+            rej_button.param.clicks,
         )
 
         column_left = pn.Column(
@@ -201,6 +295,8 @@ def plot_heatmap(self):
             select_cluster,
             select_rec_groups,
             thresh_slider,
+            acc_button,
+            rej_button,
             styles=dict(background="WhiteSmoke"),
         )
 
diff --git a/examples/scope_reducing_heatmap.ipynb b/examples/scope_reducing_heatmap.ipynb
index 21e32e48..1a101b53 100644
--- a/examples/scope_reducing_heatmap.ipynb
+++ b/examples/scope_reducing_heatmap.ipynb
@@ -9,7 +9,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -23,7 +23,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 2,
    "metadata": {},
    "outputs": [
     {
@@ -70,12 +70,12 @@
      "data": {
       "application/vnd.holoviews_exec.v0+json": "",
       "text/html": [
-       "<div id='dc2cde33-9369-4db4-8408-847bf4c65ffc'>\n",
-       "  <div id=\"a793e9c8-e442-466e-aea8-1b0e6fb985a1\" data-root-id=\"dc2cde33-9369-4db4-8408-847bf4c65ffc\" style=\"display: contents;\"></div>\n",
+       "<div id='7de196b5-2c93-443a-a44b-281f976f845f'>\n",
+       "  <div id=\"a20ce3e3-5de6-4d64-aeac-21871f55dc02\" data-root-id=\"7de196b5-2c93-443a-a44b-281f976f845f\" style=\"display: contents;\"></div>\n",
        "</div>\n",
        "<script type=\"application/javascript\">(function(root) {\n",
-       "  var docs_json = {\"1c8a85bc-1a5f-4975-a57f-a684300f34ab\":{\"version\":\"3.4.1\",\"title\":\"Bokeh Application\",\"roots\":[{\"type\":\"object\",\"name\":\"panel.models.browser.BrowserInfo\",\"id\":\"dc2cde33-9369-4db4-8408-847bf4c65ffc\"},{\"type\":\"object\",\"name\":\"panel.models.comm_manager.CommManager\",\"id\":\"bc54cb9f-6ddb-48f4-a20b-e2578c219f81\",\"attributes\":{\"plot_id\":\"dc2cde33-9369-4db4-8408-847bf4c65ffc\",\"comm_id\":\"2e5b001ec7954f37b20ffe8e1669f853\",\"client_comm_id\":\"01588b68ba47480181e527c16a4fd717\"}}],\"defs\":[{\"type\":\"model\",\"name\":\"ReactiveHTML1\"},{\"type\":\"model\",\"name\":\"FlexBox1\",\"properties\":[{\"name\":\"align_content\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"align_items\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"flex_direction\",\"kind\":\"Any\",\"default\":\"row\"},{\"name\":\"flex_wrap\",\"kind\":\"Any\",\"default\":\"wrap\"},{\"name\":\"gap\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"justify_content\",\"kind\":\"Any\",\"default\":\"flex-start\"}]},{\"type\":\"model\",\"name\":\"FloatPanel1\",\"properties\":[{\"name\":\"config\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"contained\",\"kind\":\"Any\",\"default\":true},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"right-top\"},{\"name\":\"offsetx\",\"kind\":\"Any\",\"default\":null},{\"name\":\"offsety\",\"kind\":\"Any\",\"default\":null},{\"name\":\"theme\",\"kind\":\"Any\",\"default\":\"primary\"},{\"name\":\"status\",\"kind\":\"Any\",\"default\":\"normalized\"}]},{\"type\":\"model\",\"name\":\"GridStack1\",\"properties\":[{\"name\":\"mode\",\"kind\":\"Any\",\"default\":\"warn\"},{\"name\":\"ncols\",\"kind\":\"Any\",\"default\":null},{\"name\":\"nrows\",\"kind\":\"Any\",\"default\":null},{\"name\":\"allow_resize\",\"kind\":\"Any\",\"default\":true},{\"name\":\"allow_drag\",\"kind\":\"Any\",\"default\":true},{\"name\":\"state\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"drag1\",\"properties\":[{\"name\":\"slider_width\",\"kind\":\"Any\",\"default\":5},{\"name\":\"slider_color\",\"kind\":\"Any\",\"default\":\"black\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":50}]},{\"type\":\"model\",\"name\":\"click1\",\"properties\":[{\"name\":\"terminal_output\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"debug_name\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"clears\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"FastWrapper1\",\"properties\":[{\"name\":\"object\",\"kind\":\"Any\",\"default\":null},{\"name\":\"style\",\"kind\":\"Any\",\"default\":null}]},{\"type\":\"model\",\"name\":\"NotificationAreaBase1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"NotificationArea1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"notifications\",\"kind\":\"Any\",\"default\":[]},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0},{\"name\":\"types\",\"kind\":\"Any\",\"default\":[{\"type\":\"map\",\"entries\":[[\"type\",\"warning\"],[\"background\",\"#ffc107\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-exclamation-triangle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]},{\"type\":\"map\",\"entries\":[[\"type\",\"info\"],[\"background\",\"#007bff\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-info-circle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]}]}]},{\"type\":\"model\",\"name\":\"Notification\",\"properties\":[{\"name\":\"background\",\"kind\":\"Any\",\"default\":null},{\"name\":\"duration\",\"kind\":\"Any\",\"default\":3000},{\"name\":\"icon\",\"kind\":\"Any\",\"default\":null},{\"name\":\"message\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"notification_type\",\"kind\":\"Any\",\"default\":null},{\"name\":\"_destroyed\",\"kind\":\"Any\",\"default\":false}]},{\"type\":\"model\",\"name\":\"TemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"BootstrapTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"TemplateEditor1\",\"properties\":[{\"name\":\"layout\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"MaterialTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"copy_to_clipboard1\",\"properties\":[{\"name\":\"fill\",\"kind\":\"Any\",\"default\":\"none\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":null}]}]}};\n",
-       "  var render_items = [{\"docid\":\"1c8a85bc-1a5f-4975-a57f-a684300f34ab\",\"roots\":{\"dc2cde33-9369-4db4-8408-847bf4c65ffc\":\"a793e9c8-e442-466e-aea8-1b0e6fb985a1\"},\"root_ids\":[\"dc2cde33-9369-4db4-8408-847bf4c65ffc\"]}];\n",
+       "  var docs_json = {\"101349fd-941c-4911-93ba-2e4a16018c96\":{\"version\":\"3.4.1\",\"title\":\"Bokeh Application\",\"roots\":[{\"type\":\"object\",\"name\":\"panel.models.browser.BrowserInfo\",\"id\":\"7de196b5-2c93-443a-a44b-281f976f845f\"},{\"type\":\"object\",\"name\":\"panel.models.comm_manager.CommManager\",\"id\":\"54c068ae-edf4-4534-b29e-a705a4b91d23\",\"attributes\":{\"plot_id\":\"7de196b5-2c93-443a-a44b-281f976f845f\",\"comm_id\":\"4c8a5367b12748279374ac61ae3d2f69\",\"client_comm_id\":\"0b05983903454cec8dcf8f0785b29cf3\"}}],\"defs\":[{\"type\":\"model\",\"name\":\"ReactiveHTML1\"},{\"type\":\"model\",\"name\":\"FlexBox1\",\"properties\":[{\"name\":\"align_content\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"align_items\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"flex_direction\",\"kind\":\"Any\",\"default\":\"row\"},{\"name\":\"flex_wrap\",\"kind\":\"Any\",\"default\":\"wrap\"},{\"name\":\"gap\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"justify_content\",\"kind\":\"Any\",\"default\":\"flex-start\"}]},{\"type\":\"model\",\"name\":\"FloatPanel1\",\"properties\":[{\"name\":\"config\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"contained\",\"kind\":\"Any\",\"default\":true},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"right-top\"},{\"name\":\"offsetx\",\"kind\":\"Any\",\"default\":null},{\"name\":\"offsety\",\"kind\":\"Any\",\"default\":null},{\"name\":\"theme\",\"kind\":\"Any\",\"default\":\"primary\"},{\"name\":\"status\",\"kind\":\"Any\",\"default\":\"normalized\"}]},{\"type\":\"model\",\"name\":\"GridStack1\",\"properties\":[{\"name\":\"mode\",\"kind\":\"Any\",\"default\":\"warn\"},{\"name\":\"ncols\",\"kind\":\"Any\",\"default\":null},{\"name\":\"nrows\",\"kind\":\"Any\",\"default\":null},{\"name\":\"allow_resize\",\"kind\":\"Any\",\"default\":true},{\"name\":\"allow_drag\",\"kind\":\"Any\",\"default\":true},{\"name\":\"state\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"drag1\",\"properties\":[{\"name\":\"slider_width\",\"kind\":\"Any\",\"default\":5},{\"name\":\"slider_color\",\"kind\":\"Any\",\"default\":\"black\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":50}]},{\"type\":\"model\",\"name\":\"click1\",\"properties\":[{\"name\":\"terminal_output\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"debug_name\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"clears\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"FastWrapper1\",\"properties\":[{\"name\":\"object\",\"kind\":\"Any\",\"default\":null},{\"name\":\"style\",\"kind\":\"Any\",\"default\":null}]},{\"type\":\"model\",\"name\":\"NotificationAreaBase1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"NotificationArea1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"notifications\",\"kind\":\"Any\",\"default\":[]},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0},{\"name\":\"types\",\"kind\":\"Any\",\"default\":[{\"type\":\"map\",\"entries\":[[\"type\",\"warning\"],[\"background\",\"#ffc107\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-exclamation-triangle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]},{\"type\":\"map\",\"entries\":[[\"type\",\"info\"],[\"background\",\"#007bff\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-info-circle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]}]}]},{\"type\":\"model\",\"name\":\"Notification\",\"properties\":[{\"name\":\"background\",\"kind\":\"Any\",\"default\":null},{\"name\":\"duration\",\"kind\":\"Any\",\"default\":3000},{\"name\":\"icon\",\"kind\":\"Any\",\"default\":null},{\"name\":\"message\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"notification_type\",\"kind\":\"Any\",\"default\":null},{\"name\":\"_destroyed\",\"kind\":\"Any\",\"default\":false}]},{\"type\":\"model\",\"name\":\"TemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"BootstrapTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"TemplateEditor1\",\"properties\":[{\"name\":\"layout\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"MaterialTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"copy_to_clipboard1\",\"properties\":[{\"name\":\"fill\",\"kind\":\"Any\",\"default\":\"none\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":null}]}]}};\n",
+       "  var render_items = [{\"docid\":\"101349fd-941c-4911-93ba-2e4a16018c96\",\"roots\":{\"7de196b5-2c93-443a-a44b-281f976f845f\":\"a20ce3e3-5de6-4d64-aeac-21871f55dc02\"},\"root_ids\":[\"7de196b5-2c93-443a-a44b-281f976f845f\"]}];\n",
        "  var docs = Object.values(docs_json)\n",
        "  if (!docs) {\n",
        "    return\n",
@@ -139,7 +139,7 @@
      },
      "metadata": {
       "application/vnd.holoviews_exec.v0+json": {
-       "id": "dc2cde33-9369-4db4-8408-847bf4c65ffc"
+       "id": "7de196b5-2c93-443a-a44b-281f976f845f"
       }
      },
      "output_type": "display_data"
@@ -191,7 +191,7 @@
     "import json\n",
     "\n",
     "import panel as pn\n",
-    "from bdi import APIManager\n",
+    "from bdikit import APIManager\n",
     "\n",
     "pn.extension('mathjax')\n",
     "pn.extension('vega')"
@@ -199,7 +199,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 3,
    "metadata": {},
    "outputs": [
     {
@@ -209,7 +209,7 @@
       "Some weights of RobertaModel were not initialized from the model checkpoint at roberta-base and are newly initialized: ['roberta.pooler.dense.bias', 'roberta.pooler.dense.weight']\n",
       "You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.\n",
       "  0%|          | 0/17 [00:00<?, ?it/s]We strongly recommend passing in an `attention_mask` since your input_ids may be padded. See https://huggingface.co/docs/transformers/troubleshooting#incorrect-output-when-padding-tokens-arent-masked.\n",
-      "100%|██████████| 17/17 [00:00<00:00, 36.25it/s]\n"
+      "100%|██████████| 17/17 [00:00<00:00, 37.58it/s]\n"
      ]
     },
     {
@@ -223,7 +223,7 @@
      "name": "stderr",
      "output_type": "stream",
      "text": [
-      "100%|██████████| 734/734 [00:32<00:00, 22.92it/s]"
+      "100%|██████████| 734/734 [00:29<00:00, 24.67it/s]"
      ]
     },
     {
@@ -305,181 +305,31 @@
        "      <td>The yes/no/unknown indicator used to describe whether the tumor is confined to the organ where it originated and did not spread to a proximal or dista...</td>\n",
        "      <td>Yes, No, Unknown, Not Reported</td>\n",
        "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>race</td>\n",
-       "      <td>0.2936</td>\n",
-       "      <td>An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...</td>\n",
-       "      <td>american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>vascular_invasion_present</td>\n",
-       "      <td>0.291</td>\n",
-       "      <td>The yes/no indicator to ask if large vessel or venous invasion was detected by surgery or presence in a tumor specimen.</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>lymphatic_invasion_present</td>\n",
-       "      <td>0.287</td>\n",
-       "      <td>A yes/no indicator to ask if small or thin-walled vessel invasion is present, indicating lymphatic involvement</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>ethnicity</td>\n",
-       "      <td>0.2618</td>\n",
-       "      <td>An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...</td>\n",
-       "      <td>hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>perineural_invasion_present</td>\n",
-       "      <td>0.2578</td>\n",
-       "      <td>a yes/no indicator to ask if perineural invasion or infiltration of tumor or cancer is present.</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>lymph_node_involvement</td>\n",
-       "      <td>0.2574</td>\n",
-       "      <td>Indicator noting whether lymph nodes were involved.</td>\n",
-       "      <td>Indeterminant, Negative, Positive, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>ovarian_surface_involvement</td>\n",
-       "      <td>0.2449</td>\n",
-       "      <td>The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.</td>\n",
-       "      <td>Absent, Indeterminate, Present, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>is_legacy</td>\n",
-       "      <td>0.2389</td>\n",
-       "      <td>Indicates whether a project will appear in the Legacy Archive.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>satellite_nodule_present</td>\n",
-       "      <td>0.2356</td>\n",
-       "      <td>Indicator noting whether a nodule or tumor is located within a small distance (e.g. 2cm) of the primary tumor.</td>\n",
-       "      <td>Absent, Indeterminate, Present, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>releasable</td>\n",
-       "      <td>0.2233</td>\n",
-       "      <td>A project can only be released by the user when `releasable` is true.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>consent_type</td>\n",
-       "      <td>0.2182</td>\n",
-       "      <td>The text term used to describe the type of consent obtain from the subject for participation in the study.</td>\n",
-       "      <td>Consent by Death, Consent Exemption, Consent Waiver, Informed Consent</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>oct_embedded</td>\n",
-       "      <td>0.2094</td>\n",
-       "      <td>Indicator of whether or not the sample was embedded in Optimal Cutting Temperature (OCT) compound.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>id</td>\n",
-       "      <td>0.201</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>gender</td>\n",
-       "      <td>0.1994</td>\n",
-       "      <td>Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...</td>\n",
-       "      <td>female, male, unspecified, unknown, not reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>necrosis_present</td>\n",
-       "      <td>0.1991</td>\n",
-       "      <td>Indicator describing whether the presence of necrosis was confirmed.</td>\n",
-       "      <td>Yes, No, Not Reported</td>\n",
-       "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                             Candidate Similarity  \\\n",
-       "0                     country_of_birth     0.5726   \n",
-       "1   country_of_residence_at_enrollment     0.5151   \n",
-       "2                       variant_origin     0.3803   \n",
-       "3              zone_of_origin_prostate     0.3563   \n",
-       "4    tumor_confined_to_organ_of_origin     0.3322   \n",
-       "5                                 race     0.2936   \n",
-       "6            vascular_invasion_present      0.291   \n",
-       "7           lymphatic_invasion_present      0.287   \n",
-       "8                            ethnicity     0.2618   \n",
-       "9          perineural_invasion_present     0.2578   \n",
-       "10              lymph_node_involvement     0.2574   \n",
-       "11         ovarian_surface_involvement     0.2449   \n",
-       "12                           is_legacy     0.2389   \n",
-       "13            satellite_nodule_present     0.2356   \n",
-       "14                          releasable     0.2233   \n",
-       "15                        consent_type     0.2182   \n",
-       "16                        oct_embedded     0.2094   \n",
-       "17                                  id      0.201   \n",
-       "18                              gender     0.1994   \n",
-       "19                    necrosis_present     0.1991   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                                                                                       The name of the country in which the patient is born.   \n",
-       "1                                              The text term used to describe the patient's country of residence at the time they were enrolled in the study.   \n",
-       "2                                                                         The text term used to describe the biological origin of a specific genetic variant.   \n",
-       "3                                                                                              The location or position of the tumor by zone of the prostate.   \n",
-       "4   The yes/no/unknown indicator used to describe whether the tumor is confined to the organ where it originated and did not spread to a proximal or dista...   \n",
-       "5   An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...   \n",
-       "6                                     The yes/no indicator to ask if large vessel or venous invasion was detected by surgery or presence in a tumor specimen.   \n",
-       "7                                              A yes/no indicator to ask if small or thin-walled vessel invasion is present, indicating lymphatic involvement   \n",
-       "8   An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...   \n",
-       "9                                                             a yes/no indicator to ask if perineural invasion or infiltration of tumor or cancer is present.   \n",
-       "10                                                                                                        Indicator noting whether lymph nodes were involved.   \n",
-       "11                 The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.   \n",
-       "12                                                                                             Indicates whether a project will appear in the Legacy Archive.   \n",
-       "13                                             Indicator noting whether a nodule or tumor is located within a small distance (e.g. 2cm) of the primary tumor.   \n",
-       "14                                                                                      A project can only be released by the user when `releasable` is true.   \n",
-       "15                                                 The text term used to describe the type of consent obtain from the subject for participation in the study.   \n",
-       "16                                                         Indicator of whether or not the sample was embedded in Optimal Cutting Temperature (OCT) compound.   \n",
-       "17                                                                                                                                                              \n",
-       "18  Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...   \n",
-       "19                                                                                       Indicator describing whether the presence of necrosis was confirmed.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0   Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "1   Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "2                                                                                                                                  Germline, Somatic, Unknown  \n",
-       "3                                                                    Central zone, Overlapping/multiple zones, Peripheral zone, Transition zone, Unknown zone  \n",
-       "4                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "5   american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...  \n",
-       "6                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "7                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "8                                                          hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect  \n",
-       "9                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "10                                                                                                   Indeterminant, Negative, Positive, Unknown, Not Reported  \n",
-       "11                                                                                                      Absent, Indeterminate, Present, Unknown, Not Reported  \n",
-       "12                                                                                                                                                             \n",
-       "13                                                                                                      Absent, Indeterminate, Present, Unknown, Not Reported  \n",
-       "14                                                                                                                                                             \n",
-       "15                                                                                      Consent by Death, Consent Exemption, Consent Waiver, Informed Consent  \n",
-       "16                                                                                                                                                             \n",
-       "17                                                                                                                                                             \n",
-       "18                                                                                                           female, male, unspecified, unknown, not reported  \n",
-       "19                                                                                                                                      Yes, No, Not Reported  "
+       "                            Candidate Similarity  \\\n",
+       "0                    country_of_birth     0.5726   \n",
+       "1  country_of_residence_at_enrollment     0.5151   \n",
+       "2                      variant_origin     0.3803   \n",
+       "3             zone_of_origin_prostate     0.3563   \n",
+       "4   tumor_confined_to_organ_of_origin     0.3322   \n",
+       "\n",
+       "                                                                                                                                                 Description  \\\n",
+       "0                                                                                                      The name of the country in which the patient is born.   \n",
+       "1                                             The text term used to describe the patient's country of residence at the time they were enrolled in the study.   \n",
+       "2                                                                        The text term used to describe the biological origin of a specific genetic variant.   \n",
+       "3                                                                                             The location or position of the tumor by zone of the prostate.   \n",
+       "4  The yes/no/unknown indicator used to describe whether the tumor is confined to the organ where it originated and did not spread to a proximal or dista...   \n",
+       "\n",
+       "                                                                                                                                             Values (sample)  \n",
+       "0  Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
+       "1  Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
+       "2                                                                                                                                 Germline, Somatic, Unknown  \n",
+       "3                                                                   Central zone, Overlapping/multiple zones, Peripheral zone, Transition zone, Unknown zone  \n",
+       "4                                                                                                                             Yes, No, Unknown, Not Reported  "
       ]
      },
      "metadata": {},
@@ -556,181 +406,31 @@
        "      <td>Text term used to describe the classification of neuroblastic differentiation within neuroblastoma tumors, as defined by the International Neuroblasto...</td>\n",
        "      <td>Differentiating, Poorly Differentiated, Undifferentiated, Undifferentiated or Poorly Differentiated, Unknown, Not Reported</td>\n",
        "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>igcccg_stage</td>\n",
-       "      <td>0.4971</td>\n",
-       "      <td>The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...</td>\n",
-       "      <td>Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>who_cns_grade</td>\n",
-       "      <td>0.495</td>\n",
-       "      <td>The WHO (World Health Organization) grading classification of CNS tumors, which is based on histological characteristics such as cellularity, mitotic ...</td>\n",
-       "      <td>Grade I, Grade II, Grade III, Grade IV, Grade Not Assigned, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>risk_factor_method_of_diagnosis</td>\n",
-       "      <td>0.4742</td>\n",
-       "      <td>The clinical or laboratory procedure(s) used in the determination of a diagnosis described in this context as a risk factor.</td>\n",
-       "      <td>Biochemical Assessment, Both Clinical and Biochemical Assessments, Clinical Assessment, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>enneking_msts_grade</td>\n",
-       "      <td>0.4695</td>\n",
-       "      <td>The text term used to describe the surgical grade of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...</td>\n",
-       "      <td>High Grade (G2), Low Grade (G1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>adverse_event_grade</td>\n",
-       "      <td>0.4679</td>\n",
-       "      <td>Numeric representation of the intensity/severity of an unfavorable and unintended sign (including an abnormal laboratory finding), symptom, syndrome, ...</td>\n",
-       "      <td>Grade 1, Grade 2, Grade 3, Grade 4, Grade 5</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.4639</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>tumor_regression_grade</td>\n",
-       "      <td>0.4593</td>\n",
-       "      <td>A numeric value used to measure therapeutic response of the primary tumor and predict patient outcomes based on a three-point tumor regression grading...</td>\n",
-       "      <td>0, 1, 2, 3, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>extrathyroid_extension</td>\n",
-       "      <td>0.4561</td>\n",
-       "      <td>Text term to describe the degree to which the primary tumor has extra thyroid extension.</td>\n",
-       "      <td>None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>secondary_gleason_grade</td>\n",
-       "      <td>0.4304</td>\n",
-       "      <td>The text term used to describe the secondary Gleason score, which describes the pattern of cells making up the second largest area of the tumor. The p...</td>\n",
-       "      <td>Pattern 1, Pattern 2, Pattern 3, Pattern 4, Pattern 5</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>education_level</td>\n",
-       "      <td>0.4262</td>\n",
-       "      <td>The years of schooling completed in graded public, private, or parochial schools, and in colleges, universities, or professional schools.</td>\n",
-       "      <td>College Degree, High School Graduate or GED, Professional or Graduate Degree, Some High School or Less, Vocational College or Some College, Not Report...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>gleason_grade_tertiary</td>\n",
-       "      <td>0.422</td>\n",
-       "      <td>The text term used to describe the tertiary pattern as described by the Gleason Grading System.</td>\n",
-       "      <td>Pattern 4, Pattern 5</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>uicc_clinical_stage</td>\n",
-       "      <td>0.4165</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.4122</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>data_type</td>\n",
-       "      <td>0.4086</td>\n",
-       "      <td>Specific content type of the data file.</td>\n",
-       "      <td>Biospecimen Supplement</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>ensat_pathologic_stage</td>\n",
-       "      <td>0.401</td>\n",
-       "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
-       "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                          Candidate Similarity  \\\n",
-       "0       histologic_progression_type     0.6556   \n",
-       "1                     who_nte_grade     0.5967   \n",
-       "2                       tumor_grade     0.5817   \n",
-       "3              tumor_grade_category     0.5759   \n",
-       "4                        inpc_grade     0.5104   \n",
-       "5                      igcccg_stage     0.4971   \n",
-       "6                     who_cns_grade      0.495   \n",
-       "7   risk_factor_method_of_diagnosis     0.4742   \n",
-       "8               enneking_msts_grade     0.4695   \n",
-       "9               adverse_event_grade     0.4679   \n",
-       "10                       inss_stage     0.4639   \n",
-       "11           tumor_regression_grade     0.4593   \n",
-       "12           extrathyroid_extension     0.4561   \n",
-       "13          secondary_gleason_grade     0.4304   \n",
-       "14                  education_level     0.4262   \n",
-       "15           gleason_grade_tertiary      0.422   \n",
-       "16              uicc_clinical_stage     0.4165   \n",
-       "17              ajcc_clinical_stage     0.4122   \n",
-       "18                        data_type     0.4086   \n",
-       "19           ensat_pathologic_stage      0.401   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0      Text term to describe the disease progression as determined by microscopic review of cells and their surrounding extracellular environment in tissues.   \n",
-       "1                                                                        The WHO (World Health Organization) grading classification of Neuroendocrine Tumors.   \n",
-       "2                                        Numeric value to express the degree of abnormality of cancer cells, a measure of differentiation and aggressiveness.   \n",
-       "3                                              Describes the number of levels or 'tiers' in the system used to determine the degree of tumor differentiation.   \n",
-       "4   Text term used to describe the classification of neuroblastic differentiation within neuroblastoma tumors, as defined by the International Neuroblasto...   \n",
-       "5   The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...   \n",
-       "6   The WHO (World Health Organization) grading classification of CNS tumors, which is based on histological characteristics such as cellularity, mitotic ...   \n",
-       "7                                The clinical or laboratory procedure(s) used in the determination of a diagnosis described in this context as a risk factor.   \n",
-       "8   The text term used to describe the surgical grade of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...   \n",
-       "9   Numeric representation of the intensity/severity of an unfavorable and unintended sign (including an abnormal laboratory finding), symptom, syndrome, ...   \n",
-       "10         Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "11  A numeric value used to measure therapeutic response of the primary tumor and predict patient outcomes based on a three-point tumor regression grading...   \n",
-       "12                                                                   Text term to describe the degree to which the primary tumor has extra thyroid extension.   \n",
-       "13  The text term used to describe the secondary Gleason score, which describes the pattern of cells making up the second largest area of the tumor. The p...   \n",
-       "14                  The years of schooling completed in graded public, private, or parochial schools, and in colleges, universities, or professional schools.   \n",
-       "15                                                            The text term used to describe the tertiary pattern as described by the Gleason Grading System.   \n",
-       "16  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "17  Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "18                                                                                                                    Specific content type of the data file.   \n",
-       "19                                        An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                    Anaplastic, Poorly differentiated, Unknown, Not Reported  \n",
-       "1                                                                                                                       G1, G2, G3, GX, Unknown, Not Reported  \n",
-       "2                                                                    G1, G2, G3, G4, GB, GX, High Grade, Intermediate Grade, Low Grade, Unknown, Not Reported  \n",
-       "3                                                                                                                         Four Tier, Three Tier, Not Reported  \n",
-       "4                                  Differentiating, Poorly Differentiated, Undifferentiated, Undifferentiated or Poorly Differentiated, Unknown, Not Reported  \n",
-       "5                                                                               Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported  \n",
-       "6                                                                           Grade I, Grade II, Grade III, Grade IV, Grade Not Assigned, Unknown, Not Reported  \n",
-       "7                                                        Biochemical Assessment, Both Clinical and Biochemical Assessments, Clinical Assessment, Not Reported  \n",
-       "8                                                                                                      High Grade (G2), Low Grade (G1), Unknown, Not Reported  \n",
-       "9                                                                                                                 Grade 1, Grade 2, Grade 3, Grade 4, Grade 5  \n",
-       "10                                                                             Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "11                                                                                                                          0, 1, 2, 3, Unknown, Not Reported  \n",
-       "12                                                                                  None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown  \n",
-       "13                                                                                                      Pattern 1, Pattern 2, Pattern 3, Pattern 4, Pattern 5  \n",
-       "14  College Degree, High School Graduate or GED, Professional or Graduate Degree, Some High School or Less, Vocational College or Some College, Not Report...  \n",
-       "15                                                                                                                                       Pattern 4, Pattern 5  \n",
-       "16  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "17  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "18                                                                                                                                     Biospecimen Supplement  \n",
-       "19                                                                                                                     Stage I, Stage II, Stage III, Stage IV  "
+       "                     Candidate Similarity  \\\n",
+       "0  histologic_progression_type     0.6556   \n",
+       "1                who_nte_grade     0.5967   \n",
+       "2                  tumor_grade     0.5817   \n",
+       "3         tumor_grade_category     0.5759   \n",
+       "4                   inpc_grade     0.5104   \n",
+       "\n",
+       "                                                                                                                                                 Description  \\\n",
+       "0     Text term to describe the disease progression as determined by microscopic review of cells and their surrounding extracellular environment in tissues.   \n",
+       "1                                                                       The WHO (World Health Organization) grading classification of Neuroendocrine Tumors.   \n",
+       "2                                       Numeric value to express the degree of abnormality of cancer cells, a measure of differentiation and aggressiveness.   \n",
+       "3                                             Describes the number of levels or 'tiers' in the system used to determine the degree of tumor differentiation.   \n",
+       "4  Text term used to describe the classification of neuroblastic differentiation within neuroblastoma tumors, as defined by the International Neuroblasto...   \n",
+       "\n",
+       "                                                                                                              Values (sample)  \n",
+       "0                                                                    Anaplastic, Poorly differentiated, Unknown, Not Reported  \n",
+       "1                                                                                       G1, G2, G3, GX, Unknown, Not Reported  \n",
+       "2                                    G1, G2, G3, G4, GB, GX, High Grade, Intermediate Grade, Low Grade, Unknown, Not Reported  \n",
+       "3                                                                                         Four Tier, Three Tier, Not Reported  \n",
+       "4  Differentiating, Poorly Differentiated, Undifferentiated, Undifferentiated or Poorly Differentiated, Unknown, Not Reported  "
       ]
      },
      "metadata": {},
@@ -775,213 +475,63 @@
        "    <tr>\n",
        "      <th>0</th>\n",
        "      <td>history_of_tumor_type</td>\n",
-       "      <td>0.6765</td>\n",
+       "      <td>0.6757</td>\n",
        "      <td>Describes the type of the patient's prior diagnosed tumor.</td>\n",
        "      <td>Colorectal Cancer, Lower Grade Glioma, Phenochromocytoma or Paraganglioma</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>1</th>\n",
        "      <td>roots</td>\n",
-       "      <td>0.6562</td>\n",
+       "      <td>0.6592</td>\n",
        "      <td></td>\n",
        "      <td></td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>2</th>\n",
        "      <td>percent_sarcomatoid_features</td>\n",
-       "      <td>0.5852</td>\n",
+       "      <td>0.5766</td>\n",
        "      <td>Numeric value that represents the percentage of sarcomatoid features found in a specific tissue sample.</td>\n",
        "      <td></td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>3</th>\n",
        "      <td>additional_pathology_findings</td>\n",
-       "      <td>0.5574</td>\n",
+       "      <td>0.5398</td>\n",
        "      <td>A section header that includes additional pathologic findings.</td>\n",
        "      <td>Adenomyosis, Asbestos bodies, Atrophic endometrium, Atypical hyperplasia/Endometrial intraepithelial neoplasia (EIN), Autoimmune atrophic chronic gast...</td>\n",
        "    </tr>\n",
        "    <tr>\n",
        "      <th>4</th>\n",
        "      <td>relationship_primary_diagnosis</td>\n",
-       "      <td>0.5291</td>\n",
+       "      <td>0.5278</td>\n",
        "      <td>The text term used to describe the malignant diagnosis of the patient's relative with a history of cancer.</td>\n",
        "      <td>Adrenal Gland Cancer, Basal Cell Cancer, Bile Duct Cancer, Bladder Cancer, Blood Cancer, Bone Cancer, Brain Cancer, Breast Cancer, Cancer, Cervical Ca...</td>\n",
        "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>primary_diagnosis</td>\n",
-       "      <td>0.525</td>\n",
-       "      <td>Text term used to describe the patient's histologic diagnosis, as described by the World Health Organization's (WHO) International Classification of D...</td>\n",
-       "      <td>Abdominal desmoid, Abdominal fibromatosis, Achromic nevus, Acidophil adenocarcinoma, Acidophil adenoma, Acidophil carcinoma, Acinar adenocarcinoma, Ac...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>described_cases</td>\n",
-       "      <td>0.5208</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>supratentorial_localization</td>\n",
-       "      <td>0.5184</td>\n",
-       "      <td>Text term to specify the location of the supratentorial tumor.</td>\n",
-       "      <td>Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>dysplasia_type</td>\n",
-       "      <td>0.5049</td>\n",
-       "      <td>The type of dysplasia involved.</td>\n",
-       "      <td>Epithelial, Esophageal Columnar Dysplasia, Esophageal Mucosa Columnar Dysplasia, Keratinizing, Nonkeratinizing, Other, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>disease_type</td>\n",
-       "      <td>0.4981</td>\n",
-       "      <td>The text term used to describe the type of malignant disease, as categorized by the World Health Organization's (WHO) International Classification of ...</td>\n",
-       "      <td>Acinar Cell Neoplasms, Adenomas and Adenocarcinomas, Adnexal and Skin Appendage Neoplasms, Basal Cell Neoplasms, Blood Vessel Tumors, Chronic Myelopro...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>pathology_details</td>\n",
-       "      <td>0.4979</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>pathology_reports</td>\n",
-       "      <td>0.4894</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>ploidy</td>\n",
-       "      <td>0.4757</td>\n",
-       "      <td>Text term used to describe the number of sets of homologous chromosomes.</td>\n",
-       "      <td>Aneuploid, Diploid, Hyperdiploid, Hypodiploid, Near Diploid, Tetraploid, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>sample_type</td>\n",
-       "      <td>0.4659</td>\n",
-       "      <td>Text term to describe the source of a biospecimen used for a laboratory test.</td>\n",
-       "      <td>Additional - New Primary, Additional Metastatic, Benign Neoplasms, Blood Derived Cancer - Bone Marrow, Blood Derived Cancer - Bone Marrow, Post-treatm...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>sarcomatoid_percent</td>\n",
-       "      <td>0.4646</td>\n",
-       "      <td>Numeric value that represents the percentage of sarcomatoid features found in a specific tissue sample.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>aneuploidy</td>\n",
-       "      <td>0.4598</td>\n",
-       "      <td>A chromosomal abnormality in which there is an addition or loss of chromosomes within a set (e.g., 23 + 22 or 23 + 24).</td>\n",
-       "      <td>Monosomy, Trisomy</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>morphologic_architectural_pattern</td>\n",
-       "      <td>0.4553</td>\n",
-       "      <td>A specific morphologic or pathologic architectural pattern was discovered within the sample studied.</td>\n",
-       "      <td>Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>tumor_code</td>\n",
-       "      <td>0.4504</td>\n",
-       "      <td>Diagnostic tumor code of the tissue sample source.</td>\n",
-       "      <td>Acute Leukemia of Ambiguous Lineage (ALAL), Acute lymphoblastic leukemia (ALL), Acute myeloid leukemia (AML), Anal Cancer (all types), Cervical Cancer...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>tumor_ploidy</td>\n",
-       "      <td>0.4503</td>\n",
-       "      <td>Numeric value used to describe the number of sets of chromosomes in a cell or an organism. For example, haploid means one set and diploid means two se...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>imaging_findings</td>\n",
-       "      <td>0.4482</td>\n",
-       "      <td>Recorded findings noted during the review of a specific medical image.</td>\n",
-       "      <td>Carcinomatosis, Kidney Involvement, Liver Involvement, Lung Involvement, Normal, Retroperitoneal Lymph Node Involvement, Vena Cava Involvement/Thrombu...</td>\n",
-       "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                            Candidate Similarity  \\\n",
-       "0               history_of_tumor_type     0.6765   \n",
-       "1                               roots     0.6562   \n",
-       "2        percent_sarcomatoid_features     0.5852   \n",
-       "3       additional_pathology_findings     0.5574   \n",
-       "4      relationship_primary_diagnosis     0.5291   \n",
-       "5                   primary_diagnosis      0.525   \n",
-       "6                     described_cases     0.5208   \n",
-       "7         supratentorial_localization     0.5184   \n",
-       "8                      dysplasia_type     0.5049   \n",
-       "9                        disease_type     0.4981   \n",
-       "10                  pathology_details     0.4979   \n",
-       "11                  pathology_reports     0.4894   \n",
-       "12                             ploidy     0.4757   \n",
-       "13                        sample_type     0.4659   \n",
-       "14                sarcomatoid_percent     0.4646   \n",
-       "15                         aneuploidy     0.4598   \n",
-       "16  morphologic_architectural_pattern     0.4553   \n",
-       "17                         tumor_code     0.4504   \n",
-       "18                       tumor_ploidy     0.4503   \n",
-       "19                   imaging_findings     0.4482   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                                                                                  Describes the type of the patient's prior diagnosed tumor.   \n",
-       "1                                                                                                                                                               \n",
-       "2                                                     Numeric value that represents the percentage of sarcomatoid features found in a specific tissue sample.   \n",
-       "3                                                                                              A section header that includes additional pathologic findings.   \n",
-       "4                                                  The text term used to describe the malignant diagnosis of the patient's relative with a history of cancer.   \n",
-       "5   Text term used to describe the patient's histologic diagnosis, as described by the World Health Organization's (WHO) International Classification of D...   \n",
-       "6                                                                                                                                                               \n",
-       "7                                                                                              Text term to specify the location of the supratentorial tumor.   \n",
-       "8                                                                                                                             The type of dysplasia involved.   \n",
-       "9   The text term used to describe the type of malignant disease, as categorized by the World Health Organization's (WHO) International Classification of ...   \n",
-       "10                                                                                                                                                              \n",
-       "11                                                                                                                                                              \n",
-       "12                                                                                   Text term used to describe the number of sets of homologous chromosomes.   \n",
-       "13                                                                              Text term to describe the source of a biospecimen used for a laboratory test.   \n",
-       "14                                                    Numeric value that represents the percentage of sarcomatoid features found in a specific tissue sample.   \n",
-       "15                                    A chromosomal abnormality in which there is an addition or loss of chromosomes within a set (e.g., 23 + 22 or 23 + 24).   \n",
-       "16                                                       A specific morphologic or pathologic architectural pattern was discovered within the sample studied.   \n",
-       "17                                                                                                         Diagnostic tumor code of the tissue sample source.   \n",
-       "18  Numeric value used to describe the number of sets of chromosomes in a cell or an organism. For example, haploid means one set and diploid means two se...   \n",
-       "19                                                                                     Recorded findings noted during the review of a specific medical image.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                   Colorectal Cancer, Lower Grade Glioma, Phenochromocytoma or Paraganglioma  \n",
-       "1                                                                                                                                                              \n",
-       "2                                                                                                                                                              \n",
-       "3   Adenomyosis, Asbestos bodies, Atrophic endometrium, Atypical hyperplasia/Endometrial intraepithelial neoplasia (EIN), Autoimmune atrophic chronic gast...  \n",
-       "4   Adrenal Gland Cancer, Basal Cell Cancer, Bile Duct Cancer, Bladder Cancer, Blood Cancer, Bone Cancer, Brain Cancer, Breast Cancer, Cancer, Cervical Ca...  \n",
-       "5   Abdominal desmoid, Abdominal fibromatosis, Achromic nevus, Acidophil adenocarcinoma, Acidophil adenoma, Acidophil carcinoma, Acinar adenocarcinoma, Ac...  \n",
-       "6                                                                                                                                                              \n",
-       "7   Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...  \n",
-       "8                Epithelial, Esophageal Columnar Dysplasia, Esophageal Mucosa Columnar Dysplasia, Keratinizing, Nonkeratinizing, Other, Unknown, Not Reported  \n",
-       "9   Acinar Cell Neoplasms, Adenomas and Adenocarcinomas, Adnexal and Skin Appendage Neoplasms, Basal Cell Neoplasms, Blood Vessel Tumors, Chronic Myelopro...  \n",
-       "10                                                                                                                                                             \n",
-       "11                                                                                                                                                             \n",
-       "12                                                             Aneuploid, Diploid, Hyperdiploid, Hypodiploid, Near Diploid, Tetraploid, Unknown, Not Reported  \n",
-       "13  Additional - New Primary, Additional Metastatic, Benign Neoplasms, Blood Derived Cancer - Bone Marrow, Blood Derived Cancer - Bone Marrow, Post-treatm...  \n",
-       "14                                                                                                                                                             \n",
-       "15                                                                                                                                          Monosomy, Trisomy  \n",
-       "16                                                    Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular  \n",
-       "17  Acute Leukemia of Ambiguous Lineage (ALAL), Acute lymphoblastic leukemia (ALL), Acute myeloid leukemia (AML), Anal Cancer (all types), Cervical Cancer...  \n",
-       "18                                                                                                                                                             \n",
-       "19  Carcinomatosis, Kidney Involvement, Liver Involvement, Lung Involvement, Normal, Retroperitoneal Lymph Node Involvement, Vena Cava Involvement/Thrombu...  "
+       "                        Candidate Similarity  \\\n",
+       "0           history_of_tumor_type     0.6757   \n",
+       "1                           roots     0.6592   \n",
+       "2    percent_sarcomatoid_features     0.5766   \n",
+       "3   additional_pathology_findings     0.5398   \n",
+       "4  relationship_primary_diagnosis     0.5278   \n",
+       "\n",
+       "                                                                                                  Description  \\\n",
+       "0                                                  Describes the type of the patient's prior diagnosed tumor.   \n",
+       "1                                                                                                               \n",
+       "2     Numeric value that represents the percentage of sarcomatoid features found in a specific tissue sample.   \n",
+       "3                                              A section header that includes additional pathologic findings.   \n",
+       "4  The text term used to describe the malignant diagnosis of the patient's relative with a history of cancer.   \n",
+       "\n",
+       "                                                                                                                                             Values (sample)  \n",
+       "0                                                                                  Colorectal Cancer, Lower Grade Glioma, Phenochromocytoma or Paraganglioma  \n",
+       "1                                                                                                                                                             \n",
+       "2                                                                                                                                                             \n",
+       "3  Adenomyosis, Asbestos bodies, Atrophic endometrium, Atypical hyperplasia/Endometrial intraepithelial neoplasia (EIN), Autoimmune atrophic chronic gast...  \n",
+       "4  Adrenal Gland Cancer, Basal Cell Cancer, Bile Duct Cancer, Bladder Cancer, Blood Cancer, Bone Cancer, Brain Cancer, Breast Cancer, Cancer, Cervical Ca...  "
       ]
      },
      "metadata": {},
@@ -1058,181 +608,31 @@
        "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
        "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
        "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.6422</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>ensat_pathologic_stage</td>\n",
-       "      <td>0.598</td>\n",
-       "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.5898</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>iss_stage</td>\n",
-       "      <td>0.5569</td>\n",
-       "      <td>The multiple myeloma disease stage at diagnosis.</td>\n",
-       "      <td>I, II, III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>ann_arbor_clinical_stage</td>\n",
-       "      <td>0.5407</td>\n",
-       "      <td>The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>cog_liver_stage</td>\n",
-       "      <td>0.5137</td>\n",
-       "      <td>The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>submitted_aligned_reads_files</td>\n",
-       "      <td>0.484</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>uicc_clinical_t</td>\n",
-       "      <td>0.4762</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>T0, T1, T1a, T1a1, T1a2, T1b, T1b1, T1b2, T1c, T1mi, T2, T2a, T2a1, T2a2, T2b, T2c, T2d, T3, T3a, T3b, T3c, T3d, T4, T4a, T4b, T4c, T4d, T4e, Ta, Tis,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>extrathyroid_extension</td>\n",
-       "      <td>0.4724</td>\n",
-       "      <td>Text term to describe the degree to which the primary tumor has extra thyroid extension.</td>\n",
-       "      <td>None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>uicc_clinical_m</td>\n",
-       "      <td>0.4668</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>uicc_pathologic_t</td>\n",
-       "      <td>0.4645</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>T0, T1, T1a, T1a1, T1a2, T1b, T1b1, T1b2, T1c, T1c2, T1mi, T2, T2a, T2a1, T2a2, T2b, T2c, T2d, T3, T3a, T3b, T3c, T3d, T4, T4a, T4b, T4c, T4d, T4e, Ta...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>ann_arbor_pathologic_stage</td>\n",
-       "      <td>0.4581</td>\n",
-       "      <td>The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>cog_renal_stage</td>\n",
-       "      <td>0.4567</td>\n",
-       "      <td>The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>ajcc_clinical_m</td>\n",
-       "      <td>0.4522</td>\n",
-       "      <td>Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>best_overall_response</td>\n",
-       "      <td>0.4407</td>\n",
-       "      <td>The best improvement achieved throughout the entire course of protocol treatment.</td>\n",
-       "      <td>AJ-Adjuvant Therapy, CPD-Clinical Progression, CR-Complete Response, CRU-Complete Response Unconfirmed, DU-Disease Unchanged, IMR-Immunoresponse, IPD-...</td>\n",
-       "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                        Candidate Similarity  \\\n",
-       "0             uicc_clinical_stage     0.7404   \n",
-       "1             ajcc_clinical_stage     0.6784   \n",
-       "2           uicc_pathologic_stage     0.6754   \n",
-       "3                      figo_stage      0.673   \n",
-       "4           ajcc_pathologic_stage     0.6702   \n",
-       "5                      inss_stage     0.6422   \n",
-       "6          ensat_pathologic_stage      0.598   \n",
-       "7                   masaoka_stage     0.5898   \n",
-       "8                       iss_stage     0.5569   \n",
-       "9        ann_arbor_clinical_stage     0.5407   \n",
-       "10                cog_liver_stage     0.5137   \n",
-       "11  submitted_aligned_reads_files      0.484   \n",
-       "12                uicc_clinical_t     0.4762   \n",
-       "13         extrathyroid_extension     0.4724   \n",
-       "14                uicc_clinical_m     0.4668   \n",
-       "15              uicc_pathologic_t     0.4645   \n",
-       "16     ann_arbor_pathologic_stage     0.4581   \n",
-       "17                cog_renal_stage     0.4567   \n",
-       "18                ajcc_clinical_m     0.4522   \n",
-       "19          best_overall_response     0.4407   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "1   Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "2   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "3   The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
-       "4         The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "5          Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "6                                         An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "7   The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "8                                                                                                            The multiple myeloma disease stage at diagnosis.   \n",
-       "9                                The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "10  The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...   \n",
-       "11                                                                                                                                                              \n",
-       "12  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "13                                                                   Text term to describe the degree to which the primary tumor has extra thyroid extension.   \n",
-       "14  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "15  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "16                             The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "17                              The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).   \n",
-       "18              Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.   \n",
-       "19                                                                          The best improvement achieved throughout the entire course of protocol treatment.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "1   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "2   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "3   Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
-       "4   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "5                                                                              Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "6                                                                                                                      Stage I, Stage II, Stage III, Stage IV  \n",
-       "7                                                                                              Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "8                                                                                                                           I, II, III, Unknown, Not Reported  \n",
-       "9                                                                                               Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "10                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "11                                                                                                                                                             \n",
-       "12  T0, T1, T1a, T1a1, T1a2, T1b, T1b1, T1b2, T1c, T1mi, T2, T2a, T2a1, T2a2, T2b, T2c, T2d, T3, T3a, T3b, T3c, T3d, T4, T4a, T4b, T4c, T4d, T4e, Ta, Tis,...  \n",
-       "13                                                                                  None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown  \n",
-       "14                                                                                                 cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported  \n",
-       "15  T0, T1, T1a, T1a1, T1a2, T1b, T1b1, T1b2, T1c, T1c2, T1mi, T2, T2a, T2a1, T2a2, T2b, T2c, T2d, T3, T3a, T3b, T3c, T3d, T4, T4a, T4b, T4c, T4d, T4e, Ta...  \n",
-       "16                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "17                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "18                                                                         cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "19  AJ-Adjuvant Therapy, CPD-Clinical Progression, CR-Complete Response, CRU-Complete Response Unconfirmed, DU-Disease Unchanged, IMR-Immunoresponse, IPD-...  "
+       "               Candidate Similarity  \\\n",
+       "0    uicc_clinical_stage     0.7404   \n",
+       "1    ajcc_clinical_stage     0.6784   \n",
+       "2  uicc_pathologic_stage     0.6754   \n",
+       "3             figo_stage      0.673   \n",
+       "4  ajcc_pathologic_stage     0.6702   \n",
+       "\n",
+       "                                                                                                                                                 Description  \\\n",
+       "0  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
+       "1  Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
+       "2  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
+       "3  The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
+       "4        The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
+       "\n",
+       "                                                                                                                                             Values (sample)  \n",
+       "0  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
+       "1  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
+       "2  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
+       "3  Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
+       "4  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  "
       ]
      },
      "metadata": {},
@@ -1309,3216 +709,229 @@
        "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
        "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
        "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>ajcc_pathologic_stage</td>\n",
-       "      <td>0.539</td>\n",
-       "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.5372</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>uicc_pathologic_n</td>\n",
-       "      <td>0.5264</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N2mi, N3, N3a, N3b, N3c, N4, NX, U...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>enneking_msts_stage</td>\n",
-       "      <td>0.514</td>\n",
-       "      <td>Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...</td>\n",
-       "      <td>Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>uicc_clinical_n</td>\n",
-       "      <td>0.5137</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N3, N3a, N3b, N3c, N4, NX, Unknown...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>cog_liver_stage</td>\n",
-       "      <td>0.5106</td>\n",
-       "      <td>The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>iss_stage</td>\n",
-       "      <td>0.5046</td>\n",
-       "      <td>The multiple myeloma disease stage at diagnosis.</td>\n",
-       "      <td>I, II, III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>cog_renal_stage</td>\n",
-       "      <td>0.4964</td>\n",
-       "      <td>The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>inrg_stage</td>\n",
-       "      <td>0.4857</td>\n",
-       "      <td>The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).</td>\n",
-       "      <td>L1, L2, M, Ms, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.4721</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>ann_arbor_clinical_stage</td>\n",
-       "      <td>0.4645</td>\n",
-       "      <td>The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>ann_arbor_pathologic_stage</td>\n",
-       "      <td>0.4562</td>\n",
-       "      <td>The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>ajcc_clinical_n</td>\n",
-       "      <td>0.4517</td>\n",
-       "      <td>Extent of the regional lymph node involvement for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatm...</td>\n",
-       "      <td>N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N3, N3a, N3b, N3c, N4, NX, Unknown...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>ajcc_pathologic_n</td>\n",
-       "      <td>0.4483</td>\n",
-       "      <td>The codes that represent the stage of cancer based on the nodes present (N stage) according to criteria based on multiple editions of the AJCC's Cance...</td>\n",
-       "      <td>N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N2mi, N3, N3a, N3b, N3c, N4, NX, U...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>ishak_fibrosis_score</td>\n",
-       "      <td>0.3844</td>\n",
-       "      <td>The text term used to describe the classification of the histopathologic degree of liver damage.</td>\n",
-       "      <td>0 - No Fibrosis, 1,2 - Portal Fibrosis, 3,4 - Fibrous Septa, 5 - Nodular Formation and Incomplete Cirrhosis, 6 - Established Cirrhosis, Unknown, Not R...</td>\n",
-       "    </tr>\n",
        "  </tbody>\n",
        "</table>\n",
        "</div>"
       ],
       "text/plain": [
-       "                     Candidate Similarity  \\\n",
-       "0                   figo_stage     0.6017   \n",
-       "1          uicc_clinical_stage     0.5684   \n",
-       "2                   inss_stage     0.5541   \n",
-       "3        uicc_pathologic_stage     0.5505   \n",
-       "4       ensat_pathologic_stage     0.5397   \n",
-       "5        ajcc_pathologic_stage      0.539   \n",
-       "6          ajcc_clinical_stage     0.5372   \n",
-       "7            uicc_pathologic_n     0.5264   \n",
-       "8          enneking_msts_stage      0.514   \n",
-       "9              uicc_clinical_n     0.5137   \n",
-       "10             cog_liver_stage     0.5106   \n",
-       "11                   iss_stage     0.5046   \n",
-       "12             cog_renal_stage     0.4964   \n",
-       "13                  inrg_stage     0.4857   \n",
-       "14               masaoka_stage     0.4721   \n",
-       "15    ann_arbor_clinical_stage     0.4645   \n",
-       "16  ann_arbor_pathologic_stage     0.4562   \n",
-       "17             ajcc_clinical_n     0.4517   \n",
-       "18           ajcc_pathologic_n     0.4483   \n",
-       "19        ishak_fibrosis_score     0.3844   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
-       "1   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "2          Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "3   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "4                                         An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "5         The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "6   Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "7   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "8   Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...   \n",
-       "9   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "10  The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...   \n",
-       "11                                                                                                           The multiple myeloma disease stage at diagnosis.   \n",
-       "12                              The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).   \n",
-       "13         The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).   \n",
-       "14  The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "15                               The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "16                             The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "17  Extent of the regional lymph node involvement for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatm...   \n",
-       "18  The codes that represent the stage of cancer based on the nodes present (N stage) according to criteria based on multiple editions of the AJCC's Cance...   \n",
-       "19                                                           The text term used to describe the classification of the histopathologic degree of liver damage.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0   Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
-       "1   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "2                                                                              Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "3   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "4                                                                                                                      Stage I, Stage II, Stage III, Stage IV  \n",
-       "5   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "6   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "7   N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N2mi, N3, N3a, N3b, N3c, N4, NX, U...  \n",
-       "8                                                                                  Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported  \n",
-       "9   N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N3, N3a, N3b, N3c, N4, NX, Unknown...  \n",
-       "10                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "11                                                                                                                          I, II, III, Unknown, Not Reported  \n",
-       "12                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "13                                                                                                                       L1, L2, M, Ms, Unknown, Not Reported  \n",
-       "14                                                                                             Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "15                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "16                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "17  N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N3, N3a, N3b, N3c, N4, NX, Unknown...  \n",
-       "18  N0, N0 (i+), N0 (i-), N0 (mol+), N0 (mol-), N1, N1a, N1b, N1bI, N1bII, N1bIII, N1bIV, N1c, N1mi, N2, N2a, N2b, N2c, N2mi, N3, N3a, N3b, N3c, N4, NX, U...  \n",
-       "19  0 - No Fibrosis, 1,2 - Portal Fibrosis, 3,4 - Fibrous Septa, 5 - Nodular Formation and Incomplete Cirrhosis, 6 - Established Cirrhosis, Unknown, Not R...  "
+       "                Candidate Similarity  \\\n",
+       "0              figo_stage     0.6017   \n",
+       "1     uicc_clinical_stage     0.5684   \n",
+       "2              inss_stage     0.5541   \n",
+       "3   uicc_pathologic_stage     0.5505   \n",
+       "4  ensat_pathologic_stage     0.5397   \n",
+       "\n",
+       "                                                                                                                                                 Description  \\\n",
+       "0  The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
+       "1  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
+       "2         Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
+       "3  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
+       "4                                        An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
+       "\n",
+       "                                                                                                                                             Values (sample)  \n",
+       "0  Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
+       "1  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
+       "2                                                                             Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
+       "3  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
+       "4                                                                                                                     Stage I, Stage II, Stage III, Stage IV  "
       ]
      },
      "metadata": {},
      "output_type": "display_data"
+    }
+   ],
+   "source": [
+    "\n",
+    "manager = APIManager()\n",
+    "manager.load_dataset('./datasets/dou.csv')\n",
+    "reduced_scope = manager.reduce_scope()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "application/javascript": "(function(root) {\n  function now() {\n    return new Date();\n  }\n\n  var force = true;\n  var py_version = '3.4.1'.replace('rc', '-rc.').replace('.dev', '-dev.');\n  var reloading = false;\n  var Bokeh = root.Bokeh;\n\n  if (typeof (root._bokeh_timeout) === \"undefined\" || force) {\n    root._bokeh_timeout = Date.now() + 5000;\n    root._bokeh_failed_load = false;\n  }\n\n  function run_callbacks() {\n    try {\n      root._bokeh_onload_callbacks.forEach(function(callback) {\n        if (callback != null)\n          callback();\n      });\n    } finally {\n      delete root._bokeh_onload_callbacks;\n    }\n    console.debug(\"Bokeh: all callbacks have finished\");\n  }\n\n  function load_libs(css_urls, js_urls, js_modules, js_exports, callback) {\n    if (css_urls == null) css_urls = [];\n    if (js_urls == null) js_urls = [];\n    if (js_modules == null) js_modules = [];\n    if (js_exports == null) js_exports = {};\n\n    root._bokeh_onload_callbacks.push(callback);\n\n    if (root._bokeh_is_loading > 0) {\n      console.debug(\"Bokeh: BokehJS is being loaded, scheduling callback at\", now());\n      return null;\n    }\n    if (js_urls.length === 0 && js_modules.length === 0 && Object.keys(js_exports).length === 0) {\n      run_callbacks();\n      return null;\n    }\n    if (!reloading) {\n      console.debug(\"Bokeh: BokehJS not loaded, scheduling load and callback at\", now());\n    }\n\n    function on_load() {\n      root._bokeh_is_loading--;\n      if (root._bokeh_is_loading === 0) {\n        console.debug(\"Bokeh: all BokehJS libraries/stylesheets loaded\");\n        run_callbacks()\n      }\n    }\n    window._bokeh_on_load = on_load\n\n    function on_error() {\n      console.error(\"failed to load \" + url);\n    }\n\n    var skip = [];\n    if (window.requirejs) {\n      window.requirejs.config({'packages': {}, 'paths': {'mathjax': '//cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-AMS_HTML', 'vega-embed': 'https://cdn.jsdelivr.net/npm/vega-embed@6/build/vega-embed.min', 'vega-lite': 'https://cdn.jsdelivr.net/npm/vega-lite@5/build/vega-lite.min', 'vega': 'https://cdn.jsdelivr.net/npm/vega@5/build/vega.min'}, 'shim': {'mathjax': {'exports': 'MathJax'}}});\n      require([\"mathjax\"], function() {\n\ton_load()\n      })\n      require([\"vega-embed\"], function(vegaEmbed) {\n\twindow.vegaEmbed = vegaEmbed\n\ton_load()\n      })\n      require([\"vega-lite\"], function(vl) {\n\twindow.vl = vl\n\ton_load()\n      })\n      require([\"vega\"], function(vega) {\n\twindow.vega = vega\n\ton_load()\n      })\n      root._bokeh_is_loading = css_urls.length + 4;\n    } else {\n      root._bokeh_is_loading = css_urls.length + js_urls.length + js_modules.length + Object.keys(js_exports).length;\n    }\n\n    var existing_stylesheets = []\n    var links = document.getElementsByTagName('link')\n    for (var i = 0; i < links.length; i++) {\n      var link = links[i]\n      if (link.href != null) {\n\texisting_stylesheets.push(link.href)\n      }\n    }\n    for (var i = 0; i < css_urls.length; i++) {\n      var url = css_urls[i];\n      if (existing_stylesheets.indexOf(url) !== -1) {\n\ton_load()\n\tcontinue;\n      }\n      const element = document.createElement(\"link\");\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.rel = \"stylesheet\";\n      element.type = \"text/css\";\n      element.href = url;\n      console.debug(\"Bokeh: injecting link tag for BokehJS stylesheet: \", url);\n      document.body.appendChild(element);\n    }    if (((window.MathJax !== undefined) && (!(window.MathJax instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-MML-AM_CHTML'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vega !== undefined) && (!(window.vega instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega@5'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vegaLite !== undefined) && (!(window.vegaLite instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-lite@5'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vegaEmbed !== undefined) && (!(window.vegaEmbed instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-embed@6'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    var existing_scripts = []\n    var scripts = document.getElementsByTagName('script')\n    for (var i = 0; i < scripts.length; i++) {\n      var script = scripts[i]\n      if (script.src != null) {\n\texisting_scripts.push(script.src)\n      }\n    }\n    for (var i = 0; i < js_urls.length; i++) {\n      var url = js_urls[i];\n      if (skip.indexOf(url) !== -1 || existing_scripts.indexOf(url) !== -1) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.async = false;\n      element.src = url;\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      document.head.appendChild(element);\n    }\n    for (var i = 0; i < js_modules.length; i++) {\n      var url = js_modules[i];\n      if (skip.indexOf(url) !== -1 || existing_scripts.indexOf(url) !== -1) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.async = false;\n      element.src = url;\n      element.type = \"module\";\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      document.head.appendChild(element);\n    }\n    for (const name in js_exports) {\n      var url = js_exports[name];\n      if (skip.indexOf(url) >= 0 || root[name] != null) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onerror = on_error;\n      element.async = false;\n      element.type = \"module\";\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      element.textContent = `\n      import ${name} from \"${url}\"\n      window.${name} = ${name}\n      window._bokeh_on_load()\n      `\n      document.head.appendChild(element);\n    }\n    if (!js_urls.length && !js_modules.length) {\n      on_load()\n    }\n  };\n\n  function inject_raw_css(css) {\n    const element = document.createElement(\"style\");\n    element.appendChild(document.createTextNode(css));\n    document.body.appendChild(element);\n  }\n\n  var js_urls = [\"https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-MML-AM_CHTML\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega@5\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-lite@5\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-embed@6\", \"https://cdn.bokeh.org/bokeh/release/bokeh-3.4.1.min.js\", \"https://cdn.bokeh.org/bokeh/release/bokeh-gl-3.4.1.min.js\", \"https://cdn.bokeh.org/bokeh/release/bokeh-widgets-3.4.1.min.js\", \"https://cdn.bokeh.org/bokeh/release/bokeh-tables-3.4.1.min.js\", \"https://cdn.bokeh.org/bokeh/release/bokeh-mathjax-3.4.1.min.js\", \"https://cdn.holoviz.org/panel/1.4.2/dist/panel.min.js\"];\n  var js_modules = [];\n  var js_exports = {};\n  var css_urls = [];\n  var inline_js = [    function(Bokeh) {\n      Bokeh.set_log_level(\"info\");\n    },\nfunction(Bokeh) {} // ensure no trailing comma for IE\n  ];\n\n  function run_inline_js() {\n    if ((root.Bokeh !== undefined) || (force === true)) {\n      for (var i = 0; i < inline_js.length; i++) {\n\ttry {\n          inline_js[i].call(root, root.Bokeh);\n\t} catch(e) {\n\t  if (!reloading) {\n\t    throw e;\n\t  }\n\t}\n      }\n      // Cache old bokeh versions\n      if (Bokeh != undefined && !reloading) {\n\tvar NewBokeh = root.Bokeh;\n\tif (Bokeh.versions === undefined) {\n\t  Bokeh.versions = new Map();\n\t}\n\tif (NewBokeh.version !== Bokeh.version) {\n\t  Bokeh.versions.set(NewBokeh.version, NewBokeh)\n\t}\n\troot.Bokeh = Bokeh;\n      }} else if (Date.now() < root._bokeh_timeout) {\n      setTimeout(run_inline_js, 100);\n    } else if (!root._bokeh_failed_load) {\n      console.log(\"Bokeh: BokehJS failed to load within specified timeout.\");\n      root._bokeh_failed_load = true;\n    }\n    root._bokeh_is_initializing = false\n  }\n\n  function load_or_wait() {\n    // Implement a backoff loop that tries to ensure we do not load multiple\n    // versions of Bokeh and its dependencies at the same time.\n    // In recent versions we use the root._bokeh_is_initializing flag\n    // to determine whether there is an ongoing attempt to initialize\n    // bokeh, however for backward compatibility we also try to ensure\n    // that we do not start loading a newer (Panel>=1.0 and Bokeh>3) version\n    // before older versions are fully initialized.\n    if (root._bokeh_is_initializing && Date.now() > root._bokeh_timeout) {\n      root._bokeh_is_initializing = false;\n      root._bokeh_onload_callbacks = undefined;\n      console.log(\"Bokeh: BokehJS was loaded multiple times but one version failed to initialize.\");\n      load_or_wait();\n    } else if (root._bokeh_is_initializing || (typeof root._bokeh_is_initializing === \"undefined\" && root._bokeh_onload_callbacks !== undefined)) {\n      setTimeout(load_or_wait, 100);\n    } else {\n      root._bokeh_is_initializing = true\n      root._bokeh_onload_callbacks = []\n      var bokeh_loaded = Bokeh != null && (Bokeh.version === py_version || (Bokeh.versions !== undefined && Bokeh.versions.has(py_version)));\n      if (!reloading && !bokeh_loaded) {\n\troot.Bokeh = undefined;\n      }\n      load_libs(css_urls, js_urls, js_modules, js_exports, function() {\n\tconsole.debug(\"Bokeh: BokehJS plotting callback run at\", now());\n\trun_inline_js();\n      });\n    }\n  }\n  // Give older versions of the autoload script a head-start to ensure\n  // they initialize before we start loading newer version.\n  setTimeout(load_or_wait, 100)\n}(window));",
+      "application/vnd.holoviews_load.v0+json": ""
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Clin_Stage_Dist_Mets-cM:\n"
-     ]
+     "data": {
+      "application/javascript": "\nif ((window.PyViz === undefined) || (window.PyViz instanceof HTMLElement)) {\n  window.PyViz = {comms: {}, comm_status:{}, kernels:{}, receivers: {}, plot_index: []}\n}\n\n\n    function JupyterCommManager() {\n    }\n\n    JupyterCommManager.prototype.register_target = function(plot_id, comm_id, msg_handler) {\n      if (window.comm_manager || ((window.Jupyter !== undefined) && (Jupyter.notebook.kernel != null))) {\n        var comm_manager = window.comm_manager || Jupyter.notebook.kernel.comm_manager;\n        comm_manager.register_target(comm_id, function(comm) {\n          comm.on_msg(msg_handler);\n        });\n      } else if ((plot_id in window.PyViz.kernels) && (window.PyViz.kernels[plot_id])) {\n        window.PyViz.kernels[plot_id].registerCommTarget(comm_id, function(comm) {\n          comm.onMsg = msg_handler;\n        });\n      } else if (typeof google != 'undefined' && google.colab.kernel != null) {\n        google.colab.kernel.comms.registerTarget(comm_id, (comm) => {\n          var messages = comm.messages[Symbol.asyncIterator]();\n          function processIteratorResult(result) {\n            var message = result.value;\n            console.log(message)\n            var content = {data: message.data, comm_id};\n            var buffers = []\n            for (var buffer of message.buffers || []) {\n              buffers.push(new DataView(buffer))\n            }\n            var metadata = message.metadata || {};\n            var msg = {content, buffers, metadata}\n            msg_handler(msg);\n            return messages.next().then(processIteratorResult);\n          }\n          return messages.next().then(processIteratorResult);\n        })\n      }\n    }\n\n    JupyterCommManager.prototype.get_client_comm = function(plot_id, comm_id, msg_handler) {\n      if (comm_id in window.PyViz.comms) {\n        return window.PyViz.comms[comm_id];\n      } else if (window.comm_manager || ((window.Jupyter !== undefined) && (Jupyter.notebook.kernel != null))) {\n        var comm_manager = window.comm_manager || Jupyter.notebook.kernel.comm_manager;\n        var comm = comm_manager.new_comm(comm_id, {}, {}, {}, comm_id);\n        if (msg_handler) {\n          comm.on_msg(msg_handler);\n        }\n      } else if ((plot_id in window.PyViz.kernels) && (window.PyViz.kernels[plot_id])) {\n        var comm = window.PyViz.kernels[plot_id].connectToComm(comm_id);\n        comm.open();\n        if (msg_handler) {\n          comm.onMsg = msg_handler;\n        }\n      } else if (typeof google != 'undefined' && google.colab.kernel != null) {\n        var comm_promise = google.colab.kernel.comms.open(comm_id)\n        comm_promise.then((comm) => {\n          window.PyViz.comms[comm_id] = comm;\n          if (msg_handler) {\n            var messages = comm.messages[Symbol.asyncIterator]();\n            function processIteratorResult(result) {\n              var message = result.value;\n              var content = {data: message.data};\n              var metadata = message.metadata || {comm_id};\n              var msg = {content, metadata}\n              msg_handler(msg);\n              return messages.next().then(processIteratorResult);\n            }\n            return messages.next().then(processIteratorResult);\n          }\n        }) \n        var sendClosure = (data, metadata, buffers, disposeOnDone) => {\n          return comm_promise.then((comm) => {\n            comm.send(data, metadata, buffers, disposeOnDone);\n          });\n        };\n        var comm = {\n          send: sendClosure\n        };\n      }\n      window.PyViz.comms[comm_id] = comm;\n      return comm;\n    }\n    window.PyViz.comm_manager = new JupyterCommManager();\n    \n\n\nvar JS_MIME_TYPE = 'application/javascript';\nvar HTML_MIME_TYPE = 'text/html';\nvar EXEC_MIME_TYPE = 'application/vnd.holoviews_exec.v0+json';\nvar CLASS_NAME = 'output';\n\n/**\n * Render data to the DOM node\n */\nfunction render(props, node) {\n  var div = document.createElement(\"div\");\n  var script = document.createElement(\"script\");\n  node.appendChild(div);\n  node.appendChild(script);\n}\n\n/**\n * Handle when a new output is added\n */\nfunction handle_add_output(event, handle) {\n  var output_area = handle.output_area;\n  var output = handle.output;\n  if ((output.data == undefined) || (!output.data.hasOwnProperty(EXEC_MIME_TYPE))) {\n    return\n  }\n  var id = output.metadata[EXEC_MIME_TYPE][\"id\"];\n  var toinsert = output_area.element.find(\".\" + CLASS_NAME.split(' ')[0]);\n  if (id !== undefined) {\n    var nchildren = toinsert.length;\n    var html_node = toinsert[nchildren-1].children[0];\n    html_node.innerHTML = output.data[HTML_MIME_TYPE];\n    var scripts = [];\n    var nodelist = html_node.querySelectorAll(\"script\");\n    for (var i in nodelist) {\n      if (nodelist.hasOwnProperty(i)) {\n        scripts.push(nodelist[i])\n      }\n    }\n\n    scripts.forEach( function (oldScript) {\n      var newScript = document.createElement(\"script\");\n      var attrs = [];\n      var nodemap = oldScript.attributes;\n      for (var j in nodemap) {\n        if (nodemap.hasOwnProperty(j)) {\n          attrs.push(nodemap[j])\n        }\n      }\n      attrs.forEach(function(attr) { newScript.setAttribute(attr.name, attr.value) });\n      newScript.appendChild(document.createTextNode(oldScript.innerHTML));\n      oldScript.parentNode.replaceChild(newScript, oldScript);\n    });\n    if (JS_MIME_TYPE in output.data) {\n      toinsert[nchildren-1].children[1].textContent = output.data[JS_MIME_TYPE];\n    }\n    output_area._hv_plot_id = id;\n    if ((window.Bokeh !== undefined) && (id in Bokeh.index)) {\n      window.PyViz.plot_index[id] = Bokeh.index[id];\n    } else {\n      window.PyViz.plot_index[id] = null;\n    }\n  } else if (output.metadata[EXEC_MIME_TYPE][\"server_id\"] !== undefined) {\n    var bk_div = document.createElement(\"div\");\n    bk_div.innerHTML = output.data[HTML_MIME_TYPE];\n    var script_attrs = bk_div.children[0].attributes;\n    for (var i = 0; i < script_attrs.length; i++) {\n      toinsert[toinsert.length - 1].childNodes[1].setAttribute(script_attrs[i].name, script_attrs[i].value);\n    }\n    // store reference to server id on output_area\n    output_area._bokeh_server_id = output.metadata[EXEC_MIME_TYPE][\"server_id\"];\n  }\n}\n\n/**\n * Handle when an output is cleared or removed\n */\nfunction handle_clear_output(event, handle) {\n  var id = handle.cell.output_area._hv_plot_id;\n  var server_id = handle.cell.output_area._bokeh_server_id;\n  if (((id === undefined) || !(id in PyViz.plot_index)) && (server_id !== undefined)) { return; }\n  var comm = window.PyViz.comm_manager.get_client_comm(\"hv-extension-comm\", \"hv-extension-comm\", function () {});\n  if (server_id !== null) {\n    comm.send({event_type: 'server_delete', 'id': server_id});\n    return;\n  } else if (comm !== null) {\n    comm.send({event_type: 'delete', 'id': id});\n  }\n  delete PyViz.plot_index[id];\n  if ((window.Bokeh !== undefined) & (id in window.Bokeh.index)) {\n    var doc = window.Bokeh.index[id].model.document\n    doc.clear();\n    const i = window.Bokeh.documents.indexOf(doc);\n    if (i > -1) {\n      window.Bokeh.documents.splice(i, 1);\n    }\n  }\n}\n\n/**\n * Handle kernel restart event\n */\nfunction handle_kernel_cleanup(event, handle) {\n  delete PyViz.comms[\"hv-extension-comm\"];\n  window.PyViz.plot_index = {}\n}\n\n/**\n * Handle update_display_data messages\n */\nfunction handle_update_output(event, handle) {\n  handle_clear_output(event, {cell: {output_area: handle.output_area}})\n  handle_add_output(event, handle)\n}\n\nfunction register_renderer(events, OutputArea) {\n  function append_mime(data, metadata, element) {\n    // create a DOM node to render to\n    var toinsert = this.create_output_subarea(\n    metadata,\n    CLASS_NAME,\n    EXEC_MIME_TYPE\n    );\n    this.keyboard_manager.register_events(toinsert);\n    // Render to node\n    var props = {data: data, metadata: metadata[EXEC_MIME_TYPE]};\n    render(props, toinsert[0]);\n    element.append(toinsert);\n    return toinsert\n  }\n\n  events.on('output_added.OutputArea', handle_add_output);\n  events.on('output_updated.OutputArea', handle_update_output);\n  events.on('clear_output.CodeCell', handle_clear_output);\n  events.on('delete.Cell', handle_clear_output);\n  events.on('kernel_ready.Kernel', handle_kernel_cleanup);\n\n  OutputArea.prototype.register_mime_type(EXEC_MIME_TYPE, append_mime, {\n    safe: true,\n    index: 0\n  });\n}\n\nif (window.Jupyter !== undefined) {\n  try {\n    var events = require('base/js/events');\n    var OutputArea = require('notebook/js/outputarea').OutputArea;\n    if (OutputArea.prototype.mime_types().indexOf(EXEC_MIME_TYPE) == -1) {\n      register_renderer(events, OutputArea);\n    }\n  } catch(err) {\n  }\n}\n",
+      "application/vnd.holoviews_load.v0+json": ""
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
      "data": {
       "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>uicc_clinical_m</td>\n",
-       "      <td>0.7455</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>ajcc_clinical_m</td>\n",
-       "      <td>0.7344</td>\n",
-       "      <td>Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>uicc_pathologic_m</td>\n",
-       "      <td>0.6992</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>ajcc_pathologic_m</td>\n",
-       "      <td>0.6908</td>\n",
-       "      <td>Code to represent the defined absence or presence of distant spread or metastases (M) to locations via vascular channels or lymphatics beyond the regi...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>ensat_clinical_m</td>\n",
-       "      <td>0.6473</td>\n",
-       "      <td>A clinical finding about one or more characteristics of adrenal cancer, following the rules of the ENSAT staging v7 classification system as they pert...</td>\n",
-       "      <td>M0, M1</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>inrg_stage</td>\n",
-       "      <td>0.6316</td>\n",
-       "      <td>The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).</td>\n",
-       "      <td>L1, L2, M, Ms, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>enneking_msts_metastasis</td>\n",
-       "      <td>0.6272</td>\n",
-       "      <td>Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...</td>\n",
-       "      <td>No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>uicc_clinical_stage</td>\n",
-       "      <td>0.6271</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.6038</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>ajcc_pathologic_stage</td>\n",
-       "      <td>0.6011</td>\n",
-       "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>fab_morphology_code</td>\n",
-       "      <td>0.5923</td>\n",
-       "      <td>A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...</td>\n",
-       "      <td>M0, M1, M2, M3, M4, M5, M6, M7, Not Classified</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>enneking_msts_stage</td>\n",
-       "      <td>0.5675</td>\n",
-       "      <td>Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...</td>\n",
-       "      <td>Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>igcccg_stage</td>\n",
-       "      <td>0.5585</td>\n",
-       "      <td>The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...</td>\n",
-       "      <td>Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.5399</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>data_type</td>\n",
-       "      <td>0.5275</td>\n",
-       "      <td>Specific content type of the data file.</td>\n",
-       "      <td>Biospecimen Supplement</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>figo_stage</td>\n",
-       "      <td>0.5225</td>\n",
-       "      <td>The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...</td>\n",
-       "      <td>Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.5117</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>metastasis_at_diagnosis</td>\n",
-       "      <td>0.5014</td>\n",
-       "      <td>The text term used to describe the extent of metastatic disease present at diagnosis.</td>\n",
-       "      <td>Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>uicc_pathologic_stage</td>\n",
-       "      <td>0.501</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>category</td>\n",
-       "      <td>0.4961</td>\n",
-       "      <td>Top level characterization of the annotation.</td>\n",
-       "      <td>Acceptable treatment for TCGA tumor, Administrative Compliance, Alternate sample pipeline, BCR Notification, Barcode incorrect, Biospecimen identity u...</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                   Candidate Similarity  \\\n",
-       "0            uicc_clinical_m     0.7455   \n",
-       "1            ajcc_clinical_m     0.7344   \n",
-       "2          uicc_pathologic_m     0.6992   \n",
-       "3          ajcc_pathologic_m     0.6908   \n",
-       "4           ensat_clinical_m     0.6473   \n",
-       "5                 inrg_stage     0.6316   \n",
-       "6   enneking_msts_metastasis     0.6272   \n",
-       "7        uicc_clinical_stage     0.6271   \n",
-       "8              masaoka_stage     0.6038   \n",
-       "9      ajcc_pathologic_stage     0.6011   \n",
-       "10       fab_morphology_code     0.5923   \n",
-       "11       enneking_msts_stage     0.5675   \n",
-       "12              igcccg_stage     0.5585   \n",
-       "13       ajcc_clinical_stage     0.5399   \n",
-       "14                 data_type     0.5275   \n",
-       "15                figo_stage     0.5225   \n",
-       "16                inss_stage     0.5117   \n",
-       "17   metastasis_at_diagnosis     0.5014   \n",
-       "18     uicc_pathologic_stage      0.501   \n",
-       "19                  category     0.4961   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "1               Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.   \n",
-       "2   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "3   Code to represent the defined absence or presence of distant spread or metastases (M) to locations via vascular channels or lymphatics beyond the regi...   \n",
-       "4   A clinical finding about one or more characteristics of adrenal cancer, following the rules of the ENSAT staging v7 classification system as they pert...   \n",
-       "5          The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).   \n",
-       "6   Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...   \n",
-       "7   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "8   The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "9         The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "10  A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...   \n",
-       "11  Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...   \n",
-       "12  The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...   \n",
-       "13  Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "14                                                                                                                    Specific content type of the data file.   \n",
-       "15  The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
-       "16         Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "17                                                                      The text term used to describe the extent of metastatic disease present at diagnosis.   \n",
-       "18  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "19                                                                                                              Top level characterization of the annotation.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                  cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported  \n",
-       "1                                                                          cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "2                                                                                         cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported  \n",
-       "3                                                                 cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "4                                                                                                                                                      M0, M1  \n",
-       "5                                                                                                                        L1, L2, M, Ms, Unknown, Not Reported  \n",
-       "6                                                                              No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported  \n",
-       "7   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "8                                                                                              Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "9   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "10                                                                                                             M0, M1, M2, M3, M4, M5, M6, M7, Not Classified  \n",
-       "11                                                                                 Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported  \n",
-       "12                                                                              Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported  \n",
-       "13  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "14                                                                                                                                     Biospecimen Supplement  \n",
-       "15  Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
-       "16                                                                             Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "17                                                             Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported  \n",
-       "18  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "19  Acceptable treatment for TCGA tumor, Administrative Compliance, Alternate sample pipeline, BCR Notification, Barcode incorrect, Biospecimen identity u...  "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Path_Stage_Dist_Mets-pM:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>uicc_clinical_m</td>\n",
-       "      <td>0.7371</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>ajcc_clinical_m</td>\n",
-       "      <td>0.7076</td>\n",
-       "      <td>Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>uicc_pathologic_m</td>\n",
-       "      <td>0.7069</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>ajcc_pathologic_m</td>\n",
-       "      <td>0.6833</td>\n",
-       "      <td>Code to represent the defined absence or presence of distant spread or metastases (M) to locations via vascular channels or lymphatics beyond the regi...</td>\n",
-       "      <td>cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>ensat_clinical_m</td>\n",
-       "      <td>0.6273</td>\n",
-       "      <td>A clinical finding about one or more characteristics of adrenal cancer, following the rules of the ENSAT staging v7 classification system as they pert...</td>\n",
-       "      <td>M0, M1</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>enneking_msts_metastasis</td>\n",
-       "      <td>0.6068</td>\n",
-       "      <td>Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...</td>\n",
-       "      <td>No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>metastasis_at_diagnosis</td>\n",
-       "      <td>0.5874</td>\n",
-       "      <td>The text term used to describe the extent of metastatic disease present at diagnosis.</td>\n",
-       "      <td>Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>classification_of_tumor</td>\n",
-       "      <td>0.5729</td>\n",
-       "      <td>Text that describes the kind of disease present in the tumor specimen as related to a specific timepoint.</td>\n",
-       "      <td>metastasis, Premalignant, primary, Prior primary, Progression, recurrence, Synchronous primary, other, Unknown, not reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.5534</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>uicc_clinical_stage</td>\n",
-       "      <td>0.551</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>ajcc_pathologic_stage</td>\n",
-       "      <td>0.5248</td>\n",
-       "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>inrg_stage</td>\n",
-       "      <td>0.5095</td>\n",
-       "      <td>The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).</td>\n",
-       "      <td>L1, L2, M, Ms, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>last_known_disease_status</td>\n",
-       "      <td>0.5005</td>\n",
-       "      <td>Text term that describes the last known state or condition of an individual's neoplasm.</td>\n",
-       "      <td>Biochemical evidence of disease without structural correlate, Distant met recurrence/progression, Loco-regional recurrence/progression, Tumor free, Un...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>notes</td>\n",
-       "      <td>0.4932</td>\n",
-       "      <td>Open entry for any further description or characterization of the data.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>treatment_outcome</td>\n",
-       "      <td>0.4907</td>\n",
-       "      <td>Text term that describes the patient's final outcome after the treatment was administered.</td>\n",
-       "      <td>Complete Response, Mixed Response, No Measurable Disease, No Response, Normalization of Tumor Markers, Partial Response, Persistent Disease, Progressi...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>fab_morphology_code</td>\n",
-       "      <td>0.4898</td>\n",
-       "      <td>A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...</td>\n",
-       "      <td>M0, M1, M2, M3, M4, M5, M6, M7, Not Classified</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>follow_ups</td>\n",
-       "      <td>0.4737</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.4692</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>ensat_pathologic_stage</td>\n",
-       "      <td>0.4533</td>\n",
-       "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.4528</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                    Candidate Similarity  \\\n",
-       "0             uicc_clinical_m     0.7371   \n",
-       "1             ajcc_clinical_m     0.7076   \n",
-       "2           uicc_pathologic_m     0.7069   \n",
-       "3           ajcc_pathologic_m     0.6833   \n",
-       "4            ensat_clinical_m     0.6273   \n",
-       "5    enneking_msts_metastasis     0.6068   \n",
-       "6     metastasis_at_diagnosis     0.5874   \n",
-       "7     classification_of_tumor     0.5729   \n",
-       "8               masaoka_stage     0.5534   \n",
-       "9         uicc_clinical_stage      0.551   \n",
-       "10      ajcc_pathologic_stage     0.5248   \n",
-       "11                 inrg_stage     0.5095   \n",
-       "12  last_known_disease_status     0.5005   \n",
-       "13                      notes     0.4932   \n",
-       "14          treatment_outcome     0.4907   \n",
-       "15        fab_morphology_code     0.4898   \n",
-       "16                 follow_ups     0.4737   \n",
-       "17                 inss_stage     0.4692   \n",
-       "18     ensat_pathologic_stage     0.4533   \n",
-       "19        ajcc_clinical_stage     0.4528   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "1               Extent of the distant metastasis for the cancer based on evidence obtained from clinical assessment parameters determined prior to treatment.   \n",
-       "2   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "3   Code to represent the defined absence or presence of distant spread or metastases (M) to locations via vascular channels or lymphatics beyond the regi...   \n",
-       "4   A clinical finding about one or more characteristics of adrenal cancer, following the rules of the ENSAT staging v7 classification system as they pert...   \n",
-       "5   Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...   \n",
-       "6                                                                       The text term used to describe the extent of metastatic disease present at diagnosis.   \n",
-       "7                                                   Text that describes the kind of disease present in the tumor specimen as related to a specific timepoint.   \n",
-       "8   The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "9   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "10        The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "11         The text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Risk Group (INRG).   \n",
-       "12                                                                    Text term that describes the last known state or condition of an individual's neoplasm.   \n",
-       "13                                                                                    Open entry for any further description or characterization of the data.   \n",
-       "14                                                                 Text term that describes the patient's final outcome after the treatment was administered.   \n",
-       "15  A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...   \n",
-       "16                                                                                                                                                              \n",
-       "17         Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "18                                        An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "19  Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                  cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported  \n",
-       "1                                                                          cM0 (i+), M0, M1, M1a, M1b, M1c, MX, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "2                                                                                         cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported  \n",
-       "3                                                                 cM0 (i+), M0, M1, M1a, M1b, M1c, M1d, M2, MX, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "4                                                                                                                                                      M0, M1  \n",
-       "5                                                                              No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported  \n",
-       "6                                                              Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported  \n",
-       "7        metastasis, Premalignant, primary, Prior primary, Progression, recurrence, Synchronous primary, other, Unknown, not reported, Not Allowed To Collect  \n",
-       "8                                                                                              Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "9   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "10  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "11                                                                                                                       L1, L2, M, Ms, Unknown, Not Reported  \n",
-       "12  Biochemical evidence of disease without structural correlate, Distant met recurrence/progression, Loco-regional recurrence/progression, Tumor free, Un...  \n",
-       "13                                                                                                                                                             \n",
-       "14  Complete Response, Mixed Response, No Measurable Disease, No Response, Normalization of Tumor Markers, Partial Response, Persistent Disease, Progressi...  \n",
-       "15                                                                                                             M0, M1, M2, M3, M4, M5, M6, M7, Not Classified  \n",
-       "16                                                                                                                                                             \n",
-       "17                                                                             Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "18                                                                                                                     Stage I, Stage II, Stage III, Stage IV  \n",
-       "19  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "tumor_Stage-Pathological:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>ensat_pathologic_stage</td>\n",
-       "      <td>0.8143</td>\n",
-       "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>ann_arbor_clinical_stage</td>\n",
-       "      <td>0.7086</td>\n",
-       "      <td>The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>cog_liver_stage</td>\n",
-       "      <td>0.7066</td>\n",
-       "      <td>The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.7037</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>iss_stage</td>\n",
-       "      <td>0.6993</td>\n",
-       "      <td>The multiple myeloma disease stage at diagnosis.</td>\n",
-       "      <td>I, II, III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>cog_renal_stage</td>\n",
-       "      <td>0.6944</td>\n",
-       "      <td>The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>ann_arbor_pathologic_stage</td>\n",
-       "      <td>0.6674</td>\n",
-       "      <td>The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.6129</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>uicc_clinical_stage</td>\n",
-       "      <td>0.5948</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.5887</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>figo_stage</td>\n",
-       "      <td>0.5563</td>\n",
-       "      <td>The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...</td>\n",
-       "      <td>Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>follow_ups</td>\n",
-       "      <td>0.532</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>ajcc_pathologic_stage</td>\n",
-       "      <td>0.5195</td>\n",
-       "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>extrathyroid_extension</td>\n",
-       "      <td>0.5184</td>\n",
-       "      <td>Text term to describe the degree to which the primary tumor has extra thyroid extension.</td>\n",
-       "      <td>None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>tumor_grade_category</td>\n",
-       "      <td>0.5121</td>\n",
-       "      <td>Describes the number of levels or 'tiers' in the system used to determine the degree of tumor differentiation.</td>\n",
-       "      <td>Four Tier, Three Tier, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>index_date</td>\n",
-       "      <td>0.4998</td>\n",
-       "      <td>The text term used to describe the reference or anchor date used when for date obfuscation, where a single date is obscurred by creating one or more d...</td>\n",
-       "      <td>Diagnosis, First Patient Visit, First Treatment, Initial Genomic Sequencing, Recurrence, Sample Procurement, Study Enrollment</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>uicc_pathologic_stage</td>\n",
-       "      <td>0.4993</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>timepoint_category</td>\n",
-       "      <td>0.4631</td>\n",
-       "      <td>Category describing a specific point in the time continuum, including those established relative to an event.</td>\n",
-       "      <td>Adjuvant Therapy, Adolescence, Adulthood, Childhood, Follow-up, Initial Diagnosis, Last Contact, Post Adjuvant Therapy, Post Hormone Therapy, Post Sec...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>notes</td>\n",
-       "      <td>0.4609</td>\n",
-       "      <td>Open entry for any further description or characterization of the data.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>programs</td>\n",
-       "      <td>0.4519</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                     Candidate Similarity  \\\n",
-       "0       ensat_pathologic_stage     0.8143   \n",
-       "1     ann_arbor_clinical_stage     0.7086   \n",
-       "2              cog_liver_stage     0.7066   \n",
-       "3                   inss_stage     0.7037   \n",
-       "4                    iss_stage     0.6993   \n",
-       "5              cog_renal_stage     0.6944   \n",
-       "6   ann_arbor_pathologic_stage     0.6674   \n",
-       "7                masaoka_stage     0.6129   \n",
-       "8          uicc_clinical_stage     0.5948   \n",
-       "9          ajcc_clinical_stage     0.5887   \n",
-       "10                  figo_stage     0.5563   \n",
-       "11                  follow_ups      0.532   \n",
-       "12       ajcc_pathologic_stage     0.5195   \n",
-       "13      extrathyroid_extension     0.5184   \n",
-       "14        tumor_grade_category     0.5121   \n",
-       "15                  index_date     0.4998   \n",
-       "16       uicc_pathologic_stage     0.4993   \n",
-       "17          timepoint_category     0.4631   \n",
-       "18                       notes     0.4609   \n",
-       "19                    programs     0.4519   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                         An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "1                                The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "2   The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...   \n",
-       "3          Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "4                                                                                                            The multiple myeloma disease stage at diagnosis.   \n",
-       "5                               The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).   \n",
-       "6                              The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "7   The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "8   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "9   Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "10  The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
-       "11                                                                                                                                                              \n",
-       "12        The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "13                                                                   Text term to describe the degree to which the primary tumor has extra thyroid extension.   \n",
-       "14                                             Describes the number of levels or 'tiers' in the system used to determine the degree of tumor differentiation.   \n",
-       "15  The text term used to describe the reference or anchor date used when for date obfuscation, where a single date is obscurred by creating one or more d...   \n",
-       "16  The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "17                                              Category describing a specific point in the time continuum, including those established relative to an event.   \n",
-       "18                                                                                    Open entry for any further description or characterization of the data.   \n",
-       "19                                                                                                                                                              \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                                      Stage I, Stage II, Stage III, Stage IV  \n",
-       "1                                                                                               Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "2                                                                                               Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "3                                                                              Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "4                                                                                                                           I, II, III, Unknown, Not Reported  \n",
-       "5                                                                                               Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "6                                                                                               Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "7                                                                                              Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "8   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "9   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "10  Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
-       "11                                                                                                                                                             \n",
-       "12  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "13                                                                                  None, Minimal (T3), Moderate/Advanced (T4a), Very Advanced (T4b), Unknown  \n",
-       "14                                                                                                                        Four Tier, Three Tier, Not Reported  \n",
-       "15                              Diagnosis, First Patient Visit, First Treatment, Initial Genomic Sequencing, Recurrence, Sample Procurement, Study Enrollment  \n",
-       "16  Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "17  Adjuvant Therapy, Adolescence, Adulthood, Childhood, Follow-up, Initial Diagnosis, Last Contact, Post Adjuvant Therapy, Post Hormone Therapy, Post Sec...  \n",
-       "18                                                                                                                                                             \n",
-       "19                                                                                                                                                             "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "FIGO_stage:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>figo_stage</td>\n",
-       "      <td>0.8703</td>\n",
-       "      <td>The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...</td>\n",
-       "      <td>Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>uicc_pathologic_stage</td>\n",
-       "      <td>0.7944</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>uicc_clinical_stage</td>\n",
-       "      <td>0.7682</td>\n",
-       "      <td>The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>ajcc_clinical_stage</td>\n",
-       "      <td>0.7659</td>\n",
-       "      <td>Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>ajcc_pathologic_stage</td>\n",
-       "      <td>0.7346</td>\n",
-       "      <td>The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.</td>\n",
-       "      <td>Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>enneking_msts_stage</td>\n",
-       "      <td>0.6924</td>\n",
-       "      <td>Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...</td>\n",
-       "      <td>Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>inss_stage</td>\n",
-       "      <td>0.6616</td>\n",
-       "      <td>Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).</td>\n",
-       "      <td>Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>irs_group</td>\n",
-       "      <td>0.6093</td>\n",
-       "      <td>Text term used to describe the classification of rhabdomyosarcoma tumors, as defined by the Intergroup Rhabdomyosarcoma Study (IRS).</td>\n",
-       "      <td>Group I, Group Ia, Group Ib, Group II, Group IIa, Group IIb, Group IIc, Group III, Group IIIa, Group IIIb, Group IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>igcccg_stage</td>\n",
-       "      <td>0.6079</td>\n",
-       "      <td>The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...</td>\n",
-       "      <td>Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>masaoka_stage</td>\n",
-       "      <td>0.586</td>\n",
-       "      <td>The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...</td>\n",
-       "      <td>Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>ensat_pathologic_stage</td>\n",
-       "      <td>0.5699</td>\n",
-       "      <td>An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>iss_stage</td>\n",
-       "      <td>0.556</td>\n",
-       "      <td>The multiple myeloma disease stage at diagnosis.</td>\n",
-       "      <td>I, II, III, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>cog_liver_stage</td>\n",
-       "      <td>0.5184</td>\n",
-       "      <td>The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>cog_renal_stage</td>\n",
-       "      <td>0.5126</td>\n",
-       "      <td>The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>ann_arbor_clinical_stage</td>\n",
-       "      <td>0.5084</td>\n",
-       "      <td>The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>enneking_msts_grade</td>\n",
-       "      <td>0.5004</td>\n",
-       "      <td>The text term used to describe the surgical grade of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...</td>\n",
-       "      <td>High Grade (G2), Low Grade (G1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>ann_arbor_pathologic_stage</td>\n",
-       "      <td>0.4989</td>\n",
-       "      <td>The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.</td>\n",
-       "      <td>Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>who_nte_grade</td>\n",
-       "      <td>0.4964</td>\n",
-       "      <td>The WHO (World Health Organization) grading classification of Neuroendocrine Tumors.</td>\n",
-       "      <td>G1, G2, G3, GX, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>who_cns_grade</td>\n",
-       "      <td>0.4911</td>\n",
-       "      <td>The WHO (World Health Organization) grading classification of CNS tumors, which is based on histological characteristics such as cellularity, mitotic ...</td>\n",
-       "      <td>Grade I, Grade II, Grade III, Grade IV, Grade Not Assigned, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>tumor_grade</td>\n",
-       "      <td>0.4821</td>\n",
-       "      <td>Numeric value to express the degree of abnormality of cancer cells, a measure of differentiation and aggressiveness.</td>\n",
-       "      <td>G1, G2, G3, G4, GB, GX, High Grade, Intermediate Grade, Low Grade, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                     Candidate Similarity  \\\n",
-       "0                   figo_stage     0.8703   \n",
-       "1        uicc_pathologic_stage     0.7944   \n",
-       "2          uicc_clinical_stage     0.7682   \n",
-       "3          ajcc_clinical_stage     0.7659   \n",
-       "4        ajcc_pathologic_stage     0.7346   \n",
-       "5          enneking_msts_stage     0.6924   \n",
-       "6                   inss_stage     0.6616   \n",
-       "7                    irs_group     0.6093   \n",
-       "8                 igcccg_stage     0.6079   \n",
-       "9                masaoka_stage      0.586   \n",
-       "10      ensat_pathologic_stage     0.5699   \n",
-       "11                   iss_stage      0.556   \n",
-       "12             cog_liver_stage     0.5184   \n",
-       "13             cog_renal_stage     0.5126   \n",
-       "14    ann_arbor_clinical_stage     0.5084   \n",
-       "15         enneking_msts_grade     0.5004   \n",
-       "16  ann_arbor_pathologic_stage     0.4989   \n",
-       "17               who_nte_grade     0.4964   \n",
-       "18               who_cns_grade     0.4911   \n",
-       "19                 tumor_grade     0.4821   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   The extent of a cervical or endometrial cancer within the body, especially whether the disease has spread from the original site to other parts of the...   \n",
-       "1   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "2   The UICC TNM Classification is an anatomically based system that records the primary and regional nodal extent of the tumor and the absence or presenc...   \n",
-       "3   Stage group determined from clinical information on the tumor (T), regional node (N) and metastases (M) and by grouping cases with similar prognosis f...   \n",
-       "4         The extent of a cancer, especially whether the disease has spread from the original site to other parts of the body based on AJCC staging criteria.   \n",
-       "5   Text term used to describe the stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tumor Society (...   \n",
-       "6          Text term used to describe the staging classification of neuroblastic tumors, as defined by the International Neuroblastoma Staging System (INSS).   \n",
-       "7                        Text term used to describe the classification of rhabdomyosarcoma tumors, as defined by the Intergroup Rhabdomyosarcoma Study (IRS).   \n",
-       "8   The text term used to describe the International Germ Cell Cancer Collaborative Group (IGCCCG), a grouping used to further classify metastatic testicu...   \n",
-       "9   The text term used to describe the Masaoka staging system, a classification that defines prognostic indicators for thymic malignancies and predicts tu...   \n",
-       "10                                        An adrenal cancer stage defined according to the European Network for the Study of Adrenal Tumors (ENSAT) criteria.   \n",
-       "11                                                                                                           The multiple myeloma disease stage at diagnosis.   \n",
-       "12  The text term used to describe the staging classification of liver tumors, as defined by the Children's Oncology Group (COG). This staging system spec...   \n",
-       "13                              The text term used to describe the staging classification of renal tumors, as defined by the Children's Oncology Group (COG).   \n",
-       "14                               The text term used to describe the clinical classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "15  The text term used to describe the surgical grade of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...   \n",
-       "16                             The text term used to describe the pathologic classification of lymphoma, as defined by the Ann Arbor Lymphoma Staging System.   \n",
-       "17                                                                       The WHO (World Health Organization) grading classification of Neuroendocrine Tumors.   \n",
-       "18  The WHO (World Health Organization) grading classification of CNS tumors, which is based on histological characteristics such as cellularity, mitotic ...   \n",
-       "19                                       Numeric value to express the degree of abnormality of cancer cells, a measure of differentiation and aggressiveness.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0   Stage 0, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage IC1, Stage IC2, Stage IC3, Stage II, Stage IIA, Stag...  \n",
-       "1   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "2   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "3   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IB Cervix, Stage IC, Stage II,...  \n",
-       "4   Stage 0, Stage 0a, Stage 0is, Stage I, Stage IA, Stage IA1, Stage IA2, Stage IA3, Stage IB, Stage IB1, Stage IB2, Stage IC, Stage II, Stage IIA, Stage...  \n",
-       "5                                                                                  Stage IA, Stage IB, Stage IIA, Stage IIB, Stage III, Unknown, Not Reported  \n",
-       "6                                                                              Stage 1, Stage 2A, Stage 2B, Stage 3, Stage 4, Stage 4S, Unknown, Not Reported  \n",
-       "7                  Group I, Group Ia, Group Ib, Group II, Group IIa, Group IIb, Group IIc, Group III, Group IIIa, Group IIIb, Group IV, Unknown, Not Reported  \n",
-       "8                                                                               Good Prognosis, Intermediate Prognosis, Poor Prognosis, Unknown, Not Reported  \n",
-       "9                                                                                              Stage I, Stage IIa, Stage IIb, Stage III, Stage IVa, Stage IVb  \n",
-       "10                                                                                                                     Stage I, Stage II, Stage III, Stage IV  \n",
-       "11                                                                                                                          I, II, III, Unknown, Not Reported  \n",
-       "12                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "13                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "14                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "15                                                                                                     High Grade (G2), Low Grade (G1), Unknown, Not Reported  \n",
-       "16                                                                                              Stage I, Stage II, Stage III, Stage IV, Unknown, Not Reported  \n",
-       "17                                                                                                                      G1, G2, G3, GX, Unknown, Not Reported  \n",
-       "18                                                                          Grade I, Grade II, Grade III, Grade IV, Grade Not Assigned, Unknown, Not Reported  \n",
-       "19                                                                   G1, G2, G3, G4, GB, GX, High Grade, Intermediate Grade, Low Grade, Unknown, Not Reported  "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "BMI:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>percent_stromal_cells</td>\n",
-       "      <td>0.818</td>\n",
-       "      <td>Numeric value to represent the percentage of reactive cells that are present in a malignant tumor sample or specimen but are not malignant such as fib...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>necrosis_percent</td>\n",
-       "      <td>0.8076</td>\n",
-       "      <td>A quantitative measurement of the percent of cells undergoing necrosis compared to the number of total cells present in a sample.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>spindle_cell_percent</td>\n",
-       "      <td>0.7874</td>\n",
-       "      <td>The percent of uveal melanoma arising from the choroid, ciliary body, or the iris and characterized by the presence of spindle-shaped melanocytes.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>recist_targeted_regions_sum</td>\n",
-       "      <td>0.7801</td>\n",
-       "      <td>Numeric value that represents the sum of baseline target lesions, as described by the Response Evaluation Criteria in Solid Tumours (RECIST) criteria.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>bmi</td>\n",
-       "      <td>0.7546</td>\n",
-       "      <td>A calculated numerical quantity that represents an individual's weight to height ratio.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>intermediate_dimension</td>\n",
-       "      <td>0.7513</td>\n",
-       "      <td>Intermediate dimension of the sample, in millimeters.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>longest_dimension</td>\n",
-       "      <td>0.721</td>\n",
-       "      <td>Numeric value that represents the longest dimension of the sample, measured in millimeters.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>average_base_quality</td>\n",
-       "      <td>0.6933</td>\n",
-       "      <td>Average base quality collected from samtools.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>percent_neutrophil_infiltration</td>\n",
-       "      <td>0.6483</td>\n",
-       "      <td>Numeric value to represent the percentage of infiltration by neutrophils in a tumor sample or specimen.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>fragment_standard_deviation_length</td>\n",
-       "      <td>0.612</td>\n",
-       "      <td>Standard deviation of the sequenced fragments length (e.g., as predicted by Agilent Bioanalyzer).</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>percent_lymphocyte_infiltration</td>\n",
-       "      <td>0.6003</td>\n",
-       "      <td>Numeric value to represent the percentage of infiltration by lymphocytes in a solid tissue sample or specimen.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>size_selection_range</td>\n",
-       "      <td>0.5116</td>\n",
-       "      <td>Range of size selection.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>percent_inflam_infiltration</td>\n",
-       "      <td>0.4583</td>\n",
-       "      <td>Numeric value to represent local response to cellular injury, marked by capillary dilatation, edema and leukocyte infiltration; clinically, inflammati...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>gross_tumor_weight</td>\n",
-       "      <td>0.458</td>\n",
-       "      <td>Numeric value used to describe the gross pathologic tumor weight, measured in grams.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>weight</td>\n",
-       "      <td>0.4574</td>\n",
-       "      <td>The weight of the patient measured in kilograms.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>imaging_suv_max</td>\n",
-       "      <td>0.456</td>\n",
-       "      <td>The standardized update value (SUV) is the effectively dimensionless measure of regional tracer uptake calculated as the activity concentration within...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>epithelioid_cell_percent</td>\n",
-       "      <td>0.4406</td>\n",
-       "      <td>The percent of uveal melanoma characterized by the presence of malignant large epithelioid melanocytes.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>initial_weight</td>\n",
-       "      <td>0.4184</td>\n",
-       "      <td>Numeric value that represents the initial weight of the sample, measured in milligrams.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>hpv_positive_type</td>\n",
-       "      <td>0.4162</td>\n",
-       "      <td>Text classification to represent the strain or type of human papillomavirus identified in an individual.</td>\n",
-       "      <td>16, 18, 26, 31, 33, 35, 39, 45, 51, 52, 53, 56, 58, 59, 63, 66, 68, 70, 73, 82, Other, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>age_at_index</td>\n",
-       "      <td>0.4117</td>\n",
-       "      <td>The patient's age (in years) on the reference or anchor date used during date obfuscation.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                             Candidate Similarity  \\\n",
-       "0                percent_stromal_cells      0.818   \n",
-       "1                     necrosis_percent     0.8076   \n",
-       "2                 spindle_cell_percent     0.7874   \n",
-       "3          recist_targeted_regions_sum     0.7801   \n",
-       "4                                  bmi     0.7546   \n",
-       "5               intermediate_dimension     0.7513   \n",
-       "6                    longest_dimension      0.721   \n",
-       "7                 average_base_quality     0.6933   \n",
-       "8      percent_neutrophil_infiltration     0.6483   \n",
-       "9   fragment_standard_deviation_length      0.612   \n",
-       "10     percent_lymphocyte_infiltration     0.6003   \n",
-       "11                size_selection_range     0.5116   \n",
-       "12         percent_inflam_infiltration     0.4583   \n",
-       "13                  gross_tumor_weight      0.458   \n",
-       "14                              weight     0.4574   \n",
-       "15                     imaging_suv_max      0.456   \n",
-       "16            epithelioid_cell_percent     0.4406   \n",
-       "17                      initial_weight     0.4184   \n",
-       "18                   hpv_positive_type     0.4162   \n",
-       "19                        age_at_index     0.4117   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   Numeric value to represent the percentage of reactive cells that are present in a malignant tumor sample or specimen but are not malignant such as fib...   \n",
-       "1                           A quantitative measurement of the percent of cells undergoing necrosis compared to the number of total cells present in a sample.   \n",
-       "2          The percent of uveal melanoma arising from the choroid, ciliary body, or the iris and characterized by the presence of spindle-shaped melanocytes.   \n",
-       "3      Numeric value that represents the sum of baseline target lesions, as described by the Response Evaluation Criteria in Solid Tumours (RECIST) criteria.   \n",
-       "4                                                                     A calculated numerical quantity that represents an individual's weight to height ratio.   \n",
-       "5                                                                                                       Intermediate dimension of the sample, in millimeters.   \n",
-       "6                                                                 Numeric value that represents the longest dimension of the sample, measured in millimeters.   \n",
-       "7                                                                                                               Average base quality collected from samtools.   \n",
-       "8                                                     Numeric value to represent the percentage of infiltration by neutrophils in a tumor sample or specimen.   \n",
-       "9                                                           Standard deviation of the sequenced fragments length (e.g., as predicted by Agilent Bioanalyzer).   \n",
-       "10                                             Numeric value to represent the percentage of infiltration by lymphocytes in a solid tissue sample or specimen.   \n",
-       "11                                                                                                                                   Range of size selection.   \n",
-       "12  Numeric value to represent local response to cellular injury, marked by capillary dilatation, edema and leukocyte infiltration; clinically, inflammati...   \n",
-       "13                                                                       Numeric value used to describe the gross pathologic tumor weight, measured in grams.   \n",
-       "14                                                                                                           The weight of the patient measured in kilograms.   \n",
-       "15  The standardized update value (SUV) is the effectively dimensionless measure of regional tracer uptake calculated as the activity concentration within...   \n",
-       "16                                                    The percent of uveal melanoma characterized by the presence of malignant large epithelioid melanocytes.   \n",
-       "17                                                                    Numeric value that represents the initial weight of the sample, measured in milligrams.   \n",
-       "18                                                   Text classification to represent the strain or type of human papillomavirus identified in an individual.   \n",
-       "19                                                                 The patient's age (in years) on the reference or anchor date used during date obfuscation.   \n",
-       "\n",
-       "                                                                                                 Values (sample)  \n",
-       "0                                                                                                                 \n",
-       "1                                                                                                                 \n",
-       "2                                                                                                                 \n",
-       "3                                                                                                                 \n",
-       "4                                                                                                                 \n",
-       "5                                                                                                                 \n",
-       "6                                                                                                                 \n",
-       "7                                                                                                                 \n",
-       "8                                                                                                                 \n",
-       "9                                                                                                                 \n",
-       "10                                                                                                                \n",
-       "11                                                                                                                \n",
-       "12                                                                                                                \n",
-       "13                                                                                                                \n",
-       "14                                                                                                                \n",
-       "15                                                                                                                \n",
-       "16                                                                                                                \n",
-       "17                                                                                                                \n",
-       "18  16, 18, 26, 31, 33, 35, 39, 45, 51, 52, 53, 56, 58, 59, 63, 66, 68, 70, 73, 82, Other, Unknown, Not Reported  \n",
-       "19                                                                                                                "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Age:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>age_at_onset</td>\n",
-       "      <td>0.8855</td>\n",
-       "      <td>Numeric value used to represent the age of the patient when exposure to a specific environmental factor began.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>age_at_last_exposure</td>\n",
-       "      <td>0.8768</td>\n",
-       "      <td>The study participant's age at the time they were last exposed.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>age_at_index</td>\n",
-       "      <td>0.8745</td>\n",
-       "      <td>The patient's age (in years) on the reference or anchor date used during date obfuscation.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>age_at_diagnosis</td>\n",
-       "      <td>0.8623</td>\n",
-       "      <td>Age at the time of diagnosis expressed in number of days since birth.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>relationship_age_at_diagnosis</td>\n",
-       "      <td>0.8441</td>\n",
-       "      <td>The age (in years) when the patient's relative was first diagnosed.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>undescended_testis_corrected_age</td>\n",
-       "      <td>0.7382</td>\n",
-       "      <td>The patient's age when their undescended testis was corrected.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>age_is_obfuscated</td>\n",
-       "      <td>0.644</td>\n",
-       "      <td>The age or other properties related to the patient's age have been modified for compliance reasons. The actual age may differ from what was reported i...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>pack_years_smoked</td>\n",
-       "      <td>0.6387</td>\n",
-       "      <td>Numeric computed value to represent lifetime tobacco exposure defined as number of cigarettes smoked per day x number of years smoked divided by 20.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>menopause_status</td>\n",
-       "      <td>0.6157</td>\n",
-       "      <td>Text term used to describe the patient's menopause status.</td>\n",
-       "      <td>Perimenopausal, Postmenopausal, Premenopausal, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>days_to_birth</td>\n",
-       "      <td>0.596</td>\n",
-       "      <td>Number of days between the date used for index and the date from a person's date of birth represented as a calculated negative number of days.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>epithelioid_cell_percent</td>\n",
-       "      <td>0.5842</td>\n",
-       "      <td>The percent of uveal melanoma characterized by the presence of malignant large epithelioid melanocytes.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>tobacco_smoking_onset_year</td>\n",
-       "      <td>0.5802</td>\n",
-       "      <td>The year in which the participant began smoking.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>demographics</td>\n",
-       "      <td>0.569</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>year_of_death</td>\n",
-       "      <td>0.5676</td>\n",
-       "      <td>Numeric value to represent the year of the death of an individual.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>tobacco_smoking_quit_year</td>\n",
-       "      <td>0.5491</td>\n",
-       "      <td>The year in which the participant quit smoking.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>fev1_fvc_pre_bronch_percent</td>\n",
-       "      <td>0.5471</td>\n",
-       "      <td>Percentage value to represent result of Forced Expiratory Volume in 1 second (FEV1) divided by the Forced Vital Capacity (FVC) pre-bronchodilator.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>weight</td>\n",
-       "      <td>0.5348</td>\n",
-       "      <td>The weight of the patient measured in kilograms.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>fev1_fvc_post_bronch_percent</td>\n",
-       "      <td>0.514</td>\n",
-       "      <td>Percentage value to represent result of Forced Expiratory Volume in 1 second (FEV1) divided by the Forced Vital Capacity (FVC) post-bronchodilator.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>years_smoked</td>\n",
-       "      <td>0.5107</td>\n",
-       "      <td>Numeric value (or unknown) to represent the number of years a person has been smoking.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>percent_necrosis</td>\n",
-       "      <td>0.5102</td>\n",
-       "      <td>Numeric value to represent the percentage of cell death in a malignant tumor sample or specimen.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                           Candidate Similarity  \\\n",
-       "0                       age_at_onset     0.8855   \n",
-       "1               age_at_last_exposure     0.8768   \n",
-       "2                       age_at_index     0.8745   \n",
-       "3                   age_at_diagnosis     0.8623   \n",
-       "4      relationship_age_at_diagnosis     0.8441   \n",
-       "5   undescended_testis_corrected_age     0.7382   \n",
-       "6                  age_is_obfuscated      0.644   \n",
-       "7                  pack_years_smoked     0.6387   \n",
-       "8                   menopause_status     0.6157   \n",
-       "9                      days_to_birth      0.596   \n",
-       "10          epithelioid_cell_percent     0.5842   \n",
-       "11        tobacco_smoking_onset_year     0.5802   \n",
-       "12                      demographics      0.569   \n",
-       "13                     year_of_death     0.5676   \n",
-       "14         tobacco_smoking_quit_year     0.5491   \n",
-       "15       fev1_fvc_pre_bronch_percent     0.5471   \n",
-       "16                            weight     0.5348   \n",
-       "17      fev1_fvc_post_bronch_percent      0.514   \n",
-       "18                      years_smoked     0.5107   \n",
-       "19                  percent_necrosis     0.5102   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                              Numeric value used to represent the age of the patient when exposure to a specific environmental factor began.   \n",
-       "1                                                                                             The study participant's age at the time they were last exposed.   \n",
-       "2                                                                  The patient's age (in years) on the reference or anchor date used during date obfuscation.   \n",
-       "3                                                                                       Age at the time of diagnosis expressed in number of days since birth.   \n",
-       "4                                                                                         The age (in years) when the patient's relative was first diagnosed.   \n",
-       "5                                                                                              The patient's age when their undescended testis was corrected.   \n",
-       "6   The age or other properties related to the patient's age have been modified for compliance reasons. The actual age may differ from what was reported i...   \n",
-       "7        Numeric computed value to represent lifetime tobacco exposure defined as number of cigarettes smoked per day x number of years smoked divided by 20.   \n",
-       "8                                                                                                  Text term used to describe the patient's menopause status.   \n",
-       "9              Number of days between the date used for index and the date from a person's date of birth represented as a calculated negative number of days.   \n",
-       "10                                                    The percent of uveal melanoma characterized by the presence of malignant large epithelioid melanocytes.   \n",
-       "11                                                                                                           The year in which the participant began smoking.   \n",
-       "12                                                                                                                                                              \n",
-       "13                                                                                         Numeric value to represent the year of the death of an individual.   \n",
-       "14                                                                                                            The year in which the participant quit smoking.   \n",
-       "15         Percentage value to represent result of Forced Expiratory Volume in 1 second (FEV1) divided by the Forced Vital Capacity (FVC) pre-bronchodilator.   \n",
-       "16                                                                                                           The weight of the patient measured in kilograms.   \n",
-       "17        Percentage value to represent result of Forced Expiratory Volume in 1 second (FEV1) divided by the Forced Vital Capacity (FVC) post-bronchodilator.   \n",
-       "18                                                                     Numeric value (or unknown) to represent the number of years a person has been smoking.   \n",
-       "19                                                           Numeric value to represent the percentage of cell death in a malignant tumor sample or specimen.   \n",
-       "\n",
-       "                                                         Values (sample)  \n",
-       "0                                                                         \n",
-       "1                                                                         \n",
-       "2                                                                         \n",
-       "3                                                                         \n",
-       "4                                                                         \n",
-       "5                                                                         \n",
-       "6                                                                         \n",
-       "7                                                                         \n",
-       "8   Perimenopausal, Postmenopausal, Premenopausal, Unknown, Not Reported  \n",
-       "9                                                                         \n",
-       "10                                                                        \n",
-       "11                                                                        \n",
-       "12                                                                        \n",
-       "13                                                                        \n",
-       "14                                                                        \n",
-       "15                                                                        \n",
-       "16                                                                        \n",
-       "17                                                                        \n",
-       "18                                                                        \n",
-       "19                                                                        "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Race:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>ethnicity</td>\n",
-       "      <td>0.7531</td>\n",
-       "      <td>An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...</td>\n",
-       "      <td>hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>race</td>\n",
-       "      <td>0.7397</td>\n",
-       "      <td>An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...</td>\n",
-       "      <td>american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>eye_color</td>\n",
-       "      <td>0.4766</td>\n",
-       "      <td>The color of the iris of the eye</td>\n",
-       "      <td>Amber, Blue, Brown, Gray, Green, Hazel, Red &amp; Violet, Other, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>channel</td>\n",
-       "      <td>0.425</td>\n",
-       "      <td>The corresponding color channel used to generate this data file.</td>\n",
-       "      <td>Green, Red</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>variant_origin</td>\n",
-       "      <td>0.4006</td>\n",
-       "      <td>The text term used to describe the biological origin of a specific genetic variant.</td>\n",
-       "      <td>Germline, Somatic, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>demographics</td>\n",
-       "      <td>0.3645</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>supratentorial_localization</td>\n",
-       "      <td>0.3533</td>\n",
-       "      <td>Text term to specify the location of the supratentorial tumor.</td>\n",
-       "      <td>Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>somatic_annotation_workflows</td>\n",
-       "      <td>0.348</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>stain_type</td>\n",
-       "      <td>0.3314</td>\n",
-       "      <td>The text term used to describe the type of stain used on a slide.</td>\n",
-       "      <td>Haemotoxylin and Eosin (H&amp;E), Immunohistochemistry (IHC)</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>fab_morphology_code</td>\n",
-       "      <td>0.329</td>\n",
-       "      <td>A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...</td>\n",
-       "      <td>M0, M1, M2, M3, M4, M5, M6, M7, Not Classified</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>melanoma_known_primary</td>\n",
-       "      <td>0.3175</td>\n",
-       "      <td>A melanoma which has metastasized from a known primary anatomic site.</td>\n",
-       "      <td>Yes, No, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>histone_variant</td>\n",
-       "      <td>0.3156</td>\n",
-       "      <td>The text term used to describe a specific histone variants, which are proteins that substitute for the core canonical histones.</td>\n",
-       "      <td>CENP-A, H2A-Bbd, H2A.X, H2A.Z, H2A.Z.1, H2A.Z.2, H2A.Z.2.2, H3.1, H3.2, H3.3, H3.5, H3.X, H3.Y, H3t (H3.4), mH2A, mH2A.1, mH2A.2, Unknown, Not Reporte...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>radon_exposure</td>\n",
-       "      <td>0.3118</td>\n",
-       "      <td>The yes/no/unknown indicator used to describe whether the patient was exposed to radon.</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>measurement_type</td>\n",
-       "      <td>0.307</td>\n",
-       "      <td>The method used to measure tumor size.</td>\n",
-       "      <td>Echographic, Pathologic, Radiologic</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>histone_family</td>\n",
-       "      <td>0.2993</td>\n",
-       "      <td>The text term used to describe the family, or classification of a group of basic proteins found in chromatin, called histones.</td>\n",
-       "      <td>H1, H2A, H2B, H3, H4, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>country_of_birth</td>\n",
-       "      <td>0.2875</td>\n",
-       "      <td>The name of the country in which the patient is born.</td>\n",
-       "      <td>Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>country_of_residence_at_enrollment</td>\n",
-       "      <td>0.2843</td>\n",
-       "      <td>The text term used to describe the patient's country of residence at the time they were enrolled in the study.</td>\n",
-       "      <td>Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>somatic_aggregation_workflows</td>\n",
-       "      <td>0.2837</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>somatic_mutation_calling_workflows</td>\n",
-       "      <td>0.2808</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>exposure_source</td>\n",
-       "      <td>0.278</td>\n",
-       "      <td>The source or location where the patient was exposed.</td>\n",
-       "      <td>Home, Occupational, Secondary, Social, Work, Unknown</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                             Candidate Similarity  \\\n",
-       "0                            ethnicity     0.7531   \n",
-       "1                                 race     0.7397   \n",
-       "2                            eye_color     0.4766   \n",
-       "3                              channel      0.425   \n",
-       "4                       variant_origin     0.4006   \n",
-       "5                         demographics     0.3645   \n",
-       "6          supratentorial_localization     0.3533   \n",
-       "7         somatic_annotation_workflows      0.348   \n",
-       "8                           stain_type     0.3314   \n",
-       "9                  fab_morphology_code      0.329   \n",
-       "10              melanoma_known_primary     0.3175   \n",
-       "11                     histone_variant     0.3156   \n",
-       "12                      radon_exposure     0.3118   \n",
-       "13                    measurement_type      0.307   \n",
-       "14                      histone_family     0.2993   \n",
-       "15                    country_of_birth     0.2875   \n",
-       "16  country_of_residence_at_enrollment     0.2843   \n",
-       "17       somatic_aggregation_workflows     0.2837   \n",
-       "18  somatic_mutation_calling_workflows     0.2808   \n",
-       "19                     exposure_source      0.278   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...   \n",
-       "1   An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...   \n",
-       "2                                                                                                                            The color of the iris of the eye   \n",
-       "3                                                                                            The corresponding color channel used to generate this data file.   \n",
-       "4                                                                         The text term used to describe the biological origin of a specific genetic variant.   \n",
-       "5                                                                                                                                                               \n",
-       "6                                                                                              Text term to specify the location of the supratentorial tumor.   \n",
-       "7                                                                                                                                                               \n",
-       "8                                                                                           The text term used to describe the type of stain used on a slide.   \n",
-       "9   A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...   \n",
-       "10                                                                                      A melanoma which has metastasized from a known primary anatomic site.   \n",
-       "11                            The text term used to describe a specific histone variants, which are proteins that substitute for the core canonical histones.   \n",
-       "12                                                                    The yes/no/unknown indicator used to describe whether the patient was exposed to radon.   \n",
-       "13                                                                                                                     The method used to measure tumor size.   \n",
-       "14                             The text term used to describe the family, or classification of a group of basic proteins found in chromatin, called histones.   \n",
-       "15                                                                                                      The name of the country in which the patient is born.   \n",
-       "16                                             The text term used to describe the patient's country of residence at the time they were enrolled in the study.   \n",
-       "17                                                                                                                                                              \n",
-       "18                                                                                                                                                              \n",
-       "19                                                                                                      The source or location where the patient was exposed.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                          hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect  \n",
-       "1   american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...  \n",
-       "2                                                                                   Amber, Blue, Brown, Gray, Green, Hazel, Red & Violet, Other, Not Reported  \n",
-       "3                                                                                                                                                  Green, Red  \n",
-       "4                                                                                                                                  Germline, Somatic, Unknown  \n",
-       "5                                                                                                                                                              \n",
-       "6   Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...  \n",
-       "7                                                                                                                                                              \n",
-       "8                                                                                                    Haemotoxylin and Eosin (H&E), Immunohistochemistry (IHC)  \n",
-       "9                                                                                                              M0, M1, M2, M3, M4, M5, M6, M7, Not Classified  \n",
-       "10                                                                                                                                      Yes, No, Not Reported  \n",
-       "11  CENP-A, H2A-Bbd, H2A.X, H2A.Z, H2A.Z.1, H2A.Z.2, H2A.Z.2.2, H3.1, H3.2, H3.3, H3.5, H3.X, H3.Y, H3t (H3.4), mH2A, mH2A.1, mH2A.2, Unknown, Not Reporte...  \n",
-       "12                                                                                                                             Yes, No, Unknown, Not Reported  \n",
-       "13                                                                                                                        Echographic, Pathologic, Radiologic  \n",
-       "14                                                                                                                H1, H2A, H2B, H3, H4, Unknown, Not Reported  \n",
-       "15  Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "16  Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "17                                                                                                                                                             \n",
-       "18                                                                                                                                                             \n",
-       "19                                                                                                       Home, Occupational, Secondary, Social, Work, Unknown  "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Ethnicity:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>ethnicity</td>\n",
-       "      <td>0.8505</td>\n",
-       "      <td>An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...</td>\n",
-       "      <td>hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>race</td>\n",
-       "      <td>0.6468</td>\n",
-       "      <td>An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...</td>\n",
-       "      <td>american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>variant_origin</td>\n",
-       "      <td>0.4661</td>\n",
-       "      <td>The text term used to describe the biological origin of a specific genetic variant.</td>\n",
-       "      <td>Germline, Somatic, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>demographics</td>\n",
-       "      <td>0.3661</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>eye_color</td>\n",
-       "      <td>0.3564</td>\n",
-       "      <td>The color of the iris of the eye</td>\n",
-       "      <td>Amber, Blue, Brown, Gray, Green, Hazel, Red &amp; Violet, Other, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>measurement_type</td>\n",
-       "      <td>0.3227</td>\n",
-       "      <td>The method used to measure tumor size.</td>\n",
-       "      <td>Echographic, Pathologic, Radiologic</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>channel</td>\n",
-       "      <td>0.3153</td>\n",
-       "      <td>The corresponding color channel used to generate this data file.</td>\n",
-       "      <td>Green, Red</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>country_of_birth</td>\n",
-       "      <td>0.3073</td>\n",
-       "      <td>The name of the country in which the patient is born.</td>\n",
-       "      <td>Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>methylation_array_harmonization_workflows</td>\n",
-       "      <td>0.2998</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>country_of_residence_at_enrollment</td>\n",
-       "      <td>0.2993</td>\n",
-       "      <td>The text term used to describe the patient's country of residence at the time they were enrolled in the study.</td>\n",
-       "      <td>Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>fab_morphology_code</td>\n",
-       "      <td>0.2927</td>\n",
-       "      <td>A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...</td>\n",
-       "      <td>M0, M1, M2, M3, M4, M5, M6, M7, Not Classified</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>stain_type</td>\n",
-       "      <td>0.2794</td>\n",
-       "      <td>The text term used to describe the type of stain used on a slide.</td>\n",
-       "      <td>Haemotoxylin and Eosin (H&amp;E), Immunohistochemistry (IHC)</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>education_level</td>\n",
-       "      <td>0.2781</td>\n",
-       "      <td>The years of schooling completed in graded public, private, or parochial schools, and in colleges, universities, or professional schools.</td>\n",
-       "      <td>College Degree, High School Graduate or GED, Professional or Graduate Degree, Some High School or Less, Vocational College or Some College, Not Report...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>mean_coverage</td>\n",
-       "      <td>0.2714</td>\n",
-       "      <td>Mean coverage for whole genome sequencing, or mean target coverage for whole exome and targeted sequencing, collected from Picard Tools.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>alcohol_type</td>\n",
-       "      <td>0.2648</td>\n",
-       "      <td>A specific type of alcohol.</td>\n",
-       "      <td>Beer, Liquor, Wine, Other, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>exposure_source</td>\n",
-       "      <td>0.2624</td>\n",
-       "      <td>The source or location where the patient was exposed.</td>\n",
-       "      <td>Home, Occupational, Secondary, Social, Work, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>somatic_annotation_workflows</td>\n",
-       "      <td>0.2578</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>analyte_type</td>\n",
-       "      <td>0.2569</td>\n",
-       "      <td>Text term that represents the kind of molecular specimen analyte.</td>\n",
-       "      <td>cfDNA, DNA, EBV Immortalized Normal, FFPE DNA, FFPE RNA, GenomePlex (Rubicon) Amplified DNA, m6A Enriched RNA, Nuclei RNA, Repli-G (Qiagen) DNA, Repli...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>gender</td>\n",
-       "      <td>0.2544</td>\n",
-       "      <td>Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...</td>\n",
-       "      <td>female, male, unspecified, unknown, not reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>wgs_coverage</td>\n",
-       "      <td>0.2528</td>\n",
-       "      <td>Range of coverage values for WGS aligned reads. Each range is non-inclusive to the lower bound.</td>\n",
-       "      <td>0x-10x, 10x-25x, 25x-150x, 150x+, Unknown, Not Applicable</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                                    Candidate Similarity  \\\n",
-       "0                                   ethnicity     0.8505   \n",
-       "1                                        race     0.6468   \n",
-       "2                              variant_origin     0.4661   \n",
-       "3                                demographics     0.3661   \n",
-       "4                                   eye_color     0.3564   \n",
-       "5                            measurement_type     0.3227   \n",
-       "6                                     channel     0.3153   \n",
-       "7                            country_of_birth     0.3073   \n",
-       "8   methylation_array_harmonization_workflows     0.2998   \n",
-       "9          country_of_residence_at_enrollment     0.2993   \n",
-       "10                        fab_morphology_code     0.2927   \n",
-       "11                                 stain_type     0.2794   \n",
-       "12                            education_level     0.2781   \n",
-       "13                              mean_coverage     0.2714   \n",
-       "14                               alcohol_type     0.2648   \n",
-       "15                            exposure_source     0.2624   \n",
-       "16               somatic_annotation_workflows     0.2578   \n",
-       "17                               analyte_type     0.2569   \n",
-       "18                                     gender     0.2544   \n",
-       "19                               wgs_coverage     0.2528   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   An individual's self-described social and cultural grouping, specifically whether an individual describes themselves as Hispanic or Latino. The provid...   \n",
-       "1   An arbitrary classification of a taxonomic group that is a division of a species. It usually arises as a consequence of geographical isolation within ...   \n",
-       "2                                                                         The text term used to describe the biological origin of a specific genetic variant.   \n",
-       "3                                                                                                                                                               \n",
-       "4                                                                                                                            The color of the iris of the eye   \n",
-       "5                                                                                                                      The method used to measure tumor size.   \n",
-       "6                                                                                            The corresponding color channel used to generate this data file.   \n",
-       "7                                                                                                       The name of the country in which the patient is born.   \n",
-       "8                                                                                                                                                               \n",
-       "9                                              The text term used to describe the patient's country of residence at the time they were enrolled in the study.   \n",
-       "10  A classification system for acute myeloid leukemias, acute lymphoblastic leukemias, and myelodysplastic syndromes. It is based on the morphologic and ...   \n",
-       "11                                                                                          The text term used to describe the type of stain used on a slide.   \n",
-       "12                  The years of schooling completed in graded public, private, or parochial schools, and in colleges, universities, or professional schools.   \n",
-       "13                   Mean coverage for whole genome sequencing, or mean target coverage for whole exome and targeted sequencing, collected from Picard Tools.   \n",
-       "14                                                                                                                                A specific type of alcohol.   \n",
-       "15                                                                                                      The source or location where the patient was exposed.   \n",
-       "16                                                                                                                                                              \n",
-       "17                                                                                          Text term that represents the kind of molecular specimen analyte.   \n",
-       "18  Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...   \n",
-       "19                                                            Range of coverage values for WGS aligned reads. Each range is non-inclusive to the lower bound.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                          hispanic or latino, not hispanic or latino, Unknown, unknown, not reported, not allowed to collect  \n",
-       "1   american indian or alaska native, asian, black or african american, native hawaiian or other pacific islander, white, other, Unknown, unknown, not rep...  \n",
-       "2                                                                                                                                  Germline, Somatic, Unknown  \n",
-       "3                                                                                                                                                              \n",
-       "4                                                                                   Amber, Blue, Brown, Gray, Green, Hazel, Red & Violet, Other, Not Reported  \n",
-       "5                                                                                                                         Echographic, Pathologic, Radiologic  \n",
-       "6                                                                                                                                                  Green, Red  \n",
-       "7   Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "8                                                                                                                                                              \n",
-       "9   Afghanistan, Albania, Algeria, Andorra, Angola, Anguilla, Antigua and Barbuda, Argentina, Armenia, Aruba, Australia, Austria, Azerbaijan, Bahamas, Bah...  \n",
-       "10                                                                                                             M0, M1, M2, M3, M4, M5, M6, M7, Not Classified  \n",
-       "11                                                                                                   Haemotoxylin and Eosin (H&E), Immunohistochemistry (IHC)  \n",
-       "12  College Degree, High School Graduate or GED, Professional or Graduate Degree, Some High School or Less, Vocational College or Some College, Not Report...  \n",
-       "13                                                                                                                                                             \n",
-       "14                                                                                                           Beer, Liquor, Wine, Other, Unknown, Not Reported  \n",
-       "15                                                                                                       Home, Occupational, Secondary, Social, Work, Unknown  \n",
-       "16                                                                                                                                                             \n",
-       "17  cfDNA, DNA, EBV Immortalized Normal, FFPE DNA, FFPE RNA, GenomePlex (Rubicon) Amplified DNA, m6A Enriched RNA, Nuclei RNA, Repli-G (Qiagen) DNA, Repli...  \n",
-       "18                                                                                                           female, male, unspecified, unknown, not reported  \n",
-       "19                                                                                                  0x-10x, 10x-25x, 25x-150x, 150x+, Unknown, Not Applicable  "
-      ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Gender:\n"
-     ]
-    },
-    {
-     "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>gender</td>\n",
-       "      <td>0.908</td>\n",
-       "      <td>Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...</td>\n",
-       "      <td>female, male, unspecified, unknown, not reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>relationship_gender</td>\n",
-       "      <td>0.8735</td>\n",
-       "      <td>The text term used to describe the gender of the patient's relative with a history of cancer.</td>\n",
-       "      <td>female, male, unspecified, unknown, not reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>pregnant_at_diagnosis</td>\n",
-       "      <td>0.5085</td>\n",
-       "      <td>The text term used to indicate whether the patient was pregnant at the time they were diagnosed.</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>menopause_status</td>\n",
-       "      <td>0.5046</td>\n",
-       "      <td>Text term used to describe the patient's menopause status.</td>\n",
-       "      <td>Perimenopausal, Postmenopausal, Premenopausal, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>hormonal_contraceptive_type</td>\n",
-       "      <td>0.4781</td>\n",
-       "      <td>The specific type of hormonal contraceptives used by the subject.</td>\n",
-       "      <td>Progestin, Progestin and Estrogen, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>pregnancy_outcome</td>\n",
-       "      <td>0.4511</td>\n",
-       "      <td>The text term used to describe the type of pregnancy the patient had.</td>\n",
-       "      <td>Ectopic Pregnancy, Induced Abortion, Live Birth, Miscarriage, Spontaneous Abortion, Stillbirth, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>tumor_shape</td>\n",
-       "      <td>0.439</td>\n",
-       "      <td>Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.</td>\n",
-       "      <td>Diffuse, Dome, Mushroom, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>marital_status</td>\n",
-       "      <td>0.4323</td>\n",
-       "      <td>A demographic parameter indicating a person's current conjugal status.</td>\n",
-       "      <td>Divorced, Domestic Partnership, Married, Never Married, Separated, Widowed</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>variant_origin</td>\n",
-       "      <td>0.4315</td>\n",
-       "      <td>The text term used to describe the biological origin of a specific genetic variant.</td>\n",
-       "      <td>Germline, Somatic, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>demographics</td>\n",
-       "      <td>0.4067</td>\n",
-       "      <td></td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>tumor_confined_to_organ_of_origin</td>\n",
-       "      <td>0.389</td>\n",
-       "      <td>The yes/no/unknown indicator used to describe whether the tumor is confined to the organ where it originated and did not spread to a proximal or dista...</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>analyte_type</td>\n",
-       "      <td>0.3619</td>\n",
-       "      <td>Text term that represents the kind of molecular specimen analyte.</td>\n",
-       "      <td>cfDNA, DNA, EBV Immortalized Normal, FFPE DNA, FFPE RNA, GenomePlex (Rubicon) Amplified DNA, m6A Enriched RNA, Nuclei RNA, Repli-G (Qiagen) DNA, Repli...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>undescended_testis_corrected</td>\n",
-       "      <td>0.3616</td>\n",
-       "      <td>Indicates whether the patient's undescended testis was corrected.</td>\n",
-       "      <td>Yes, No, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>relationship_age_at_diagnosis</td>\n",
-       "      <td>0.3613</td>\n",
-       "      <td>The age (in years) when the patient's relative was first diagnosed.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>weeks_gestation_at_birth</td>\n",
-       "      <td>0.3573</td>\n",
-       "      <td>Numeric value used to describe the number of weeks starting from the approximate date of the biological mother's last menstrual period and ending with...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>relationship_type</td>\n",
-       "      <td>0.3565</td>\n",
-       "      <td>The subgroup that describes the state of connectedness between members of the unit of society organized around kinship ties.</td>\n",
-       "      <td>Adopted Brother, Adopted Daughter, Adopted Sister, Adopted Son, Adoptive Father, Adoptive Mother, Aunt, Brother, Brother-in-law, Child, Cousin, Daught...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>tumor_focality</td>\n",
-       "      <td>0.3563</td>\n",
-       "      <td>The text term used to describe whether the patient's disease originated in a single location or multiple locations.</td>\n",
-       "      <td>Multifocal, Unifocal, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>undescended_testis_history_laterality</td>\n",
-       "      <td>0.3474</td>\n",
-       "      <td>Describes the lateral location of the patient's undescended testis.</td>\n",
-       "      <td>Bilateral, Left, Right, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>undescended_testis_corrected_age</td>\n",
-       "      <td>0.344</td>\n",
-       "      <td>The patient's age when their undescended testis was corrected.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>ovarian_surface_involvement</td>\n",
-       "      <td>0.3385</td>\n",
-       "      <td>The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.</td>\n",
-       "      <td>Absent, Indeterminate, Present, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                                Candidate Similarity  \\\n",
-       "0                                  gender      0.908   \n",
-       "1                     relationship_gender     0.8735   \n",
-       "2                   pregnant_at_diagnosis     0.5085   \n",
-       "3                        menopause_status     0.5046   \n",
-       "4             hormonal_contraceptive_type     0.4781   \n",
-       "5                       pregnancy_outcome     0.4511   \n",
-       "6                             tumor_shape      0.439   \n",
-       "7                          marital_status     0.4323   \n",
-       "8                          variant_origin     0.4315   \n",
-       "9                            demographics     0.4067   \n",
-       "10      tumor_confined_to_organ_of_origin      0.389   \n",
-       "11                           analyte_type     0.3619   \n",
-       "12           undescended_testis_corrected     0.3616   \n",
-       "13          relationship_age_at_diagnosis     0.3613   \n",
-       "14               weeks_gestation_at_birth     0.3573   \n",
-       "15                      relationship_type     0.3565   \n",
-       "16                         tumor_focality     0.3563   \n",
-       "17  undescended_testis_history_laterality     0.3474   \n",
-       "18       undescended_testis_corrected_age      0.344   \n",
-       "19            ovarian_surface_involvement     0.3385   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0   Text designations that identify gender. Gender is described as the assemblage of properties that distinguish people on the basis of their societal rol...   \n",
-       "1                                                               The text term used to describe the gender of the patient's relative with a history of cancer.   \n",
-       "2                                                            The text term used to indicate whether the patient was pregnant at the time they were diagnosed.   \n",
-       "3                                                                                                  Text term used to describe the patient's menopause status.   \n",
-       "4                                                                                           The specific type of hormonal contraceptives used by the subject.   \n",
-       "5                                                                                       The text term used to describe the type of pregnancy the patient had.   \n",
-       "6                                           Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.   \n",
-       "7                                                                                      A demographic parameter indicating a person's current conjugal status.   \n",
-       "8                                                                         The text term used to describe the biological origin of a specific genetic variant.   \n",
-       "9                                                                                                                                                               \n",
-       "10  The yes/no/unknown indicator used to describe whether the tumor is confined to the organ where it originated and did not spread to a proximal or dista...   \n",
-       "11                                                                                          Text term that represents the kind of molecular specimen analyte.   \n",
-       "12                                                                                          Indicates whether the patient's undescended testis was corrected.   \n",
-       "13                                                                                        The age (in years) when the patient's relative was first diagnosed.   \n",
-       "14  Numeric value used to describe the number of weeks starting from the approximate date of the biological mother's last menstrual period and ending with...   \n",
-       "15                               The subgroup that describes the state of connectedness between members of the unit of society organized around kinship ties.   \n",
-       "16                                        The text term used to describe whether the patient's disease originated in a single location or multiple locations.   \n",
-       "17                                                                                        Describes the lateral location of the patient's undescended testis.   \n",
-       "18                                                                                             The patient's age when their undescended testis was corrected.   \n",
-       "19                 The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.   \n",
+       "<style>*[data-root-id],\n",
+       "*[data-root-id] > * {\n",
+       "  box-sizing: border-box;\n",
+       "  font-family: var(--jp-ui-font-family);\n",
+       "  font-size: var(--jp-ui-font-size1);\n",
+       "  color: var(--vscode-editor-foreground, var(--jp-ui-font-color1));\n",
+       "}\n",
        "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                            female, male, unspecified, unknown, not reported  \n",
-       "1                                                                                                            female, male, unspecified, unknown, not reported  \n",
-       "2                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "3                                                                                        Perimenopausal, Postmenopausal, Premenopausal, Unknown, Not Reported  \n",
-       "4                                                                                                    Progestin, Progestin and Estrogen, Unknown, Not Reported  \n",
-       "5                                       Ectopic Pregnancy, Induced Abortion, Live Birth, Miscarriage, Spontaneous Abortion, Stillbirth, Unknown, Not Reported  \n",
-       "6                                                                                                                            Diffuse, Dome, Mushroom, Unknown  \n",
-       "7                                                                                  Divorced, Domestic Partnership, Married, Never Married, Separated, Widowed  \n",
-       "8                                                                                                                                  Germline, Somatic, Unknown  \n",
-       "9                                                                                                                                                              \n",
-       "10                                                                                                                             Yes, No, Unknown, Not Reported  \n",
-       "11  cfDNA, DNA, EBV Immortalized Normal, FFPE DNA, FFPE RNA, GenomePlex (Rubicon) Amplified DNA, m6A Enriched RNA, Nuclei RNA, Repli-G (Qiagen) DNA, Repli...  \n",
-       "12                                                                                                                                      Yes, No, Not Reported  \n",
-       "13                                                                                                                                                             \n",
-       "14                                                                                                                                                             \n",
-       "15  Adopted Brother, Adopted Daughter, Adopted Sister, Adopted Son, Adoptive Father, Adoptive Mother, Aunt, Brother, Brother-in-law, Child, Cousin, Daught...  \n",
-       "16                                                                                                                Multifocal, Unifocal, Unknown, Not Reported  \n",
-       "17                                                                                                                       Bilateral, Left, Right, Not Reported  \n",
-       "18                                                                                                                                                             \n",
-       "19                                                                                                      Absent, Indeterminate, Present, Unknown, Not Reported  "
+       "/* Override VSCode background color */\n",
+       ".cell-output-ipywidget-background:has(\n",
+       "    > .cell-output-ipywidget-background > .lm-Widget > *[data-root-id]\n",
+       "  ),\n",
+       ".cell-output-ipywidget-background:has(> .lm-Widget > *[data-root-id]) {\n",
+       "  background-color: transparent !important;\n",
+       "}\n",
+       "</style>"
       ]
      },
      "metadata": {},
      "output_type": "display_data"
     },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Tumor_Site:\n"
-     ]
-    },
     {
      "data": {
+      "application/vnd.holoviews_exec.v0+json": "",
       "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
+       "<div id='aa16b927-ebd1-45d1-a966-2d079e223c93'>\n",
+       "  <div id=\"bc74cfc7-b314-4e84-8321-06f49f25ebd8\" data-root-id=\"aa16b927-ebd1-45d1-a966-2d079e223c93\" style=\"display: contents;\"></div>\n",
+       "</div>\n",
+       "<script type=\"application/javascript\">(function(root) {\n",
+       "  var docs_json = {\"970fe6af-6ffd-4f1d-9fac-6b104962d03a\":{\"version\":\"3.4.1\",\"title\":\"Bokeh Application\",\"roots\":[{\"type\":\"object\",\"name\":\"panel.models.browser.BrowserInfo\",\"id\":\"aa16b927-ebd1-45d1-a966-2d079e223c93\"},{\"type\":\"object\",\"name\":\"panel.models.comm_manager.CommManager\",\"id\":\"ffec20fa-eb9e-4732-8da4-dac9e81b570b\",\"attributes\":{\"plot_id\":\"aa16b927-ebd1-45d1-a966-2d079e223c93\",\"comm_id\":\"6d482684d1aa43c2a79f9a5ed089af4f\",\"client_comm_id\":\"30314b76108649208a194811b6108b48\"}}],\"defs\":[{\"type\":\"model\",\"name\":\"ReactiveHTML1\"},{\"type\":\"model\",\"name\":\"FlexBox1\",\"properties\":[{\"name\":\"align_content\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"align_items\",\"kind\":\"Any\",\"default\":\"flex-start\"},{\"name\":\"flex_direction\",\"kind\":\"Any\",\"default\":\"row\"},{\"name\":\"flex_wrap\",\"kind\":\"Any\",\"default\":\"wrap\"},{\"name\":\"gap\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"justify_content\",\"kind\":\"Any\",\"default\":\"flex-start\"}]},{\"type\":\"model\",\"name\":\"FloatPanel1\",\"properties\":[{\"name\":\"config\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"contained\",\"kind\":\"Any\",\"default\":true},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"right-top\"},{\"name\":\"offsetx\",\"kind\":\"Any\",\"default\":null},{\"name\":\"offsety\",\"kind\":\"Any\",\"default\":null},{\"name\":\"theme\",\"kind\":\"Any\",\"default\":\"primary\"},{\"name\":\"status\",\"kind\":\"Any\",\"default\":\"normalized\"}]},{\"type\":\"model\",\"name\":\"GridStack1\",\"properties\":[{\"name\":\"mode\",\"kind\":\"Any\",\"default\":\"warn\"},{\"name\":\"ncols\",\"kind\":\"Any\",\"default\":null},{\"name\":\"nrows\",\"kind\":\"Any\",\"default\":null},{\"name\":\"allow_resize\",\"kind\":\"Any\",\"default\":true},{\"name\":\"allow_drag\",\"kind\":\"Any\",\"default\":true},{\"name\":\"state\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"drag1\",\"properties\":[{\"name\":\"slider_width\",\"kind\":\"Any\",\"default\":5},{\"name\":\"slider_color\",\"kind\":\"Any\",\"default\":\"black\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":50}]},{\"type\":\"model\",\"name\":\"click1\",\"properties\":[{\"name\":\"terminal_output\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"debug_name\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"clears\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"FastWrapper1\",\"properties\":[{\"name\":\"object\",\"kind\":\"Any\",\"default\":null},{\"name\":\"style\",\"kind\":\"Any\",\"default\":null}]},{\"type\":\"model\",\"name\":\"NotificationAreaBase1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"NotificationArea1\",\"properties\":[{\"name\":\"js_events\",\"kind\":\"Any\",\"default\":{\"type\":\"map\"}},{\"name\":\"notifications\",\"kind\":\"Any\",\"default\":[]},{\"name\":\"position\",\"kind\":\"Any\",\"default\":\"bottom-right\"},{\"name\":\"_clear\",\"kind\":\"Any\",\"default\":0},{\"name\":\"types\",\"kind\":\"Any\",\"default\":[{\"type\":\"map\",\"entries\":[[\"type\",\"warning\"],[\"background\",\"#ffc107\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-exclamation-triangle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]},{\"type\":\"map\",\"entries\":[[\"type\",\"info\"],[\"background\",\"#007bff\"],[\"icon\",{\"type\":\"map\",\"entries\":[[\"className\",\"fas fa-info-circle\"],[\"tagName\",\"i\"],[\"color\",\"white\"]]}]]}]}]},{\"type\":\"model\",\"name\":\"Notification\",\"properties\":[{\"name\":\"background\",\"kind\":\"Any\",\"default\":null},{\"name\":\"duration\",\"kind\":\"Any\",\"default\":3000},{\"name\":\"icon\",\"kind\":\"Any\",\"default\":null},{\"name\":\"message\",\"kind\":\"Any\",\"default\":\"\"},{\"name\":\"notification_type\",\"kind\":\"Any\",\"default\":null},{\"name\":\"_destroyed\",\"kind\":\"Any\",\"default\":false}]},{\"type\":\"model\",\"name\":\"TemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"BootstrapTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"TemplateEditor1\",\"properties\":[{\"name\":\"layout\",\"kind\":\"Any\",\"default\":[]}]},{\"type\":\"model\",\"name\":\"MaterialTemplateActions1\",\"properties\":[{\"name\":\"open_modal\",\"kind\":\"Any\",\"default\":0},{\"name\":\"close_modal\",\"kind\":\"Any\",\"default\":0}]},{\"type\":\"model\",\"name\":\"copy_to_clipboard1\",\"properties\":[{\"name\":\"fill\",\"kind\":\"Any\",\"default\":\"none\"},{\"name\":\"value\",\"kind\":\"Any\",\"default\":null}]}]}};\n",
+       "  var render_items = [{\"docid\":\"970fe6af-6ffd-4f1d-9fac-6b104962d03a\",\"roots\":{\"aa16b927-ebd1-45d1-a966-2d079e223c93\":\"bc74cfc7-b314-4e84-8321-06f49f25ebd8\"},\"root_ids\":[\"aa16b927-ebd1-45d1-a966-2d079e223c93\"]}];\n",
+       "  var docs = Object.values(docs_json)\n",
+       "  if (!docs) {\n",
+       "    return\n",
+       "  }\n",
+       "  const py_version = docs[0].version.replace('rc', '-rc.').replace('.dev', '-dev.')\n",
+       "  function embed_document(root) {\n",
+       "    var Bokeh = get_bokeh(root)\n",
+       "    Bokeh.embed.embed_items_notebook(docs_json, render_items);\n",
+       "    for (const render_item of render_items) {\n",
+       "      for (const root_id of render_item.root_ids) {\n",
+       "\tconst id_el = document.getElementById(root_id)\n",
+       "\tif (id_el.children.length && (id_el.children[0].className === 'bk-root')) {\n",
+       "\t  const root_el = id_el.children[0]\n",
+       "\t  root_el.id = root_el.id + '-rendered'\n",
+       "\t}\n",
+       "      }\n",
        "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
+       "  }\n",
+       "  function get_bokeh(root) {\n",
+       "    if (root.Bokeh === undefined) {\n",
+       "      return null\n",
+       "    } else if (root.Bokeh.version !== py_version) {\n",
+       "      if (root.Bokeh.versions === undefined || !root.Bokeh.versions.has(py_version)) {\n",
+       "\treturn null\n",
+       "      }\n",
+       "      return root.Bokeh.versions.get(py_version);\n",
+       "    } else if (root.Bokeh.version === py_version) {\n",
+       "      return root.Bokeh\n",
        "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>margins_involved_site</td>\n",
-       "      <td>0.6137</td>\n",
-       "      <td>The text term used to describe the anatomic sites that were involved in the survival margins.</td>\n",
-       "      <td>Gerota Fascia, Parenchyma, Perinephric Fat, Renal, Renal Capsule, Renal Sinus, Renal Vein, Ureter</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>tumor_depth_descriptor</td>\n",
-       "      <td>0.5781</td>\n",
-       "      <td>Text term for the degree to which a tumor has penetrated into organ or tissue.</td>\n",
-       "      <td>Deep, Superficial, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>max_tumor_bulk_site</td>\n",
-       "      <td>0.5583</td>\n",
-       "      <td>The site of the tumor where the dimension or diameter is larger than any other part of the tumor.</td>\n",
-       "      <td>Adrenal, Appendix, Ascites/peritoneum, Axillary lymph nodes, Bone marrow, Brain, Breast, Cervical lymph nodes, Colon, Iliac, Iliac-external, Inguinal,...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>supratentorial_localization</td>\n",
-       "      <td>0.5446</td>\n",
-       "      <td>Text term to specify the location of the supratentorial tumor.</td>\n",
-       "      <td>Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>enneking_msts_tumor_site</td>\n",
-       "      <td>0.5399</td>\n",
-       "      <td>Text term and code that represents the tumor site of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...</td>\n",
-       "      <td>Extracompartmental (T2), Intracompartmental (T1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>tumor_level_prostate</td>\n",
-       "      <td>0.5308</td>\n",
-       "      <td>The level(s) of the prostate from which the tumor originated.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>primary_site</td>\n",
-       "      <td>0.5265</td>\n",
-       "      <td>The text term used to describe the primary site of disease, as categorized by the World Health Organization's (WHO) International Classification of Di...</td>\n",
-       "      <td>Accessory sinuses, Adrenal gland, Anus and anal canal, Base of tongue, Bladder, Bones, joints and articular cartilage of limbs, Bones, joints and arti...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>morphologic_architectural_pattern</td>\n",
-       "      <td>0.52</td>\n",
-       "      <td>A specific morphologic or pathologic architectural pattern was discovered within the sample studied.</td>\n",
-       "      <td>Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>tumor_shape</td>\n",
-       "      <td>0.4893</td>\n",
-       "      <td>Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.</td>\n",
-       "      <td>Diffuse, Dome, Mushroom, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>biospecimen_type</td>\n",
-       "      <td>0.4642</td>\n",
-       "      <td>The text term used to describe the biological material used for testing, diagnostic, treatment or research purposes.</td>\n",
-       "      <td>Blood, Bone Marrow, Buccal Mucosa, Buffy Coat, Cerebrospinal Fluid, Connective Tissue, Embryonic Fluid, Embryonic Tissue, Feces, Granulocyte, Involved...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>tissue_or_organ_of_origin</td>\n",
-       "      <td>0.4573</td>\n",
-       "      <td>The text term used to describe the anatomic site of origin, of the patient's malignant disease, as described by the World Health Organization's (WHO) ...</td>\n",
-       "      <td>Abdomen, NOS, Abdominal esophagus, Accessory sinus, NOS, Acoustic nerve, Adrenal gland, NOS, Ampulla of Vater, Anal canal, Anterior 2/3 of tongue, NOS...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>tumor_focality</td>\n",
-       "      <td>0.4343</td>\n",
-       "      <td>The text term used to describe whether the patient's disease originated in a single location or multiple locations.</td>\n",
-       "      <td>Multifocal, Unifocal, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>site_of_resection_or_biopsy</td>\n",
-       "      <td>0.434</td>\n",
-       "      <td>The text term used to describe the anatomic site of origin, of the patient's malignant disease, as described by the World Health Organization's (WHO) ...</td>\n",
-       "      <td>Abdomen, NOS, Abdominal esophagus, Accessory sinus, NOS, Acoustic nerve, Adrenal gland, NOS, Ampulla of Vater, Anal canal, Anterior 2/3 of tongue, NOS...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>treatment_anatomic_site</td>\n",
-       "      <td>0.4275</td>\n",
-       "      <td>The anatomic site or field targeted by a treatment regimen or single agent therapy.</td>\n",
-       "      <td>Abdomen, total, Abdominal Wall, Acetabulum, Adenoid, Adipose, Adrenal, Alveolar Ridge, Amniotic Fluid, Ampulla of Vater, Anal Sphincter, Ankle, Anorec...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>ovarian_surface_involvement</td>\n",
-       "      <td>0.3998</td>\n",
-       "      <td>The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.</td>\n",
-       "      <td>Absent, Indeterminate, Present, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>lymph_node_involved_site</td>\n",
-       "      <td>0.3911</td>\n",
-       "      <td>The text term used to describe the anatomic site of lymph node involvement.</td>\n",
-       "      <td>Aortic, Axillary, Cervical, Cervical, Central, Cervical, Lateral, Cervical, NOS, Epitrochlear, Femoral, Hilar, Iliac, NOS, Iliac-common, Iliac-externa...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>history_of_tumor</td>\n",
-       "      <td>0.39</td>\n",
-       "      <td>Indicates whether patient has a history of tumors.</td>\n",
-       "      <td>Yes, No, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>imaging_type</td>\n",
-       "      <td>0.3897</td>\n",
-       "      <td>The text term used to describe the type of imaging or scan performed on the patient.</td>\n",
-       "      <td>99mTc Bone Scintigraphy, CT Scan, MRI, PET, Ultrasound</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>metastasis_at_diagnosis</td>\n",
-       "      <td>0.3885</td>\n",
-       "      <td>The text term used to describe the extent of metastatic disease present at diagnosis.</td>\n",
-       "      <td>Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>sites_of_involvement</td>\n",
-       "      <td>0.3876</td>\n",
-       "      <td>The anatomic sites of disease involvement in addition to the primary anatomic site.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                            Candidate Similarity  \\\n",
-       "0               margins_involved_site     0.6137   \n",
-       "1              tumor_depth_descriptor     0.5781   \n",
-       "2                 max_tumor_bulk_site     0.5583   \n",
-       "3         supratentorial_localization     0.5446   \n",
-       "4            enneking_msts_tumor_site     0.5399   \n",
-       "5                tumor_level_prostate     0.5308   \n",
-       "6                        primary_site     0.5265   \n",
-       "7   morphologic_architectural_pattern       0.52   \n",
-       "8                         tumor_shape     0.4893   \n",
-       "9                    biospecimen_type     0.4642   \n",
-       "10          tissue_or_organ_of_origin     0.4573   \n",
-       "11                     tumor_focality     0.4343   \n",
-       "12        site_of_resection_or_biopsy      0.434   \n",
-       "13            treatment_anatomic_site     0.4275   \n",
-       "14        ovarian_surface_involvement     0.3998   \n",
-       "15           lymph_node_involved_site     0.3911   \n",
-       "16                   history_of_tumor       0.39   \n",
-       "17                       imaging_type     0.3897   \n",
-       "18            metastasis_at_diagnosis     0.3885   \n",
-       "19               sites_of_involvement     0.3876   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                                               The text term used to describe the anatomic sites that were involved in the survival margins.   \n",
-       "1                                                                              Text term for the degree to which a tumor has penetrated into organ or tissue.   \n",
-       "2                                                           The site of the tumor where the dimension or diameter is larger than any other part of the tumor.   \n",
-       "3                                                                                              Text term to specify the location of the supratentorial tumor.   \n",
-       "4   Text term and code that represents the tumor site of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...   \n",
-       "5                                                                                               The level(s) of the prostate from which the tumor originated.   \n",
-       "6   The text term used to describe the primary site of disease, as categorized by the World Health Organization's (WHO) International Classification of Di...   \n",
-       "7                                                        A specific morphologic or pathologic architectural pattern was discovered within the sample studied.   \n",
-       "8                                           Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.   \n",
-       "9                                        The text term used to describe the biological material used for testing, diagnostic, treatment or research purposes.   \n",
-       "10  The text term used to describe the anatomic site of origin, of the patient's malignant disease, as described by the World Health Organization's (WHO) ...   \n",
-       "11                                        The text term used to describe whether the patient's disease originated in a single location or multiple locations.   \n",
-       "12  The text term used to describe the anatomic site of origin, of the patient's malignant disease, as described by the World Health Organization's (WHO) ...   \n",
-       "13                                                                        The anatomic site or field targeted by a treatment regimen or single agent therapy.   \n",
-       "14                 The text term that describes whether the surface tissue (outer boundary) of the ovary shows evidence of involvement or presence of cancer.   \n",
-       "15                                                                                The text term used to describe the anatomic site of lymph node involvement.   \n",
-       "16                                                                                                         Indicates whether patient has a history of tumors.   \n",
-       "17                                                                       The text term used to describe the type of imaging or scan performed on the patient.   \n",
-       "18                                                                      The text term used to describe the extent of metastatic disease present at diagnosis.   \n",
-       "19                                                                        The anatomic sites of disease involvement in addition to the primary anatomic site.   \n",
-       "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                           Gerota Fascia, Parenchyma, Perinephric Fat, Renal, Renal Capsule, Renal Sinus, Renal Vein, Ureter  \n",
-       "1                                                                                                                             Deep, Superficial, Not Reported  \n",
-       "2   Adrenal, Appendix, Ascites/peritoneum, Axillary lymph nodes, Bone marrow, Brain, Breast, Cervical lymph nodes, Colon, Iliac, Iliac-external, Inguinal,...  \n",
-       "3   Cerebral Cortex, Deep Gray (e.g. Basal Ganglia, Thalamus), Frontal lobe, Occipital lobe, Parietal lobe, Spinal Cord, Temporal lobe, White Matter, Unkn...  \n",
-       "4                                                                                     Extracompartmental (T2), Intracompartmental (T1), Unknown, Not Reported  \n",
-       "5                                                                                                                                                              \n",
-       "6   Accessory sinuses, Adrenal gland, Anus and anal canal, Base of tongue, Bladder, Bones, joints and articular cartilage of limbs, Bones, joints and arti...  \n",
-       "7                                                     Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular  \n",
-       "8                                                                                                                            Diffuse, Dome, Mushroom, Unknown  \n",
-       "9   Blood, Bone Marrow, Buccal Mucosa, Buffy Coat, Cerebrospinal Fluid, Connective Tissue, Embryonic Fluid, Embryonic Tissue, Feces, Granulocyte, Involved...  \n",
-       "10  Abdomen, NOS, Abdominal esophagus, Accessory sinus, NOS, Acoustic nerve, Adrenal gland, NOS, Ampulla of Vater, Anal canal, Anterior 2/3 of tongue, NOS...  \n",
-       "11                                                                                                                Multifocal, Unifocal, Unknown, Not Reported  \n",
-       "12  Abdomen, NOS, Abdominal esophagus, Accessory sinus, NOS, Acoustic nerve, Adrenal gland, NOS, Ampulla of Vater, Anal canal, Anterior 2/3 of tongue, NOS...  \n",
-       "13  Abdomen, total, Abdominal Wall, Acetabulum, Adenoid, Adipose, Adrenal, Alveolar Ridge, Amniotic Fluid, Ampulla of Vater, Anal Sphincter, Ankle, Anorec...  \n",
-       "14                                                                                                      Absent, Indeterminate, Present, Unknown, Not Reported  \n",
-       "15  Aortic, Axillary, Cervical, Cervical, Central, Cervical, Lateral, Cervical, NOS, Epitrochlear, Femoral, Hilar, Iliac, NOS, Iliac-common, Iliac-externa...  \n",
-       "16                                                                                                                                      Yes, No, Not Reported  \n",
-       "17                                                                                                     99mTc Bone Scintigraphy, CT Scan, MRI, PET, Ultrasound  \n",
-       "18                                                             Distant Metastasis, Metastasis, NOS, No Metastasis, Regional Metastasis, Unknown, Not Reported  \n",
-       "19                                                                                                                                                             "
+       "    return null\n",
+       "  }\n",
+       "  function is_loaded(root) {\n",
+       "    var Bokeh = get_bokeh(root)\n",
+       "    return (Bokeh != null && Bokeh.Panel !== undefined && ( root.MathJax !== undefined) && ( root.MathJax !== undefined) && ( root.vega !== undefined) && ( root.vega !== undefined) && ( root.MathJax !== undefined))\n",
+       "  }\n",
+       "  if (is_loaded(root)) {\n",
+       "    embed_document(root);\n",
+       "  } else {\n",
+       "    var attempts = 0;\n",
+       "    var timer = setInterval(function(root) {\n",
+       "      if (is_loaded(root)) {\n",
+       "        clearInterval(timer);\n",
+       "        embed_document(root);\n",
+       "      } else if (document.readyState == \"complete\") {\n",
+       "        attempts++;\n",
+       "        if (attempts > 200) {\n",
+       "          clearInterval(timer);\n",
+       "\t  var Bokeh = get_bokeh(root)\n",
+       "\t  if (Bokeh == null || Bokeh.Panel == null) {\n",
+       "            console.warn(\"Panel: ERROR: Unable to run Panel code because Bokeh or Panel library is missing\");\n",
+       "\t  } else {\n",
+       "\t    console.warn(\"Panel: WARNING: Attempting to render but not all required libraries could be resolved.\")\n",
+       "\t    embed_document(root)\n",
+       "\t  }\n",
+       "        }\n",
+       "      }\n",
+       "    }, 25, root)\n",
+       "  }\n",
+       "})(window);</script>"
       ]
      },
+     "metadata": {
+      "application/vnd.holoviews_exec.v0+json": {
+       "id": "aa16b927-ebd1-45d1-a966-2d079e223c93"
+      }
+     },
+     "output_type": "display_data"
+    },
+    {
+     "data": {
+      "application/javascript": "(function(root) {\n  function now() {\n    return new Date();\n  }\n\n  var force = true;\n  var py_version = '3.4.1'.replace('rc', '-rc.').replace('.dev', '-dev.');\n  var reloading = true;\n  var Bokeh = root.Bokeh;\n\n  if (typeof (root._bokeh_timeout) === \"undefined\" || force) {\n    root._bokeh_timeout = Date.now() + 5000;\n    root._bokeh_failed_load = false;\n  }\n\n  function run_callbacks() {\n    try {\n      root._bokeh_onload_callbacks.forEach(function(callback) {\n        if (callback != null)\n          callback();\n      });\n    } finally {\n      delete root._bokeh_onload_callbacks;\n    }\n    console.debug(\"Bokeh: all callbacks have finished\");\n  }\n\n  function load_libs(css_urls, js_urls, js_modules, js_exports, callback) {\n    if (css_urls == null) css_urls = [];\n    if (js_urls == null) js_urls = [];\n    if (js_modules == null) js_modules = [];\n    if (js_exports == null) js_exports = {};\n\n    root._bokeh_onload_callbacks.push(callback);\n\n    if (root._bokeh_is_loading > 0) {\n      console.debug(\"Bokeh: BokehJS is being loaded, scheduling callback at\", now());\n      return null;\n    }\n    if (js_urls.length === 0 && js_modules.length === 0 && Object.keys(js_exports).length === 0) {\n      run_callbacks();\n      return null;\n    }\n    if (!reloading) {\n      console.debug(\"Bokeh: BokehJS not loaded, scheduling load and callback at\", now());\n    }\n\n    function on_load() {\n      root._bokeh_is_loading--;\n      if (root._bokeh_is_loading === 0) {\n        console.debug(\"Bokeh: all BokehJS libraries/stylesheets loaded\");\n        run_callbacks()\n      }\n    }\n    window._bokeh_on_load = on_load\n\n    function on_error() {\n      console.error(\"failed to load \" + url);\n    }\n\n    var skip = [];\n    if (window.requirejs) {\n      window.requirejs.config({'packages': {}, 'paths': {'mathjax': '//cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-AMS_HTML', 'vega-embed': 'https://cdn.jsdelivr.net/npm/vega-embed@6/build/vega-embed.min', 'vega-lite': 'https://cdn.jsdelivr.net/npm/vega-lite@5/build/vega-lite.min', 'vega': 'https://cdn.jsdelivr.net/npm/vega@5/build/vega.min'}, 'shim': {'mathjax': {'exports': 'MathJax'}}});\n      require([\"mathjax\"], function() {\n\ton_load()\n      })\n      require([\"vega-embed\"], function(vegaEmbed) {\n\twindow.vegaEmbed = vegaEmbed\n\ton_load()\n      })\n      require([\"vega-lite\"], function(vl) {\n\twindow.vl = vl\n\ton_load()\n      })\n      require([\"vega\"], function(vega) {\n\twindow.vega = vega\n\ton_load()\n      })\n      root._bokeh_is_loading = css_urls.length + 4;\n    } else {\n      root._bokeh_is_loading = css_urls.length + js_urls.length + js_modules.length + Object.keys(js_exports).length;\n    }\n\n    var existing_stylesheets = []\n    var links = document.getElementsByTagName('link')\n    for (var i = 0; i < links.length; i++) {\n      var link = links[i]\n      if (link.href != null) {\n\texisting_stylesheets.push(link.href)\n      }\n    }\n    for (var i = 0; i < css_urls.length; i++) {\n      var url = css_urls[i];\n      if (existing_stylesheets.indexOf(url) !== -1) {\n\ton_load()\n\tcontinue;\n      }\n      const element = document.createElement(\"link\");\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.rel = \"stylesheet\";\n      element.type = \"text/css\";\n      element.href = url;\n      console.debug(\"Bokeh: injecting link tag for BokehJS stylesheet: \", url);\n      document.body.appendChild(element);\n    }    if (((window.MathJax !== undefined) && (!(window.MathJax instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-MML-AM_CHTML'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vega !== undefined) && (!(window.vega instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega@5'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vegaLite !== undefined) && (!(window.vegaLite instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-lite@5'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    if (((window.vegaEmbed !== undefined) && (!(window.vegaEmbed instanceof HTMLElement))) || window.requirejs) {\n      var urls = ['https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-embed@6'];\n      for (var i = 0; i < urls.length; i++) {\n        skip.push(urls[i])\n      }\n    }    var existing_scripts = []\n    var scripts = document.getElementsByTagName('script')\n    for (var i = 0; i < scripts.length; i++) {\n      var script = scripts[i]\n      if (script.src != null) {\n\texisting_scripts.push(script.src)\n      }\n    }\n    for (var i = 0; i < js_urls.length; i++) {\n      var url = js_urls[i];\n      if (skip.indexOf(url) !== -1 || existing_scripts.indexOf(url) !== -1) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.async = false;\n      element.src = url;\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      document.head.appendChild(element);\n    }\n    for (var i = 0; i < js_modules.length; i++) {\n      var url = js_modules[i];\n      if (skip.indexOf(url) !== -1 || existing_scripts.indexOf(url) !== -1) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onload = on_load;\n      element.onerror = on_error;\n      element.async = false;\n      element.src = url;\n      element.type = \"module\";\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      document.head.appendChild(element);\n    }\n    for (const name in js_exports) {\n      var url = js_exports[name];\n      if (skip.indexOf(url) >= 0 || root[name] != null) {\n\tif (!window.requirejs) {\n\t  on_load();\n\t}\n\tcontinue;\n      }\n      var element = document.createElement('script');\n      element.onerror = on_error;\n      element.async = false;\n      element.type = \"module\";\n      console.debug(\"Bokeh: injecting script tag for BokehJS library: \", url);\n      element.textContent = `\n      import ${name} from \"${url}\"\n      window.${name} = ${name}\n      window._bokeh_on_load()\n      `\n      document.head.appendChild(element);\n    }\n    if (!js_urls.length && !js_modules.length) {\n      on_load()\n    }\n  };\n\n  function inject_raw_css(css) {\n    const element = document.createElement(\"style\");\n    element.appendChild(document.createTextNode(css));\n    document.body.appendChild(element);\n  }\n\n  var js_urls = [\"https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js?config=TeX-MML-AM_CHTML\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega@5\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-lite@5\", \"https://cdn.holoviz.org/panel/1.4.2/dist/bundled/vegaplot/vega-embed@6\"];\n  var js_modules = [];\n  var js_exports = {};\n  var css_urls = [];\n  var inline_js = [    function(Bokeh) {\n      Bokeh.set_log_level(\"info\");\n    },\nfunction(Bokeh) {} // ensure no trailing comma for IE\n  ];\n\n  function run_inline_js() {\n    if ((root.Bokeh !== undefined) || (force === true)) {\n      for (var i = 0; i < inline_js.length; i++) {\n\ttry {\n          inline_js[i].call(root, root.Bokeh);\n\t} catch(e) {\n\t  if (!reloading) {\n\t    throw e;\n\t  }\n\t}\n      }\n      // Cache old bokeh versions\n      if (Bokeh != undefined && !reloading) {\n\tvar NewBokeh = root.Bokeh;\n\tif (Bokeh.versions === undefined) {\n\t  Bokeh.versions = new Map();\n\t}\n\tif (NewBokeh.version !== Bokeh.version) {\n\t  Bokeh.versions.set(NewBokeh.version, NewBokeh)\n\t}\n\troot.Bokeh = Bokeh;\n      }} else if (Date.now() < root._bokeh_timeout) {\n      setTimeout(run_inline_js, 100);\n    } else if (!root._bokeh_failed_load) {\n      console.log(\"Bokeh: BokehJS failed to load within specified timeout.\");\n      root._bokeh_failed_load = true;\n    }\n    root._bokeh_is_initializing = false\n  }\n\n  function load_or_wait() {\n    // Implement a backoff loop that tries to ensure we do not load multiple\n    // versions of Bokeh and its dependencies at the same time.\n    // In recent versions we use the root._bokeh_is_initializing flag\n    // to determine whether there is an ongoing attempt to initialize\n    // bokeh, however for backward compatibility we also try to ensure\n    // that we do not start loading a newer (Panel>=1.0 and Bokeh>3) version\n    // before older versions are fully initialized.\n    if (root._bokeh_is_initializing && Date.now() > root._bokeh_timeout) {\n      root._bokeh_is_initializing = false;\n      root._bokeh_onload_callbacks = undefined;\n      console.log(\"Bokeh: BokehJS was loaded multiple times but one version failed to initialize.\");\n      load_or_wait();\n    } else if (root._bokeh_is_initializing || (typeof root._bokeh_is_initializing === \"undefined\" && root._bokeh_onload_callbacks !== undefined)) {\n      setTimeout(load_or_wait, 100);\n    } else {\n      root._bokeh_is_initializing = true\n      root._bokeh_onload_callbacks = []\n      var bokeh_loaded = Bokeh != null && (Bokeh.version === py_version || (Bokeh.versions !== undefined && Bokeh.versions.has(py_version)));\n      if (!reloading && !bokeh_loaded) {\n\troot.Bokeh = undefined;\n      }\n      load_libs(css_urls, js_urls, js_modules, js_exports, function() {\n\tconsole.debug(\"Bokeh: BokehJS plotting callback run at\", now());\n\trun_inline_js();\n      });\n    }\n  }\n  // Give older versions of the autoload script a head-start to ensure\n  // they initialize before we start loading newer version.\n  setTimeout(load_or_wait, 100)\n}(window));",
+      "application/vnd.holoviews_load.v0+json": ""
+     },
      "metadata": {},
      "output_type": "display_data"
     },
     {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Tumor_Focality:\n"
-     ]
+     "data": {
+      "application/javascript": "\nif ((window.PyViz === undefined) || (window.PyViz instanceof HTMLElement)) {\n  window.PyViz = {comms: {}, comm_status:{}, kernels:{}, receivers: {}, plot_index: []}\n}\n\n\n    function JupyterCommManager() {\n    }\n\n    JupyterCommManager.prototype.register_target = function(plot_id, comm_id, msg_handler) {\n      if (window.comm_manager || ((window.Jupyter !== undefined) && (Jupyter.notebook.kernel != null))) {\n        var comm_manager = window.comm_manager || Jupyter.notebook.kernel.comm_manager;\n        comm_manager.register_target(comm_id, function(comm) {\n          comm.on_msg(msg_handler);\n        });\n      } else if ((plot_id in window.PyViz.kernels) && (window.PyViz.kernels[plot_id])) {\n        window.PyViz.kernels[plot_id].registerCommTarget(comm_id, function(comm) {\n          comm.onMsg = msg_handler;\n        });\n      } else if (typeof google != 'undefined' && google.colab.kernel != null) {\n        google.colab.kernel.comms.registerTarget(comm_id, (comm) => {\n          var messages = comm.messages[Symbol.asyncIterator]();\n          function processIteratorResult(result) {\n            var message = result.value;\n            console.log(message)\n            var content = {data: message.data, comm_id};\n            var buffers = []\n            for (var buffer of message.buffers || []) {\n              buffers.push(new DataView(buffer))\n            }\n            var metadata = message.metadata || {};\n            var msg = {content, buffers, metadata}\n            msg_handler(msg);\n            return messages.next().then(processIteratorResult);\n          }\n          return messages.next().then(processIteratorResult);\n        })\n      }\n    }\n\n    JupyterCommManager.prototype.get_client_comm = function(plot_id, comm_id, msg_handler) {\n      if (comm_id in window.PyViz.comms) {\n        return window.PyViz.comms[comm_id];\n      } else if (window.comm_manager || ((window.Jupyter !== undefined) && (Jupyter.notebook.kernel != null))) {\n        var comm_manager = window.comm_manager || Jupyter.notebook.kernel.comm_manager;\n        var comm = comm_manager.new_comm(comm_id, {}, {}, {}, comm_id);\n        if (msg_handler) {\n          comm.on_msg(msg_handler);\n        }\n      } else if ((plot_id in window.PyViz.kernels) && (window.PyViz.kernels[plot_id])) {\n        var comm = window.PyViz.kernels[plot_id].connectToComm(comm_id);\n        comm.open();\n        if (msg_handler) {\n          comm.onMsg = msg_handler;\n        }\n      } else if (typeof google != 'undefined' && google.colab.kernel != null) {\n        var comm_promise = google.colab.kernel.comms.open(comm_id)\n        comm_promise.then((comm) => {\n          window.PyViz.comms[comm_id] = comm;\n          if (msg_handler) {\n            var messages = comm.messages[Symbol.asyncIterator]();\n            function processIteratorResult(result) {\n              var message = result.value;\n              var content = {data: message.data};\n              var metadata = message.metadata || {comm_id};\n              var msg = {content, metadata}\n              msg_handler(msg);\n              return messages.next().then(processIteratorResult);\n            }\n            return messages.next().then(processIteratorResult);\n          }\n        }) \n        var sendClosure = (data, metadata, buffers, disposeOnDone) => {\n          return comm_promise.then((comm) => {\n            comm.send(data, metadata, buffers, disposeOnDone);\n          });\n        };\n        var comm = {\n          send: sendClosure\n        };\n      }\n      window.PyViz.comms[comm_id] = comm;\n      return comm;\n    }\n    window.PyViz.comm_manager = new JupyterCommManager();\n    \n\n\nvar JS_MIME_TYPE = 'application/javascript';\nvar HTML_MIME_TYPE = 'text/html';\nvar EXEC_MIME_TYPE = 'application/vnd.holoviews_exec.v0+json';\nvar CLASS_NAME = 'output';\n\n/**\n * Render data to the DOM node\n */\nfunction render(props, node) {\n  var div = document.createElement(\"div\");\n  var script = document.createElement(\"script\");\n  node.appendChild(div);\n  node.appendChild(script);\n}\n\n/**\n * Handle when a new output is added\n */\nfunction handle_add_output(event, handle) {\n  var output_area = handle.output_area;\n  var output = handle.output;\n  if ((output.data == undefined) || (!output.data.hasOwnProperty(EXEC_MIME_TYPE))) {\n    return\n  }\n  var id = output.metadata[EXEC_MIME_TYPE][\"id\"];\n  var toinsert = output_area.element.find(\".\" + CLASS_NAME.split(' ')[0]);\n  if (id !== undefined) {\n    var nchildren = toinsert.length;\n    var html_node = toinsert[nchildren-1].children[0];\n    html_node.innerHTML = output.data[HTML_MIME_TYPE];\n    var scripts = [];\n    var nodelist = html_node.querySelectorAll(\"script\");\n    for (var i in nodelist) {\n      if (nodelist.hasOwnProperty(i)) {\n        scripts.push(nodelist[i])\n      }\n    }\n\n    scripts.forEach( function (oldScript) {\n      var newScript = document.createElement(\"script\");\n      var attrs = [];\n      var nodemap = oldScript.attributes;\n      for (var j in nodemap) {\n        if (nodemap.hasOwnProperty(j)) {\n          attrs.push(nodemap[j])\n        }\n      }\n      attrs.forEach(function(attr) { newScript.setAttribute(attr.name, attr.value) });\n      newScript.appendChild(document.createTextNode(oldScript.innerHTML));\n      oldScript.parentNode.replaceChild(newScript, oldScript);\n    });\n    if (JS_MIME_TYPE in output.data) {\n      toinsert[nchildren-1].children[1].textContent = output.data[JS_MIME_TYPE];\n    }\n    output_area._hv_plot_id = id;\n    if ((window.Bokeh !== undefined) && (id in Bokeh.index)) {\n      window.PyViz.plot_index[id] = Bokeh.index[id];\n    } else {\n      window.PyViz.plot_index[id] = null;\n    }\n  } else if (output.metadata[EXEC_MIME_TYPE][\"server_id\"] !== undefined) {\n    var bk_div = document.createElement(\"div\");\n    bk_div.innerHTML = output.data[HTML_MIME_TYPE];\n    var script_attrs = bk_div.children[0].attributes;\n    for (var i = 0; i < script_attrs.length; i++) {\n      toinsert[toinsert.length - 1].childNodes[1].setAttribute(script_attrs[i].name, script_attrs[i].value);\n    }\n    // store reference to server id on output_area\n    output_area._bokeh_server_id = output.metadata[EXEC_MIME_TYPE][\"server_id\"];\n  }\n}\n\n/**\n * Handle when an output is cleared or removed\n */\nfunction handle_clear_output(event, handle) {\n  var id = handle.cell.output_area._hv_plot_id;\n  var server_id = handle.cell.output_area._bokeh_server_id;\n  if (((id === undefined) || !(id in PyViz.plot_index)) && (server_id !== undefined)) { return; }\n  var comm = window.PyViz.comm_manager.get_client_comm(\"hv-extension-comm\", \"hv-extension-comm\", function () {});\n  if (server_id !== null) {\n    comm.send({event_type: 'server_delete', 'id': server_id});\n    return;\n  } else if (comm !== null) {\n    comm.send({event_type: 'delete', 'id': id});\n  }\n  delete PyViz.plot_index[id];\n  if ((window.Bokeh !== undefined) & (id in window.Bokeh.index)) {\n    var doc = window.Bokeh.index[id].model.document\n    doc.clear();\n    const i = window.Bokeh.documents.indexOf(doc);\n    if (i > -1) {\n      window.Bokeh.documents.splice(i, 1);\n    }\n  }\n}\n\n/**\n * Handle kernel restart event\n */\nfunction handle_kernel_cleanup(event, handle) {\n  delete PyViz.comms[\"hv-extension-comm\"];\n  window.PyViz.plot_index = {}\n}\n\n/**\n * Handle update_display_data messages\n */\nfunction handle_update_output(event, handle) {\n  handle_clear_output(event, {cell: {output_area: handle.output_area}})\n  handle_add_output(event, handle)\n}\n\nfunction register_renderer(events, OutputArea) {\n  function append_mime(data, metadata, element) {\n    // create a DOM node to render to\n    var toinsert = this.create_output_subarea(\n    metadata,\n    CLASS_NAME,\n    EXEC_MIME_TYPE\n    );\n    this.keyboard_manager.register_events(toinsert);\n    // Render to node\n    var props = {data: data, metadata: metadata[EXEC_MIME_TYPE]};\n    render(props, toinsert[0]);\n    element.append(toinsert);\n    return toinsert\n  }\n\n  events.on('output_added.OutputArea', handle_add_output);\n  events.on('output_updated.OutputArea', handle_update_output);\n  events.on('clear_output.CodeCell', handle_clear_output);\n  events.on('delete.Cell', handle_clear_output);\n  events.on('kernel_ready.Kernel', handle_kernel_cleanup);\n\n  OutputArea.prototype.register_mime_type(EXEC_MIME_TYPE, append_mime, {\n    safe: true,\n    index: 0\n  });\n}\n\nif (window.Jupyter !== undefined) {\n  try {\n    var events = require('base/js/events');\n    var OutputArea = require('notebook/js/outputarea').OutputArea;\n    if (OutputArea.prototype.mime_types().indexOf(EXEC_MIME_TYPE) == -1) {\n      register_renderer(events, OutputArea);\n    }\n  } catch(err) {\n  }\n}\n",
+      "application/vnd.holoviews_load.v0+json": ""
+     },
+     "metadata": {},
+     "output_type": "display_data"
     },
     {
      "data": {
       "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>tumor_focality</td>\n",
-       "      <td>0.808</td>\n",
-       "      <td>The text term used to describe whether the patient's disease originated in a single location or multiple locations.</td>\n",
-       "      <td>Multifocal, Unifocal, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>tumor_shape</td>\n",
-       "      <td>0.5626</td>\n",
-       "      <td>Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.</td>\n",
-       "      <td>Diffuse, Dome, Mushroom, Unknown</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>tumor_depth_descriptor</td>\n",
-       "      <td>0.5311</td>\n",
-       "      <td>Text term for the degree to which a tumor has penetrated into organ or tissue.</td>\n",
-       "      <td>Deep, Superficial, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>enneking_msts_tumor_site</td>\n",
-       "      <td>0.4829</td>\n",
-       "      <td>Text term and code that represents the tumor site of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...</td>\n",
-       "      <td>Extracompartmental (T2), Intracompartmental (T1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>biospecimen_type</td>\n",
-       "      <td>0.4809</td>\n",
-       "      <td>The text term used to describe the biological material used for testing, diagnostic, treatment or research purposes.</td>\n",
-       "      <td>Blood, Bone Marrow, Buccal Mucosa, Buffy Coat, Cerebrospinal Fluid, Connective Tissue, Embryonic Fluid, Embryonic Tissue, Feces, Granulocyte, Involved...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>tissue_type</td>\n",
-       "      <td>0.4783</td>\n",
-       "      <td>Text term that represents a description of the kind of tissue collected with respect to disease status or proximity to tumor tissue.</td>\n",
-       "      <td>Abnormal, Normal, Peritumoral, Tumor, Unknown, Not Reported, Not Allowed To Collect</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>wilms_tumor_histologic_subtype</td>\n",
-       "      <td>0.4597</td>\n",
-       "      <td>The text term used to describe the classification of Wilms tumors distinguishing between favorable and unfavorable histologic groups.</td>\n",
-       "      <td>Favorable, Unfavorable, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>residual_tumor_measurement</td>\n",
-       "      <td>0.4544</td>\n",
-       "      <td>A measurement of the tumor cells that remain in the body following cancer treatment.</td>\n",
-       "      <td>1-10 mm, 11-20 mm, &gt;20 mm, No macroscopic disease</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>non_nodal_tumor_deposits</td>\n",
-       "      <td>0.451</td>\n",
-       "      <td>The yes/no/unknown indicator used to describe the presence of tumor deposits in the pericolic or perirectal fat or in adjacent mesentery away from the...</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>tumor_infiltrating_macrophages</td>\n",
-       "      <td>0.4464</td>\n",
-       "      <td>Non-neoplastic macrophages that infiltrate a tumor.</td>\n",
-       "      <td>Few, Many, Moderate</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>specimen_type</td>\n",
-       "      <td>0.443</td>\n",
-       "      <td>The type of a material sample taken from a biological entity for testing, diagnostic, propagation, treatment or research purposes. This includes parti...</td>\n",
-       "      <td>2D Classical Conditionally Reprogrammed Cells, 2D Modified Conditionally Reprogrammed Cells, 3D Air-Liquid Interface Organoid, 3D Neurosphere, 3D Orga...</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>extranodal_extension</td>\n",
-       "      <td>0.4366</td>\n",
-       "      <td>Extension of a malignant neoplasm beyond the lymph node capsule.</td>\n",
-       "      <td>Gross Extension, Microscopic Extension, No Extranodal Extension</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>measurement_unit</td>\n",
-       "      <td>0.4319</td>\n",
-       "      <td>The type of unit of measure being used to express a length or distance.</td>\n",
-       "      <td>Centimeters, Millimeters</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>columnar_mucosa_present</td>\n",
-       "      <td>0.4153</td>\n",
-       "      <td>Indicator noting whether columnar mucosa was present within the tissue.</td>\n",
-       "      <td>Yes, No, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>distance_normal_to_tumor</td>\n",
-       "      <td>0.4077</td>\n",
-       "      <td>Text term to signify the distance between the tumor tissue and the normal control tissue that was procured for matching normal DNA.</td>\n",
-       "      <td>Adjacent (&lt; or = 2cm), Distal (&gt;2cm), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>morphologic_architectural_pattern</td>\n",
-       "      <td>0.3949</td>\n",
-       "      <td>A specific morphologic or pathologic architectural pattern was discovered within the sample studied.</td>\n",
-       "      <td>Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>vascular_invasion_type</td>\n",
-       "      <td>0.3896</td>\n",
-       "      <td>Text term that represents the type of vascular tumor invasion.</td>\n",
-       "      <td>Extramural, Intramural, Macro, Micro, No Vascular Invasion, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>residual_tumor</td>\n",
-       "      <td>0.3751</td>\n",
-       "      <td>Tumor cells that remain in the body following cancer treatment.</td>\n",
-       "      <td>R0, R1, R2, RX</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>enneking_msts_metastasis</td>\n",
-       "      <td>0.3703</td>\n",
-       "      <td>Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...</td>\n",
-       "      <td>No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>ovarian_specimen_status</td>\n",
-       "      <td>0.3582</td>\n",
-       "      <td>The text term used to describe the physical condition of the involved ovary.</td>\n",
-       "      <td>Ovarian Capsule Fragmented, Ovarian Capsule Intact, Ovarian Capsule Ruptured, Unknown, Not Reported</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
-      "text/plain": [
-       "                            Candidate Similarity  \\\n",
-       "0                      tumor_focality      0.808   \n",
-       "1                         tumor_shape     0.5626   \n",
-       "2              tumor_depth_descriptor     0.5311   \n",
-       "3            enneking_msts_tumor_site     0.4829   \n",
-       "4                    biospecimen_type     0.4809   \n",
-       "5                         tissue_type     0.4783   \n",
-       "6      wilms_tumor_histologic_subtype     0.4597   \n",
-       "7          residual_tumor_measurement     0.4544   \n",
-       "8            non_nodal_tumor_deposits      0.451   \n",
-       "9      tumor_infiltrating_macrophages     0.4464   \n",
-       "10                      specimen_type      0.443   \n",
-       "11               extranodal_extension     0.4366   \n",
-       "12                   measurement_unit     0.4319   \n",
-       "13            columnar_mucosa_present     0.4153   \n",
-       "14           distance_normal_to_tumor     0.4077   \n",
-       "15  morphologic_architectural_pattern     0.3949   \n",
-       "16             vascular_invasion_type     0.3896   \n",
-       "17                     residual_tumor     0.3751   \n",
-       "18           enneking_msts_metastasis     0.3703   \n",
-       "19            ovarian_specimen_status     0.3582   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                         The text term used to describe whether the patient's disease originated in a single location or multiple locations.   \n",
-       "1                                           Text term to represent the description of the shape of a tumor determined by clinical or pathological techniques.   \n",
-       "2                                                                              Text term for the degree to which a tumor has penetrated into organ or tissue.   \n",
-       "3   Text term and code that represents the tumor site of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskeletal Tu...   \n",
-       "4                                        The text term used to describe the biological material used for testing, diagnostic, treatment or research purposes.   \n",
-       "5                        Text term that represents a description of the kind of tissue collected with respect to disease status or proximity to tumor tissue.   \n",
-       "6                       The text term used to describe the classification of Wilms tumors distinguishing between favorable and unfavorable histologic groups.   \n",
-       "7                                                                        A measurement of the tumor cells that remain in the body following cancer treatment.   \n",
-       "8   The yes/no/unknown indicator used to describe the presence of tumor deposits in the pericolic or perirectal fat or in adjacent mesentery away from the...   \n",
-       "9                                                                                                         Non-neoplastic macrophages that infiltrate a tumor.   \n",
-       "10  The type of a material sample taken from a biological entity for testing, diagnostic, propagation, treatment or research purposes. This includes parti...   \n",
-       "11                                                                                           Extension of a malignant neoplasm beyond the lymph node capsule.   \n",
-       "12                                                                                    The type of unit of measure being used to express a length or distance.   \n",
-       "13                                                                                    Indicator noting whether columnar mucosa was present within the tissue.   \n",
-       "14                        Text term to signify the distance between the tumor tissue and the normal control tissue that was procured for matching normal DNA.   \n",
-       "15                                                       A specific morphologic or pathologic architectural pattern was discovered within the sample studied.   \n",
-       "16                                                                                             Text term that represents the type of vascular tumor invasion.   \n",
-       "17                                                                                            Tumor cells that remain in the body following cancer treatment.   \n",
-       "18  Text term and code that represents the metastatic stage of the musculoskeletal sarcoma, using the Enneking staging system approved by the Musculoskele...   \n",
-       "19                                                                               The text term used to describe the physical condition of the involved ovary.   \n",
+       "<style>*[data-root-id],\n",
+       "*[data-root-id] > * {\n",
+       "  box-sizing: border-box;\n",
+       "  font-family: var(--jp-ui-font-family);\n",
+       "  font-size: var(--jp-ui-font-size1);\n",
+       "  color: var(--vscode-editor-foreground, var(--jp-ui-font-color1));\n",
+       "}\n",
        "\n",
-       "                                                                                                                                              Values (sample)  \n",
-       "0                                                                                                                 Multifocal, Unifocal, Unknown, Not Reported  \n",
-       "1                                                                                                                            Diffuse, Dome, Mushroom, Unknown  \n",
-       "2                                                                                                                             Deep, Superficial, Not Reported  \n",
-       "3                                                                                     Extracompartmental (T2), Intracompartmental (T1), Unknown, Not Reported  \n",
-       "4   Blood, Bone Marrow, Buccal Mucosa, Buffy Coat, Cerebrospinal Fluid, Connective Tissue, Embryonic Fluid, Embryonic Tissue, Feces, Granulocyte, Involved...  \n",
-       "5                                                                         Abnormal, Normal, Peritumoral, Tumor, Unknown, Not Reported, Not Allowed To Collect  \n",
-       "6                                                                                                               Favorable, Unfavorable, Unknown, Not Reported  \n",
-       "7                                                                                                           1-10 mm, 11-20 mm, >20 mm, No macroscopic disease  \n",
-       "8                                                                                                                              Yes, No, Unknown, Not Reported  \n",
-       "9                                                                                                                                         Few, Many, Moderate  \n",
-       "10  2D Classical Conditionally Reprogrammed Cells, 2D Modified Conditionally Reprogrammed Cells, 3D Air-Liquid Interface Organoid, 3D Neurosphere, 3D Orga...  \n",
-       "11                                                                                            Gross Extension, Microscopic Extension, No Extranodal Extension  \n",
-       "12                                                                                                                                   Centimeters, Millimeters  \n",
-       "13                                                                                                                             Yes, No, Unknown, Not Reported  \n",
-       "14                                                                                                Adjacent (< or = 2cm), Distal (>2cm), Unknown, Not Reported  \n",
-       "15                                                    Cohesive, Cribiform, Micropapillary, Non-cohesive, Papillary Renal Cell, Papillary, NOS, Solid, Tubular  \n",
-       "16                                                                          Extramural, Intramural, Macro, Micro, No Vascular Invasion, Unknown, Not Reported  \n",
-       "17                                                                                                                                             R0, R1, R2, RX  \n",
-       "18                                                                             No Metastasis (M0), Regional or Distant Metastasis (M1), Unknown, Not Reported  \n",
-       "19                                                        Ovarian Capsule Fragmented, Ovarian Capsule Intact, Ovarian Capsule Ruptured, Unknown, Not Reported  "
+       "/* Override VSCode background color */\n",
+       ".cell-output-ipywidget-background:has(\n",
+       "    > .cell-output-ipywidget-background > .lm-Widget > *[data-root-id]\n",
+       "  ),\n",
+       ".cell-output-ipywidget-background:has(> .lm-Widget > *[data-root-id]) {\n",
+       "  background-color: transparent !important;\n",
+       "}\n",
+       "</style>"
       ]
      },
      "metadata": {},
      "output_type": "display_data"
     },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      "Tumor_Size_cm:\n"
-     ]
-    },
     {
      "data": {
-      "text/html": [
-       "<div>\n",
-       "<style scoped>\n",
-       "    .dataframe tbody tr th:only-of-type {\n",
-       "        vertical-align: middle;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe tbody tr th {\n",
-       "        vertical-align: top;\n",
-       "    }\n",
-       "\n",
-       "    .dataframe thead th {\n",
-       "        text-align: right;\n",
-       "    }\n",
-       "</style>\n",
-       "<table border=\"1\" class=\"dataframe\">\n",
-       "  <thead>\n",
-       "    <tr style=\"text-align: right;\">\n",
-       "      <th></th>\n",
-       "      <th>Candidate</th>\n",
-       "      <th>Similarity</th>\n",
-       "      <th>Description</th>\n",
-       "      <th>Values (sample)</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <th>0</th>\n",
-       "      <td>shortest_dimension</td>\n",
-       "      <td>0.7575</td>\n",
-       "      <td>Numeric value that represents the shortest dimension of the sample, measured in millimeters.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>1</th>\n",
-       "      <td>size_extraocular_nodule</td>\n",
-       "      <td>0.7416</td>\n",
-       "      <td>The size of the nodule that is outside the eye.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>2</th>\n",
-       "      <td>tumor_width_measurement</td>\n",
-       "      <td>0.7034</td>\n",
-       "      <td>The numerical measurement of tumor width.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>3</th>\n",
-       "      <td>tumor_depth_measurement</td>\n",
-       "      <td>0.6989</td>\n",
-       "      <td>The numerical measurement of tumor depth.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>4</th>\n",
-       "      <td>tumor_thickness</td>\n",
-       "      <td>0.6506</td>\n",
-       "      <td>A measurement of the thickness of a sectioned slice (of tissue or mineral or other substance) in millimeters (mm).</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>5</th>\n",
-       "      <td>analyte_quantity</td>\n",
-       "      <td>0.6418</td>\n",
-       "      <td>The quantity in micrograms (ug) of the analyte(s) derived from the analyte(s) shipped for sequencing and characterization.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>6</th>\n",
-       "      <td>average_insert_size</td>\n",
-       "      <td>0.6362</td>\n",
-       "      <td>Average insert size collected from samtools.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>7</th>\n",
-       "      <td>tumor_largest_dimension_diameter</td>\n",
-       "      <td>0.5736</td>\n",
-       "      <td>Numeric value used to describe the maximum diameter or dimension of the primary tumor, measured in centimeters.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>8</th>\n",
-       "      <td>mitotic_total_area</td>\n",
-       "      <td>0.5635</td>\n",
-       "      <td>The total area reviewed when calculating the mitotic index ratio.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>9</th>\n",
-       "      <td>rin</td>\n",
-       "      <td>0.5578</td>\n",
-       "      <td>A numerical assessment of the integrity of RNA based on the entire electrophoretic trace of the RNA sample including the presence or absence of degrad...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>10</th>\n",
-       "      <td>size_selection_range</td>\n",
-       "      <td>0.5574</td>\n",
-       "      <td>Range of size selection.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>11</th>\n",
-       "      <td>imaging_suv</td>\n",
-       "      <td>0.5519</td>\n",
-       "      <td>The standardized update value (SUV) is the effectively dimensionless measure of regional tracer uptake calculated as the activity concentration within...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>12</th>\n",
-       "      <td>tumor_infiltrating_macrophages</td>\n",
-       "      <td>0.5417</td>\n",
-       "      <td>Non-neoplastic macrophages that infiltrate a tumor.</td>\n",
-       "      <td>Few, Many, Moderate</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>13</th>\n",
-       "      <td>breslow_thickness</td>\n",
-       "      <td>0.5358</td>\n",
-       "      <td>The number that describes the distance, in millimeters, between the upper layer of the epidermis and the deepest point of tumor penetration.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>14</th>\n",
-       "      <td>circumferential_resection_margin</td>\n",
-       "      <td>0.5312</td>\n",
-       "      <td>Numeric value used to describe the non-peritonealised bare area of rectum, comprising anterior and posterior segments, when submitted as a surgical sp...</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>15</th>\n",
-       "      <td>body_surface_area</td>\n",
-       "      <td>0.5154</td>\n",
-       "      <td>Numeric value used to represent the 2-dimensional extent of the body surface relating height to weight.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>16</th>\n",
-       "      <td>workflow_version</td>\n",
-       "      <td>0.5089</td>\n",
-       "      <td>Major version for a GDC workflow.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>17</th>\n",
-       "      <td>mean_coverage</td>\n",
-       "      <td>0.5042</td>\n",
-       "      <td>Mean coverage for whole genome sequencing, or mean target coverage for whole exome and targeted sequencing, collected from Picard Tools.</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>18</th>\n",
-       "      <td>tumor_depth</td>\n",
-       "      <td>0.4949</td>\n",
-       "      <td>Numeric value that represents the depth of tumor invasion, measured in millimeters (mm).</td>\n",
-       "      <td></td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <th>19</th>\n",
-       "      <td>tumor_depth_descriptor</td>\n",
-       "      <td>0.4846</td>\n",
-       "      <td>Text term for the degree to which a tumor has penetrated into organ or tissue.</td>\n",
-       "      <td>Deep, Superficial, Not Reported</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n",
-       "</div>"
-      ],
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "5a1f31b2ebc24a6ab8953e084f9f00ab",
+       "version_major": 2,
+       "version_minor": 0
+      },
       "text/plain": [
-       "                           Candidate Similarity  \\\n",
-       "0                 shortest_dimension     0.7575   \n",
-       "1            size_extraocular_nodule     0.7416   \n",
-       "2            tumor_width_measurement     0.7034   \n",
-       "3            tumor_depth_measurement     0.6989   \n",
-       "4                    tumor_thickness     0.6506   \n",
-       "5                   analyte_quantity     0.6418   \n",
-       "6                average_insert_size     0.6362   \n",
-       "7   tumor_largest_dimension_diameter     0.5736   \n",
-       "8                 mitotic_total_area     0.5635   \n",
-       "9                                rin     0.5578   \n",
-       "10              size_selection_range     0.5574   \n",
-       "11                       imaging_suv     0.5519   \n",
-       "12    tumor_infiltrating_macrophages     0.5417   \n",
-       "13                 breslow_thickness     0.5358   \n",
-       "14  circumferential_resection_margin     0.5312   \n",
-       "15                 body_surface_area     0.5154   \n",
-       "16                  workflow_version     0.5089   \n",
-       "17                     mean_coverage     0.5042   \n",
-       "18                       tumor_depth     0.4949   \n",
-       "19            tumor_depth_descriptor     0.4846   \n",
-       "\n",
-       "                                                                                                                                                  Description  \\\n",
-       "0                                                                Numeric value that represents the shortest dimension of the sample, measured in millimeters.   \n",
-       "1                                                                                                             The size of the nodule that is outside the eye.   \n",
-       "2                                                                                                                   The numerical measurement of tumor width.   \n",
-       "3                                                                                                                   The numerical measurement of tumor depth.   \n",
-       "4                                          A measurement of the thickness of a sectioned slice (of tissue or mineral or other substance) in millimeters (mm).   \n",
-       "5                                  The quantity in micrograms (ug) of the analyte(s) derived from the analyte(s) shipped for sequencing and characterization.   \n",
-       "6                                                                                                                Average insert size collected from samtools.   \n",
-       "7                                             Numeric value used to describe the maximum diameter or dimension of the primary tumor, measured in centimeters.   \n",
-       "8                                                                                           The total area reviewed when calculating the mitotic index ratio.   \n",
-       "9   A numerical assessment of the integrity of RNA based on the entire electrophoretic trace of the RNA sample including the presence or absence of degrad...   \n",
-       "10                                                                                                                                   Range of size selection.   \n",
-       "11  The standardized update value (SUV) is the effectively dimensionless measure of regional tracer uptake calculated as the activity concentration within...   \n",
-       "12                                                                                                        Non-neoplastic macrophages that infiltrate a tumor.   \n",
-       "13               The number that describes the distance, in millimeters, between the upper layer of the epidermis and the deepest point of tumor penetration.   \n",
-       "14  Numeric value used to describe the non-peritonealised bare area of rectum, comprising anterior and posterior segments, when submitted as a surgical sp...   \n",
-       "15                                                    Numeric value used to represent the 2-dimensional extent of the body surface relating height to weight.   \n",
-       "16                                                                                                                          Major version for a GDC workflow.   \n",
-       "17                   Mean coverage for whole genome sequencing, or mean target coverage for whole exome and targeted sequencing, collected from Picard Tools.   \n",
-       "18                                                                   Numeric value that represents the depth of tumor invasion, measured in millimeters (mm).   \n",
-       "19                                                                             Text term for the degree to which a tumor has penetrated into organ or tissue.   \n",
-       "\n",
-       "                    Values (sample)  \n",
-       "0                                    \n",
-       "1                                    \n",
-       "2                                    \n",
-       "3                                    \n",
-       "4                                    \n",
-       "5                                    \n",
-       "6                                    \n",
-       "7                                    \n",
-       "8                                    \n",
-       "9                                    \n",
-       "10                                   \n",
-       "11                                   \n",
-       "12              Few, Many, Moderate  \n",
-       "13                                   \n",
-       "14                                   \n",
-       "15                                   \n",
-       "16                                   \n",
-       "17                                   \n",
-       "18                                   \n",
-       "19  Deep, Superficial, Not Reported  "
+       "BokehModel(combine_events=True, render_bundle={'docs_json': {'0bf58594-a7b6-4b36-9048-2264a754d6d6': {'version…"
       ]
      },
+     "execution_count": 4,
      "metadata": {},
-     "output_type": "display_data"
+     "output_type": "execute_result"
     }
    ],
    "source": [
-    "\n",
-    "manager = APIManager()\n",
-    "manager.load_dataset('./datasets/dou.csv')\n",
-    "reduced_scope = manager.reduce_scope()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from bdi.visualization.scope_reducing import SRHeatMapManager\n",
+    "from bdikit.visualization.scope_reducing import SRHeatMapManager\n",
     "\n",
     "heatmap_manager = SRHeatMapManager()\n",
-    "heatmap_manager.get_heatmap(reduced_scope)\n",
+    "heatmap_manager._write_json(reduced_scope)\n",
+    "heatmap_manager.get_heatmap()\n",
     "heatmap_manager.plot_heatmap()"
    ]
   }