{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Parsing rare list\n",
    "\n",
    "https://globalgenes.org/rarelist\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.6/site-packages/urllib3/connectionpool.py:858: InsecureRequestWarning: Unverified HTTPS request is being made. Adding certificate verification is strongly advised. See: https://urllib3.readthedocs.io/en/latest/advanced-usage.html#ssl-warnings\n",
      "  InsecureRequestWarning)\n"
     ]
    }
   ],
   "source": [
    "# Fetch HTML using requests lib and feed to bs4\n",
    "import requests\n",
    "\n",
    "# note their SSL certificate is not verified. Be careful!\n",
    "result = requests.get(\"https://globalgenes.org/rarelist\", verify=False)\n",
    "\n",
    "from bs4 import BeautifulSoup\n",
    "from bs4 import NavigableString\n",
    "soup = BeautifulSoup(result.content, 'html.parser')\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "<title>Rare Disease List</title>"
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# check\n",
    "soup.title"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "# write formatted html to file\n",
    "# (not used: this is just a useful side effect for exploration)\n",
    "f=open('rarelist.html','w')\n",
    "f.write(soup.prettify())\n",
    "f.close()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['Aagenaes syndrome',\n",
       " 'Aarskog syndrome',\n",
       " 'Aase Smith syndrome',\n",
       " 'ABCD syndrome',\n",
       " 'Abderhalden Kaufmann Lignac syndrome',\n",
       " 'Abdominal aortic aneurysm',\n",
       " 'Abdominal chemodectomas with cutaneous angiolipomas',\n",
       " 'Abdominal cystic lymphangioma',\n",
       " 'Abdominal obesity metabolic syndrome',\n",
       " 'Aberrant subclavian artery',\n",
       " 'Abetalipoproteinemia',\n",
       " 'Abidi X-linked mental retardation syndrome',\n",
       " 'Ablepharon macrostomia syndrome',\n",
       " \"Abrikosov's tumor\",\n",
       " 'Abruzzo Erickson syndrome',\n",
       " 'Absence of fingerprints congenital milia',\n",
       " 'Absence of gluteal muscle',\n",
       " 'Absence of septum pellucidum',\n",
       " 'Absence of Tibia',\n",
       " 'Absence of tibia with polydactyly']"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# use bs4 to extract names from HTML\n",
    "\n",
    "names = []  ## all disease names found\n",
    "name2url = {}  ## mapping of names to URLs\n",
    "\n",
    "h5s = soup.find_all(\"h5\")\n",
    "for h5 in h5s:\n",
    "    ul = h5.find_next_sibling('ul')\n",
    "    for li in ul.findAll('li'):\n",
    "        if len(li.contents) == 0:\n",
    "            continue\n",
    "        n = li.contents[0]\n",
    "        if n is None:\n",
    "            print('BAD: {}'.format(li))\n",
    "            continue\n",
    "        if not isinstance(n, NavigableString):\n",
    "            n = n.contents[0]\n",
    "            if li.select('a'):\n",
    "                url = li.a['href']\n",
    "            \n",
    "                name2url[n] = url\n",
    "        names.append(n)\n",
    "        \n",
    "# show the first 20 for sanity checking\n",
    "names[0:20]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[('Acute disseminated encephalomyelitis', 'http://ulf.org/'),\n",
       " ('Acute hemorrhagic leukoencephalitis', 'http://ulf.org/'),\n",
       " ('Adrenoleukodystrophy X-linked', 'http://ulf.org/'),\n",
       " ('Adrenomyeloneuropathy', 'http://ulf.org/'),\n",
       " ('Aicardi-Goutieres syndrome', 'http://ulf.org/'),\n",
       " ('Alexander disease', 'http://ulf.org/'),\n",
       " ('Alkaptonuria', 'http://www.alkaptonuria.info/'),\n",
       " ('Alpers syndrome',\n",
       "  'http://www.umdf.org/site/c.8qKOJ0MvF7LUG/b.7929671/k.BDF0/Home.htm'),\n",
       " ('Alzheimer disease familial', 'http://www.mitoaction.org/'),\n",
       " ('Alzheimer disease type 1', 'http://www.mitoaction.org/')]"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## sanity check URL mapping\n",
    "list(name2url.items())[0:10]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "import csv\n",
    "with open('rare-list.tsv', 'w', newline='') as csvfile:\n",
    "    spamwriter = csv.writer(csvfile, delimiter='\\t')\n",
    "    for n in names:\n",
    "        spamwriter.writerow([n, name2url.get(n)])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/usr/local/lib/python3.6/site-packages/cachier/mongo_core.py:24: UserWarning: Cachier warning: pymongo was not found. MongoDB cores will not work.\n",
      "  \"Cachier warning: pymongo was not found. MongoDB cores will not work.\")\n"
     ]
    }
   ],
   "source": [
    "## use ontobio lib for fetching ontologies and lexical mapping\n",
    "from ontobio import OntologyFactory"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "ofa = OntologyFactory()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "hp = ofa.create('obo:hp')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "mondo = ofa.create('obo:mondo')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "from ontobio.lexmap import LexicalMapEngine\n",
    "lexmap = LexicalMapEngine()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "rare handle: None meta: None"
      ]
     },
     "execution_count": 14,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# Quick hack to make a degenerate 'ontology' from the list of names\n",
    "from ontobio import Ontology\n",
    "\n",
    "def ont_from_names(names):\n",
    "    ont = Ontology(id='rare')\n",
    "    for n in names:\n",
    "        ## use name as ID\n",
    "        ont.add_node(n, n)\n",
    "    return ont\n",
    "        \n",
    "rare = ont_from_names(names)\n",
    "rare"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['Aagenaes syndrome',\n",
       " 'Aarskog syndrome',\n",
       " 'Aase Smith syndrome',\n",
       " 'ABCD syndrome',\n",
       " 'Abderhalden Kaufmann Lignac syndrome',\n",
       " 'Abdominal aortic aneurysm',\n",
       " 'Abdominal chemodectomas with cutaneous angiolipomas',\n",
       " 'Abdominal cystic lymphangioma',\n",
       " 'Abdominal obesity metabolic syndrome',\n",
       " 'Aberrant subclavian artery']"
      ]
     },
     "execution_count": 15,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## quick inspection\n",
    "rare.nodes()[0:10]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "WARNING:root:Incomplete syn: HP:0000991 \"\" hasRelatedSynonym None [] 1.0\n",
      "WARNING:root:Incomplete syn: HP:0012377 \"\" hasRelatedSynonym None [] 1.0\n",
      "WARNING:root:Incomplete syn: HP:0000510 \"\" hasRelatedSynonym None [] 1.0\n",
      "WARNING:root:Ignoring suspicous synonym: UBERON:0002722 \"4\" hasBroadSynonym None ['http://uri.neuinfo.org/nif/nifstd/birnlex_1488', 'NIFSTD:NeuroNames_abbrevSource'] 1.0\n",
      "WARNING:root:Ignoring suspicous synonym: UBERON:0001715 \"3\" hasBroadSynonym None ['http://uri.neuinfo.org/nif/nifstd/birnlex_1240', 'NIFSTD:NeuroNames_abbrevSource'] 1.0\n"
     ]
    }
   ],
   "source": [
    "## index the 3 ontologies\n",
    "lexmap.index_ontology(hp)\n",
    "lexmap.index_ontology(mondo)\n",
    "lexmap.index_ontology(rare)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "## CONFIGURE\n",
    "## we will map R to mondo and hp separately\n",
    "lexmap.ontology_pairs = [(rare.id, mondo.id), (rare.id, hp.id)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [],
   "source": [
    "# align\n",
    "g = lexmap.get_xref_graph()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style>\n",
       "    .dataframe thead tr:only-child th {\n",
       "        text-align: right;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>left</th>\n",
       "      <th>left_label</th>\n",
       "      <th>right</th>\n",
       "      <th>right_label</th>\n",
       "      <th>left_match_type</th>\n",
       "      <th>right_match_type</th>\n",
       "      <th>left_match_val</th>\n",
       "      <th>right_match_val</th>\n",
       "      <th>score</th>\n",
       "      <th>left_simscore</th>\n",
       "      <th>...</th>\n",
       "      <th>conditional_pr_equiv</th>\n",
       "      <th>pr_subClassOf</th>\n",
       "      <th>pr_superClassOf</th>\n",
       "      <th>pr_equivalentTo</th>\n",
       "      <th>pr_other</th>\n",
       "      <th>left_novel</th>\n",
       "      <th>right_novel</th>\n",
       "      <th>left_consistent</th>\n",
       "      <th>right_consistent</th>\n",
       "      <th>equiv_clique_size</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3287</th>\n",
       "      <td>11-beta-hydroxylase deficiency</td>\n",
       "      <td>11-beta-hydroxylase deficiency</td>\n",
       "      <td>MONDO:0008729</td>\n",
       "      <td>congenital adrenal hyperplasia due to 11-beta-...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>11-beta-hydroxylase deficiency</td>\n",
       "      <td>11-Beta-Hydroxylase Deficiency</td>\n",
       "      <td>50.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.799654</td>\n",
       "      <td>0.077184</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2199</th>\n",
       "      <td>15q13.3 microdeletion syndrome</td>\n",
       "      <td>15q13.3 microdeletion syndrome</td>\n",
       "      <td>MONDO:0012774</td>\n",
       "      <td>chromosome 15q13.3 microdeletion syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>15q13.3 microdeletion syndrome</td>\n",
       "      <td>15q13.3 microdeletion syndrome</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.918763</td>\n",
       "      <td>0.021299</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3339</th>\n",
       "      <td>17-alpha-hydroxylase deficiency</td>\n",
       "      <td>17-alpha-hydroxylase deficiency</td>\n",
       "      <td>MONDO:0008730</td>\n",
       "      <td>congenital adrenal hyperplasia due to 17-alpha...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>17-alpha-hydroxylase deficiency</td>\n",
       "      <td>17-Alpha-Hydroxylase Deficiency</td>\n",
       "      <td>50.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.799654</td>\n",
       "      <td>0.077184</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3481</th>\n",
       "      <td>17-beta hydroxysteroid dehydrogenase 3 deficiency</td>\n",
       "      <td>17-beta hydroxysteroid dehydrogenase 3 deficiency</td>\n",
       "      <td>MONDO:0009916</td>\n",
       "      <td>46,XY disorder of sex development due to 17-be...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>17-beta hydroxysteroid dehydrogenase 3 deficiency</td>\n",
       "      <td>17-beta-hydroxysteroid dehydrogenase 3 deficiency</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2592</th>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>MONDO:0012496</td>\n",
       "      <td>Koolen de Vries syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.168017</td>\n",
       "      <td>0.055554</td>\n",
       "      <td>0.749591</td>\n",
       "      <td>0.026839</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2593</th>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>MONDO:0018216</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>17q21.31 microdeletion syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.526316</td>\n",
       "      <td>0.051671</td>\n",
       "      <td>0.108232</td>\n",
       "      <td>0.824734</td>\n",
       "      <td>0.015363</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2987</th>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>MONDO:0008751</td>\n",
       "      <td>Corticosterone methyloxidase type 1 deficiency</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>18-Hydroxylase Deficiency</td>\n",
       "      <td>32.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.355556</td>\n",
       "      <td>0.232996</td>\n",
       "      <td>0.289482</td>\n",
       "      <td>0.283582</td>\n",
       "      <td>0.193941</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2986</th>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>MONDO:0020489</td>\n",
       "      <td>familial hyperreninemic hypoaldosteronism type 1</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>18 Hydroxylase deficiency</td>\n",
       "      <td>18-hydroxylase deficiency</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.644444</td>\n",
       "      <td>0.292046</td>\n",
       "      <td>0.210145</td>\n",
       "      <td>0.309167</td>\n",
       "      <td>0.188643</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1960</th>\n",
       "      <td>1q21.1 microdeletion syndrome</td>\n",
       "      <td>1q21.1 microdeletion syndrome</td>\n",
       "      <td>MONDO:0012914</td>\n",
       "      <td>chromosome 1q21.1 deletion syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>1q21.1 microdeletion syndrome</td>\n",
       "      <td>1q21.1 microdeletion syndrome</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.923042</td>\n",
       "      <td>0.016740</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1428</th>\n",
       "      <td>2 4-Dienoyl-CoA reductase deficiency</td>\n",
       "      <td>2 4-Dienoyl-CoA reductase deficiency</td>\n",
       "      <td>MONDO:0014464</td>\n",
       "      <td>progressive encephalopathy with leukodystrophy...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>2 4-Dienoyl-CoA reductase deficiency</td>\n",
       "      <td>2,4-dienoyl-CoA reductase deficiency</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.382559</td>\n",
       "      <td>0.215835</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4514</th>\n",
       "      <td>2-Hydroxyglutaric aciduria</td>\n",
       "      <td>2-Hydroxyglutaric aciduria</td>\n",
       "      <td>MONDO:0016001</td>\n",
       "      <td>2-hydroxyglutaric aciduria</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>2-Hydroxyglutaric aciduria</td>\n",
       "      <td>2-hydroxyglutaric aciduria</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1888</th>\n",
       "      <td>2-methyl-3-hydroxybutyric aciduria</td>\n",
       "      <td>2-methyl-3-hydroxybutyric aciduria</td>\n",
       "      <td>MONDO:0010327</td>\n",
       "      <td>HSD10 disease</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>2-methyl-3-hydroxybutyric aciduria</td>\n",
       "      <td>2-methyl-3-hydroxybutyric aciduria</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.918763</td>\n",
       "      <td>0.021299</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1202</th>\n",
       "      <td>2-methylbutyryl-CoA dehydrogenase deficiency</td>\n",
       "      <td>2-methylbutyryl-CoA dehydrogenase deficiency</td>\n",
       "      <td>MONDO:0012392</td>\n",
       "      <td>2-methylbutyryl-CoA dehydrogenase deficiency</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>2-methylbutyryl-CoA dehydrogenase deficiency</td>\n",
       "      <td>2-methylbutyryl-CoA dehydrogenase deficiency</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.927169</td>\n",
       "      <td>0.015241</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3288</th>\n",
       "      <td>21-hydroxylase deficiency</td>\n",
       "      <td>21-hydroxylase deficiency</td>\n",
       "      <td>MONDO:0008728</td>\n",
       "      <td>classic congenital adrenal hyperplasia due to ...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>21-hydroxylase deficiency</td>\n",
       "      <td>21-Hydroxylase Deficiency</td>\n",
       "      <td>50.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.799654</td>\n",
       "      <td>0.077184</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3507</th>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>MONDO:0008644</td>\n",
       "      <td>velocardiofacial syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>deletion 22q11.2 syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.134754</td>\n",
       "      <td>0.179472</td>\n",
       "      <td>0.287938</td>\n",
       "      <td>0.282070</td>\n",
       "      <td>0.250520</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>41</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2964</th>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>MONDO:0018923</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>22q11.2 deletion syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>0.166667</td>\n",
       "      <td>...</td>\n",
       "      <td>0.115075</td>\n",
       "      <td>0.092223</td>\n",
       "      <td>0.035954</td>\n",
       "      <td>0.841716</td>\n",
       "      <td>0.030107</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>41</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1721</th>\n",
       "      <td>3 methylglutaconic aciduria type I</td>\n",
       "      <td>3 methylglutaconic aciduria type I</td>\n",
       "      <td>MONDO:0009610</td>\n",
       "      <td>3-methylglutaconic aciduria type 1</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>3 methylglutaconic aciduria type I</td>\n",
       "      <td>3-methylglutaconic aciduria type 1</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.382559</td>\n",
       "      <td>0.215835</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1720</th>\n",
       "      <td>3 methylglutaconic aciduria type IV</td>\n",
       "      <td>3 methylglutaconic aciduria type IV</td>\n",
       "      <td>MONDO:0009611</td>\n",
       "      <td>3-methylglutaconic aciduria type 4</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>3 methylglutaconic aciduria type IV</td>\n",
       "      <td>3-methylglutaconic aciduria type 4</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.382559</td>\n",
       "      <td>0.215835</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2580</th>\n",
       "      <td>3 methylglutaconic aciduria type V</td>\n",
       "      <td>3 methylglutaconic aciduria type V</td>\n",
       "      <td>MONDO:0012435</td>\n",
       "      <td>3-methylglutaconic aciduria type 5</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>3 methylglutaconic aciduria type V</td>\n",
       "      <td>3-methylglutaconic aciduria type 5</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.198342</td>\n",
       "      <td>0.198342</td>\n",
       "      <td>0.377872</td>\n",
       "      <td>0.225444</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1877</th>\n",
       "      <td>3-Hydroxyisobutyric aciduria</td>\n",
       "      <td>3-Hydroxyisobutyric aciduria</td>\n",
       "      <td>MONDO:0009371</td>\n",
       "      <td>3-hydroxyisobutyric aciduria</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>3-Hydroxyisobutyric aciduria</td>\n",
       "      <td>3-hydroxyisobutyric aciduria</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.927169</td>\n",
       "      <td>0.015241</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3289</th>\n",
       "      <td>3-beta-hydroxysteroid dehydrogenase deficiency</td>\n",
       "      <td>3-beta-hydroxysteroid dehydrogenase deficiency</td>\n",
       "      <td>MONDO:0008727</td>\n",
       "      <td>congenital adrenal hyperplasia due to 3-beta-h...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>3-beta-hydroxysteroid dehydrogenase deficiency</td>\n",
       "      <td>3-Beta-Hydroxysteroid Dehydrogenase Deficiency</td>\n",
       "      <td>50.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.061581</td>\n",
       "      <td>0.799654</td>\n",
       "      <td>0.077184</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3670</th>\n",
       "      <td>3-methylglutaconic aciduria type III</td>\n",
       "      <td>3-methylglutaconic aciduria type III</td>\n",
       "      <td>MONDO:0009787</td>\n",
       "      <td>3-methylglutaconic aciduria type 3</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>3-methylglutaconic aciduria type III</td>\n",
       "      <td>3-methylglutaconic aciduria type III</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.918763</td>\n",
       "      <td>0.021299</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>755</th>\n",
       "      <td>4-hydroxyphenylacetic aciduria</td>\n",
       "      <td>4-hydroxyphenylacetic aciduria</td>\n",
       "      <td>HP:0003607</td>\n",
       "      <td>4-Hydroxyphenylacetic aciduria</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>4-hydroxyphenylacetic aciduria</td>\n",
       "      <td>4-Hydroxyphenylacetic aciduria</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3680</th>\n",
       "      <td>46 XX testicular disorder of sex development</td>\n",
       "      <td>46 XX testicular disorder of sex development</td>\n",
       "      <td>MONDO:0010766</td>\n",
       "      <td>46,XX testicular disorder of sex development</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>46 XX testicular disorder of sex development</td>\n",
       "      <td>46,XX testicular disorder of sex development</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.198342</td>\n",
       "      <td>0.198342</td>\n",
       "      <td>0.377872</td>\n",
       "      <td>0.225444</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3136</th>\n",
       "      <td>47 XXX syndrome</td>\n",
       "      <td>47 XXX syndrome</td>\n",
       "      <td>MONDO:0018066</td>\n",
       "      <td>trisomy X</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>47 XXX syndrome</td>\n",
       "      <td>47,XXX syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.226493</td>\n",
       "      <td>0.185437</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3166</th>\n",
       "      <td>47 XYY syndrome</td>\n",
       "      <td>47 XYY syndrome</td>\n",
       "      <td>MONDO:0019339</td>\n",
       "      <td>47,XYY syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>47 XYY syndrome</td>\n",
       "      <td>47,XYY syndrome</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.226493</td>\n",
       "      <td>0.185437</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4164</th>\n",
       "      <td>49 XXXXX syndrome</td>\n",
       "      <td>49 XXXXX syndrome</td>\n",
       "      <td>MONDO:0015228</td>\n",
       "      <td>pentasomy X</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>49 XXXXX syndrome</td>\n",
       "      <td>49,XXXXX syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4531</th>\n",
       "      <td>49 XXXXY syndrome</td>\n",
       "      <td>49 XXXXY syndrome</td>\n",
       "      <td>MONDO:0019929</td>\n",
       "      <td>49,XXXXY syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>49 XXXXY syndrome</td>\n",
       "      <td>49,XXXXY syndrome</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.219001</td>\n",
       "      <td>0.179303</td>\n",
       "      <td>0.379414</td>\n",
       "      <td>0.222282</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>710</th>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>MONDO:0009825</td>\n",
       "      <td>5-oxoprolinase deficiency (disease)</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.923042</td>\n",
       "      <td>0.016740</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>709</th>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>HP:0040142</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>5-oxoprolinase deficiency</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2067</th>\n",
       "      <td>Wrinkly skin syndrome</td>\n",
       "      <td>Wrinkly skin syndrome</td>\n",
       "      <td>MONDO:0010208</td>\n",
       "      <td>Wrinkly skin syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Wrinkly skin syndrome</td>\n",
       "      <td>Wrinkly skin syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2105</th>\n",
       "      <td>X-linked adrenal hypoplasia congenita</td>\n",
       "      <td>X-linked adrenal hypoplasia congenita</td>\n",
       "      <td>MONDO:0010264</td>\n",
       "      <td>X-linked adrenal hypoplasia congenita</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>X-linked adrenal hypoplasia congenita</td>\n",
       "      <td>X-linked adrenal hypoplasia congenita</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028738</td>\n",
       "      <td>0.028738</td>\n",
       "      <td>0.925323</td>\n",
       "      <td>0.017201</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1552</th>\n",
       "      <td>X-linked hypohidrotic ectodermal dysplasia</td>\n",
       "      <td>X-linked hypohidrotic ectodermal dysplasia</td>\n",
       "      <td>MONDO:0010585</td>\n",
       "      <td>X-linked hypohidrotic ectodermal dysplasia</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>X-linked hypohidrotic ectodermal dysplasia</td>\n",
       "      <td>X-linked hypohidrotic ectodermal dysplasia</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028738</td>\n",
       "      <td>0.028738</td>\n",
       "      <td>0.925323</td>\n",
       "      <td>0.017201</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3900</th>\n",
       "      <td>X-linked ichthyosis</td>\n",
       "      <td>X-linked ichthyosis</td>\n",
       "      <td>MONDO:0010622</td>\n",
       "      <td>recessive X-linked ichthyosis</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>X-linked ichthyosis</td>\n",
       "      <td>X-linked ichthyosis</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.029886</td>\n",
       "      <td>0.029886</td>\n",
       "      <td>0.916224</td>\n",
       "      <td>0.024003</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1968</th>\n",
       "      <td>X-linked severe combined immunodeficiency</td>\n",
       "      <td>X-linked severe combined immunodeficiency</td>\n",
       "      <td>MONDO:0010315</td>\n",
       "      <td>gamma chain deficiency</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>X-linked severe combined immunodeficiency</td>\n",
       "      <td>X-Linked Severe Combined Immunodeficiency</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.029969</td>\n",
       "      <td>0.918763</td>\n",
       "      <td>0.021299</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2543</th>\n",
       "      <td>XFE progeroid syndrome</td>\n",
       "      <td>XFE progeroid syndrome</td>\n",
       "      <td>MONDO:0012590</td>\n",
       "      <td>XFE progeroid syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>XFE progeroid syndrome</td>\n",
       "      <td>XFE progeroid syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3037</th>\n",
       "      <td>XK aprosencephaly</td>\n",
       "      <td>XK aprosencephaly</td>\n",
       "      <td>MONDO:0008811</td>\n",
       "      <td>XK aprosencephaly</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>XK aprosencephaly</td>\n",
       "      <td>XK aprosencephaly</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2070</th>\n",
       "      <td>Xanthinuria type 1</td>\n",
       "      <td>Xanthinuria type 1</td>\n",
       "      <td>MONDO:0010209</td>\n",
       "      <td>xanthinuria type I</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Xanthinuria type 1</td>\n",
       "      <td>xanthinuria type I</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2414</th>\n",
       "      <td>Xanthinuria type 2</td>\n",
       "      <td>Xanthinuria type 2</td>\n",
       "      <td>MONDO:0011346</td>\n",
       "      <td>xanthinuria type II</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Xanthinuria type 2</td>\n",
       "      <td>xanthinuria type II</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1509</th>\n",
       "      <td>Xanthogranulomatous cholecystitis</td>\n",
       "      <td>Xanthogranulomatous cholecystitis</td>\n",
       "      <td>MONDO:0004875</td>\n",
       "      <td>xanthogranulomatous cholecystitis</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Xanthogranulomatous cholecystitis</td>\n",
       "      <td>xanthogranulomatous cholecystitis</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.028795</td>\n",
       "      <td>0.927169</td>\n",
       "      <td>0.015241</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2867</th>\n",
       "      <td>Xeroderma pigmentosum</td>\n",
       "      <td>Xeroderma pigmentosum</td>\n",
       "      <td>MONDO:0019600</td>\n",
       "      <td>xeroderma pigmentosum</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Xeroderma pigmentosum</td>\n",
       "      <td>xeroderma pigmentosum</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2077</th>\n",
       "      <td>Xeroderma pigmentosum variant type</td>\n",
       "      <td>Xeroderma pigmentosum variant type</td>\n",
       "      <td>MONDO:0010214</td>\n",
       "      <td>xeroderma pigmentosum variant type</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Xeroderma pigmentosum variant type</td>\n",
       "      <td>xeroderma pigmentosum variant type</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3151</th>\n",
       "      <td>Yaws</td>\n",
       "      <td>Yaws</td>\n",
       "      <td>MONDO:0006019</td>\n",
       "      <td>yaws</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Yaws</td>\n",
       "      <td>yaws</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.051830</td>\n",
       "      <td>0.051830</td>\n",
       "      <td>0.874531</td>\n",
       "      <td>0.021809</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3080</th>\n",
       "      <td>Yellow fever</td>\n",
       "      <td>Yellow fever</td>\n",
       "      <td>MONDO:0020502</td>\n",
       "      <td>yellow fever</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Yellow fever</td>\n",
       "      <td>yellow fever</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4539</th>\n",
       "      <td>Yellow nail syndrome</td>\n",
       "      <td>Yellow nail syndrome</td>\n",
       "      <td>MONDO:0007921</td>\n",
       "      <td>yellow nail syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Yellow nail syndrome</td>\n",
       "      <td>yellow nail syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2555</th>\n",
       "      <td>Yemenite deaf-blind hypopigmentation syndrome</td>\n",
       "      <td>Yemenite deaf-blind hypopigmentation syndrome</td>\n",
       "      <td>MONDO:0011133</td>\n",
       "      <td>Deaf blind hypopigmentation syndrome, Yemenite...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>Yemenite deaf-blind hypopigmentation syndrome</td>\n",
       "      <td>Yemenite deaf-blind hypopigmentation syndrome</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.030109</td>\n",
       "      <td>0.923042</td>\n",
       "      <td>0.016740</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4262</th>\n",
       "      <td>Yolk sac tumor</td>\n",
       "      <td>Yolk sac tumor</td>\n",
       "      <td>MONDO:0005744</td>\n",
       "      <td>yolk sac tumor</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Yolk sac tumor</td>\n",
       "      <td>yolk sac tumor</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3775</th>\n",
       "      <td>Yorifuji Okuno syndrome</td>\n",
       "      <td>Yorifuji Okuno syndrome</td>\n",
       "      <td>MONDO:0010802</td>\n",
       "      <td>pancreatic hypoplasia-diabetes-congenital hear...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>Yorifuji Okuno syndrome</td>\n",
       "      <td>Yorifuji-Okuno syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4330</th>\n",
       "      <td>Young Hughes syndrome</td>\n",
       "      <td>Young Hughes syndrome</td>\n",
       "      <td>MONDO:0017614</td>\n",
       "      <td>X-linked intellectual disability-hypogonadism-...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>Young Hughes syndrome</td>\n",
       "      <td>Young-Hughes syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.382559</td>\n",
       "      <td>0.215835</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2384</th>\n",
       "      <td>Young Simpson syndrome</td>\n",
       "      <td>Young Simpson syndrome</td>\n",
       "      <td>MONDO:0011365</td>\n",
       "      <td>blepharophimosis-intellectual disability syndr...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>Young Simpson syndrome</td>\n",
       "      <td>Young-Simpson Syndrome</td>\n",
       "      <td>32.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.200803</td>\n",
       "      <td>0.382559</td>\n",
       "      <td>0.215835</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2059</th>\n",
       "      <td>Young syndrome</td>\n",
       "      <td>Young syndrome</td>\n",
       "      <td>MONDO:0010220</td>\n",
       "      <td>young syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Young syndrome</td>\n",
       "      <td>young syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2892</th>\n",
       "      <td>Yunis Varon syndrome</td>\n",
       "      <td>Yunis Varon syndrome</td>\n",
       "      <td>MONDO:0008995</td>\n",
       "      <td>Yunis-Varon syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Yunis Varon syndrome</td>\n",
       "      <td>Yunis-Varon syndrome</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.062922</td>\n",
       "      <td>0.062922</td>\n",
       "      <td>0.817066</td>\n",
       "      <td>0.057090</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1473</th>\n",
       "      <td>Zechi Ceide syndrome</td>\n",
       "      <td>Zechi Ceide syndrome</td>\n",
       "      <td>MONDO:0013036</td>\n",
       "      <td>Zechi-Ceide syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Zechi Ceide syndrome</td>\n",
       "      <td>Zechi-Ceide syndrome</td>\n",
       "      <td>64.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2866</th>\n",
       "      <td>Zellweger syndrome</td>\n",
       "      <td>Zellweger syndrome</td>\n",
       "      <td>MONDO:0019609</td>\n",
       "      <td>Zellweger syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Zellweger syndrome</td>\n",
       "      <td>Zellweger syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.028758</td>\n",
       "      <td>0.925963</td>\n",
       "      <td>0.016522</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>657</th>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>MONDO:0006020</td>\n",
       "      <td>Zollinger-Ellison syndrome (disease)</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison Syndrome</td>\n",
       "      <td>90.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.473684</td>\n",
       "      <td>0.075251</td>\n",
       "      <td>0.062185</td>\n",
       "      <td>0.839062</td>\n",
       "      <td>0.023503</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>11</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>655</th>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>HP:0002044</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.028891</td>\n",
       "      <td>0.930268</td>\n",
       "      <td>0.011949</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>11</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>656</th>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>MONDO:0019610</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>Zollinger-Ellison syndrome</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>0.526316</td>\n",
       "      <td>0.055295</td>\n",
       "      <td>0.045694</td>\n",
       "      <td>0.882570</td>\n",
       "      <td>0.016441</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>11</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3377</th>\n",
       "      <td>Zori Stalker Williams syndrome</td>\n",
       "      <td>Zori Stalker Williams syndrome</td>\n",
       "      <td>MONDO:0010883</td>\n",
       "      <td>pectus excavatum-macrocephaly-dysplastic nails...</td>\n",
       "      <td>label</td>\n",
       "      <td>hasExactSynonym</td>\n",
       "      <td>Zori Stalker Williams syndrome</td>\n",
       "      <td>Zori-Stalker-Williams syndrome</td>\n",
       "      <td>58.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.205965</td>\n",
       "      <td>0.392394</td>\n",
       "      <td>0.195675</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2061</th>\n",
       "      <td>Zunich neuroectodermal syndrome</td>\n",
       "      <td>Zunich neuroectodermal syndrome</td>\n",
       "      <td>MONDO:0010221</td>\n",
       "      <td>CHIME syndrome</td>\n",
       "      <td>label</td>\n",
       "      <td>hasRelatedSynonym</td>\n",
       "      <td>Zunich neuroectodermal syndrome</td>\n",
       "      <td>Zunich Neuroectodermal Syndrome</td>\n",
       "      <td>50.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.061951</td>\n",
       "      <td>0.061951</td>\n",
       "      <td>0.804454</td>\n",
       "      <td>0.071645</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3649</th>\n",
       "      <td>Zygomycosis</td>\n",
       "      <td>Zygomycosis</td>\n",
       "      <td>MONDO:0019136</td>\n",
       "      <td>zygomycosis</td>\n",
       "      <td>label</td>\n",
       "      <td>label</td>\n",
       "      <td>Zygomycosis</td>\n",
       "      <td>zygomycosis</td>\n",
       "      <td>100.0</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>...</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.051830</td>\n",
       "      <td>0.051830</td>\n",
       "      <td>0.874531</td>\n",
       "      <td>0.021809</td>\n",
       "      <td>True</td>\n",
       "      <td>True</td>\n",
       "      <td>False</td>\n",
       "      <td>False</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>4558 rows × 22 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                   left  \\\n",
       "3287                     11-beta-hydroxylase deficiency   \n",
       "2199                     15q13.3 microdeletion syndrome   \n",
       "3339                    17-alpha-hydroxylase deficiency   \n",
       "3481  17-beta hydroxysteroid dehydrogenase 3 deficiency   \n",
       "2592                    17q21.31 microdeletion syndrome   \n",
       "2593                    17q21.31 microdeletion syndrome   \n",
       "2987                          18 Hydroxylase deficiency   \n",
       "2986                          18 Hydroxylase deficiency   \n",
       "1960                      1q21.1 microdeletion syndrome   \n",
       "1428               2 4-Dienoyl-CoA reductase deficiency   \n",
       "4514                         2-Hydroxyglutaric aciduria   \n",
       "1888                 2-methyl-3-hydroxybutyric aciduria   \n",
       "1202       2-methylbutyryl-CoA dehydrogenase deficiency   \n",
       "3288                          21-hydroxylase deficiency   \n",
       "3507                          22q11.2 deletion syndrome   \n",
       "2964                          22q11.2 deletion syndrome   \n",
       "1721                 3 methylglutaconic aciduria type I   \n",
       "1720                3 methylglutaconic aciduria type IV   \n",
       "2580                 3 methylglutaconic aciduria type V   \n",
       "1877                       3-Hydroxyisobutyric aciduria   \n",
       "3289     3-beta-hydroxysteroid dehydrogenase deficiency   \n",
       "3670               3-methylglutaconic aciduria type III   \n",
       "755                      4-hydroxyphenylacetic aciduria   \n",
       "3680       46 XX testicular disorder of sex development   \n",
       "3136                                    47 XXX syndrome   \n",
       "3166                                    47 XYY syndrome   \n",
       "4164                                  49 XXXXX syndrome   \n",
       "4531                                  49 XXXXY syndrome   \n",
       "710                           5-oxoprolinase deficiency   \n",
       "709                           5-oxoprolinase deficiency   \n",
       "...                                                 ...   \n",
       "2067                              Wrinkly skin syndrome   \n",
       "2105              X-linked adrenal hypoplasia congenita   \n",
       "1552         X-linked hypohidrotic ectodermal dysplasia   \n",
       "3900                                X-linked ichthyosis   \n",
       "1968          X-linked severe combined immunodeficiency   \n",
       "2543                             XFE progeroid syndrome   \n",
       "3037                                  XK aprosencephaly   \n",
       "2070                                 Xanthinuria type 1   \n",
       "2414                                 Xanthinuria type 2   \n",
       "1509                  Xanthogranulomatous cholecystitis   \n",
       "2867                              Xeroderma pigmentosum   \n",
       "2077                 Xeroderma pigmentosum variant type   \n",
       "3151                                               Yaws   \n",
       "3080                                       Yellow fever   \n",
       "4539                               Yellow nail syndrome   \n",
       "2555      Yemenite deaf-blind hypopigmentation syndrome   \n",
       "4262                                     Yolk sac tumor   \n",
       "3775                            Yorifuji Okuno syndrome   \n",
       "4330                              Young Hughes syndrome   \n",
       "2384                             Young Simpson syndrome   \n",
       "2059                                     Young syndrome   \n",
       "2892                               Yunis Varon syndrome   \n",
       "1473                               Zechi Ceide syndrome   \n",
       "2866                                 Zellweger syndrome   \n",
       "657                          Zollinger-Ellison syndrome   \n",
       "655                          Zollinger-Ellison syndrome   \n",
       "656                          Zollinger-Ellison syndrome   \n",
       "3377                     Zori Stalker Williams syndrome   \n",
       "2061                    Zunich neuroectodermal syndrome   \n",
       "3649                                        Zygomycosis   \n",
       "\n",
       "                                             left_label          right  \\\n",
       "3287                     11-beta-hydroxylase deficiency  MONDO:0008729   \n",
       "2199                     15q13.3 microdeletion syndrome  MONDO:0012774   \n",
       "3339                    17-alpha-hydroxylase deficiency  MONDO:0008730   \n",
       "3481  17-beta hydroxysteroid dehydrogenase 3 deficiency  MONDO:0009916   \n",
       "2592                    17q21.31 microdeletion syndrome  MONDO:0012496   \n",
       "2593                    17q21.31 microdeletion syndrome  MONDO:0018216   \n",
       "2987                          18 Hydroxylase deficiency  MONDO:0008751   \n",
       "2986                          18 Hydroxylase deficiency  MONDO:0020489   \n",
       "1960                      1q21.1 microdeletion syndrome  MONDO:0012914   \n",
       "1428               2 4-Dienoyl-CoA reductase deficiency  MONDO:0014464   \n",
       "4514                         2-Hydroxyglutaric aciduria  MONDO:0016001   \n",
       "1888                 2-methyl-3-hydroxybutyric aciduria  MONDO:0010327   \n",
       "1202       2-methylbutyryl-CoA dehydrogenase deficiency  MONDO:0012392   \n",
       "3288                          21-hydroxylase deficiency  MONDO:0008728   \n",
       "3507                          22q11.2 deletion syndrome  MONDO:0008644   \n",
       "2964                          22q11.2 deletion syndrome  MONDO:0018923   \n",
       "1721                 3 methylglutaconic aciduria type I  MONDO:0009610   \n",
       "1720                3 methylglutaconic aciduria type IV  MONDO:0009611   \n",
       "2580                 3 methylglutaconic aciduria type V  MONDO:0012435   \n",
       "1877                       3-Hydroxyisobutyric aciduria  MONDO:0009371   \n",
       "3289     3-beta-hydroxysteroid dehydrogenase deficiency  MONDO:0008727   \n",
       "3670               3-methylglutaconic aciduria type III  MONDO:0009787   \n",
       "755                      4-hydroxyphenylacetic aciduria     HP:0003607   \n",
       "3680       46 XX testicular disorder of sex development  MONDO:0010766   \n",
       "3136                                    47 XXX syndrome  MONDO:0018066   \n",
       "3166                                    47 XYY syndrome  MONDO:0019339   \n",
       "4164                                  49 XXXXX syndrome  MONDO:0015228   \n",
       "4531                                  49 XXXXY syndrome  MONDO:0019929   \n",
       "710                           5-oxoprolinase deficiency  MONDO:0009825   \n",
       "709                           5-oxoprolinase deficiency     HP:0040142   \n",
       "...                                                 ...            ...   \n",
       "2067                              Wrinkly skin syndrome  MONDO:0010208   \n",
       "2105              X-linked adrenal hypoplasia congenita  MONDO:0010264   \n",
       "1552         X-linked hypohidrotic ectodermal dysplasia  MONDO:0010585   \n",
       "3900                                X-linked ichthyosis  MONDO:0010622   \n",
       "1968          X-linked severe combined immunodeficiency  MONDO:0010315   \n",
       "2543                             XFE progeroid syndrome  MONDO:0012590   \n",
       "3037                                  XK aprosencephaly  MONDO:0008811   \n",
       "2070                                 Xanthinuria type 1  MONDO:0010209   \n",
       "2414                                 Xanthinuria type 2  MONDO:0011346   \n",
       "1509                  Xanthogranulomatous cholecystitis  MONDO:0004875   \n",
       "2867                              Xeroderma pigmentosum  MONDO:0019600   \n",
       "2077                 Xeroderma pigmentosum variant type  MONDO:0010214   \n",
       "3151                                               Yaws  MONDO:0006019   \n",
       "3080                                       Yellow fever  MONDO:0020502   \n",
       "4539                               Yellow nail syndrome  MONDO:0007921   \n",
       "2555      Yemenite deaf-blind hypopigmentation syndrome  MONDO:0011133   \n",
       "4262                                     Yolk sac tumor  MONDO:0005744   \n",
       "3775                            Yorifuji Okuno syndrome  MONDO:0010802   \n",
       "4330                              Young Hughes syndrome  MONDO:0017614   \n",
       "2384                             Young Simpson syndrome  MONDO:0011365   \n",
       "2059                                     Young syndrome  MONDO:0010220   \n",
       "2892                               Yunis Varon syndrome  MONDO:0008995   \n",
       "1473                               Zechi Ceide syndrome  MONDO:0013036   \n",
       "2866                                 Zellweger syndrome  MONDO:0019609   \n",
       "657                          Zollinger-Ellison syndrome  MONDO:0006020   \n",
       "655                          Zollinger-Ellison syndrome     HP:0002044   \n",
       "656                          Zollinger-Ellison syndrome  MONDO:0019610   \n",
       "3377                     Zori Stalker Williams syndrome  MONDO:0010883   \n",
       "2061                    Zunich neuroectodermal syndrome  MONDO:0010221   \n",
       "3649                                        Zygomycosis  MONDO:0019136   \n",
       "\n",
       "                                            right_label left_match_type  \\\n",
       "3287  congenital adrenal hyperplasia due to 11-beta-...           label   \n",
       "2199          chromosome 15q13.3 microdeletion syndrome           label   \n",
       "3339  congenital adrenal hyperplasia due to 17-alpha...           label   \n",
       "3481  46,XY disorder of sex development due to 17-be...           label   \n",
       "2592                           Koolen de Vries syndrome           label   \n",
       "2593                    17q21.31 microdeletion syndrome           label   \n",
       "2987     Corticosterone methyloxidase type 1 deficiency           label   \n",
       "2986   familial hyperreninemic hypoaldosteronism type 1           label   \n",
       "1960                chromosome 1q21.1 deletion syndrome           label   \n",
       "1428  progressive encephalopathy with leukodystrophy...           label   \n",
       "4514                         2-hydroxyglutaric aciduria           label   \n",
       "1888                                      HSD10 disease           label   \n",
       "1202       2-methylbutyryl-CoA dehydrogenase deficiency           label   \n",
       "3288  classic congenital adrenal hyperplasia due to ...           label   \n",
       "3507                          velocardiofacial syndrome           label   \n",
       "2964                          22q11.2 deletion syndrome           label   \n",
       "1721                 3-methylglutaconic aciduria type 1           label   \n",
       "1720                 3-methylglutaconic aciduria type 4           label   \n",
       "2580                 3-methylglutaconic aciduria type 5           label   \n",
       "1877                       3-hydroxyisobutyric aciduria           label   \n",
       "3289  congenital adrenal hyperplasia due to 3-beta-h...           label   \n",
       "3670                 3-methylglutaconic aciduria type 3           label   \n",
       "755                      4-Hydroxyphenylacetic aciduria           label   \n",
       "3680       46,XX testicular disorder of sex development           label   \n",
       "3136                                          trisomy X           label   \n",
       "3166                                    47,XYY syndrome           label   \n",
       "4164                                        pentasomy X           label   \n",
       "4531                                  49,XXXXY syndrome           label   \n",
       "710                 5-oxoprolinase deficiency (disease)           label   \n",
       "709                           5-oxoprolinase deficiency           label   \n",
       "...                                                 ...             ...   \n",
       "2067                              Wrinkly skin syndrome           label   \n",
       "2105              X-linked adrenal hypoplasia congenita           label   \n",
       "1552         X-linked hypohidrotic ectodermal dysplasia           label   \n",
       "3900                      recessive X-linked ichthyosis           label   \n",
       "1968                             gamma chain deficiency           label   \n",
       "2543                             XFE progeroid syndrome           label   \n",
       "3037                                  XK aprosencephaly           label   \n",
       "2070                                 xanthinuria type I           label   \n",
       "2414                                xanthinuria type II           label   \n",
       "1509                  xanthogranulomatous cholecystitis           label   \n",
       "2867                              xeroderma pigmentosum           label   \n",
       "2077                 xeroderma pigmentosum variant type           label   \n",
       "3151                                               yaws           label   \n",
       "3080                                       yellow fever           label   \n",
       "4539                               yellow nail syndrome           label   \n",
       "2555  Deaf blind hypopigmentation syndrome, Yemenite...           label   \n",
       "4262                                     yolk sac tumor           label   \n",
       "3775  pancreatic hypoplasia-diabetes-congenital hear...           label   \n",
       "4330  X-linked intellectual disability-hypogonadism-...           label   \n",
       "2384  blepharophimosis-intellectual disability syndr...           label   \n",
       "2059                                     young syndrome           label   \n",
       "2892                               Yunis-Varon syndrome           label   \n",
       "1473                               Zechi-Ceide syndrome           label   \n",
       "2866                                 Zellweger syndrome           label   \n",
       "657                Zollinger-Ellison syndrome (disease)           label   \n",
       "655                          Zollinger-Ellison syndrome           label   \n",
       "656                          Zollinger-Ellison syndrome           label   \n",
       "3377  pectus excavatum-macrocephaly-dysplastic nails...           label   \n",
       "2061                                     CHIME syndrome           label   \n",
       "3649                                        zygomycosis           label   \n",
       "\n",
       "       right_match_type                                     left_match_val  \\\n",
       "3287  hasRelatedSynonym                     11-beta-hydroxylase deficiency   \n",
       "2199    hasExactSynonym                     15q13.3 microdeletion syndrome   \n",
       "3339  hasRelatedSynonym                    17-alpha-hydroxylase deficiency   \n",
       "3481    hasExactSynonym  17-beta hydroxysteroid dehydrogenase 3 deficiency   \n",
       "2592    hasExactSynonym                    17q21.31 microdeletion syndrome   \n",
       "2593              label                    17q21.31 microdeletion syndrome   \n",
       "2987  hasRelatedSynonym                          18 Hydroxylase deficiency   \n",
       "2986    hasExactSynonym                          18 Hydroxylase deficiency   \n",
       "1960    hasExactSynonym                      1q21.1 microdeletion syndrome   \n",
       "1428    hasExactSynonym               2 4-Dienoyl-CoA reductase deficiency   \n",
       "4514              label                         2-Hydroxyglutaric aciduria   \n",
       "1888    hasExactSynonym                 2-methyl-3-hydroxybutyric aciduria   \n",
       "1202              label       2-methylbutyryl-CoA dehydrogenase deficiency   \n",
       "3288  hasRelatedSynonym                          21-hydroxylase deficiency   \n",
       "3507    hasExactSynonym                          22q11.2 deletion syndrome   \n",
       "2964              label                          22q11.2 deletion syndrome   \n",
       "1721              label                 3 methylglutaconic aciduria type I   \n",
       "1720              label                3 methylglutaconic aciduria type IV   \n",
       "2580              label                 3 methylglutaconic aciduria type V   \n",
       "1877              label                       3-Hydroxyisobutyric aciduria   \n",
       "3289  hasRelatedSynonym     3-beta-hydroxysteroid dehydrogenase deficiency   \n",
       "3670    hasExactSynonym               3-methylglutaconic aciduria type III   \n",
       "755               label                     4-hydroxyphenylacetic aciduria   \n",
       "3680              label       46 XX testicular disorder of sex development   \n",
       "3136    hasExactSynonym                                    47 XXX syndrome   \n",
       "3166              label                                    47 XYY syndrome   \n",
       "4164    hasExactSynonym                                  49 XXXXX syndrome   \n",
       "4531              label                                  49 XXXXY syndrome   \n",
       "710     hasExactSynonym                          5-oxoprolinase deficiency   \n",
       "709               label                          5-oxoprolinase deficiency   \n",
       "...                 ...                                                ...   \n",
       "2067              label                              Wrinkly skin syndrome   \n",
       "2105              label              X-linked adrenal hypoplasia congenita   \n",
       "1552              label         X-linked hypohidrotic ectodermal dysplasia   \n",
       "3900    hasExactSynonym                                X-linked ichthyosis   \n",
       "1968    hasExactSynonym          X-linked severe combined immunodeficiency   \n",
       "2543              label                             XFE progeroid syndrome   \n",
       "3037              label                                  XK aprosencephaly   \n",
       "2070              label                                 Xanthinuria type 1   \n",
       "2414              label                                 Xanthinuria type 2   \n",
       "1509              label                  Xanthogranulomatous cholecystitis   \n",
       "2867              label                              Xeroderma pigmentosum   \n",
       "2077              label                 Xeroderma pigmentosum variant type   \n",
       "3151              label                                               Yaws   \n",
       "3080              label                                       Yellow fever   \n",
       "4539              label                               Yellow nail syndrome   \n",
       "2555    hasExactSynonym      Yemenite deaf-blind hypopigmentation syndrome   \n",
       "4262              label                                     Yolk sac tumor   \n",
       "3775    hasExactSynonym                            Yorifuji Okuno syndrome   \n",
       "4330    hasExactSynonym                              Young Hughes syndrome   \n",
       "2384  hasRelatedSynonym                             Young Simpson syndrome   \n",
       "2059              label                                     Young syndrome   \n",
       "2892              label                               Yunis Varon syndrome   \n",
       "1473              label                               Zechi Ceide syndrome   \n",
       "2866              label                                 Zellweger syndrome   \n",
       "657     hasExactSynonym                         Zollinger-Ellison syndrome   \n",
       "655               label                         Zollinger-Ellison syndrome   \n",
       "656               label                         Zollinger-Ellison syndrome   \n",
       "3377    hasExactSynonym                     Zori Stalker Williams syndrome   \n",
       "2061  hasRelatedSynonym                    Zunich neuroectodermal syndrome   \n",
       "3649              label                                        Zygomycosis   \n",
       "\n",
       "                                        right_match_val  score  left_simscore  \\\n",
       "3287                     11-Beta-Hydroxylase Deficiency   50.0       1.000000   \n",
       "2199                     15q13.3 microdeletion syndrome   90.0       1.000000   \n",
       "3339                    17-Alpha-Hydroxylase Deficiency   50.0       1.000000   \n",
       "3481  17-beta-hydroxysteroid dehydrogenase 3 deficiency   58.0       1.000000   \n",
       "2592                    17q21.31 microdeletion syndrome   90.0       1.000000   \n",
       "2593                    17q21.31 microdeletion syndrome  100.0       1.000000   \n",
       "2987                          18-Hydroxylase Deficiency   32.0       1.000000   \n",
       "2986                          18-hydroxylase deficiency   58.0       1.000000   \n",
       "1960                      1q21.1 microdeletion syndrome   90.0       1.000000   \n",
       "1428               2,4-dienoyl-CoA reductase deficiency   58.0       1.000000   \n",
       "4514                         2-hydroxyglutaric aciduria  100.0       1.000000   \n",
       "1888                 2-methyl-3-hydroxybutyric aciduria   90.0       1.000000   \n",
       "1202       2-methylbutyryl-CoA dehydrogenase deficiency  100.0       1.000000   \n",
       "3288                          21-Hydroxylase Deficiency   50.0       1.000000   \n",
       "3507                          deletion 22q11.2 syndrome   58.0       1.000000   \n",
       "2964                          22q11.2 deletion syndrome  100.0       0.166667   \n",
       "1721                 3-methylglutaconic aciduria type 1   64.0       1.000000   \n",
       "1720                 3-methylglutaconic aciduria type 4   64.0       1.000000   \n",
       "2580                 3-methylglutaconic aciduria type 5   64.0       1.000000   \n",
       "1877                       3-hydroxyisobutyric aciduria  100.0       1.000000   \n",
       "3289     3-Beta-Hydroxysteroid Dehydrogenase Deficiency   50.0       1.000000   \n",
       "3670               3-methylglutaconic aciduria type III   90.0       1.000000   \n",
       "755                      4-Hydroxyphenylacetic aciduria  100.0       1.000000   \n",
       "3680       46,XX testicular disorder of sex development   64.0       1.000000   \n",
       "3136                                    47,XXX syndrome   58.0       1.000000   \n",
       "3166                                    47,XYY syndrome   64.0       1.000000   \n",
       "4164                                  49,XXXXX syndrome   58.0       1.000000   \n",
       "4531                                  49,XXXXY syndrome   64.0       1.000000   \n",
       "710                           5-oxoprolinase deficiency   90.0       1.000000   \n",
       "709                           5-oxoprolinase deficiency  100.0       1.000000   \n",
       "...                                                 ...    ...            ...   \n",
       "2067                              Wrinkly skin syndrome  100.0       1.000000   \n",
       "2105              X-linked adrenal hypoplasia congenita  100.0       1.000000   \n",
       "1552         X-linked hypohidrotic ectodermal dysplasia  100.0       1.000000   \n",
       "3900                                X-linked ichthyosis   90.0       1.000000   \n",
       "1968          X-Linked Severe Combined Immunodeficiency   90.0       1.000000   \n",
       "2543                             XFE progeroid syndrome  100.0       1.000000   \n",
       "3037                                  XK aprosencephaly  100.0       1.000000   \n",
       "2070                                 xanthinuria type I   64.0       1.000000   \n",
       "2414                                xanthinuria type II   64.0       1.000000   \n",
       "1509                  xanthogranulomatous cholecystitis  100.0       1.000000   \n",
       "2867                              xeroderma pigmentosum  100.0       1.000000   \n",
       "2077                 xeroderma pigmentosum variant type  100.0       1.000000   \n",
       "3151                                               yaws  100.0       1.000000   \n",
       "3080                                       yellow fever  100.0       1.000000   \n",
       "4539                               yellow nail syndrome  100.0       1.000000   \n",
       "2555      Yemenite deaf-blind hypopigmentation syndrome   90.0       1.000000   \n",
       "4262                                     yolk sac tumor  100.0       1.000000   \n",
       "3775                            Yorifuji-Okuno syndrome   58.0       1.000000   \n",
       "4330                              Young-Hughes syndrome   58.0       1.000000   \n",
       "2384                             Young-Simpson Syndrome   32.0       1.000000   \n",
       "2059                                     young syndrome  100.0       1.000000   \n",
       "2892                               Yunis-Varon syndrome   64.0       1.000000   \n",
       "1473                               Zechi-Ceide syndrome   64.0       1.000000   \n",
       "2866                                 Zellweger syndrome  100.0       1.000000   \n",
       "657                          Zollinger-Ellison Syndrome   90.0       1.000000   \n",
       "655                          Zollinger-Ellison syndrome  100.0       1.000000   \n",
       "656                          Zollinger-Ellison syndrome  100.0       1.000000   \n",
       "3377                     Zori-Stalker-Williams syndrome   58.0       1.000000   \n",
       "2061                    Zunich Neuroectodermal Syndrome   50.0       1.000000   \n",
       "3649                                        zygomycosis  100.0       1.000000   \n",
       "\n",
       "            ...          conditional_pr_equiv  pr_subClassOf  pr_superClassOf  \\\n",
       "3287        ...                      1.000000       0.061581         0.061581   \n",
       "2199        ...                      1.000000       0.029969         0.029969   \n",
       "3339        ...                      1.000000       0.061581         0.061581   \n",
       "3481        ...                      1.000000       0.205965         0.205965   \n",
       "2592        ...                      0.473684       0.168017         0.055554   \n",
       "2593        ...                      0.526316       0.051671         0.108232   \n",
       "2987        ...                      0.355556       0.232996         0.289482   \n",
       "2986        ...                      0.644444       0.292046         0.210145   \n",
       "1960        ...                      1.000000       0.030109         0.030109   \n",
       "1428        ...                      1.000000       0.200803         0.200803   \n",
       "4514        ...                      1.000000       0.028758         0.028758   \n",
       "1888        ...                      1.000000       0.029969         0.029969   \n",
       "1202        ...                      1.000000       0.028795         0.028795   \n",
       "3288        ...                      1.000000       0.061581         0.061581   \n",
       "3507        ...                      0.134754       0.179472         0.287938   \n",
       "2964        ...                      0.115075       0.092223         0.035954   \n",
       "1721        ...                      1.000000       0.200803         0.200803   \n",
       "1720        ...                      1.000000       0.200803         0.200803   \n",
       "2580        ...                      1.000000       0.198342         0.198342   \n",
       "1877        ...                      1.000000       0.028795         0.028795   \n",
       "3289        ...                      1.000000       0.061581         0.061581   \n",
       "3670        ...                      1.000000       0.029969         0.029969   \n",
       "755         ...                      1.000000       0.028891         0.028891   \n",
       "3680        ...                      1.000000       0.198342         0.198342   \n",
       "3136        ...                      1.000000       0.226493         0.185437   \n",
       "3166        ...                      1.000000       0.226493         0.185437   \n",
       "4164        ...                      1.000000       0.205965         0.205965   \n",
       "4531        ...                      1.000000       0.219001         0.179303   \n",
       "710         ...                      1.000000       0.030109         0.030109   \n",
       "709         ...                      1.000000       0.028891         0.028891   \n",
       "...         ...                           ...            ...              ...   \n",
       "2067        ...                      1.000000       0.028758         0.028758   \n",
       "2105        ...                      1.000000       0.028738         0.028738   \n",
       "1552        ...                      1.000000       0.028738         0.028738   \n",
       "3900        ...                      1.000000       0.029886         0.029886   \n",
       "1968        ...                      1.000000       0.029969         0.029969   \n",
       "2543        ...                      1.000000       0.028891         0.028891   \n",
       "3037        ...                      1.000000       0.028891         0.028891   \n",
       "2070        ...                      1.000000       0.205965         0.205965   \n",
       "2414        ...                      1.000000       0.205965         0.205965   \n",
       "1509        ...                      1.000000       0.028795         0.028795   \n",
       "2867        ...                      1.000000       0.028758         0.028758   \n",
       "2077        ...                      1.000000       0.028758         0.028758   \n",
       "3151        ...                      1.000000       0.051830         0.051830   \n",
       "3080        ...                      1.000000       0.028891         0.028891   \n",
       "4539        ...                      1.000000       0.028891         0.028891   \n",
       "2555        ...                      1.000000       0.030109         0.030109   \n",
       "4262        ...                      1.000000       0.028758         0.028758   \n",
       "3775        ...                      1.000000       0.205965         0.205965   \n",
       "4330        ...                      1.000000       0.200803         0.200803   \n",
       "2384        ...                      1.000000       0.200803         0.200803   \n",
       "2059        ...                      1.000000       0.028891         0.028891   \n",
       "2892        ...                      1.000000       0.062922         0.062922   \n",
       "1473        ...                      1.000000       0.205965         0.205965   \n",
       "2866        ...                      1.000000       0.028758         0.028758   \n",
       "657         ...                      0.473684       0.075251         0.062185   \n",
       "655         ...                      1.000000       0.028891         0.028891   \n",
       "656         ...                      0.526316       0.055295         0.045694   \n",
       "3377        ...                      1.000000       0.205965         0.205965   \n",
       "2061        ...                      1.000000       0.061951         0.061951   \n",
       "3649        ...                      1.000000       0.051830         0.051830   \n",
       "\n",
       "      pr_equivalentTo  pr_other  left_novel  right_novel  left_consistent  \\\n",
       "3287         0.799654  0.077184        True         True            False   \n",
       "2199         0.918763  0.021299        True         True            False   \n",
       "3339         0.799654  0.077184        True         True            False   \n",
       "3481         0.392394  0.195675        True         True            False   \n",
       "2592         0.749591  0.026839        True         True            False   \n",
       "2593         0.824734  0.015363        True         True            False   \n",
       "2987         0.283582  0.193941        True         True            False   \n",
       "2986         0.309167  0.188643        True         True            False   \n",
       "1960         0.923042  0.016740        True         True            False   \n",
       "1428         0.382559  0.215835        True         True            False   \n",
       "4514         0.925963  0.016522        True         True            False   \n",
       "1888         0.918763  0.021299        True         True            False   \n",
       "1202         0.927169  0.015241        True         True            False   \n",
       "3288         0.799654  0.077184        True         True            False   \n",
       "3507         0.282070  0.250520        True         True            False   \n",
       "2964         0.841716  0.030107        True         True            False   \n",
       "1721         0.382559  0.215835        True         True            False   \n",
       "1720         0.382559  0.215835        True         True            False   \n",
       "2580         0.377872  0.225444        True         True            False   \n",
       "1877         0.927169  0.015241        True         True            False   \n",
       "3289         0.799654  0.077184        True         True            False   \n",
       "3670         0.918763  0.021299        True         True            False   \n",
       "755          0.930268  0.011949        True         True            False   \n",
       "3680         0.377872  0.225444        True         True            False   \n",
       "3136         0.392394  0.195675        True         True            False   \n",
       "3166         0.392394  0.195675        True         True            False   \n",
       "4164         0.392394  0.195675        True         True            False   \n",
       "4531         0.379414  0.222282        True         True            False   \n",
       "710          0.923042  0.016740        True         True            False   \n",
       "709          0.930268  0.011949        True         True            False   \n",
       "...               ...       ...         ...          ...              ...   \n",
       "2067         0.925963  0.016522        True         True            False   \n",
       "2105         0.925323  0.017201        True         True            False   \n",
       "1552         0.925323  0.017201        True         True            False   \n",
       "3900         0.916224  0.024003        True         True            False   \n",
       "1968         0.918763  0.021299        True         True            False   \n",
       "2543         0.930268  0.011949        True         True            False   \n",
       "3037         0.930268  0.011949        True         True            False   \n",
       "2070         0.392394  0.195675        True         True            False   \n",
       "2414         0.392394  0.195675        True         True            False   \n",
       "1509         0.927169  0.015241        True         True            False   \n",
       "2867         0.925963  0.016522        True         True            False   \n",
       "2077         0.925963  0.016522        True         True            False   \n",
       "3151         0.874531  0.021809        True         True            False   \n",
       "3080         0.930268  0.011949        True         True            False   \n",
       "4539         0.930268  0.011949        True         True            False   \n",
       "2555         0.923042  0.016740        True         True            False   \n",
       "4262         0.925963  0.016522        True         True            False   \n",
       "3775         0.392394  0.195675        True         True            False   \n",
       "4330         0.382559  0.215835        True         True            False   \n",
       "2384         0.382559  0.215835        True         True            False   \n",
       "2059         0.930268  0.011949        True         True            False   \n",
       "2892         0.817066  0.057090        True         True            False   \n",
       "1473         0.392394  0.195675        True         True            False   \n",
       "2866         0.925963  0.016522        True         True            False   \n",
       "657          0.839062  0.023503        True         True            False   \n",
       "655          0.930268  0.011949        True         True            False   \n",
       "656          0.882570  0.016441        True         True            False   \n",
       "3377         0.392394  0.195675        True         True            False   \n",
       "2061         0.804454  0.071645        True         True            False   \n",
       "3649         0.874531  0.021809        True         True            False   \n",
       "\n",
       "      right_consistent  equiv_clique_size  \n",
       "3287             False                  7  \n",
       "2199             False                  6  \n",
       "3339             False                  5  \n",
       "3481             False                  7  \n",
       "2592             False                  8  \n",
       "2593             False                  8  \n",
       "2987             False                  6  \n",
       "2986             False                  6  \n",
       "1960             False                  6  \n",
       "1428             False                  5  \n",
       "4514             False                  7  \n",
       "1888             False                  5  \n",
       "1202             False                  7  \n",
       "3288             False                  5  \n",
       "3507             False                 41  \n",
       "2964             False                 41  \n",
       "1721             False                  9  \n",
       "1720             False                  8  \n",
       "2580             False                  7  \n",
       "1877             False                  8  \n",
       "3289             False                  5  \n",
       "3670             False                  8  \n",
       "755              False                  2  \n",
       "3680             False                  6  \n",
       "3136             False                  5  \n",
       "3166             False                  5  \n",
       "4164             False                  5  \n",
       "4531             False                  6  \n",
       "710              False                  7  \n",
       "709              False                  7  \n",
       "...                ...                ...  \n",
       "2067             False                  7  \n",
       "2105             False                  7  \n",
       "1552             False                  4  \n",
       "3900             False                  7  \n",
       "1968             False                  8  \n",
       "2543             False                  7  \n",
       "3037             False                  8  \n",
       "2070             False                  5  \n",
       "2414             False                  6  \n",
       "1509             False                  8  \n",
       "2867             False                  8  \n",
       "2077             False                  8  \n",
       "3151             False                 10  \n",
       "3080             False                  8  \n",
       "4539             False                  9  \n",
       "2555             False                  6  \n",
       "4262             False                  7  \n",
       "3775             False                  5  \n",
       "4330             False                  4  \n",
       "2384             False                  7  \n",
       "2059             False                  7  \n",
       "2892             False                  7  \n",
       "1473             False                  6  \n",
       "2866             False                  6  \n",
       "657              False                 11  \n",
       "655              False                 11  \n",
       "656              False                 11  \n",
       "3377             False                  5  \n",
       "2061             False                  6  \n",
       "3649             False                  9  \n",
       "\n",
       "[4558 rows x 22 columns]"
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# get a dataframe from the mapping graph\n",
    "df=lexmap.as_dataframe(g)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "## write to file (not used here but can be examined separately)\n",
    "df.to_csv('rare-matches.tsv', sep=\"\\t\", index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "udf = lexmap.unmapped_dataframe(g)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style>\n",
       "    .dataframe thead tr:only-child th {\n",
       "        text-align: right;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: left;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>id</th>\n",
       "      <th>label</th>\n",
       "      <th>mapped_equivs</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>18057</th>\n",
       "      <td>16p11.2 deletion syndrome</td>\n",
       "      <td>16p11.2 deletion syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105646</th>\n",
       "      <td>2-Methylacetoacetyl CoA thiolase deficiency</td>\n",
       "      <td>2-Methylacetoacetyl CoA thiolase deficiency</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41905</th>\n",
       "      <td>2-hydroxyethyl methacrylate sensitization</td>\n",
       "      <td>2-hydroxyethyl methacrylate sensitization</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29133</th>\n",
       "      <td>22q11.2 duplication syndrome</td>\n",
       "      <td>22q11.2 duplication syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100428</th>\n",
       "      <td>22q13.3 deletion syndrome</td>\n",
       "      <td>22q13.3 deletion syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>96122</th>\n",
       "      <td>2q37 deletion syndrome</td>\n",
       "      <td>2q37 deletion syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>88482</th>\n",
       "      <td>3 Methylcrotonyl-CoA carboxylase 1 deficiency</td>\n",
       "      <td>3 Methylcrotonyl-CoA carboxylase 1 deficiency</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34501</th>\n",
       "      <td>3 alpha methylcrotonyl-CoA carboxylase 2 defic...</td>\n",
       "      <td>3 alpha methylcrotonyl-CoA carboxylase 2 defic...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>85670</th>\n",
       "      <td>3-alpha hydroxyacyl-CoA dehydrogenase deficiency</td>\n",
       "      <td>3-alpha hydroxyacyl-CoA dehydrogenase deficiency</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>77929</th>\n",
       "      <td>3p deletion syndrome</td>\n",
       "      <td>3p deletion syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>95095</th>\n",
       "      <td>46 XX Gonadal dysgenesis epibulbar dermoid</td>\n",
       "      <td>46 XX Gonadal dysgenesis epibulbar dermoid</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>90032</th>\n",
       "      <td>5-Nucleotidase syndrome</td>\n",
       "      <td>5-Nucleotidase syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>74374</th>\n",
       "      <td>6 alpha mercaptopurine sensitivity</td>\n",
       "      <td>6 alpha mercaptopurine sensitivity</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51486</th>\n",
       "      <td>ACTH-independent macronodular adrenal hyperplasia</td>\n",
       "      <td>ACTH-independent macronodular adrenal hyperplasia</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26334</th>\n",
       "      <td>AIDS Dementia Complex</td>\n",
       "      <td>AIDS Dementia Complex</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12881</th>\n",
       "      <td>AIDS dysmorphic syndrome</td>\n",
       "      <td>AIDS dysmorphic syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>77859</th>\n",
       "      <td>ALK+ histiocytosis</td>\n",
       "      <td>ALK+ histiocytosis</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26275</th>\n",
       "      <td>ALS-like syndrome of encephalomyopathy</td>\n",
       "      <td>ALS-like syndrome of encephalomyopathy</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>60831</th>\n",
       "      <td>Abderhalden Kaufmann Lignac syndrome</td>\n",
       "      <td>Abderhalden Kaufmann Lignac syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10975</th>\n",
       "      <td>Abdominal chemodectomas with cutaneous angioli...</td>\n",
       "      <td>Abdominal chemodectomas with cutaneous angioli...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>108580</th>\n",
       "      <td>Abdominal cystic lymphangioma</td>\n",
       "      <td>Abdominal cystic lymphangioma</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>94496</th>\n",
       "      <td>Aberrant subclavian artery</td>\n",
       "      <td>Aberrant subclavian artery</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>93116</th>\n",
       "      <td>Abidi X-linked mental retardation syndrome</td>\n",
       "      <td>Abidi X-linked mental retardation syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40555</th>\n",
       "      <td>Absence of fingerprints congenital milia</td>\n",
       "      <td>Absence of fingerprints congenital milia</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7562</th>\n",
       "      <td>Absence of gluteal muscle</td>\n",
       "      <td>Absence of gluteal muscle</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6259</th>\n",
       "      <td>Absence of tibia with polydactyly</td>\n",
       "      <td>Absence of tibia with polydactyly</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75137</th>\n",
       "      <td>Absent T lymphocytes</td>\n",
       "      <td>Absent T lymphocytes</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49480</th>\n",
       "      <td>Absent breasts and nipples</td>\n",
       "      <td>Absent breasts and nipples</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>56640</th>\n",
       "      <td>Abuse dwarfism syndrome</td>\n",
       "      <td>Abuse dwarfism syndrome</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8138</th>\n",
       "      <td>Acanthamoeba infection</td>\n",
       "      <td>Acanthamoeba infection</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25120</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99948</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0008961]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21037</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99949</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011113]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17454</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99950</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011085]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20779</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99951</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011527]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70495</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99952</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>94070</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99953</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011534]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>82089</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99954</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>106842</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99955</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011066]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>99610</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99956</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0011475]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10190</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99960</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100192</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99961</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30752</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99965</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51288</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99966</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24502</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99967</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>102919</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99969</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>79112</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99970</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17426</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99971</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15059</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99976</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>65846</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99977</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6381</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99978</td>\n",
       "      <td>None</td>\n",
       "      <td>[MONDO:0003345]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3759</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99981</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3847</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99983</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>85668</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99989</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4382</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99990</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45866</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99991</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21041</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99994</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>65561</th>\n",
       "      <td>http://www.orpha.net/ORDO/Orphanet_99995</td>\n",
       "      <td>None</td>\n",
       "      <td>[]</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43256</th>\n",
       "      <td>http://www.w3.org/2000/01/rdf-schema#seeAlso</td>\n",
       "      <td>seeAlso</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21673</th>\n",
       "      <td>http://www.w3.org/2002/07/owl#Thing</td>\n",
       "      <td>None</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15400</th>\n",
       "      <td>http://www.w3.org/2002/07/owl#topObjectProperty</td>\n",
       "      <td>None</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>110240 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                       id  \\\n",
       "18057                           16p11.2 deletion syndrome   \n",
       "105646        2-Methylacetoacetyl CoA thiolase deficiency   \n",
       "41905           2-hydroxyethyl methacrylate sensitization   \n",
       "29133                        22q11.2 duplication syndrome   \n",
       "100428                          22q13.3 deletion syndrome   \n",
       "96122                              2q37 deletion syndrome   \n",
       "88482       3 Methylcrotonyl-CoA carboxylase 1 deficiency   \n",
       "34501   3 alpha methylcrotonyl-CoA carboxylase 2 defic...   \n",
       "85670    3-alpha hydroxyacyl-CoA dehydrogenase deficiency   \n",
       "77929                                3p deletion syndrome   \n",
       "95095          46 XX Gonadal dysgenesis epibulbar dermoid   \n",
       "90032                             5-Nucleotidase syndrome   \n",
       "74374                  6 alpha mercaptopurine sensitivity   \n",
       "51486   ACTH-independent macronodular adrenal hyperplasia   \n",
       "26334                               AIDS Dementia Complex   \n",
       "12881                            AIDS dysmorphic syndrome   \n",
       "77859                                  ALK+ histiocytosis   \n",
       "26275              ALS-like syndrome of encephalomyopathy   \n",
       "60831                Abderhalden Kaufmann Lignac syndrome   \n",
       "10975   Abdominal chemodectomas with cutaneous angioli...   \n",
       "108580                      Abdominal cystic lymphangioma   \n",
       "94496                          Aberrant subclavian artery   \n",
       "93116          Abidi X-linked mental retardation syndrome   \n",
       "40555            Absence of fingerprints congenital milia   \n",
       "7562                            Absence of gluteal muscle   \n",
       "6259                    Absence of tibia with polydactyly   \n",
       "75137                                Absent T lymphocytes   \n",
       "49480                          Absent breasts and nipples   \n",
       "56640                             Abuse dwarfism syndrome   \n",
       "8138                               Acanthamoeba infection   \n",
       "...                                                   ...   \n",
       "25120            http://www.orpha.net/ORDO/Orphanet_99948   \n",
       "21037            http://www.orpha.net/ORDO/Orphanet_99949   \n",
       "17454            http://www.orpha.net/ORDO/Orphanet_99950   \n",
       "20779            http://www.orpha.net/ORDO/Orphanet_99951   \n",
       "70495            http://www.orpha.net/ORDO/Orphanet_99952   \n",
       "94070            http://www.orpha.net/ORDO/Orphanet_99953   \n",
       "82089            http://www.orpha.net/ORDO/Orphanet_99954   \n",
       "106842           http://www.orpha.net/ORDO/Orphanet_99955   \n",
       "99610            http://www.orpha.net/ORDO/Orphanet_99956   \n",
       "10190            http://www.orpha.net/ORDO/Orphanet_99960   \n",
       "100192           http://www.orpha.net/ORDO/Orphanet_99961   \n",
       "30752            http://www.orpha.net/ORDO/Orphanet_99965   \n",
       "51288            http://www.orpha.net/ORDO/Orphanet_99966   \n",
       "24502            http://www.orpha.net/ORDO/Orphanet_99967   \n",
       "102919           http://www.orpha.net/ORDO/Orphanet_99969   \n",
       "79112            http://www.orpha.net/ORDO/Orphanet_99970   \n",
       "17426            http://www.orpha.net/ORDO/Orphanet_99971   \n",
       "15059            http://www.orpha.net/ORDO/Orphanet_99976   \n",
       "65846            http://www.orpha.net/ORDO/Orphanet_99977   \n",
       "6381             http://www.orpha.net/ORDO/Orphanet_99978   \n",
       "3759             http://www.orpha.net/ORDO/Orphanet_99981   \n",
       "3847             http://www.orpha.net/ORDO/Orphanet_99983   \n",
       "85668            http://www.orpha.net/ORDO/Orphanet_99989   \n",
       "4382             http://www.orpha.net/ORDO/Orphanet_99990   \n",
       "45866            http://www.orpha.net/ORDO/Orphanet_99991   \n",
       "21041            http://www.orpha.net/ORDO/Orphanet_99994   \n",
       "65561            http://www.orpha.net/ORDO/Orphanet_99995   \n",
       "43256        http://www.w3.org/2000/01/rdf-schema#seeAlso   \n",
       "21673                 http://www.w3.org/2002/07/owl#Thing   \n",
       "15400     http://www.w3.org/2002/07/owl#topObjectProperty   \n",
       "\n",
       "                                                    label    mapped_equivs  \n",
       "18057                           16p11.2 deletion syndrome                   \n",
       "105646        2-Methylacetoacetyl CoA thiolase deficiency                   \n",
       "41905           2-hydroxyethyl methacrylate sensitization                   \n",
       "29133                        22q11.2 duplication syndrome                   \n",
       "100428                          22q13.3 deletion syndrome                   \n",
       "96122                              2q37 deletion syndrome                   \n",
       "88482       3 Methylcrotonyl-CoA carboxylase 1 deficiency                   \n",
       "34501   3 alpha methylcrotonyl-CoA carboxylase 2 defic...                   \n",
       "85670    3-alpha hydroxyacyl-CoA dehydrogenase deficiency                   \n",
       "77929                                3p deletion syndrome                   \n",
       "95095          46 XX Gonadal dysgenesis epibulbar dermoid                   \n",
       "90032                             5-Nucleotidase syndrome                   \n",
       "74374                  6 alpha mercaptopurine sensitivity                   \n",
       "51486   ACTH-independent macronodular adrenal hyperplasia                   \n",
       "26334                               AIDS Dementia Complex                   \n",
       "12881                            AIDS dysmorphic syndrome                   \n",
       "77859                                  ALK+ histiocytosis                   \n",
       "26275              ALS-like syndrome of encephalomyopathy                   \n",
       "60831                Abderhalden Kaufmann Lignac syndrome                   \n",
       "10975   Abdominal chemodectomas with cutaneous angioli...                   \n",
       "108580                      Abdominal cystic lymphangioma                   \n",
       "94496                          Aberrant subclavian artery                   \n",
       "93116          Abidi X-linked mental retardation syndrome                   \n",
       "40555            Absence of fingerprints congenital milia                   \n",
       "7562                            Absence of gluteal muscle                   \n",
       "6259                    Absence of tibia with polydactyly                   \n",
       "75137                                Absent T lymphocytes                   \n",
       "49480                          Absent breasts and nipples                   \n",
       "56640                             Abuse dwarfism syndrome                   \n",
       "8138                               Acanthamoeba infection                   \n",
       "...                                                   ...              ...  \n",
       "25120                                                None  [MONDO:0008961]  \n",
       "21037                                                None  [MONDO:0011113]  \n",
       "17454                                                None  [MONDO:0011085]  \n",
       "20779                                                None  [MONDO:0011527]  \n",
       "70495                                                None               []  \n",
       "94070                                                None  [MONDO:0011534]  \n",
       "82089                                                None               []  \n",
       "106842                                               None  [MONDO:0011066]  \n",
       "99610                                                None  [MONDO:0011475]  \n",
       "10190                                                None               []  \n",
       "100192                                               None               []  \n",
       "30752                                                None               []  \n",
       "51288                                                None               []  \n",
       "24502                                                None               []  \n",
       "102919                                               None               []  \n",
       "79112                                                None               []  \n",
       "17426                                                None               []  \n",
       "15059                                                None               []  \n",
       "65846                                                None               []  \n",
       "6381                                                 None  [MONDO:0003345]  \n",
       "3759                                                 None               []  \n",
       "3847                                                 None               []  \n",
       "85668                                                None               []  \n",
       "4382                                                 None               []  \n",
       "45866                                                None               []  \n",
       "21041                                                None               []  \n",
       "65561                                                None               []  \n",
       "43256                                             seeAlso                   \n",
       "21673                                                None                   \n",
       "15400                                                None                   \n",
       "\n",
       "[110240 rows x 3 columns]"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## unmapped (TODO this includes unmapped from MONDO/HP to R, which we don't care about so much)\n",
    "udf.to_csv('rare-no-matches.tsv', sep=\"\\t\", index=False)\n",
    "udf"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}