{ "cells": [ { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import re\n", "import sys\n", "import operator\n", "import collections\n", "import os" ] }, { "cell_type": "code", "execution_count": 7, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | Entry | \n", "Entry name | \n", "Status | \n", "Protein names | \n", "Gene names | \n", "Organism | \n", "Length | \n", "
|---|---|---|---|---|---|---|---|
| 0 | \n", "P78410 | \n", "BT3A2_HUMAN | \n", "reviewed | \n", "Butyrophilin subfamily 3 member A2 | \n", "BTN3A2 BT3.2 BTF3 BTF4 | \n", "Homo sapiens (Human) | \n", "334 | \n", "
| 1 | \n", "Q8TDQ1 | \n", "CLM1_HUMAN | \n", "reviewed | \n", "CMRF35-like molecule 1 (CLM-1) (CD300 antigen-... | \n", "CD300LF CD300F CLM1 IGSF13 IREM1 NKIR UNQ3105/... | \n", "Homo sapiens (Human) | \n", "290 | \n", "
| 2 | \n", "Q7Z624 | \n", "CMKMT_HUMAN | \n", "reviewed | \n", "Calmodulin-lysine N-methyltransferase (CLNMT) ... | \n", "CAMKMT C2orf34 CLNMT | \n", "Homo sapiens (Human) | \n", "323 | \n", "
| 3 | \n", "O75208 | \n", "COQ9_HUMAN | \n", "reviewed | \n", "Ubiquinone biosynthesis protein COQ9, mitochon... | \n", "COQ9 C16orf49 HSPC326 PSEC0129 | \n", "Homo sapiens (Human) | \n", "318 | \n", "
| 4 | \n", "Q8NEV1 | \n", "CSK23_HUMAN | \n", "reviewed | \n", "Casein kinase II subunit alpha 3 (CK II alpha ... | \n", "CSNK2A3 CSNK2A1P | \n", "Homo sapiens (Human) | \n", "391 | \n", "
| 5 | \n", "P33681 | \n", "CD80_HUMAN | \n", "reviewed | \n", "T-lymphocyte activation antigen CD80 (Activati... | \n", "CD80 CD28LG CD28LG1 LAB7 | \n", "Homo sapiens (Human) | \n", "288 | \n", "
| 6 | \n", "P02511 | \n", "CRYAB_HUMAN | \n", "reviewed | \n", "Alpha-crystallin B chain (Alpha(B)-crystallin)... | \n", "CRYAB CRYA2 HSPB5 | \n", "Homo sapiens (Human) | \n", "175 | \n", "
| 7 | \n", "Q8N4T0 | \n", "CBPA6_HUMAN | \n", "reviewed | \n", "Carboxypeptidase A6 (EC 3.4.17.-) | \n", "CPA6 CPAH | \n", "Homo sapiens (Human) | \n", "437 | \n", "
| 8 | \n", "P20933 | \n", "ASPG_HUMAN | \n", "reviewed | \n", "N(4)-(beta-N-acetylglucosaminyl)-L-asparaginas... | \n", "AGA | \n", "Homo sapiens (Human) | \n", "346 | \n", "
| 9 | \n", "Q86VB7 | \n", "C163A_HUMAN | \n", "reviewed | \n", "Scavenger receptor cysteine-rich type 1 protei... | \n", "CD163 M130 | \n", "Homo sapiens (Human) | \n", "1156 | \n", "
| 10 | \n", "P53420 | \n", "CO4A4_HUMAN | \n", "reviewed | \n", "Collagen alpha-4(IV) chain | \n", "COL4A4 | \n", "Homo sapiens (Human) | \n", "1690 | \n", "
| 11 | \n", "A2IDD5 | \n", "CCD78_HUMAN | \n", "reviewed | \n", "Coiled-coil domain-containing protein 78 (hsCC... | \n", "CCDC78 C16orf25 JFP10 | \n", "Homo sapiens (Human) | \n", "438 | \n", "
| 12 | \n", "Q02952 | \n", "AKA12_HUMAN | \n", "reviewed | \n", "A-kinase anchor protein 12 (AKAP-12) (A-kinase... | \n", "AKAP12 AKAP250 | \n", "Homo sapiens (Human) | \n", "1782 | \n", "
| 13 | \n", "O15194 | \n", "CTDSL_HUMAN | \n", "reviewed | \n", "CTD small phosphatase-like protein (CTDSP-like... | \n", "CTDSPL C3orf8 NIF1 NIFL SCP3 YA22 | \n", "Homo sapiens (Human) | \n", "276 | \n", "
| 14 | \n", "O14613 | \n", "BORG1_HUMAN | \n", "reviewed | \n", "Cdc42 effector protein 2 (Binder of Rho GTPase... | \n", "CDC42EP2 BORG1 CEP2 | \n", "Homo sapiens (Human) | \n", "210 | \n", "
| 15 | \n", "P30260 | \n", "CDC27_HUMAN | \n", "reviewed | \n", "Cell division cycle protein 27 homolog (Anapha... | \n", "CDC27 ANAPC3 D0S1430E D17S978E | \n", "Homo sapiens (Human) | \n", "824 | \n", "
| 16 | \n", "O75175 | \n", "CNOT3_HUMAN | \n", "reviewed | \n", "CCR4-NOT transcription complex subunit 3 (CCR4... | \n", "CNOT3 KIAA0691 LENG2 NOT3 | \n", "Homo sapiens (Human) | \n", "753 | \n", "
| 17 | \n", "Q16611 | \n", "BAK_HUMAN | \n", "reviewed | \n", "Bcl-2 homologous antagonist/killer (Apoptosis ... | \n", "BAK1 BAK BCL2L7 CDN1 | \n", "Homo sapiens (Human) | \n", "211 | \n", "
| 18 | \n", "Q07065 | \n", "CKAP4_HUMAN | \n", "reviewed | \n", "Cytoskeleton-associated protein 4 (63-kDa cyto... | \n", "CKAP4 | \n", "Homo sapiens (Human) | \n", "602 | \n", "
| 19 | \n", "Q96B67 | \n", "ARRD3_HUMAN | \n", "reviewed | \n", "Arrestin domain-containing protein 3 (TBP-2-li... | \n", "ARRDC3 KIAA1376 | \n", "Homo sapiens (Human) | \n", "414 | \n", "
| 20 | \n", "Q15327 | \n", "ANKR1_HUMAN | \n", "reviewed | \n", "Ankyrin repeat domain-containing protein 1 (Ca... | \n", "ANKRD1 C193 CARP HA1A2 | \n", "Homo sapiens (Human) | \n", "319 | \n", "
| 21 | \n", "Q99653 | \n", "CHP1_HUMAN | \n", "reviewed | \n", "Calcineurin B homologous protein 1 (Calcineuri... | \n", "CHP1 CHP | \n", "Homo sapiens (Human) | \n", "195 | \n", "
| 22 | \n", "P0CG37 | \n", "CFC1_HUMAN | \n", "reviewed | \n", "Cryptic protein (Cryptic family protein 1) | \n", "CFC1 | \n", "Homo sapiens (Human) | \n", "223 | \n", "
| 23 | \n", "P17544 | \n", "ATF7_HUMAN | \n", "reviewed | \n", "Cyclic AMP-dependent transcription factor ATF-... | \n", "ATF7 ATFA | \n", "Homo sapiens (Human) | \n", "494 | \n", "
| 24 | \n", "Q8N5B7 | \n", "CERS5_HUMAN | \n", "reviewed | \n", "Ceramide synthase 5 (CerS5) (EC 2.3.1.-) (LAG1... | \n", "CERS5 LASS5 | \n", "Homo sapiens (Human) | \n", "392 | \n", "
| 25 | \n", "Q6ZMG9 | \n", "CERS6_HUMAN | \n", "reviewed | \n", "Ceramide synthase 6 (CerS6) (EC 2.3.1.-) (LAG1... | \n", "CERS6 LASS6 | \n", "Homo sapiens (Human) | \n", "384 | \n", "
| 26 | \n", "A0A1B0GW15 | \n", "A0A1B0GW15_HUMAN | \n", "unreviewed | \n", "Uncharacterized protein | \n", "NaN | \n", "Homo sapiens (Human) | \n", "77 | \n", "
| 27 | \n", "A0A0A0MRX4 | \n", "A0A0A0MRX4_HUMAN | \n", "unreviewed | \n", "Ral guanine nucleotide dissociation stimulator... | \n", "RGL3 | \n", "Homo sapiens (Human) | \n", "710 | \n", "
| 28 | \n", "F5H052 | \n", "F5H052_HUMAN | \n", "unreviewed | \n", "Armadillo repeat-containing protein 6 (Fragment) | \n", "ARMC6 | \n", "Homo sapiens (Human) | \n", "103 | \n", "
| 29 | \n", "B1AMT0 | \n", "B1AMT0_HUMAN | \n", "unreviewed | \n", "Cohesin subunit SA-2 (Fragment) | \n", "STAG2 | \n", "Homo sapiens (Human) | \n", "115 | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 74004 | \n", "O14775 | \n", "GNB5_HUMAN | \n", "reviewed | \n", "Guanine nucleotide-binding protein subunit bet... | \n", "GNB5 | \n", "Homo sapiens (Human) | \n", "395 | \n", "
| 74005 | \n", "O43716 | \n", "GATC_HUMAN | \n", "reviewed | \n", "Glutamyl-tRNA(Gln) amidotransferase subunit C,... | \n", "GATC 15E1.2 | \n", "Homo sapiens (Human) | \n", "136 | \n", "
| 74006 | \n", "P03372 | \n", "ESR1_HUMAN | \n", "reviewed | \n", "Estrogen receptor (ER) (ER-alpha) (Estradiol r... | \n", "ESR1 ESR NR3A1 | \n", "Homo sapiens (Human) | \n", "595 | \n", "
| 74007 | \n", "Q6NT32 | \n", "EST5A_HUMAN | \n", "reviewed | \n", "Carboxylesterase 5A (EC 3.1.1.1) (Carboxyleste... | \n", "CES5A CES7 | \n", "Homo sapiens (Human) | \n", "575 | \n", "
| 74008 | \n", "P30793 | \n", "GCH1_HUMAN | \n", "reviewed | \n", "GTP cyclohydrolase 1 (EC 3.5.4.16) (GTP cycloh... | \n", "GCH1 DYT5 GCH | \n", "Homo sapiens (Human) | \n", "250 | \n", "
| 74009 | \n", "Q9HAH7 | \n", "FBRS_HUMAN | \n", "reviewed | \n", "Probable fibrosin-1 | \n", "FBRS FBS FBS1 | \n", "Homo sapiens (Human) | \n", "460 | \n", "
| 74010 | \n", "O00461 | \n", "GOLI4_HUMAN | \n", "reviewed | \n", "Golgi integral membrane protein 4 (Golgi integ... | \n", "GOLIM4 GIMPC GOLPH4 GPP130 | \n", "Homo sapiens (Human) | \n", "696 | \n", "
| 74011 | \n", "Q9UI32 | \n", "GLSL_HUMAN | \n", "reviewed | \n", "Glutaminase liver isoform, mitochondrial (GLS)... | \n", "GLS2 GA | \n", "Homo sapiens (Human) | \n", "602 | \n", "
| 74012 | \n", "Q9UBI6 | \n", "GBG12_HUMAN | \n", "reviewed | \n", "Guanine nucleotide-binding protein G(I)/G(S)/G... | \n", "GNG12 | \n", "Homo sapiens (Human) | \n", "72 | \n", "
| 74013 | \n", "P63215 | \n", "GBG3_HUMAN | \n", "reviewed | \n", "Guanine nucleotide-binding protein G(I)/G(S)/G... | \n", "GNG3 GNGT3 | \n", "Homo sapiens (Human) | \n", "75 | \n", "
| 74014 | \n", "Q8WUU5 | \n", "GATD1_HUMAN | \n", "reviewed | \n", "GATA zinc finger domain-containing protein 1 (... | \n", "GATAD1 ODAG | \n", "Homo sapiens (Human) | \n", "269 | \n", "
| 74015 | \n", "Q8NBI3 | \n", "DRAXI_HUMAN | \n", "reviewed | \n", "Draxin (Dorsal inhibitory axon guidance protei... | \n", "DRAXIN C1orf187 PSEC0258 UNQ3119/PRO10268 | \n", "Homo sapiens (Human) | \n", "349 | \n", "
| 74016 | \n", "Q8IUC8 | \n", "GLT13_HUMAN | \n", "reviewed | \n", "Polypeptide N-acetylgalactosaminyltransferase ... | \n", "GALNT13 KIAA1918 | \n", "Homo sapiens (Human) | \n", "556 | \n", "
| 74017 | \n", "Q7Z2K6 | \n", "ERMP1_HUMAN | \n", "reviewed | \n", "Endoplasmic reticulum metallopeptidase 1 (EC 3... | \n", "ERMP1 FXNA KIAA1815 | \n", "Homo sapiens (Human) | \n", "904 | \n", "
| 74018 | \n", "Q9UM22 | \n", "EPDR1_HUMAN | \n", "reviewed | \n", "Mammalian ependymin-related protein 1 (MERP-1)... | \n", "EPDR1 MERP1 UCC1 | \n", "Homo sapiens (Human) | \n", "224 | \n", "
| 74019 | \n", "P05160 | \n", "F13B_HUMAN | \n", "reviewed | \n", "Coagulation factor XIII B chain (Fibrin-stabil... | \n", "F13B | \n", "Homo sapiens (Human) | \n", "661 | \n", "
| 74020 | \n", "P37059 | \n", "DHB2_HUMAN | \n", "reviewed | \n", "Estradiol 17-beta-dehydrogenase 2 (EC 1.1.1.62... | \n", "HSD17B2 EDH17B2 SDR9C2 | \n", "Homo sapiens (Human) | \n", "387 | \n", "
| 74021 | \n", "A8K855 | \n", "EFCB7_HUMAN | \n", "reviewed | \n", "EF-hand calcium-binding domain-containing prot... | \n", "EFCAB7 KIAA1799 | \n", "Homo sapiens (Human) | \n", "629 | \n", "
| 74022 | \n", "Q16099 | \n", "GRIK4_HUMAN | \n", "reviewed | \n", "Glutamate receptor ionotropic, kainate 4 (GluK... | \n", "GRIK4 GRIK | \n", "Homo sapiens (Human) | \n", "956 | \n", "
| 74023 | \n", "P0DPD8 | \n", "EFCE2_HUMAN | \n", "reviewed | \n", "EEF1AKMT4-ECE2 readthrough transcript protein ... | \n", "EEF1AKMT4-ECE2 | \n", "Homo sapiens (Human) | \n", "883 | \n", "
| 74024 | \n", "P56937 | \n", "DHB7_HUMAN | \n", "reviewed | \n", "3-keto-steroid reductase (EC 1.1.1.270) (17-be... | \n", "HSD17B7 SDR37C1 UNQ2563/PRO6243 | \n", "Homo sapiens (Human) | \n", "341 | \n", "
| 74025 | \n", "Q9NYF3 | \n", "FA53C_HUMAN | \n", "reviewed | \n", "Protein FAM53C | \n", "FAM53C C5orf6 | \n", "Homo sapiens (Human) | \n", "392 | \n", "
| 74026 | \n", "Q6UY11 | \n", "DLK2_HUMAN | \n", "reviewed | \n", "Protein delta homolog 2 (DLK-2) (Epidermal gro... | \n", "DLK2 EGFL9 UNQ2903/PRO28633 | \n", "Homo sapiens (Human) | \n", "383 | \n", "
| 74027 | \n", "Q99504 | \n", "EYA3_HUMAN | \n", "reviewed | \n", "Eyes absent homolog 3 (EC 3.1.3.48) | \n", "EYA3 | \n", "Homo sapiens (Human) | \n", "573 | \n", "
| 74028 | \n", "Q01459 | \n", "DIAC_HUMAN | \n", "reviewed | \n", "Di-N-acetylchitobiase (EC 3.2.1.-) | \n", "CTBS CTB | \n", "Homo sapiens (Human) | \n", "385 | \n", "
| 74029 | \n", "O60610 | \n", "DIAP1_HUMAN | \n", "reviewed | \n", "Protein diaphanous homolog 1 (Diaphanous-relat... | \n", "DIAPH1 DIAP1 | \n", "Homo sapiens (Human) | \n", "1272 | \n", "
| 74030 | \n", "O60269 | \n", "GRIN2_HUMAN | \n", "reviewed | \n", "G protein-regulated inducer of neurite outgrow... | \n", "GPRIN2 KIAA0514 | \n", "Homo sapiens (Human) | \n", "458 | \n", "
| 74031 | \n", "Q6P3S1 | \n", "DEN1B_HUMAN | \n", "reviewed | \n", "DENN domain-containing protein 1B (Connecdenn ... | \n", "DENND1B C1orf218 FAM31B | \n", "Homo sapiens (Human) | \n", "775 | \n", "
| 74032 | \n", "P09958 | \n", "FURIN_HUMAN | \n", "reviewed | \n", "Furin (EC 3.4.21.75) (Dibasic-processing enzym... | \n", "FURIN FUR PACE PCSK3 | \n", "Homo sapiens (Human) | \n", "794 | \n", "
| 74033 | \n", "Q8IUX8 | \n", "EGFL6_HUMAN | \n", "reviewed | \n", "Epidermal growth factor-like protein 6 (EGF-li... | \n", "EGFL6 MAEG PP648 UNQ281/PRO320 | \n", "Homo sapiens (Human) | \n", "553 | \n", "
74034 rows × 7 columns
\n", "