Created
December 8, 2023 23:00
-
-
Save agitter/579db8aae2b95cd51338031d211908b9 to your computer and use it in GitHub Desktop.
wikicrow-unexplored
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"cells": [ | |
{ | |
"cell_type": "markdown", | |
"metadata": {}, | |
"source": [ | |
"# Exploring the unexplored WikiCrow genes\n", | |
"Checks when the 669 genes from https://gist.github.com/whitead/e20c4c9e484fad32d8df6f9a610b8dbd last had their symbol modified \n", | |
"By [@agitter](https://github.com/agitter)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 38, | |
"metadata": {}, | |
"outputs": [], | |
"source": [ | |
"import pandas as pd\n", | |
"import seaborn as sns" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 2, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"name": "stderr", | |
"output_type": "stream", | |
"text": [ | |
"C:\\ProgramData\\Anaconda3\\lib\\site-packages\\IPython\\core\\interactiveshell.py:3049: DtypeWarning: Columns (32,34,38,40,50) have mixed types. Specify dtype option on import or set low_memory=False.\n", | |
" interactivity=interactivity, compiler=compiler, result=result)\n" | |
] | |
} | |
], | |
"source": [ | |
"# Download HGCN data attributes\n", | |
"hgnc_df = pd.read_csv('https://ftp.ebi.ac.uk/pub/databases/genenames/hgnc/tsv/hgnc_complete_set.txt', sep='\\t')" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 6, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"(43736, 54)" | |
] | |
}, | |
"execution_count": 6, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"# Genes by data attributes\n", | |
"hgnc_df.shape" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 8, | |
"metadata": {}, | |
"outputs": [], | |
"source": [ | |
"# Download unexplored gene list from https://gist.github.com/whitead/e20c4c9e484fad32d8df6f9a610b8dbd\n", | |
"unexp_df = pd.read_csv('https://gist.githubusercontent.com/whitead/e20c4c9e484fad32d8df6f9a610b8dbd/raw/b56bcafb681838320ff03f5ec84731e42acca701/unexplored.txt', header=None)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 9, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<style scoped>\n", | |
" .dataframe tbody tr th:only-of-type {\n", | |
" vertical-align: middle;\n", | |
" }\n", | |
"\n", | |
" .dataframe tbody tr th {\n", | |
" vertical-align: top;\n", | |
" }\n", | |
"\n", | |
" .dataframe thead th {\n", | |
" text-align: right;\n", | |
" }\n", | |
"</style>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>0</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>0</th>\n", | |
" <td>AADACL4</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1</th>\n", | |
" <td>ACCSL</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2</th>\n", | |
" <td>ACTR3C</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>3</th>\n", | |
" <td>ACTRT3</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4</th>\n", | |
" <td>ANHX</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>5</th>\n", | |
" <td>ANKMY1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>6</th>\n", | |
" <td>ANKRD10</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>7</th>\n", | |
" <td>ANKRD30BL</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8</th>\n", | |
" <td>ANKRD34A</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9</th>\n", | |
" <td>ANKRD39</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10</th>\n", | |
" <td>ANKRD40CL</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>11</th>\n", | |
" <td>ANKRD60</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>12</th>\n", | |
" <td>ANKRD61</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>13</th>\n", | |
" <td>ANKRD63</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>14</th>\n", | |
" <td>ANKRD65</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>15</th>\n", | |
" <td>ANKRD66</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>16</th>\n", | |
" <td>AP1AR</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>17</th>\n", | |
" <td>ARB2A</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>18</th>\n", | |
" <td>ARL14EPL</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>19</th>\n", | |
" <td>ARMH1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>20</th>\n", | |
" <td>ARMH2</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>21</th>\n", | |
" <td>AVPI1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>22</th>\n", | |
" <td>BCLAF3</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23</th>\n", | |
" <td>BEAN1</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24</th>\n", | |
" <td>BRD3OS</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>25</th>\n", | |
" <td>BTBD17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>26</th>\n", | |
" <td>C10orf105</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>27</th>\n", | |
" <td>C10orf120</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>28</th>\n", | |
" <td>C10orf126</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>29</th>\n", | |
" <td>C10orf143</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>...</th>\n", | |
" <td>...</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>639</th>\n", | |
" <td>ZNF716</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>640</th>\n", | |
" <td>ZNF722</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>641</th>\n", | |
" <td>ZNF723</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>642</th>\n", | |
" <td>ZNF724</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>643</th>\n", | |
" <td>ZNF730</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>644</th>\n", | |
" <td>ZNF740</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>645</th>\n", | |
" <td>ZNF75D</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>646</th>\n", | |
" <td>ZNF761</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>647</th>\n", | |
" <td>ZNF763</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>648</th>\n", | |
" <td>ZNF766</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>649</th>\n", | |
" <td>ZNF771</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>650</th>\n", | |
" <td>ZNF773</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>651</th>\n", | |
" <td>ZNF781</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>652</th>\n", | |
" <td>ZNF783</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>653</th>\n", | |
" <td>ZNF786</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>654</th>\n", | |
" <td>ZNF787</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>655</th>\n", | |
" <td>ZNF790</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>656</th>\n", | |
" <td>ZNF814</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>657</th>\n", | |
" <td>ZNF829</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>658</th>\n", | |
" <td>ZNF830</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>659</th>\n", | |
" <td>ZNF841</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>660</th>\n", | |
" <td>ZNF843</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>661</th>\n", | |
" <td>ZNF845</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>662</th>\n", | |
" <td>ZNF852</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>663</th>\n", | |
" <td>ZNF860</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>664</th>\n", | |
" <td>ZNF892</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>665</th>\n", | |
" <td>ZSCAN26</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>666</th>\n", | |
" <td>ZSCAN30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>667</th>\n", | |
" <td>ZSCAN32</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>668</th>\n", | |
" <td>ZSCAN9</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"<p>669 rows × 1 columns</p>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" 0\n", | |
"0 AADACL4\n", | |
"1 ACCSL\n", | |
"2 ACTR3C\n", | |
"3 ACTRT3\n", | |
"4 ANHX\n", | |
"5 ANKMY1\n", | |
"6 ANKRD10\n", | |
"7 ANKRD30BL\n", | |
"8 ANKRD34A\n", | |
"9 ANKRD39\n", | |
"10 ANKRD40CL\n", | |
"11 ANKRD60\n", | |
"12 ANKRD61\n", | |
"13 ANKRD63\n", | |
"14 ANKRD65\n", | |
"15 ANKRD66\n", | |
"16 AP1AR\n", | |
"17 ARB2A\n", | |
"18 ARL14EPL\n", | |
"19 ARMH1\n", | |
"20 ARMH2\n", | |
"21 AVPI1\n", | |
"22 BCLAF3\n", | |
"23 BEAN1\n", | |
"24 BRD3OS\n", | |
"25 BTBD17\n", | |
"26 C10orf105\n", | |
"27 C10orf120\n", | |
"28 C10orf126\n", | |
"29 C10orf143\n", | |
".. ...\n", | |
"639 ZNF716\n", | |
"640 ZNF722\n", | |
"641 ZNF723\n", | |
"642 ZNF724\n", | |
"643 ZNF730\n", | |
"644 ZNF740\n", | |
"645 ZNF75D\n", | |
"646 ZNF761\n", | |
"647 ZNF763\n", | |
"648 ZNF766\n", | |
"649 ZNF771\n", | |
"650 ZNF773\n", | |
"651 ZNF781\n", | |
"652 ZNF783\n", | |
"653 ZNF786\n", | |
"654 ZNF787\n", | |
"655 ZNF790\n", | |
"656 ZNF814\n", | |
"657 ZNF829\n", | |
"658 ZNF830\n", | |
"659 ZNF841\n", | |
"660 ZNF843\n", | |
"661 ZNF845\n", | |
"662 ZNF852\n", | |
"663 ZNF860\n", | |
"664 ZNF892\n", | |
"665 ZSCAN26\n", | |
"666 ZSCAN30\n", | |
"667 ZSCAN32\n", | |
"668 ZSCAN9\n", | |
"\n", | |
"[669 rows x 1 columns]" | |
] | |
}, | |
"execution_count": 9, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"# Inspect the first and last few, confirm there are 669\n", | |
"unexp_df" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 24, | |
"metadata": {}, | |
"outputs": [], | |
"source": [ | |
"# Keep the 669 unexplored genes from the HGNC table\n", | |
"hgnc_unexp_df = hgnc_df[hgnc_df['symbol'].isin(unexp_df[0].values.tolist())]" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 25, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<style scoped>\n", | |
" .dataframe tbody tr th:only-of-type {\n", | |
" vertical-align: middle;\n", | |
" }\n", | |
"\n", | |
" .dataframe tbody tr th {\n", | |
" vertical-align: top;\n", | |
" }\n", | |
"\n", | |
" .dataframe thead th {\n", | |
" text-align: right;\n", | |
" }\n", | |
"</style>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>hgnc_id</th>\n", | |
" <th>symbol</th>\n", | |
" <th>name</th>\n", | |
" <th>locus_group</th>\n", | |
" <th>locus_type</th>\n", | |
" <th>status</th>\n", | |
" <th>location</th>\n", | |
" <th>location_sortable</th>\n", | |
" <th>alias_symbol</th>\n", | |
" <th>alias_name</th>\n", | |
" <th>...</th>\n", | |
" <th>cd</th>\n", | |
" <th>lncrnadb</th>\n", | |
" <th>enzyme_id</th>\n", | |
" <th>intermediate_filament_db</th>\n", | |
" <th>rna_central_ids</th>\n", | |
" <th>lncipedia</th>\n", | |
" <th>gtrnadb</th>\n", | |
" <th>agr</th>\n", | |
" <th>mane_select</th>\n", | |
" <th>gencc</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>19</th>\n", | |
" <td>HGNC:32038</td>\n", | |
" <td>AADACL4</td>\n", | |
" <td>arylacetamide deacetylase like 4</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1p36.21</td>\n", | |
" <td>01p36.21</td>\n", | |
" <td>OTTHUMG00000001889</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32038</td>\n", | |
" <td>ENST00000376221.2|NM_001013630.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>195</th>\n", | |
" <td>HGNC:34391</td>\n", | |
" <td>ACCSL</td>\n", | |
" <td>1-aminocyclopropane-1-carboxylate synthase hom...</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>11p11.2</td>\n", | |
" <td>11p11.2</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:34391</td>\n", | |
" <td>ENST00000378832.1|NM_001031854.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>346</th>\n", | |
" <td>HGNC:37282</td>\n", | |
" <td>ACTR3C</td>\n", | |
" <td>actin related protein 3C</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7q36.1</td>\n", | |
" <td>07q36.1</td>\n", | |
" <td>ARP11</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:37282</td>\n", | |
" <td>ENST00000683684.1|NM_001164458.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>358</th>\n", | |
" <td>HGNC:24022</td>\n", | |
" <td>ACTRT3</td>\n", | |
" <td>actin related protein T3</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>3q26.2</td>\n", | |
" <td>03q26.2</td>\n", | |
" <td>ARPM1</td>\n", | |
" <td>actin related protein M1</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:24022</td>\n", | |
" <td>ENST00000330368.3|NM_032487.5</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1015</th>\n", | |
" <td>HGNC:40024</td>\n", | |
" <td>ANHX</td>\n", | |
" <td>anomalous homeobox</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>12q24.33</td>\n", | |
" <td>12q24.33</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:40024</td>\n", | |
" <td>ENST00000545940.6|NM_001372060.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1036</th>\n", | |
" <td>HGNC:20987</td>\n", | |
" <td>ANKMY1</td>\n", | |
" <td>ankyrin repeat and MYND domain containing 1</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>2q37.3</td>\n", | |
" <td>02q37.3</td>\n", | |
" <td>FLJ20499|ZMYND13</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:20987</td>\n", | |
" <td>ENST00000401804.6|NM_001282771.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1044</th>\n", | |
" <td>HGNC:20265</td>\n", | |
" <td>ANKRD10</td>\n", | |
" <td>ankyrin repeat domain 10</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>13q34</td>\n", | |
" <td>13q34</td>\n", | |
" <td>FLJ20093</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:20265</td>\n", | |
" <td>ENST00000267339.6|NM_017664.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1099</th>\n", | |
" <td>HGNC:35167</td>\n", | |
" <td>ANKRD30BL</td>\n", | |
" <td>ankyrin repeat domain 30B like</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>2q21.2</td>\n", | |
" <td>02q21.2</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:35167</td>\n", | |
" <td>ENST00000409867.6|NM_001358416.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1117</th>\n", | |
" <td>HGNC:27639</td>\n", | |
" <td>ANKRD34A</td>\n", | |
" <td>ankyrin repeat domain 34A</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1q21.1</td>\n", | |
" <td>01q21.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27639</td>\n", | |
" <td>ENST00000606888.3|NM_001039888.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1129</th>\n", | |
" <td>HGNC:28640</td>\n", | |
" <td>ANKRD39</td>\n", | |
" <td>ankyrin repeat domain 39</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>2q11.2</td>\n", | |
" <td>02q11.2</td>\n", | |
" <td>MGC41816</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28640</td>\n", | |
" <td>ENST00000393537.5|NM_016466.6</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1132</th>\n", | |
" <td>HGNC:26080</td>\n", | |
" <td>ANKRD40CL</td>\n", | |
" <td>ANKRD40 C-terminal like</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>17q21.33</td>\n", | |
" <td>17q21.33</td>\n", | |
" <td>FLJ20694</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>LINC00483</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:26080</td>\n", | |
" <td>ENST00000450727.6|NM_001358683.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1152</th>\n", | |
" <td>HGNC:16217</td>\n", | |
" <td>ANKRD60</td>\n", | |
" <td>ankyrin repeat domain 60</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>20q13.32</td>\n", | |
" <td>20q13.32</td>\n", | |
" <td>bA196N14.3</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:16217</td>\n", | |
" <td>ENST00000457363.2|NM_001304369.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1153</th>\n", | |
" <td>HGNC:22467</td>\n", | |
" <td>ANKRD61</td>\n", | |
" <td>ankyrin repeat domain 61</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7p22.1</td>\n", | |
" <td>07p22.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:22467</td>\n", | |
" <td>ENST00000409061.2|NM_001271700.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1157</th>\n", | |
" <td>HGNC:40027</td>\n", | |
" <td>ANKRD63</td>\n", | |
" <td>ankyrin repeat domain 63</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>15q15.1</td>\n", | |
" <td>15q15.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:40027</td>\n", | |
" <td>ENST00000434396.2|NM_001190479.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1158</th>\n", | |
" <td>HGNC:42950</td>\n", | |
" <td>ANKRD65</td>\n", | |
" <td>ankyrin repeat domain 65</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1p36.33</td>\n", | |
" <td>01p36.33</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:42950</td>\n", | |
" <td>ENST00000537107.6|NM_001145210.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1160</th>\n", | |
" <td>HGNC:44669</td>\n", | |
" <td>ANKRD66</td>\n", | |
" <td>ankyrin repeat domain 66</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>6p12.3</td>\n", | |
" <td>06p12.3</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:44669</td>\n", | |
" <td>ENST00000565422.3|NM_001162435.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1230</th>\n", | |
" <td>HGNC:28808</td>\n", | |
" <td>AP1AR</td>\n", | |
" <td>adaptor related protein complex 1 associated r...</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>4q25</td>\n", | |
" <td>04q25</td>\n", | |
" <td>PRO0971|2C18|gamma-BAR</td>\n", | |
" <td>gamma1-adaptin brefeldin A resistance</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28808</td>\n", | |
" <td>ENST00000274000.10|NM_018569.6</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1386</th>\n", | |
" <td>HGNC:25365</td>\n", | |
" <td>ARB2A</td>\n", | |
" <td>ARB2 cotranscriptional regulator A</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>5q15</td>\n", | |
" <td>05q15</td>\n", | |
" <td>DKFZP564D172|Toupee</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:25365</td>\n", | |
" <td>ENST00000395965.8|NM_032042.6</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1596</th>\n", | |
" <td>HGNC:44201</td>\n", | |
" <td>ARL14EPL</td>\n", | |
" <td>ADP ribosylation factor like GTPase 14 effecto...</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>5q23.1</td>\n", | |
" <td>05q23.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:44201</td>\n", | |
" <td>ENST00000686077.1|NM_001195581.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1625</th>\n", | |
" <td>HGNC:34345</td>\n", | |
" <td>ARMH1</td>\n", | |
" <td>armadillo like helical domain containing 1</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1p34.1</td>\n", | |
" <td>01p34.1</td>\n", | |
" <td>MGC33556|p40</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:34345</td>\n", | |
" <td>ENST00000535358.6|NM_001145636.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1626</th>\n", | |
" <td>HGNC:49394</td>\n", | |
" <td>ARMH2</td>\n", | |
" <td>armadillo like helical domain containing 2</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>6p22.3</td>\n", | |
" <td>06p22.3</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:49394</td>\n", | |
" <td>ENST00000565469.4|NM_001282492.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2100</th>\n", | |
" <td>HGNC:30898</td>\n", | |
" <td>AVPI1</td>\n", | |
" <td>arginine vasopressin induced 1</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>10q24.2</td>\n", | |
" <td>10q24.2</td>\n", | |
" <td>VIP32|PP5395|VIT32</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:30898</td>\n", | |
" <td>ENST00000370626.4|NM_021732.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2319</th>\n", | |
" <td>HGNC:27413</td>\n", | |
" <td>BCLAF3</td>\n", | |
" <td>BCLAF1 and THRAP3 family member 3</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>Xp22.12</td>\n", | |
" <td>Xp22.12</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27413</td>\n", | |
" <td>ENST00000379682.9|NM_001367774.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2349</th>\n", | |
" <td>HGNC:24160</td>\n", | |
" <td>BEAN1</td>\n", | |
" <td>brain expressed associated with NEDD4 1</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>16q21</td>\n", | |
" <td>16q21</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:24160</td>\n", | |
" <td>ENST00000536005.7|NM_001178020.3</td>\n", | |
" <td>HGNC:24160</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2638</th>\n", | |
" <td>HGNC:24742</td>\n", | |
" <td>BRD3OS</td>\n", | |
" <td>BRD3 opposite strand</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>9q34.2</td>\n", | |
" <td>09q34.2</td>\n", | |
" <td>FLJ35348|bA374P20.3|SERLOC</td>\n", | |
" <td>Super enhancer and ERK1/2 Regulated Long Inter...</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>LINC00094</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:24742</td>\n", | |
" <td>ENST00000603928.3|NM_001355256.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2726</th>\n", | |
" <td>HGNC:33758</td>\n", | |
" <td>BTBD17</td>\n", | |
" <td>BTB domain containing 17</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>17q25.1</td>\n", | |
" <td>17q25.1</td>\n", | |
" <td>LGALS3BPL|BTBD17A|TANGO10A</td>\n", | |
" <td>transport and golgi organization 10 homolog A ...</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:33758</td>\n", | |
" <td>ENST00000375366.4|NM_001080466.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2831</th>\n", | |
" <td>HGNC:28667</td>\n", | |
" <td>C1orf116</td>\n", | |
" <td>chromosome 1 open reading frame 116</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1q32.1</td>\n", | |
" <td>01q32.1</td>\n", | |
" <td>SARG|FLJ36507|MGC2742|MGC4309</td>\n", | |
" <td>specifically androgen-regulated gene</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28667</td>\n", | |
" <td>ENST00000359470.6|NM_023938.6</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2839</th>\n", | |
" <td>HGNC:25262</td>\n", | |
" <td>C1orf167</td>\n", | |
" <td>chromosome 1 open reading frame 167</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1p36.22</td>\n", | |
" <td>01p36.22</td>\n", | |
" <td>DKFZp434E1410|RP11-56N19.2</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:25262</td>\n", | |
" <td>ENST00000688073.1|NM_001010881.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2841</th>\n", | |
" <td>HGNC:27915</td>\n", | |
" <td>C1orf174</td>\n", | |
" <td>chromosome 1 open reading frame 174</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1p36.32</td>\n", | |
" <td>01p36.32</td>\n", | |
" <td>RP13-531C17.2</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27915</td>\n", | |
" <td>ENST00000361605.4|NM_207356.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2844</th>\n", | |
" <td>HGNC:56760</td>\n", | |
" <td>C1orf202</td>\n", | |
" <td>chromosome 1 open reading frame 202</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>1q44</td>\n", | |
" <td>01q44</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>ENST00000640271.3|NM_001395959.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>...</th>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43483</th>\n", | |
" <td>HGNC:32284</td>\n", | |
" <td>ZNF705B</td>\n", | |
" <td>zinc finger protein 705B</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>8p23.1</td>\n", | |
" <td>08p23.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32284</td>\n", | |
" <td>ENST00000400120.3|NM_001193630.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43497</th>\n", | |
" <td>HGNC:32458</td>\n", | |
" <td>ZNF716</td>\n", | |
" <td>zinc finger protein 716</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7p11.2</td>\n", | |
" <td>07p11.2</td>\n", | |
" <td>FLJ46189</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32458</td>\n", | |
" <td>ENST00000420713.2|NM_001159279.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43501</th>\n", | |
" <td>HGNC:22571</td>\n", | |
" <td>ZNF722</td>\n", | |
" <td>zinc finger protein 722</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7q11.21</td>\n", | |
" <td>07q11.21</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:22571</td>\n", | |
" <td>ENST00000330020.5|NM_001396012.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43502</th>\n", | |
" <td>HGNC:32286</td>\n", | |
" <td>ZNF723</td>\n", | |
" <td>zinc finger protein 723</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19p12</td>\n", | |
" <td>19p12</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32286</td>\n", | |
" <td>ENST00000600766.3|NM_001349726.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43503</th>\n", | |
" <td>HGNC:32460</td>\n", | |
" <td>ZNF724</td>\n", | |
" <td>zinc finger protein 724</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19p12</td>\n", | |
" <td>19p12</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32460</td>\n", | |
" <td>ENST00000418100.6|NM_001355404.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43510</th>\n", | |
" <td>HGNC:32470</td>\n", | |
" <td>ZNF730</td>\n", | |
" <td>zinc finger protein 730</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19p12</td>\n", | |
" <td>19p12</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:32470</td>\n", | |
" <td>ENST00000597761.7|NM_001277403.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43531</th>\n", | |
" <td>HGNC:27465</td>\n", | |
" <td>ZNF740</td>\n", | |
" <td>zinc finger protein 740</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>12q13.13</td>\n", | |
" <td>12q13.13</td>\n", | |
" <td>Zfp740</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27465</td>\n", | |
" <td>ENST00000416904.5|NM_001004304.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43537</th>\n", | |
" <td>HGNC:23179</td>\n", | |
" <td>ZNF761</td>\n", | |
" <td>zinc finger protein 761</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.42</td>\n", | |
" <td>19q13.42</td>\n", | |
" <td>KIAA2033|FLJ16231|FLJ35333</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:23179</td>\n", | |
" <td>ENST00000684525.1|NM_001289951.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43538</th>\n", | |
" <td>HGNC:27614</td>\n", | |
" <td>ZNF763</td>\n", | |
" <td>zinc finger protein 763</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19p13.2</td>\n", | |
" <td>19p13.2</td>\n", | |
" <td>ZNF440L</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27614</td>\n", | |
" <td>ENST00000358987.8|NM_001367172.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43541</th>\n", | |
" <td>HGNC:28063</td>\n", | |
" <td>ZNF766</td>\n", | |
" <td>zinc finger protein 766</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.41</td>\n", | |
" <td>19q13.41</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28063</td>\n", | |
" <td>ENST00000439461.6|NM_001010851.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43545</th>\n", | |
" <td>HGNC:29653</td>\n", | |
" <td>ZNF771</td>\n", | |
" <td>zinc finger protein 771</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>16p11.2</td>\n", | |
" <td>16p11.2</td>\n", | |
" <td>DSC43</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:29653</td>\n", | |
" <td>ENST00000319296.10|NM_001142305.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43547</th>\n", | |
" <td>HGNC:30487</td>\n", | |
" <td>ZNF773</td>\n", | |
" <td>zinc finger protein 773</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>MGC4728</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:30487</td>\n", | |
" <td>ENST00000282292.9|NM_198542.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43557</th>\n", | |
" <td>HGNC:26745</td>\n", | |
" <td>ZNF781</td>\n", | |
" <td>zinc finger protein 781</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>FLJ37549</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:26745</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43559</th>\n", | |
" <td>HGNC:27222</td>\n", | |
" <td>ZNF783</td>\n", | |
" <td>zinc finger protein 783</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7q36.1</td>\n", | |
" <td>07q36.1</td>\n", | |
" <td>DKFZp667J212</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27222</td>\n", | |
" <td>ENST00000434415.6|NM_001195220.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43562</th>\n", | |
" <td>HGNC:21806</td>\n", | |
" <td>ZNF786</td>\n", | |
" <td>zinc finger protein 786</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>7q36.1</td>\n", | |
" <td>07q36.1</td>\n", | |
" <td>DKFZp762I137</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:21806</td>\n", | |
" <td>ENST00000491431.2|NM_152411.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43563</th>\n", | |
" <td>HGNC:26998</td>\n", | |
" <td>ZNF787</td>\n", | |
" <td>zinc finger protein 787</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:26998</td>\n", | |
" <td>ENST00000610935.2|NM_001002836.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43566</th>\n", | |
" <td>HGNC:33114</td>\n", | |
" <td>ZNF790</td>\n", | |
" <td>zinc finger protein 790</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>MGC62100|FLJ20350</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:33114</td>\n", | |
" <td>ENST00000356725.9|NM_206894.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43581</th>\n", | |
" <td>HGNC:33258</td>\n", | |
" <td>ZNF814</td>\n", | |
" <td>zinc finger protein 814</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>19q13.43</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:33258</td>\n", | |
" <td>ENST00000435989.7|NM_001144989.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43590</th>\n", | |
" <td>HGNC:34032</td>\n", | |
" <td>ZNF829</td>\n", | |
" <td>zinc finger protein 829</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>19q13.12</td>\n", | |
" <td>DKFZp779O175</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:34032</td>\n", | |
" <td>ENST00000391711.8|NM_001037232.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43591</th>\n", | |
" <td>HGNC:28291</td>\n", | |
" <td>ZNF830</td>\n", | |
" <td>zinc finger protein 830</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>17q12</td>\n", | |
" <td>17q12</td>\n", | |
" <td>MGC20398|OMCG1</td>\n", | |
" <td>orphan maintenance of genome 1</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28291</td>\n", | |
" <td>ENST00000361952.5|NM_052857.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43600</th>\n", | |
" <td>HGNC:27611</td>\n", | |
" <td>ZNF841</td>\n", | |
" <td>zinc finger protein 841</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.41</td>\n", | |
" <td>19q13.41</td>\n", | |
" <td>LOC284371</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27611</td>\n", | |
" <td>ENST00000594440.6|NM_001136499.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43601</th>\n", | |
" <td>HGNC:28710</td>\n", | |
" <td>ZNF843</td>\n", | |
" <td>zinc finger protein 843</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>16p11.2</td>\n", | |
" <td>16p11.2</td>\n", | |
" <td>MGC46336</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:28710</td>\n", | |
" <td>ENST00000315678.10|NM_001136509.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43603</th>\n", | |
" <td>HGNC:25112</td>\n", | |
" <td>ZNF845</td>\n", | |
" <td>zinc finger protein 845</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>19q13.42</td>\n", | |
" <td>19q13.42</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:25112</td>\n", | |
" <td>ENST00000458035.3|NM_138374.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43609</th>\n", | |
" <td>HGNC:27713</td>\n", | |
" <td>ZNF852</td>\n", | |
" <td>zinc finger protein 852</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>3p21.31</td>\n", | |
" <td>03p21.31</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:27713</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43612</th>\n", | |
" <td>HGNC:34513</td>\n", | |
" <td>ZNF860</td>\n", | |
" <td>zinc finger protein 860</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>3p24.1</td>\n", | |
" <td>03p24.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:34513</td>\n", | |
" <td>ENST00000360311.5|NM_001137674.3</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43632</th>\n", | |
" <td>HGNC:38707</td>\n", | |
" <td>ZNF892</td>\n", | |
" <td>zinc finger protein 892</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>2q11.1</td>\n", | |
" <td>02q11.1</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>ENST00000425953.6|NM_001395961.1</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43692</th>\n", | |
" <td>HGNC:12984</td>\n", | |
" <td>ZSCAN9</td>\n", | |
" <td>zinc finger and SCAN domain containing 9</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>6p22.1</td>\n", | |
" <td>06p22.1</td>\n", | |
" <td>PRD51</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:12984</td>\n", | |
" <td>ENST00000252207.10|NM_006299.5</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43704</th>\n", | |
" <td>HGNC:12978</td>\n", | |
" <td>ZSCAN26</td>\n", | |
" <td>zinc finger and SCAN domain containing 26</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>6p22.1</td>\n", | |
" <td>06p22.1</td>\n", | |
" <td>SRE-ZBP</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:12978</td>\n", | |
" <td>ENST00000421553.7|NM_001023560.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43706</th>\n", | |
" <td>HGNC:33517</td>\n", | |
" <td>ZSCAN30</td>\n", | |
" <td>zinc finger and SCAN domain containing 30</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>18q12.2</td>\n", | |
" <td>18q12.2</td>\n", | |
" <td>ZNF917</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:33517</td>\n", | |
" <td>ENST00000333206.10|NM_001112734.4</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43708</th>\n", | |
" <td>HGNC:20812</td>\n", | |
" <td>ZSCAN32</td>\n", | |
" <td>zinc finger and SCAN domain containing 32</td>\n", | |
" <td>protein-coding gene</td>\n", | |
" <td>gene with protein product</td>\n", | |
" <td>Approved</td>\n", | |
" <td>16p13.3</td>\n", | |
" <td>16p13.3</td>\n", | |
" <td>FLJ20417</td>\n", | |
" <td>NaN</td>\n", | |
" <td>...</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>NaN</td>\n", | |
" <td>HGNC:20812</td>\n", | |
" <td>ENST00000396852.9|NM_001284527.2</td>\n", | |
" <td>NaN</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"<p>669 rows × 54 columns</p>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" hgnc_id symbol \\\n", | |
"19 HGNC:32038 AADACL4 \n", | |
"195 HGNC:34391 ACCSL \n", | |
"346 HGNC:37282 ACTR3C \n", | |
"358 HGNC:24022 ACTRT3 \n", | |
"1015 HGNC:40024 ANHX \n", | |
"1036 HGNC:20987 ANKMY1 \n", | |
"1044 HGNC:20265 ANKRD10 \n", | |
"1099 HGNC:35167 ANKRD30BL \n", | |
"1117 HGNC:27639 ANKRD34A \n", | |
"1129 HGNC:28640 ANKRD39 \n", | |
"1132 HGNC:26080 ANKRD40CL \n", | |
"1152 HGNC:16217 ANKRD60 \n", | |
"1153 HGNC:22467 ANKRD61 \n", | |
"1157 HGNC:40027 ANKRD63 \n", | |
"1158 HGNC:42950 ANKRD65 \n", | |
"1160 HGNC:44669 ANKRD66 \n", | |
"1230 HGNC:28808 AP1AR \n", | |
"1386 HGNC:25365 ARB2A \n", | |
"1596 HGNC:44201 ARL14EPL \n", | |
"1625 HGNC:34345 ARMH1 \n", | |
"1626 HGNC:49394 ARMH2 \n", | |
"2100 HGNC:30898 AVPI1 \n", | |
"2319 HGNC:27413 BCLAF3 \n", | |
"2349 HGNC:24160 BEAN1 \n", | |
"2638 HGNC:24742 BRD3OS \n", | |
"2726 HGNC:33758 BTBD17 \n", | |
"2831 HGNC:28667 C1orf116 \n", | |
"2839 HGNC:25262 C1orf167 \n", | |
"2841 HGNC:27915 C1orf174 \n", | |
"2844 HGNC:56760 C1orf202 \n", | |
"... ... ... \n", | |
"43483 HGNC:32284 ZNF705B \n", | |
"43497 HGNC:32458 ZNF716 \n", | |
"43501 HGNC:22571 ZNF722 \n", | |
"43502 HGNC:32286 ZNF723 \n", | |
"43503 HGNC:32460 ZNF724 \n", | |
"43510 HGNC:32470 ZNF730 \n", | |
"43531 HGNC:27465 ZNF740 \n", | |
"43537 HGNC:23179 ZNF761 \n", | |
"43538 HGNC:27614 ZNF763 \n", | |
"43541 HGNC:28063 ZNF766 \n", | |
"43545 HGNC:29653 ZNF771 \n", | |
"43547 HGNC:30487 ZNF773 \n", | |
"43557 HGNC:26745 ZNF781 \n", | |
"43559 HGNC:27222 ZNF783 \n", | |
"43562 HGNC:21806 ZNF786 \n", | |
"43563 HGNC:26998 ZNF787 \n", | |
"43566 HGNC:33114 ZNF790 \n", | |
"43581 HGNC:33258 ZNF814 \n", | |
"43590 HGNC:34032 ZNF829 \n", | |
"43591 HGNC:28291 ZNF830 \n", | |
"43600 HGNC:27611 ZNF841 \n", | |
"43601 HGNC:28710 ZNF843 \n", | |
"43603 HGNC:25112 ZNF845 \n", | |
"43609 HGNC:27713 ZNF852 \n", | |
"43612 HGNC:34513 ZNF860 \n", | |
"43632 HGNC:38707 ZNF892 \n", | |
"43692 HGNC:12984 ZSCAN9 \n", | |
"43704 HGNC:12978 ZSCAN26 \n", | |
"43706 HGNC:33517 ZSCAN30 \n", | |
"43708 HGNC:20812 ZSCAN32 \n", | |
"\n", | |
" name locus_group \\\n", | |
"19 arylacetamide deacetylase like 4 protein-coding gene \n", | |
"195 1-aminocyclopropane-1-carboxylate synthase hom... protein-coding gene \n", | |
"346 actin related protein 3C protein-coding gene \n", | |
"358 actin related protein T3 protein-coding gene \n", | |
"1015 anomalous homeobox protein-coding gene \n", | |
"1036 ankyrin repeat and MYND domain containing 1 protein-coding gene \n", | |
"1044 ankyrin repeat domain 10 protein-coding gene \n", | |
"1099 ankyrin repeat domain 30B like protein-coding gene \n", | |
"1117 ankyrin repeat domain 34A protein-coding gene \n", | |
"1129 ankyrin repeat domain 39 protein-coding gene \n", | |
"1132 ANKRD40 C-terminal like protein-coding gene \n", | |
"1152 ankyrin repeat domain 60 protein-coding gene \n", | |
"1153 ankyrin repeat domain 61 protein-coding gene \n", | |
"1157 ankyrin repeat domain 63 protein-coding gene \n", | |
"1158 ankyrin repeat domain 65 protein-coding gene \n", | |
"1160 ankyrin repeat domain 66 protein-coding gene \n", | |
"1230 adaptor related protein complex 1 associated r... protein-coding gene \n", | |
"1386 ARB2 cotranscriptional regulator A protein-coding gene \n", | |
"1596 ADP ribosylation factor like GTPase 14 effecto... protein-coding gene \n", | |
"1625 armadillo like helical domain containing 1 protein-coding gene \n", | |
"1626 armadillo like helical domain containing 2 protein-coding gene \n", | |
"2100 arginine vasopressin induced 1 protein-coding gene \n", | |
"2319 BCLAF1 and THRAP3 family member 3 protein-coding gene \n", | |
"2349 brain expressed associated with NEDD4 1 protein-coding gene \n", | |
"2638 BRD3 opposite strand protein-coding gene \n", | |
"2726 BTB domain containing 17 protein-coding gene \n", | |
"2831 chromosome 1 open reading frame 116 protein-coding gene \n", | |
"2839 chromosome 1 open reading frame 167 protein-coding gene \n", | |
"2841 chromosome 1 open reading frame 174 protein-coding gene \n", | |
"2844 chromosome 1 open reading frame 202 protein-coding gene \n", | |
"... ... ... \n", | |
"43483 zinc finger protein 705B protein-coding gene \n", | |
"43497 zinc finger protein 716 protein-coding gene \n", | |
"43501 zinc finger protein 722 protein-coding gene \n", | |
"43502 zinc finger protein 723 protein-coding gene \n", | |
"43503 zinc finger protein 724 protein-coding gene \n", | |
"43510 zinc finger protein 730 protein-coding gene \n", | |
"43531 zinc finger protein 740 protein-coding gene \n", | |
"43537 zinc finger protein 761 protein-coding gene \n", | |
"43538 zinc finger protein 763 protein-coding gene \n", | |
"43541 zinc finger protein 766 protein-coding gene \n", | |
"43545 zinc finger protein 771 protein-coding gene \n", | |
"43547 zinc finger protein 773 protein-coding gene \n", | |
"43557 zinc finger protein 781 protein-coding gene \n", | |
"43559 zinc finger protein 783 protein-coding gene \n", | |
"43562 zinc finger protein 786 protein-coding gene \n", | |
"43563 zinc finger protein 787 protein-coding gene \n", | |
"43566 zinc finger protein 790 protein-coding gene \n", | |
"43581 zinc finger protein 814 protein-coding gene \n", | |
"43590 zinc finger protein 829 protein-coding gene \n", | |
"43591 zinc finger protein 830 protein-coding gene \n", | |
"43600 zinc finger protein 841 protein-coding gene \n", | |
"43601 zinc finger protein 843 protein-coding gene \n", | |
"43603 zinc finger protein 845 protein-coding gene \n", | |
"43609 zinc finger protein 852 protein-coding gene \n", | |
"43612 zinc finger protein 860 protein-coding gene \n", | |
"43632 zinc finger protein 892 protein-coding gene \n", | |
"43692 zinc finger and SCAN domain containing 9 protein-coding gene \n", | |
"43704 zinc finger and SCAN domain containing 26 protein-coding gene \n", | |
"43706 zinc finger and SCAN domain containing 30 protein-coding gene \n", | |
"43708 zinc finger and SCAN domain containing 32 protein-coding gene \n", | |
"\n", | |
" locus_type status location location_sortable \\\n", | |
"19 gene with protein product Approved 1p36.21 01p36.21 \n", | |
"195 gene with protein product Approved 11p11.2 11p11.2 \n", | |
"346 gene with protein product Approved 7q36.1 07q36.1 \n", | |
"358 gene with protein product Approved 3q26.2 03q26.2 \n", | |
"1015 gene with protein product Approved 12q24.33 12q24.33 \n", | |
"1036 gene with protein product Approved 2q37.3 02q37.3 \n", | |
"1044 gene with protein product Approved 13q34 13q34 \n", | |
"1099 gene with protein product Approved 2q21.2 02q21.2 \n", | |
"1117 gene with protein product Approved 1q21.1 01q21.1 \n", | |
"1129 gene with protein product Approved 2q11.2 02q11.2 \n", | |
"1132 gene with protein product Approved 17q21.33 17q21.33 \n", | |
"1152 gene with protein product Approved 20q13.32 20q13.32 \n", | |
"1153 gene with protein product Approved 7p22.1 07p22.1 \n", | |
"1157 gene with protein product Approved 15q15.1 15q15.1 \n", | |
"1158 gene with protein product Approved 1p36.33 01p36.33 \n", | |
"1160 gene with protein product Approved 6p12.3 06p12.3 \n", | |
"1230 gene with protein product Approved 4q25 04q25 \n", | |
"1386 gene with protein product Approved 5q15 05q15 \n", | |
"1596 gene with protein product Approved 5q23.1 05q23.1 \n", | |
"1625 gene with protein product Approved 1p34.1 01p34.1 \n", | |
"1626 gene with protein product Approved 6p22.3 06p22.3 \n", | |
"2100 gene with protein product Approved 10q24.2 10q24.2 \n", | |
"2319 gene with protein product Approved Xp22.12 Xp22.12 \n", | |
"2349 gene with protein product Approved 16q21 16q21 \n", | |
"2638 gene with protein product Approved 9q34.2 09q34.2 \n", | |
"2726 gene with protein product Approved 17q25.1 17q25.1 \n", | |
"2831 gene with protein product Approved 1q32.1 01q32.1 \n", | |
"2839 gene with protein product Approved 1p36.22 01p36.22 \n", | |
"2841 gene with protein product Approved 1p36.32 01p36.32 \n", | |
"2844 gene with protein product Approved 1q44 01q44 \n", | |
"... ... ... ... ... \n", | |
"43483 gene with protein product Approved 8p23.1 08p23.1 \n", | |
"43497 gene with protein product Approved 7p11.2 07p11.2 \n", | |
"43501 gene with protein product Approved 7q11.21 07q11.21 \n", | |
"43502 gene with protein product Approved 19p12 19p12 \n", | |
"43503 gene with protein product Approved 19p12 19p12 \n", | |
"43510 gene with protein product Approved 19p12 19p12 \n", | |
"43531 gene with protein product Approved 12q13.13 12q13.13 \n", | |
"43537 gene with protein product Approved 19q13.42 19q13.42 \n", | |
"43538 gene with protein product Approved 19p13.2 19p13.2 \n", | |
"43541 gene with protein product Approved 19q13.41 19q13.41 \n", | |
"43545 gene with protein product Approved 16p11.2 16p11.2 \n", | |
"43547 gene with protein product Approved 19q13.43 19q13.43 \n", | |
"43557 gene with protein product Approved 19q13.12 19q13.12 \n", | |
"43559 gene with protein product Approved 7q36.1 07q36.1 \n", | |
"43562 gene with protein product Approved 7q36.1 07q36.1 \n", | |
"43563 gene with protein product Approved 19q13.43 19q13.43 \n", | |
"43566 gene with protein product Approved 19q13.12 19q13.12 \n", | |
"43581 gene with protein product Approved 19q13.43 19q13.43 \n", | |
"43590 gene with protein product Approved 19q13.12 19q13.12 \n", | |
"43591 gene with protein product Approved 17q12 17q12 \n", | |
"43600 gene with protein product Approved 19q13.41 19q13.41 \n", | |
"43601 gene with protein product Approved 16p11.2 16p11.2 \n", | |
"43603 gene with protein product Approved 19q13.42 19q13.42 \n", | |
"43609 gene with protein product Approved 3p21.31 03p21.31 \n", | |
"43612 gene with protein product Approved 3p24.1 03p24.1 \n", | |
"43632 gene with protein product Approved 2q11.1 02q11.1 \n", | |
"43692 gene with protein product Approved 6p22.1 06p22.1 \n", | |
"43704 gene with protein product Approved 6p22.1 06p22.1 \n", | |
"43706 gene with protein product Approved 18q12.2 18q12.2 \n", | |
"43708 gene with protein product Approved 16p13.3 16p13.3 \n", | |
"\n", | |
" alias_symbol \\\n", | |
"19 OTTHUMG00000001889 \n", | |
"195 NaN \n", | |
"346 ARP11 \n", | |
"358 ARPM1 \n", | |
"1015 NaN \n", | |
"1036 FLJ20499|ZMYND13 \n", | |
"1044 FLJ20093 \n", | |
"1099 NaN \n", | |
"1117 NaN \n", | |
"1129 MGC41816 \n", | |
"1132 FLJ20694 \n", | |
"1152 bA196N14.3 \n", | |
"1153 NaN \n", | |
"1157 NaN \n", | |
"1158 NaN \n", | |
"1160 NaN \n", | |
"1230 PRO0971|2C18|gamma-BAR \n", | |
"1386 DKFZP564D172|Toupee \n", | |
"1596 NaN \n", | |
"1625 MGC33556|p40 \n", | |
"1626 NaN \n", | |
"2100 VIP32|PP5395|VIT32 \n", | |
"2319 NaN \n", | |
"2349 NaN \n", | |
"2638 FLJ35348|bA374P20.3|SERLOC \n", | |
"2726 LGALS3BPL|BTBD17A|TANGO10A \n", | |
"2831 SARG|FLJ36507|MGC2742|MGC4309 \n", | |
"2839 DKFZp434E1410|RP11-56N19.2 \n", | |
"2841 RP13-531C17.2 \n", | |
"2844 NaN \n", | |
"... ... \n", | |
"43483 NaN \n", | |
"43497 FLJ46189 \n", | |
"43501 NaN \n", | |
"43502 NaN \n", | |
"43503 NaN \n", | |
"43510 NaN \n", | |
"43531 Zfp740 \n", | |
"43537 KIAA2033|FLJ16231|FLJ35333 \n", | |
"43538 ZNF440L \n", | |
"43541 NaN \n", | |
"43545 DSC43 \n", | |
"43547 MGC4728 \n", | |
"43557 FLJ37549 \n", | |
"43559 DKFZp667J212 \n", | |
"43562 DKFZp762I137 \n", | |
"43563 NaN \n", | |
"43566 MGC62100|FLJ20350 \n", | |
"43581 NaN \n", | |
"43590 DKFZp779O175 \n", | |
"43591 MGC20398|OMCG1 \n", | |
"43600 LOC284371 \n", | |
"43601 MGC46336 \n", | |
"43603 NaN \n", | |
"43609 NaN \n", | |
"43612 NaN \n", | |
"43632 NaN \n", | |
"43692 PRD51 \n", | |
"43704 SRE-ZBP \n", | |
"43706 ZNF917 \n", | |
"43708 FLJ20417 \n", | |
"\n", | |
" alias_name ... cd lncrnadb \\\n", | |
"19 NaN ... NaN NaN \n", | |
"195 NaN ... NaN NaN \n", | |
"346 NaN ... NaN NaN \n", | |
"358 actin related protein M1 ... NaN NaN \n", | |
"1015 NaN ... NaN NaN \n", | |
"1036 NaN ... NaN NaN \n", | |
"1044 NaN ... NaN NaN \n", | |
"1099 NaN ... NaN NaN \n", | |
"1117 NaN ... NaN NaN \n", | |
"1129 NaN ... NaN NaN \n", | |
"1132 NaN ... NaN NaN \n", | |
"1152 NaN ... NaN NaN \n", | |
"1153 NaN ... NaN NaN \n", | |
"1157 NaN ... NaN NaN \n", | |
"1158 NaN ... NaN NaN \n", | |
"1160 NaN ... NaN NaN \n", | |
"1230 gamma1-adaptin brefeldin A resistance ... NaN NaN \n", | |
"1386 NaN ... NaN NaN \n", | |
"1596 NaN ... NaN NaN \n", | |
"1625 NaN ... NaN NaN \n", | |
"1626 NaN ... NaN NaN \n", | |
"2100 NaN ... NaN NaN \n", | |
"2319 NaN ... NaN NaN \n", | |
"2349 NaN ... NaN NaN \n", | |
"2638 Super enhancer and ERK1/2 Regulated Long Inter... ... NaN NaN \n", | |
"2726 transport and golgi organization 10 homolog A ... ... NaN NaN \n", | |
"2831 specifically androgen-regulated gene ... NaN NaN \n", | |
"2839 NaN ... NaN NaN \n", | |
"2841 NaN ... NaN NaN \n", | |
"2844 NaN ... NaN NaN \n", | |
"... ... ... ... ... \n", | |
"43483 NaN ... NaN NaN \n", | |
"43497 NaN ... NaN NaN \n", | |
"43501 NaN ... NaN NaN \n", | |
"43502 NaN ... NaN NaN \n", | |
"43503 NaN ... NaN NaN \n", | |
"43510 NaN ... NaN NaN \n", | |
"43531 NaN ... NaN NaN \n", | |
"43537 NaN ... NaN NaN \n", | |
"43538 NaN ... NaN NaN \n", | |
"43541 NaN ... NaN NaN \n", | |
"43545 NaN ... NaN NaN \n", | |
"43547 NaN ... NaN NaN \n", | |
"43557 NaN ... NaN NaN \n", | |
"43559 NaN ... NaN NaN \n", | |
"43562 NaN ... NaN NaN \n", | |
"43563 NaN ... NaN NaN \n", | |
"43566 NaN ... NaN NaN \n", | |
"43581 NaN ... NaN NaN \n", | |
"43590 NaN ... NaN NaN \n", | |
"43591 orphan maintenance of genome 1 ... NaN NaN \n", | |
"43600 NaN ... NaN NaN \n", | |
"43601 NaN ... NaN NaN \n", | |
"43603 NaN ... NaN NaN \n", | |
"43609 NaN ... NaN NaN \n", | |
"43612 NaN ... NaN NaN \n", | |
"43632 NaN ... NaN NaN \n", | |
"43692 NaN ... NaN NaN \n", | |
"43704 NaN ... NaN NaN \n", | |
"43706 NaN ... NaN NaN \n", | |
"43708 NaN ... NaN NaN \n", | |
"\n", | |
" enzyme_id intermediate_filament_db rna_central_ids lncipedia gtrnadb \\\n", | |
"19 NaN NaN NaN NaN NaN \n", | |
"195 NaN NaN NaN NaN NaN \n", | |
"346 NaN NaN NaN NaN NaN \n", | |
"358 NaN NaN NaN NaN NaN \n", | |
"1015 NaN NaN NaN NaN NaN \n", | |
"1036 NaN NaN NaN NaN NaN \n", | |
"1044 NaN NaN NaN NaN NaN \n", | |
"1099 NaN NaN NaN NaN NaN \n", | |
"1117 NaN NaN NaN NaN NaN \n", | |
"1129 NaN NaN NaN NaN NaN \n", | |
"1132 NaN NaN NaN LINC00483 NaN \n", | |
"1152 NaN NaN NaN NaN NaN \n", | |
"1153 NaN NaN NaN NaN NaN \n", | |
"1157 NaN NaN NaN NaN NaN \n", | |
"1158 NaN NaN NaN NaN NaN \n", | |
"1160 NaN NaN NaN NaN NaN \n", | |
"1230 NaN NaN NaN NaN NaN \n", | |
"1386 NaN NaN NaN NaN NaN \n", | |
"1596 NaN NaN NaN NaN NaN \n", | |
"1625 NaN NaN NaN NaN NaN \n", | |
"1626 NaN NaN NaN NaN NaN \n", | |
"2100 NaN NaN NaN NaN NaN \n", | |
"2319 NaN NaN NaN NaN NaN \n", | |
"2349 NaN NaN NaN NaN NaN \n", | |
"2638 NaN NaN NaN LINC00094 NaN \n", | |
"2726 NaN NaN NaN NaN NaN \n", | |
"2831 NaN NaN NaN NaN NaN \n", | |
"2839 NaN NaN NaN NaN NaN \n", | |
"2841 NaN NaN NaN NaN NaN \n", | |
"2844 NaN NaN NaN NaN NaN \n", | |
"... ... ... ... ... ... \n", | |
"43483 NaN NaN NaN NaN NaN \n", | |
"43497 NaN NaN NaN NaN NaN \n", | |
"43501 NaN NaN NaN NaN NaN \n", | |
"43502 NaN NaN NaN NaN NaN \n", | |
"43503 NaN NaN NaN NaN NaN \n", | |
"43510 NaN NaN NaN NaN NaN \n", | |
"43531 NaN NaN NaN NaN NaN \n", | |
"43537 NaN NaN NaN NaN NaN \n", | |
"43538 NaN NaN NaN NaN NaN \n", | |
"43541 NaN NaN NaN NaN NaN \n", | |
"43545 NaN NaN NaN NaN NaN \n", | |
"43547 NaN NaN NaN NaN NaN \n", | |
"43557 NaN NaN NaN NaN NaN \n", | |
"43559 NaN NaN NaN NaN NaN \n", | |
"43562 NaN NaN NaN NaN NaN \n", | |
"43563 NaN NaN NaN NaN NaN \n", | |
"43566 NaN NaN NaN NaN NaN \n", | |
"43581 NaN NaN NaN NaN NaN \n", | |
"43590 NaN NaN NaN NaN NaN \n", | |
"43591 NaN NaN NaN NaN NaN \n", | |
"43600 NaN NaN NaN NaN NaN \n", | |
"43601 NaN NaN NaN NaN NaN \n", | |
"43603 NaN NaN NaN NaN NaN \n", | |
"43609 NaN NaN NaN NaN NaN \n", | |
"43612 NaN NaN NaN NaN NaN \n", | |
"43632 NaN NaN NaN NaN NaN \n", | |
"43692 NaN NaN NaN NaN NaN \n", | |
"43704 NaN NaN NaN NaN NaN \n", | |
"43706 NaN NaN NaN NaN NaN \n", | |
"43708 NaN NaN NaN NaN NaN \n", | |
"\n", | |
" agr mane_select gencc \n", | |
"19 HGNC:32038 ENST00000376221.2|NM_001013630.2 NaN \n", | |
"195 HGNC:34391 ENST00000378832.1|NM_001031854.2 NaN \n", | |
"346 HGNC:37282 ENST00000683684.1|NM_001164458.2 NaN \n", | |
"358 HGNC:24022 ENST00000330368.3|NM_032487.5 NaN \n", | |
"1015 HGNC:40024 ENST00000545940.6|NM_001372060.1 NaN \n", | |
"1036 HGNC:20987 ENST00000401804.6|NM_001282771.3 NaN \n", | |
"1044 HGNC:20265 ENST00000267339.6|NM_017664.4 NaN \n", | |
"1099 HGNC:35167 ENST00000409867.6|NM_001358416.1 NaN \n", | |
"1117 HGNC:27639 ENST00000606888.3|NM_001039888.4 NaN \n", | |
"1129 HGNC:28640 ENST00000393537.5|NM_016466.6 NaN \n", | |
"1132 HGNC:26080 ENST00000450727.6|NM_001358683.3 NaN \n", | |
"1152 HGNC:16217 ENST00000457363.2|NM_001304369.2 NaN \n", | |
"1153 HGNC:22467 ENST00000409061.2|NM_001271700.2 NaN \n", | |
"1157 HGNC:40027 ENST00000434396.2|NM_001190479.3 NaN \n", | |
"1158 HGNC:42950 ENST00000537107.6|NM_001145210.3 NaN \n", | |
"1160 HGNC:44669 ENST00000565422.3|NM_001162435.3 NaN \n", | |
"1230 HGNC:28808 ENST00000274000.10|NM_018569.6 NaN \n", | |
"1386 HGNC:25365 ENST00000395965.8|NM_032042.6 NaN \n", | |
"1596 HGNC:44201 ENST00000686077.1|NM_001195581.2 NaN \n", | |
"1625 HGNC:34345 ENST00000535358.6|NM_001145636.2 NaN \n", | |
"1626 HGNC:49394 ENST00000565469.4|NM_001282492.2 NaN \n", | |
"2100 HGNC:30898 ENST00000370626.4|NM_021732.3 NaN \n", | |
"2319 HGNC:27413 ENST00000379682.9|NM_001367774.2 NaN \n", | |
"2349 HGNC:24160 ENST00000536005.7|NM_001178020.3 HGNC:24160 \n", | |
"2638 HGNC:24742 ENST00000603928.3|NM_001355256.2 NaN \n", | |
"2726 HGNC:33758 ENST00000375366.4|NM_001080466.2 NaN \n", | |
"2831 HGNC:28667 ENST00000359470.6|NM_023938.6 NaN \n", | |
"2839 HGNC:25262 ENST00000688073.1|NM_001010881.2 NaN \n", | |
"2841 HGNC:27915 ENST00000361605.4|NM_207356.3 NaN \n", | |
"2844 NaN ENST00000640271.3|NM_001395959.1 NaN \n", | |
"... ... ... ... \n", | |
"43483 HGNC:32284 ENST00000400120.3|NM_001193630.1 NaN \n", | |
"43497 HGNC:32458 ENST00000420713.2|NM_001159279.1 NaN \n", | |
"43501 HGNC:22571 ENST00000330020.5|NM_001396012.1 NaN \n", | |
"43502 HGNC:32286 ENST00000600766.3|NM_001349726.2 NaN \n", | |
"43503 HGNC:32460 ENST00000418100.6|NM_001355404.2 NaN \n", | |
"43510 HGNC:32470 ENST00000597761.7|NM_001277403.2 NaN \n", | |
"43531 HGNC:27465 ENST00000416904.5|NM_001004304.4 NaN \n", | |
"43537 HGNC:23179 ENST00000684525.1|NM_001289951.2 NaN \n", | |
"43538 HGNC:27614 ENST00000358987.8|NM_001367172.2 NaN \n", | |
"43541 HGNC:28063 ENST00000439461.6|NM_001010851.3 NaN \n", | |
"43545 HGNC:29653 ENST00000319296.10|NM_001142305.2 NaN \n", | |
"43547 HGNC:30487 ENST00000282292.9|NM_198542.3 NaN \n", | |
"43557 HGNC:26745 NaN NaN \n", | |
"43559 HGNC:27222 ENST00000434415.6|NM_001195220.2 NaN \n", | |
"43562 HGNC:21806 ENST00000491431.2|NM_152411.4 NaN \n", | |
"43563 HGNC:26998 ENST00000610935.2|NM_001002836.4 NaN \n", | |
"43566 HGNC:33114 ENST00000356725.9|NM_206894.4 NaN \n", | |
"43581 HGNC:33258 ENST00000435989.7|NM_001144989.2 NaN \n", | |
"43590 HGNC:34032 ENST00000391711.8|NM_001037232.4 NaN \n", | |
"43591 HGNC:28291 ENST00000361952.5|NM_052857.4 NaN \n", | |
"43600 HGNC:27611 ENST00000594440.6|NM_001136499.2 NaN \n", | |
"43601 HGNC:28710 ENST00000315678.10|NM_001136509.3 NaN \n", | |
"43603 HGNC:25112 ENST00000458035.3|NM_138374.3 NaN \n", | |
"43609 HGNC:27713 NaN NaN \n", | |
"43612 HGNC:34513 ENST00000360311.5|NM_001137674.3 NaN \n", | |
"43632 NaN ENST00000425953.6|NM_001395961.1 NaN \n", | |
"43692 HGNC:12984 ENST00000252207.10|NM_006299.5 NaN \n", | |
"43704 HGNC:12978 ENST00000421553.7|NM_001023560.4 NaN \n", | |
"43706 HGNC:33517 ENST00000333206.10|NM_001112734.4 NaN \n", | |
"43708 HGNC:20812 ENST00000396852.9|NM_001284527.2 NaN \n", | |
"\n", | |
"[669 rows x 54 columns]" | |
] | |
}, | |
"execution_count": 25, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"# Inspect it\n", | |
"hgnc_unexp_df" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 26, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"19 NaN\n", | |
"195 NaN\n", | |
"346 NaN\n", | |
"358 NaN\n", | |
"1015 NaN\n", | |
"1036 NaN\n", | |
"1044 NaN\n", | |
"1099 2010-06-14\n", | |
"1117 2007-11-20\n", | |
"1129 NaN\n", | |
"1132 2018-05-17\n", | |
"1152 2008-03-25\n", | |
"1153 NaN\n", | |
"1157 NaN\n", | |
"1158 NaN\n", | |
"1160 NaN\n", | |
"1230 2009-09-25\n", | |
"1386 2023-08-18\n", | |
"1596 NaN\n", | |
"1625 2018-01-31\n", | |
"1626 2018-01-31\n", | |
"2100 NaN\n", | |
"2319 2017-06-09\n", | |
"2349 NaN\n", | |
"2638 2017-08-11\n", | |
"2726 NaN\n", | |
"2831 NaN\n", | |
"2839 NaN\n", | |
"2841 NaN\n", | |
"2844 NaN\n", | |
" ... \n", | |
"43483 NaN\n", | |
"43497 NaN\n", | |
"43501 2021-09-24\n", | |
"43502 2017-03-30\n", | |
"43503 2016-07-19\n", | |
"43510 NaN\n", | |
"43531 NaN\n", | |
"43537 2006-08-11\n", | |
"43538 NaN\n", | |
"43541 NaN\n", | |
"43545 NaN\n", | |
"43547 2006-12-15\n", | |
"43557 NaN\n", | |
"43559 NaN\n", | |
"43562 NaN\n", | |
"43563 NaN\n", | |
"43566 NaN\n", | |
"43581 NaN\n", | |
"43590 NaN\n", | |
"43591 2008-03-25\n", | |
"43600 NaN\n", | |
"43601 NaN\n", | |
"43603 NaN\n", | |
"43609 NaN\n", | |
"43612 NaN\n", | |
"43632 NaN\n", | |
"43692 2013-01-09\n", | |
"43704 2013-01-09\n", | |
"43706 2010-07-23\n", | |
"43708 2013-01-09\n", | |
"Name: date_symbol_changed, Length: 669, dtype: object" | |
] | |
}, | |
"execution_count": 26, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"hgnc_unexp_df['date_symbol_changed']" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 37, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/html": [ | |
"<div>\n", | |
"<style scoped>\n", | |
" .dataframe tbody tr th:only-of-type {\n", | |
" vertical-align: middle;\n", | |
" }\n", | |
"\n", | |
" .dataframe tbody tr th {\n", | |
" vertical-align: top;\n", | |
" }\n", | |
"\n", | |
" .dataframe thead th {\n", | |
" text-align: right;\n", | |
" }\n", | |
"</style>\n", | |
"<table border=\"1\" class=\"dataframe\">\n", | |
" <thead>\n", | |
" <tr style=\"text-align: right;\">\n", | |
" <th></th>\n", | |
" <th>symbol</th>\n", | |
" <th>date_symbol_changed</th>\n", | |
" <th>date_name_changed</th>\n", | |
" </tr>\n", | |
" </thead>\n", | |
" <tbody>\n", | |
" <tr>\n", | |
" <th>21287</th>\n", | |
" <td>MTCL3</td>\n", | |
" <td>2023-09-01</td>\n", | |
" <td>2023-09-01</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1386</th>\n", | |
" <td>ARB2A</td>\n", | |
" <td>2023-08-18</td>\n", | |
" <td>2023-08-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>22666</th>\n", | |
" <td>NHSL3</td>\n", | |
" <td>2023-08-18</td>\n", | |
" <td>2023-08-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8623</th>\n", | |
" <td>FAM90A11</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8624</th>\n", | |
" <td>FAM90A12</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8625</th>\n", | |
" <td>FAM90A13</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8627</th>\n", | |
" <td>FAM90A15</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8617</th>\n", | |
" <td>FAM90A5</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8632</th>\n", | |
" <td>FAM90A20</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8636</th>\n", | |
" <td>FAM90A24</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8615</th>\n", | |
" <td>FAM90A3</td>\n", | |
" <td>2023-08-17</td>\n", | |
" <td>2023-08-17</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4447</th>\n", | |
" <td>CFAP96</td>\n", | |
" <td>2023-05-03</td>\n", | |
" <td>2023-05-03</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4765</th>\n", | |
" <td>CIMIP2C</td>\n", | |
" <td>2023-04-27</td>\n", | |
" <td>2023-04-27</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4763</th>\n", | |
" <td>CIMIP2A</td>\n", | |
" <td>2023-04-27</td>\n", | |
" <td>2023-04-27</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4759</th>\n", | |
" <td>CIMAP1D</td>\n", | |
" <td>2023-04-27</td>\n", | |
" <td>2023-04-27</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>37293</th>\n", | |
" <td>SPMIP8</td>\n", | |
" <td>2023-04-27</td>\n", | |
" <td>2023-04-27</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>37289</th>\n", | |
" <td>SPMIP4</td>\n", | |
" <td>2023-04-27</td>\n", | |
" <td>2023-05-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8787</th>\n", | |
" <td>FAM200C</td>\n", | |
" <td>2022-10-19</td>\n", | |
" <td>2022-10-19</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>41601</th>\n", | |
" <td>UQCC5</td>\n", | |
" <td>2022-10-10</td>\n", | |
" <td>2022-10-10</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>4435</th>\n", | |
" <td>CFAP68</td>\n", | |
" <td>2022-09-29</td>\n", | |
" <td>2022-09-29</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>41600</th>\n", | |
" <td>UQCC4</td>\n", | |
" <td>2022-09-22</td>\n", | |
" <td>2022-09-22</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>26924</th>\n", | |
" <td>PRR23E</td>\n", | |
" <td>2022-09-15</td>\n", | |
" <td>2022-09-15</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>7516</th>\n", | |
" <td>EEIG2</td>\n", | |
" <td>2022-09-01</td>\n", | |
" <td>2022-09-01</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10517</th>\n", | |
" <td>GOLGA6L24</td>\n", | |
" <td>2022-08-24</td>\n", | |
" <td>2022-08-24</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10518</th>\n", | |
" <td>GOLGA6L25</td>\n", | |
" <td>2022-08-24</td>\n", | |
" <td>2022-08-24</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10647</th>\n", | |
" <td>GPR15LG</td>\n", | |
" <td>2022-05-30</td>\n", | |
" <td>2022-05-30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>25521</th>\n", | |
" <td>PIERCE2</td>\n", | |
" <td>2021-11-26</td>\n", | |
" <td>2021-11-26</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9996</th>\n", | |
" <td>GARIN6</td>\n", | |
" <td>2021-11-25</td>\n", | |
" <td>2021-11-25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9995</th>\n", | |
" <td>GARIN5B</td>\n", | |
" <td>2021-11-25</td>\n", | |
" <td>2021-11-25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>9989</th>\n", | |
" <td>GARIN1B</td>\n", | |
" <td>2021-11-25</td>\n", | |
" <td>2021-11-25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>...</th>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" <td>...</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1152</th>\n", | |
" <td>ANKRD60</td>\n", | |
" <td>2008-03-25</td>\n", | |
" <td>2008-03-25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23821</th>\n", | |
" <td>OR4K3</td>\n", | |
" <td>2008-01-23</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>18002</th>\n", | |
" <td>MAPK1IP1L</td>\n", | |
" <td>2008-01-16</td>\n", | |
" <td>2016-07-01</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24615</th>\n", | |
" <td>PABPC1L2B</td>\n", | |
" <td>2007-11-21</td>\n", | |
" <td>2016-03-30</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>1117</th>\n", | |
" <td>ANKRD34A</td>\n", | |
" <td>2007-11-20</td>\n", | |
" <td>2007-11-20</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>2984</th>\n", | |
" <td>C6orf52</td>\n", | |
" <td>2007-06-07</td>\n", | |
" <td>2007-06-07</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>10691</th>\n", | |
" <td>GPR89B</td>\n", | |
" <td>2007-06-06</td>\n", | |
" <td>2007-06-06</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>42907</th>\n", | |
" <td>ZKSCAN2</td>\n", | |
" <td>2007-02-20</td>\n", | |
" <td>2007-02-20</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>39164</th>\n", | |
" <td>TMEM185B</td>\n", | |
" <td>2007-02-05</td>\n", | |
" <td>2011-05-27</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>39148</th>\n", | |
" <td>TMEM183A</td>\n", | |
" <td>2006-12-18</td>\n", | |
" <td>2006-12-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43547</th>\n", | |
" <td>ZNF773</td>\n", | |
" <td>2006-12-15</td>\n", | |
" <td>2006-12-15</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43537</th>\n", | |
" <td>ZNF761</td>\n", | |
" <td>2006-08-11</td>\n", | |
" <td>2006-08-11</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43227</th>\n", | |
" <td>ZNF428</td>\n", | |
" <td>2006-07-04</td>\n", | |
" <td>2006-07-04</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8670</th>\n", | |
" <td>FAM118A</td>\n", | |
" <td>2006-04-26</td>\n", | |
" <td>2015-11-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>13461</th>\n", | |
" <td>IRGQ</td>\n", | |
" <td>2005-10-31</td>\n", | |
" <td>2016-06-13</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>35134</th>\n", | |
" <td>SFT2D1</td>\n", | |
" <td>2005-07-25</td>\n", | |
" <td>2005-07-25</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>8571</th>\n", | |
" <td>FAM78A</td>\n", | |
" <td>2005-07-18</td>\n", | |
" <td>2015-11-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>25953</th>\n", | |
" <td>PLGLB2</td>\n", | |
" <td>2005-03-31</td>\n", | |
" <td>2019-02-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24674</th>\n", | |
" <td>PAGE3</td>\n", | |
" <td>2005-01-27</td>\n", | |
" <td>2015-11-18</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>11450</th>\n", | |
" <td>HDHD3</td>\n", | |
" <td>2004-08-12</td>\n", | |
" <td>2015-12-01</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>34493</th>\n", | |
" <td>SAMD10</td>\n", | |
" <td>2004-07-16</td>\n", | |
" <td>2004-07-15</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>42579</th>\n", | |
" <td>YLPM1</td>\n", | |
" <td>2004-07-15</td>\n", | |
" <td>2004-07-15</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23973</th>\n", | |
" <td>OR5W2</td>\n", | |
" <td>2004-03-10</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23968</th>\n", | |
" <td>OR5T1</td>\n", | |
" <td>2004-03-10</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24361</th>\n", | |
" <td>OR51F1</td>\n", | |
" <td>2004-03-10</td>\n", | |
" <td>2020-05-01</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>24276</th>\n", | |
" <td>OR10W1</td>\n", | |
" <td>2004-03-05</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23630</th>\n", | |
" <td>OR2AJ1</td>\n", | |
" <td>2004-03-05</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>43271</th>\n", | |
" <td>ZNF486</td>\n", | |
" <td>2003-12-17</td>\n", | |
" <td>2003-12-16</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>13713</th>\n", | |
" <td>KBTBD3</td>\n", | |
" <td>2003-12-17</td>\n", | |
" <td>2016-02-12</td>\n", | |
" </tr>\n", | |
" <tr>\n", | |
" <th>23615</th>\n", | |
" <td>OR2A12</td>\n", | |
" <td>2002-11-13</td>\n", | |
" <td>2015-12-09</td>\n", | |
" </tr>\n", | |
" </tbody>\n", | |
"</table>\n", | |
"<p>273 rows × 3 columns</p>\n", | |
"</div>" | |
], | |
"text/plain": [ | |
" symbol date_symbol_changed date_name_changed\n", | |
"21287 MTCL3 2023-09-01 2023-09-01\n", | |
"1386 ARB2A 2023-08-18 2023-08-18\n", | |
"22666 NHSL3 2023-08-18 2023-08-18\n", | |
"8623 FAM90A11 2023-08-17 2023-08-17\n", | |
"8624 FAM90A12 2023-08-17 2023-08-17\n", | |
"8625 FAM90A13 2023-08-17 2023-08-17\n", | |
"8627 FAM90A15 2023-08-17 2023-08-17\n", | |
"8617 FAM90A5 2023-08-17 2023-08-17\n", | |
"8632 FAM90A20 2023-08-17 2023-08-17\n", | |
"8636 FAM90A24 2023-08-17 2023-08-17\n", | |
"8615 FAM90A3 2023-08-17 2023-08-17\n", | |
"4447 CFAP96 2023-05-03 2023-05-03\n", | |
"4765 CIMIP2C 2023-04-27 2023-04-27\n", | |
"4763 CIMIP2A 2023-04-27 2023-04-27\n", | |
"4759 CIMAP1D 2023-04-27 2023-04-27\n", | |
"37293 SPMIP8 2023-04-27 2023-04-27\n", | |
"37289 SPMIP4 2023-04-27 2023-05-18\n", | |
"8787 FAM200C 2022-10-19 2022-10-19\n", | |
"41601 UQCC5 2022-10-10 2022-10-10\n", | |
"4435 CFAP68 2022-09-29 2022-09-29\n", | |
"41600 UQCC4 2022-09-22 2022-09-22\n", | |
"26924 PRR23E 2022-09-15 2022-09-15\n", | |
"7516 EEIG2 2022-09-01 2022-09-01\n", | |
"10517 GOLGA6L24 2022-08-24 2022-08-24\n", | |
"10518 GOLGA6L25 2022-08-24 2022-08-24\n", | |
"10647 GPR15LG 2022-05-30 2022-05-30\n", | |
"25521 PIERCE2 2021-11-26 2021-11-26\n", | |
"9996 GARIN6 2021-11-25 2021-11-25\n", | |
"9995 GARIN5B 2021-11-25 2021-11-25\n", | |
"9989 GARIN1B 2021-11-25 2021-11-25\n", | |
"... ... ... ...\n", | |
"1152 ANKRD60 2008-03-25 2008-03-25\n", | |
"23821 OR4K3 2008-01-23 2015-12-09\n", | |
"18002 MAPK1IP1L 2008-01-16 2016-07-01\n", | |
"24615 PABPC1L2B 2007-11-21 2016-03-30\n", | |
"1117 ANKRD34A 2007-11-20 2007-11-20\n", | |
"2984 C6orf52 2007-06-07 2007-06-07\n", | |
"10691 GPR89B 2007-06-06 2007-06-06\n", | |
"42907 ZKSCAN2 2007-02-20 2007-02-20\n", | |
"39164 TMEM185B 2007-02-05 2011-05-27\n", | |
"39148 TMEM183A 2006-12-18 2006-12-18\n", | |
"43547 ZNF773 2006-12-15 2006-12-15\n", | |
"43537 ZNF761 2006-08-11 2006-08-11\n", | |
"43227 ZNF428 2006-07-04 2006-07-04\n", | |
"8670 FAM118A 2006-04-26 2015-11-18\n", | |
"13461 IRGQ 2005-10-31 2016-06-13\n", | |
"35134 SFT2D1 2005-07-25 2005-07-25\n", | |
"8571 FAM78A 2005-07-18 2015-11-18\n", | |
"25953 PLGLB2 2005-03-31 2019-02-18\n", | |
"24674 PAGE3 2005-01-27 2015-11-18\n", | |
"11450 HDHD3 2004-08-12 2015-12-01\n", | |
"34493 SAMD10 2004-07-16 2004-07-15\n", | |
"42579 YLPM1 2004-07-15 2004-07-15\n", | |
"23973 OR5W2 2004-03-10 2015-12-09\n", | |
"23968 OR5T1 2004-03-10 2015-12-09\n", | |
"24361 OR51F1 2004-03-10 2020-05-01\n", | |
"24276 OR10W1 2004-03-05 2015-12-09\n", | |
"23630 OR2AJ1 2004-03-05 2015-12-09\n", | |
"43271 ZNF486 2003-12-17 2003-12-16\n", | |
"13713 KBTBD3 2003-12-17 2016-02-12\n", | |
"23615 OR2A12 2002-11-13 2015-12-09\n", | |
"\n", | |
"[273 rows x 3 columns]" | |
] | |
}, | |
"execution_count": 37, | |
"metadata": {}, | |
"output_type": "execute_result" | |
} | |
], | |
"source": [ | |
"# Inspect the most recent dates the symbols were changed\n", | |
"# Most of them were not changed as recently as ARB2A\n", | |
"hgnc_unexp_df = hgnc_unexp_df[['symbol', 'date_symbol_changed', 'date_name_changed']]\n", | |
"hgnc_unexp_df = hgnc_unexp_df.dropna(axis=0, subset=['date_symbol_changed'])\n", | |
"hgnc_unexp_df.sort_values(by='date_symbol_changed', ascending=False)" | |
] | |
}, | |
{ | |
"cell_type": "code", | |
"execution_count": 46, | |
"metadata": {}, | |
"outputs": [ | |
{ | |
"data": { | |
"text/plain": [ | |
"<matplotlib.axes._subplots.AxesSubplot at 0x14108a2aba8>" | |
] | |
}, | |
"execution_count": 46, | |
"metadata": {}, | |
"output_type": "execute_result" | |
}, | |
{ | |
"data": { | |
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAXQAAAEaCAYAAAABnax5AAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4zLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvnQurowAAGVlJREFUeJzt3XvUJHV54PHvwwwCI8pFJoAgDIsgahSMcxAEE0RNUAzgBSPh4HiDbG5oXBWMG+OeE12I2Wg8R7NBiWC8IHhBVqKCCKLcZ7jN4IAoorAijAKicb0Az/5Rv5GeN/N29dv19tT0b76fc/p0dVU9/Xuq3nqf/nXdOjITSdL026zvBCRJ88OCLkmVsKBLUiUs6JJUCQu6JFXCgi5JlbCgS1IlLOiSVAkLuiRVYuGGbGyHHXbIJUuWbMgmJWnqrVix4keZubhtvg1a0JcsWcLy5cs3ZJOSNPUi4nujzOcuF0mqhAVdkiphQZekSljQJakSFnRJqoQFXZIqYUGXpEpY0CWpEhv0wiJpQ1py8vmzTrv9lMM3YCbShmEPXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRIWdEmqhAVdkiphQZekSljQJakSFnRJqoQFXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRIjF/SIWBAR10XEF8rrPSLiqoi4NSI+FRGPmlyakqQ2c+mhvwFYPfD6VOC9mbkXcB/wuvlMTJI0NyMV9IjYFTgc+HB5HcChwKfLLGcCR00iQUnSaEbtob8PeCvwcHn9OOD+zHywvL4T2GV9gRFxQkQsj4jla9as6ZSsJGl2rQU9Il4M3JOZKwZHr2fWXF98Zp6WmUszc+nixYvHTFOS1GbhCPMcBBwRES8CtgQeS9Nj3zYiFpZe+q7ADyaXpiSpTWsPPTPflpm7ZuYS4JXAVzPzWOBi4OVltmXA5yeWpSSpVZfz0E8C3hQR36bZp376/KQkSRrHKLtcfiMzLwEuKcO3AfvPf0qSpHF4pagkVcKCLkmVsKBLUiUs6JJUCQu6JFXCgi5JlbCgS1IlLOiSVAkLuiRVwoIuSZWwoEtSJSzoklQJC7okVcKCLkmVsKBLUiUs6JJUCQu6JFXCgi5JlbCgS1IlLOiSVAkLuiRVwoIuSZWwoEtSJSzoklQJC7okVcKCLkmVsKBLUiUW9p2ApI3DkpPPHzr99lMO30CZaFz20CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRIWdEmqhAVdkiphQZekSljQJakSrQU9IraMiKsj4oaIuCki/kcZv0dEXBURt0bEpyLiUZNPV5I0m1F66L8EDs3MfYH9gMMi4gDgVOC9mbkXcB/wusmlKUlq01rQs/Gz8nLz8kjgUODTZfyZwFETyVCSNJKRbs4VEQuAFcATgQ8A3wHuz8wHyyx3ArvMEnsCcALAbrvt1jVfSZo3w25INo03IxvpoGhmPpSZ+wG7AvsDT17fbLPEnpaZSzNz6eLFi8fPVJI01JzOcsnM+4FLgAOAbSNibQ9/V+AH85uaJGkuRjnLZXFEbFuGtwKeD6wGLgZeXmZbBnx+UklKktqNsg99Z+DMsh99M+DszPxCRHwTOCsi/g64Djh9gnlKklq0FvTMvBF4xnrG30azP12StBHwSlFJqoQFXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRIWdEmqhAVdkiphQZekSljQJakSFnRJqoQFXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRIWdEmqhAVdkiphQZekSljQJakSFnRJqoQFXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKLOw7Aak2S04+f+j02085fANlok2NPXRJqoQFXZIqYUGXpEpY0CWpEhZ0SapEa0GPiCdExMURsToiboqIN5Tx20fEhRFxa3nebvLpSpJmM0oP/UHgv2Xmk4EDgD+PiKcAJwMXZeZewEXltSSpJ60FPTPvysxry/BPgdXALsCRwJlltjOBoyaVpCSp3Zz2oUfEEuAZwFXAjpl5FzRFH/itWWJOiIjlEbF8zZo13bKVJM1q5IIeEVsDnwHemJkPjBqXmadl5tLMXLp48eJxcpQkjWCkgh4Rm9MU849n5mfL6LsjYucyfWfgnsmkKEkaxShnuQRwOrA6M/9xYNJ5wLIyvAz4/PynJ0ka1Sg35zoIOA5YGRHXl3F/DZwCnB0RrwO+Dxw9mRQlSaNoLeiZ+Q0gZpn8vPlNR5I0Lq8UlaRKWNAlqRIWdEmqhAVdkiphQZekSljQJakSFnRJqoQFXZIqMcqVotImZ8nJ5w+dfvsph2+gTFSjSW1f9tAlqRIWdEmqhAVdkiphQZekSljQJakSFnRJqoQFXZIqYUGXpEp4YdEmwgtlNEluXxsHe+iSVAkLuiRVwoIuSZWwoEtSJSzoklQJC7okVcKCLkmVsKBLUiUs6JJUCa8UldQrrzKdP/bQJakSFnRJqoQFXZIqYUGXpEpY0CWpEhZ0SaqEBV2SKmFBl6RKWNAlqRKtBT0i/jUi7omIVQPjto+ICyPi1vK83WTTlCS1GaWHfgZw2IxxJwMXZeZewEXltSSpR60FPTMvBe6dMfpI4MwyfCZw1DznJUmao3H3oe+YmXcBlOffmm3GiDghIpZHxPI1a9aM2Zwkqc3ED4pm5mmZuTQzly5evHjSzUnSJmvcgn53ROwMUJ7vmb+UJEnjGLegnwcsK8PLgM/PTzqSpHGNctriJ4ErgCdFxJ0R8TrgFOAFEXEr8ILyWpLUo9ZfLMrMY2aZ9Lx5zkWSpsbG+EtLXikqSZWwoEtSJSzoklQJC7okVaL1oGiNNsaDGZLUlT10SaqEBV2SKmFBl6RKbJL70DU9hh3v8FiHtC576JJUCQu6JFXCgi5JlbCgS1IlPCg6RabxAKEXcc2N60td2EOXpEpY0CWpEhZ0SaqEBV2SKuFB0TnqetBqGg9sanq4fW3a7KFLUiUs6JJUCQu6JFXCgi5JlbCgS1IlLOiSVAkLuiRVwoIuSZXwwiK18g6A2ph5MdUj7KFLUiUs6JJUCQu6JFViavehu99MktZlD12SKmFBl6RKWNAlqRIWdEmqRK8HRT2wKUnzp1MPPSIOi4hbIuLbEXHyfCUlSZq7sQt6RCwAPgC8EHgKcExEPGW+EpMkzU2XHvr+wLcz87bM/BVwFnDk/KQlSZqrLgV9F+COgdd3lnGSpB5EZo4XGHE08AeZ+fry+jhg/8z8yxnznQCcUF4+CbhllrfcAfjRWMl0j5/G2D7bnsbYPtuextg+23aZ/7PdM3Nx67tk5lgP4EDgywOv3wa8rcP7LR83tmv8NMZOa96ur+mInda8N8VlHnx02eVyDbBXROwREY8CXgmc1+H9JEkdjH0eemY+GBF/AXwZWAD8a2beNG+ZSZLmpNOFRZn578C/z1Mup/UYP42xfbY9jbF9tj2NsX227TKPaeyDopKkjYv3cpGkSljQJakSFnRJqkRvd1uMiMcCizPzOzPGPz0zb2yJ3QkgM38YEYuB5wC3jHuWTUS8OzP/eoy4PYBnAN/MzJtb5t0NuCczfxERAbwa+B3gm8CHMvPBIbFHABdk5i/mmmOJ/13g7sy8JSIOBg4AVmfm7Le7XDd+a+Aw4AnAg8CtJZ+HR4jdh+aWELsACfwAOC8zV4+zLBtKROwPZGZeU+5RdBhwczkRYK7v9dHMfNW8J7mRGDht+QeZ+ZWI+GPg2cBq4LTM/PUE297kt6913rePg6IR8QrgfcA9wObAqzPzmjLt2sz8nSGxfwKcDARwKk1hvAk4CPj7zDy9pe33zxwFHAd8FCAzTxwSe25mHlWGjyzLcAnNxvs/M/OMIbGraK6k/XlEnArsCZwLHFrafe2Q2P8H/AfwReCTNBd0PTRsOQdi30dz352FNKeYPq+8z+8B12XmW1riXwG8BbgBeC5wOc03u6cBx2bmyiGxJwHH0Nzn584yeleaf/6zMvOUUZZhPe/7msz8SMs8+9D8k1+VmT8bGH9YZn6pJfZvaW46txC4EHgWzd/5+TTr/l1DYmdeixE06+2rAJl5xLC2Z7zXwTR/u1WZeUHLvM+i+ZB+ICK2ovkfWdtheHdm/mRI7InA5zLzjtnmaWn74zTrahFwP7A18FmabS0yc1lL/J7AS1i3w/DJYTmXuN62rzLfWNtYl+2r1XxcnTTGVVHXAzuX4f2Bm4GXltfXtcSupNlwHgf8DNipjN8OuH6Etu8EPga8ClhWHmvWDrfEXjcwfDmwRxneAbihJfabA8MrgM0GXrfFXleW73jgIuBu4H8DvzfC8t5EU1QWAfcBi8r4zWkKRVv8jQMxO5QNDuDpwOUtsd8CNl/P+EcBt3bYfr7fMv1EmltMnAvcDhw5MO3aEd5/Jc21FYuAB4DHlvFbATe2xF5btq9DaD40DwHuKsND/17A1QPDx5f/k78FLgNOHuHvvLAMn0bT2Ti4xH+2JfYnND3brwN/RvPNeS5/jxvL88KybS4or2OE9XUiTVH77+V/6oPAu2g+iA7ZGLevrttYl+2rNa8uwR1W2MoZr3emKXInjrAyrh0YvmHGtKEfBmWex5SN/RPALmXcbSPmPdj21XNpm6Z3fGgZ/gzNvRmg+WBqK+jXzni9U1lXVwB3tMSuKs9b0hT0rcrrBQx8yLRsfGu/yW3Fuh9qQz8QaD6od1/P+N1pdpENi71xlsdK4Jcj5Lx1GV4CLAfeMIdt5Lr1DZfXQzsNNN9e/qoUqf3muH0NtnsNpbACj575P7Oe2NVDtpe2nK8ref8+cDpNB+dLNJ2cx4yQ9yqaIrod8FNg+4FtbnVL7Eoe+QBYBFxShncb4X+ql+2r6zbWZftqe/S1D/2nEbFnlv3nmXlXRBxC82n31JbYhyNi82z2y/3mZ40iYktGOMibmT8F3hgRzwQ+FhHnjxJX7BsRD9D0PLaIiJ2y2Y//KJoCOczrgY9GxDtpekTXR8TanvebWmJjxjL8EHg/8P6I2L0l9vyI+DrNP9eHgbMj4kqaHuOlLbHQXDj2pYj4Gs3XxHMAImL7mXmtxxuBiyLiVh65M+duwBOBv2iJ3RH4A5oPoUFB05MbZkGWr8CZeXvZtj5d1lVbzgC/iohFmflz4Jm/aThiG2DocYNsjiu8NyLOKc93M/qxqs0iYjua7TEyc015z/+IiFmPsRSrBnYV3BARSzNzeUTsDbTtw86S9wXABRGxOc3f+hjgH4C2m0KdTlNcFwBvB86JiNtojtWc1RILzfp5CNiCpsNFZn6/5DFMX9sXdNvGxt6+WnX5NBj3AewL7LWe8ZvT7JcdFrsb6/+atQvw/DnmEcCfAx/ruDzbAgeOOO+TaQ7ivIxm39lmI8Qc0jG/A4EDyvCewJuBV4zSdol5UYl5wcC4zYAtRojdjOYf+2XAy8vwghHiTgcOnmXaJ1piv0rpHQ+MW0hznOShEdpe73LR7HJ62hzX/eE0+7BHmfd24Dbgu+V57e7ErWnvZW8DnAF8B7iKpojfBnwN2LcldtYeJeUb3Qi5Px54fBnetvyt9x8h7g00PePTaD4UXlPGLwYu3Ri3r67b2HxuXzMfvV4pGhE7MnB0OjPv3hCxfbY9jbHzEb+e99s6Bw4kzaeI2BV4MJtvMjOnHZSZl3V477HzHjc2IhYBO2bmd0eY9zHAf6EpLneO8neKiL0z81tzzWsUoyxzRDyVpqOzKlvOFttYTHIb66Kvs1z2ozmotw3wf8voXWmOkP9pZl43idgR4v8sM68dEvsM4J8nkHdbu73Ezkf8kPf9fmbuNmbsBi+qA/Fd8p66Ze55fQ1tOyKeTtOz34XmzK2TMvO+Mu3qzNx/nHYnbZJ597UP/QzgTzLzqsGREXFAmbbvhGLb4j/SEv+RCeXd1m5fsZ3iI2K2YwNBsxthXN+k2fU2kdgueU/rMneJ7XGZPwi8E7iS5hjVNyLiiGyOzQ3d/961qEbE04APjRk/dt5t+iroj55ZIAAy88qIePQEY/tsexpju8a/G3gPzbnFMw09EN1zUR077y6xfS1zn+urY9tb5yPne/9DRKygOYB/HM2uwWG6FtV/7hDfJe+h+iroXyxnl3yUR45OP4Hm3PChF310jO2z7WmM7Rp/LXBuZq6YOSEiXt8S20tRLbrkPY3L3Of66tJ2RMQ2WS5AysyLI+JlNKcFb98S27WodonvkvfwN+7roGhEvJBHLtkNmgt+zssRLn3tEttn29MY2yU+Ip4E3Jvl9LsZ03YcdsAuIi4H/nKWInFHZj5hErHzkPfULXPP66tL3n9Mc47/lTPG7wb8TWYePyT2BuB3c+Bq1LIb5jM059E/brbYrvFd8m7j/dC1UeqrqPapxw+S3tZXX213LaqTLMqdZIdzHsd90JwxcQrNzXt+XB6ry7htJxXbZ9vTGDuPbd88Ttt9PbrkPa3L3Nf6msZ2N+a8+7p97tk0V2g9NzMfl83Xk+fSnAp3zgRj+2x7GmPnq+1DZsTe1xYbEdtExCkRcXNE/Lg8Vpdx204qtmve07jMfa6vjm331W5vebfq6RNq1vssDJvWNbbPtqcxtue8vwycRLlasozbqYy7cFKxm+Iy97y+uuTdS7t95t2aV5fgsRtt7hnxVpqr39aO27GsjK9MKrbPtqcxtue8+/wQ26SWuef11SXvXtrtM++2R1+7XP6I5i6DX4uI+yLiXpr7AW9Pc4+RScX22fY0xvbZ9vci4q3R3HIAaA6SRXMP7Lb7dneJ7Zr3NC5zn+urS9t9tdtn3sN1+TTo8gD2obmh+9Yzxh82ydg+257G2L7aprkL5ak0B47uA+6lOXB0KuX2rJOI3RSXuc/11bXtHtvtJe/W9+0SPHaj3W4O3/XHC3ppexpjN4K2+/oA3BSXuZf11aXtPtd1n3kPfe8uwWM32u3m8F1/vKCXtqcxtue8+yyqm9Qy97y+uv7yzwZvt8+82x59Xfrf5ebwXX+8oK+2pzG2z7aPB56ZmT+LiCUlbklm/tOEY7vmPY3L3Of66tJ2X+32mfdQfR0U/WE0t2UFoCzciyk3eJ9gbJ9tT2Nsn22vs9HT/DbnCyPiH5njP8wcY7vmPY3L3Of66tJ2X+32mfdwXbr34z5o7qe90yzTDppUbJ9tT2Nsz3l3+UWYrr9YtEktc8/rq0vevbTbZ95tD+/loo1SdPhFmC6xfeprmftcX3213bXdjXUbs6BLUiX62ocuSZpnFnRJqoQFXWOLiHdGxJuHTD8qIp6yIXMaJiJuj4gd5jD/0OWbJeaQiPjC3LObfxtTLtowLOiapKOAjaagS7WzoGtOIuLtEXFLRHwFeFIZd3xEXBMRN0TEZyJiUUQ8GzgCeE9EXB8Re5bHlyJiRUR8PSL2GdLO0RGxqrznpWXc1wfP342IyyLi6aUnfWZEXFB64S+NiL+PiJWlvcEf7X1LRFxdHk8s77N7RFwUETeW56G/cj/Q/hMj4islx2sjYs8yaeuI+HQ098r+eEREmf8dZT2tiojTBsZfEhGnlpy+FRHPKeMXRcTZJa9PRcRVEbG0TPv9iLiitHtORGxdxh9W2v0G8NJRlkMV6XLOo49N6wE8k+ay5UXAY4FvA28GHjcwz9/R/EYkwBnAywemXQTsVYafBXx1SFsrgV3K8LbleRnwvjK8N7C8DL8T+AbNr63vC/wceGGZ9jngqDJ8O/D2Mvwq4Atl+P8Ay8rwa2l+8Hjt+755SI5XAS8pw1uW9XII8BOac403A64ADi7zbD8Q+2/AH5bhS4D/VYZfRLmFalm3/1KGf5vmh5SX0lyAcinw6DLtJOAdJYc7gL1oLm45e+0y+tg0HvbQNRfPAT6XmT/PzAeA88r43y6955XAscBTZwaWHuSzgXMi4nrgX4Cdh7R1GXBGRBwPLCjjzgFeXHrcr6X5wFjri5n5a5oPggXA2l9kX0lzv4y1PjnwfGAZPhD4RBn+N+DgIXmtXZ7H0HzgfA4gM3+RmT8vk6/OzDsz82Hg+oH2n1t62SuBQ1l3PX22PK8YmP9g4Kzy/quAG8v4A2h2ZV1W1uUyYHeam0V9NzNvzcwEPta2HKpLX/dy0fRa34ULZ9D0gm+IiFfT9FJn2gy4PzP3W8+0/9xI5n+NiGcBhwPXR8R+mfnjiLgQOJLmvtFLB0J+WeIejohfl4IG8DDrbuc5yzAjjB807PLuXw4MPwQsjIgtgQ8CSzPzjoh4J02PembMQwP5ztZG0PwqzjHrjGx2R3lhySbMHrrm4lLgJRGxVemh/mEZ/xjgrtJzPnZg/p+WaZQe/Xcj4miAaOw7W0MRsWdmXpWZ7wB+BDyhTPow8H7gmsy8d4xl+KOB5yvK8OXAK8vwsTS7b4Yqy3NnRBxV8t0iIhYNCVlbvH9Uvq28fIRcv0H5wYNyttDa+3xcCRw0cAxgUUTsTXNv7j0G9uUfgzYpFnSNLDOvBT5FsxvhM8DXy6S/odmffCFNUVnrLJqDkNeVInMs8LqIuAG4iaanPZv3lIOaq2g+SG4oOawAHgA+MuZibBERVwFvAP6qjDsReE1E3AgcV6aN4jjgxBJ3Oc1vSq5XZt4PfIhmF9C5wDUjvP8HgcXl/U+i2eXyk8xcA7wa+GSZdiWwT2b+AjgBOL8cFP3eiMuhSnjpv6ZKRDye5iDiPmUfdbUiYgGweWb+onwgXgTsnZm/6jk1baTch66pERGvAt4FvKn2Yl4sAi4uu7IC+FOLuYaxh65eRcTbgaNnjD4nM9/VRz7rExEfAA6aMfqfMnPc3T7SRFjQJakSHhSVpEpY0CWpEhZ0SaqEBV2SKmFBl6RK/H+t9PAFXkYYWgAAAABJRU5ErkJggg==\n", | |
"text/plain": [ | |
"<Figure size 432x288 with 1 Axes>" | |
] | |
}, | |
"metadata": { | |
"needs_background": "light" | |
}, | |
"output_type": "display_data" | |
} | |
], | |
"source": [ | |
"# Plot the histogram of the years the symbols were changed for the 273 with changes\n", | |
"hgnc_unexp_df['date_symbol_changed'] = pd.to_datetime(hgnc_unexp_df['date_symbol_changed'])\n", | |
"hgnc_unexp_df['date_symbol_changed'].groupby([hgnc_unexp_df['date_symbol_changed'].dt.year]).count().plot(kind='bar')" | |
] | |
} | |
], | |
"metadata": { | |
"kernelspec": { | |
"display_name": "Python 3", | |
"language": "python", | |
"name": "python3" | |
}, | |
"language_info": { | |
"codemirror_mode": { | |
"name": "ipython", | |
"version": 3 | |
}, | |
"file_extension": ".py", | |
"mimetype": "text/x-python", | |
"name": "python", | |
"nbconvert_exporter": "python", | |
"pygments_lexer": "ipython3", | |
"version": "3.7.3" | |
} | |
}, | |
"nbformat": 4, | |
"nbformat_minor": 2 | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment