{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "import numpy as np\n", "import seaborn as sns\n", "import matplotlib.pyplot as plt\n", "from sqlalchemy import create_engine\n", "from sklearn import preprocessing\n", "import mysql.connector\n", "from pandas import DataFrame\n", "from sklearn.metrics import jaccard_score\n", "from numpy import logical_and as l_and, logical_not as l_not" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [], "source": [ "disnet_db_ares = mysql.connector.connect(\n", " host=\"138.4.130.153\",\n", " port = \"30602\",\n", " user=\"disnet_user\",\n", " password=\"tYkX4JxV8p79\",\n", " database=\"disnet_drugslayer\"\n", ")\n", "\n", " \n", "\n", "disnet_mysql_cursor = disnet_db_ares.cursor()" ] }, { "cell_type": "code", "execution_count": 14, "metadata": {}, "outputs": [], "source": [ "def get_dummies(data,col_index,col_col):\n", " \n", " df_final= pd.get_dummies(data.set_index(col_index),col_col).reset_index()\n", " df_final=df_final.drop_duplicates()\n", " df_final=df_final.groupby(col_index).sum().reset_index()\n", " \n", " return df_final\n", "\n", "def convert(lista):\n", " return tuple(i for i in lista)\n", "\n", "\n", "def get_normal_diseases(rare_disease):\n", " '''\n", " Esta funcion devuelve un dataframe con la enfermedad, los medicamentos y los targets que son utiles\n", " para la enfermedad rara que se le pase como parametro'''\n", " \n", " \n", " q= f'''SELECT DISTINCT\n", " d.disease_id, drug_name,dg.gene_id\n", " FROM\n", " disnet_biolayer.disease_variant dv\n", " JOIN disnet_biolayer.disease d on dv.disease_id = d.disease_id\n", " JOIN disnet_biolayer.variant v on v.variant_id = dv.variant_id\n", " JOIN disnet_biolayer.disease_gene dg ON d.disease_id = dg.disease_id\n", " JOIN disnet_biolayer.encodes e ON dg.gene_id = e.gene_id\n", " JOIN disnet_drugslayer.has_code hc ON hc.code = e.protein_id\n", " JOIN disnet_drugslayer.drug_target dt ON hc.id = dt.target_id\n", " JOIN disnet_drugslayer.drug d ON dt.drug_id = d.drug_id\n", " WHERE\n", " hc.entity_id = 3\n", " and v.chromosome is not null\n", " and d.ddf_type = \"disease\"\n", " AND dg.gene_id in (SELECT distinct(gene_id) FROM disnet_biolayer.disease_gene\n", " where disease_id = \"{rare_disease}\")\n", " ;'''\n", " \n", " df = pd.read_sql(q, con=disnet_db_ares)\n", " \n", " return df" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "scrolled": false }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
rare_dis_idC0000744C0000846C0000889C0001080C0001127C0001193C0001206C0001311C0001339...C4540135C4540251C4540293C4540389C4540439C4540496C4540534C4540536C4540602C4543822
0C0011195000000000...0000000000
1C0027877000000000...0000000000
2C0036391000000000...0000000000
3C0549463000000000...0000000000
4C0751337000000000...0000000000
5C1852146000000000...0000000000
\n", "

6 rows × 6953 columns

\n", "
" ], "text/plain": [ " rare_dis_id C0000744 C0000846 C0000889 C0001080 C0001127 C0001193 \\\n", "0 C0011195 0 0 0 0 0 0 \n", "1 C0027877 0 0 0 0 0 0 \n", "2 C0036391 0 0 0 0 0 0 \n", "3 C0549463 0 0 0 0 0 0 \n", "4 C0751337 0 0 0 0 0 0 \n", "5 C1852146 0 0 0 0 0 0 \n", "\n", " C0001206 C0001311 C0001339 ... C4540135 C4540251 C4540293 C4540389 \\\n", "0 0 0 0 ... 0 0 0 0 \n", "1 0 0 0 ... 0 0 0 0 \n", "2 0 0 0 ... 0 0 0 0 \n", "3 0 0 0 ... 0 0 0 0 \n", "4 0 0 0 ... 0 0 0 0 \n", "5 0 0 0 ... 0 0 0 0 \n", "\n", " C4540439 C4540496 C4540534 C4540536 C4540602 C4543822 \n", "0 0 0 0 0 0 0 \n", "1 0 0 0 0 0 0 \n", "2 0 0 0 0 0 0 \n", "3 0 0 0 0 0 0 \n", "4 0 0 0 0 0 0 \n", "5 0 0 0 0 0 0 \n", "\n", "[6 rows x 6953 columns]" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "rare_diseases= ['C0011195', 'C0023944', 'C0024054', 'C0024901', 'C0027877', 'C0036391', 'C0265202', 'C0268059', 'C0549463', 'C0751337', 'C0869083', 'C1852146', 'C0796280']\n", "\n", "matrix_jac_gen = pd.read_excel((\"mat_jacc_variant.xlsx\"),engine='openpyxl')\n", "matrix_jac_gen" ] }, { "cell_type": "code", "execution_count": 85, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_iddrug_namegene_id
\n", "
" ], "text/plain": [ "Empty DataFrame\n", "Columns: [disease_id, drug_name, gene_id]\n", "Index: []" ] }, "execution_count": 85, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_useful_diseases = get_normal_diseases(\"C1852146\")\n", "df_useful_diseases" ] }, { "cell_type": "code", "execution_count": 66, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "358" ] }, "execution_count": 66, "metadata": {}, "output_type": "execute_result" } ], "source": [ "useful_diseases = get_normal_diseases(\"C1852146\")['disease_id'].drop_duplicates().tolist()\n", "len(useful_diseases)" ] }, { "cell_type": "code", "execution_count": 67, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
rare_dis_idC0000744C0000846C0000889C0001080C0001127C0001193C0001206C0001311C0001339...C4540135C4540251C4540293C4540389C4540439C4540496C4540534C4540536C4540602C4543822
3C0549463000000000...0000000000
\n", "

1 rows × 6953 columns

\n", "
" ], "text/plain": [ " rare_dis_id C0000744 C0000846 C0000889 C0001080 C0001127 C0001193 \\\n", "3 C0549463 0 0 0 0 0 0 \n", "\n", " C0001206 C0001311 C0001339 ... C4540135 C4540251 C4540293 C4540389 \\\n", "3 0 0 0 ... 0 0 0 0 \n", "\n", " C4540439 C4540496 C4540534 C4540536 C4540602 C4543822 \n", "3 0 0 0 0 0 0 \n", "\n", "[1 rows x 6953 columns]" ] }, "execution_count": 67, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df = matrix_jac_gen[matrix_jac_gen.rare_dis_id == 'C1852146']\n", "df.head(2)" ] }, { "cell_type": "code", "execution_count": 68, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
rare_dis_idC0549463
C05494631.0
C00028710.0
C01499250.0
C00857860.0
C00854350.0
......
C08124130.0
C07517810.0
C07404570.0
C06998850.0
C40829370.0
\n", "

358 rows × 1 columns

\n", "
" ], "text/plain": [ "rare_dis_id C0549463\n", "C0549463 1.0\n", "C0002871 0.0\n", "C0149925 0.0\n", "C0085786 0.0\n", "C0085435 0.0\n", "... ...\n", "C0812413 0.0\n", "C0751781 0.0\n", "C0740457 0.0\n", "C0699885 0.0\n", "C4082937 0.0\n", "\n", "[358 rows x 1 columns]" ] }, "execution_count": 68, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_useful = df[['rare_dis_id'] + useful_diseases].set_index('rare_dis_id').transpose()\n", "df_useful.sort_values(by='C1852146', ascending=False)" ] }, { "cell_type": "code", "execution_count": 70, "metadata": {}, "outputs": [], "source": [ "df_normal_dis_jacc=pd.DataFrame(df_useful['C1852146'].nlargest(5)).reset_index().rename(columns={'index':'disease_id', 'C1852146':'jacc_idx'})" ] }, { "cell_type": "code", "execution_count": 71, "metadata": {}, "outputs": [], "source": [ "df_normal_dis_jacc.to_excel(\"dis_jacc_C1852146_v.xlsx\")" ] }, { "cell_type": "code", "execution_count": 72, "metadata": {}, "outputs": [], "source": [ "df_normal_rare_drug=pd.merge(df_useful_diseases,df_normal_dis_jacc,on=\"disease_id\",how=\"inner\")" ] }, { "cell_type": "code", "execution_count": 73, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_iddrug_namegene_idjacc_idx
0C0002871MERCAPTOPURINE32510.0
1C0002871PAZOPANIB HYDROCHLORIDE37020.0
2C0002871FOSTAMATINIB37020.0
3C0002871PAZOPANIB37020.0
4C0002871DEQUALINIUM3310.0
5C0002871EMAPALUMAB34580.0
6C0002871OLSALAZINE34580.0
7C0002871GLUCOSAMINE34580.0
8C0003868MERCAPTOPURINE32510.0
9C0004135MERCAPTOPURINE32510.0
10C0006142MERCAPTOPURINE32510.0
11C0006142PAZOPANIB HYDROCHLORIDE37020.0
12C0006142FOSTAMATINIB37020.0
13C0006142PAZOPANIB37020.0
14C0006142ZINC ACETATE3250.0
15C0006142DEQUALINIUM3310.0
16C0006142EMAPALUMAB34580.0
17C0006142OLSALAZINE34580.0
18C0006142GLUCOSAMINE34580.0
19C0006142IXEKIZUMAB36050.0
20C0006142SECUKINUMAB36050.0
21C0549463MERCAPTOPURINE32511.0
22C0549463PAZOPANIB HYDROCHLORIDE37021.0
23C0549463FOSTAMATINIB37021.0
24C0549463PAZOPANIB37021.0
25C0549463ZINC ACETATE3251.0
26C0549463DEQUALINIUM3311.0
27C0549463EMAPALUMAB34581.0
28C0549463OLSALAZINE34581.0
29C0549463GLUCOSAMINE34581.0
30C0549463IXEKIZUMAB36051.0
31C0549463SECUKINUMAB36051.0
\n", "
" ], "text/plain": [ " disease_id drug_name gene_id jacc_idx\n", "0 C0002871 MERCAPTOPURINE 3251 0.0\n", "1 C0002871 PAZOPANIB HYDROCHLORIDE 3702 0.0\n", "2 C0002871 FOSTAMATINIB 3702 0.0\n", "3 C0002871 PAZOPANIB 3702 0.0\n", "4 C0002871 DEQUALINIUM 331 0.0\n", "5 C0002871 EMAPALUMAB 3458 0.0\n", "6 C0002871 OLSALAZINE 3458 0.0\n", "7 C0002871 GLUCOSAMINE 3458 0.0\n", "8 C0003868 MERCAPTOPURINE 3251 0.0\n", "9 C0004135 MERCAPTOPURINE 3251 0.0\n", "10 C0006142 MERCAPTOPURINE 3251 0.0\n", "11 C0006142 PAZOPANIB HYDROCHLORIDE 3702 0.0\n", "12 C0006142 FOSTAMATINIB 3702 0.0\n", "13 C0006142 PAZOPANIB 3702 0.0\n", "14 C0006142 ZINC ACETATE 325 0.0\n", "15 C0006142 DEQUALINIUM 331 0.0\n", "16 C0006142 EMAPALUMAB 3458 0.0\n", "17 C0006142 OLSALAZINE 3458 0.0\n", "18 C0006142 GLUCOSAMINE 3458 0.0\n", "19 C0006142 IXEKIZUMAB 3605 0.0\n", "20 C0006142 SECUKINUMAB 3605 0.0\n", "21 C0549463 MERCAPTOPURINE 3251 1.0\n", "22 C0549463 PAZOPANIB HYDROCHLORIDE 3702 1.0\n", "23 C0549463 FOSTAMATINIB 3702 1.0\n", "24 C0549463 PAZOPANIB 3702 1.0\n", "25 C0549463 ZINC ACETATE 325 1.0\n", "26 C0549463 DEQUALINIUM 331 1.0\n", "27 C0549463 EMAPALUMAB 3458 1.0\n", "28 C0549463 OLSALAZINE 3458 1.0\n", "29 C0549463 GLUCOSAMINE 3458 1.0\n", "30 C0549463 IXEKIZUMAB 3605 1.0\n", "31 C0549463 SECUKINUMAB 3605 1.0" ] }, "execution_count": 73, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_normal_rare_drug" ] }, { "cell_type": "code", "execution_count": 74, "metadata": {}, "outputs": [], "source": [ "df_normal_rare_drug=df_normal_rare_drug.drop_duplicates()" ] }, { "cell_type": "code", "execution_count": 75, "metadata": {}, "outputs": [], "source": [ "prueba=df_normal_rare_drug.groupby('drug_name').count()" ] }, { "cell_type": "code", "execution_count": 76, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_idgene_idjacc_idx
drug_name
DEQUALINIUM333
EMAPALUMAB333
FOSTAMATINIB333
GLUCOSAMINE333
IXEKIZUMAB222
MERCAPTOPURINE555
OLSALAZINE333
PAZOPANIB333
PAZOPANIB HYDROCHLORIDE333
SECUKINUMAB222
ZINC ACETATE222
\n", "
" ], "text/plain": [ " disease_id gene_id jacc_idx\n", "drug_name \n", "DEQUALINIUM 3 3 3\n", "EMAPALUMAB 3 3 3\n", "FOSTAMATINIB 3 3 3\n", "GLUCOSAMINE 3 3 3\n", "IXEKIZUMAB 2 2 2\n", "MERCAPTOPURINE 5 5 5\n", "OLSALAZINE 3 3 3\n", "PAZOPANIB 3 3 3\n", "PAZOPANIB HYDROCHLORIDE 3 3 3\n", "SECUKINUMAB 2 2 2\n", "ZINC ACETATE 2 2 2" ] }, "execution_count": 76, "metadata": {}, "output_type": "execute_result" } ], "source": [ "prueba" ] }, { "cell_type": "code", "execution_count": 77, "metadata": {}, "outputs": [], "source": [ "drug=prueba[prueba[\"disease_id\"]>4]" ] }, { "cell_type": "code", "execution_count": 78, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_idgene_idjacc_idx
drug_name
MERCAPTOPURINE555
\n", "
" ], "text/plain": [ " disease_id gene_id jacc_idx\n", "drug_name \n", "MERCAPTOPURINE 5 5 5" ] }, "execution_count": 78, "metadata": {}, "output_type": "execute_result" } ], "source": [ "drug" ] }, { "cell_type": "code", "execution_count": 80, "metadata": {}, "outputs": [], "source": [ "drug.to_excel(\"drugs_C0549463_V.xlsx\")" ] }, { "cell_type": "code", "execution_count": 79, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_iddrug_namegene_idjacc_idx
0C0002871MERCAPTOPURINE32510.0
8C0003868MERCAPTOPURINE32510.0
9C0004135MERCAPTOPURINE32510.0
10C0006142MERCAPTOPURINE32510.0
21C0549463MERCAPTOPURINE32511.0
\n", "
" ], "text/plain": [ " disease_id drug_name gene_id jacc_idx\n", "0 C0002871 MERCAPTOPURINE 3251 0.0\n", "8 C0003868 MERCAPTOPURINE 3251 0.0\n", "9 C0004135 MERCAPTOPURINE 3251 0.0\n", "10 C0006142 MERCAPTOPURINE 3251 0.0\n", "21 C0549463 MERCAPTOPURINE 3251 1.0" ] }, "execution_count": 79, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df_normal_rare_drug[df_normal_rare_drug[\"drug_name\"]==\"MERCAPTOPURINE\"]" ] }, { "cell_type": "code", "execution_count": 81, "metadata": {}, "outputs": [], "source": [ "drug_all=df_normal_rare_drug[df_normal_rare_drug[\"disease_id\"]==\"C0549463\"]" ] }, { "cell_type": "code", "execution_count": 82, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
disease_iddrug_namegene_idjacc_idx
21C0549463MERCAPTOPURINE32511.0
22C0549463PAZOPANIB HYDROCHLORIDE37021.0
23C0549463FOSTAMATINIB37021.0
24C0549463PAZOPANIB37021.0
25C0549463ZINC ACETATE3251.0
26C0549463DEQUALINIUM3311.0
27C0549463EMAPALUMAB34581.0
28C0549463OLSALAZINE34581.0
29C0549463GLUCOSAMINE34581.0
30C0549463IXEKIZUMAB36051.0
31C0549463SECUKINUMAB36051.0
\n", "
" ], "text/plain": [ " disease_id drug_name gene_id jacc_idx\n", "21 C0549463 MERCAPTOPURINE 3251 1.0\n", "22 C0549463 PAZOPANIB HYDROCHLORIDE 3702 1.0\n", "23 C0549463 FOSTAMATINIB 3702 1.0\n", "24 C0549463 PAZOPANIB 3702 1.0\n", "25 C0549463 ZINC ACETATE 325 1.0\n", "26 C0549463 DEQUALINIUM 331 1.0\n", "27 C0549463 EMAPALUMAB 3458 1.0\n", "28 C0549463 OLSALAZINE 3458 1.0\n", "29 C0549463 GLUCOSAMINE 3458 1.0\n", "30 C0549463 IXEKIZUMAB 3605 1.0\n", "31 C0549463 SECUKINUMAB 3605 1.0" ] }, "execution_count": 82, "metadata": {}, "output_type": "execute_result" } ], "source": [ "drug_all" ] }, { "cell_type": "code", "execution_count": 83, "metadata": {}, "outputs": [], "source": [ "drug_all.to_excel(\"drugs_all_C0549463_v.xlsx\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.9" } }, "nbformat": 4, "nbformat_minor": 4 }