{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "**In this notebook data from MarkerDB database related to chemical diagnostic markers-disease associations is processed, inserted into SQL tables and analysed.**" ] }, { "cell_type": "code", "execution_count": 65, "metadata": {}, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "**Operations with data from Markerdb database**" ] }, { "cell_type": "code", "execution_count": 66, "metadata": { "scrolled": true }, "outputs": [ { "data": { "text/html": [ "
\n", " | marker_id | \n", "marker | \n", "name_id | \n", "name | \n", "patient | \n", "gender | \n", "sample | \n", "concentration | \n", "Column9 | \n", "reference | \n", "\n", " | Column12 | \n", "type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "1-Methylhistidine | \n", "251 | \n", "Obesity | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "NaN | \n", "Tuma, P., Samcova, E. & Balinova, P. Determina... | \n", "15899597.0 | \n", "2 | \n", "Diagnostic | \n", "
1 | \n", "1 | \n", "1-Methylhistidine | \n", "1 | \n", "Normal | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "85.8 (17.7-153.8) umol/mmol creatinine | \n", "NaN | \n", "David F. Putnam Composition and Concentrative ... | \n", "NaN | \n", "2 | \n", "Diagnostic | \n", "
2 | \n", "1 | \n", "1-Methylhistidine | \n", "33 | \n", "Alzheimer's Disease | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "15.7 (11.7-19.7) umol/mmol creatinine | \n", "NaN | \n", "Fonteh, A. N., Harrington, R. J., Tsai, A., Li... | \n", "17031479.0 | \n", "2 | \n", "Diagnostic | \n", "
3 | \n", "1 | \n", "1-Methylhistidine | \n", "34 | \n", "Pregnancy | \n", "Adult: >=18 yrs old | \n", "Female | \n", "Blood | \n", "50.0 uM | \n", "NaN | \n", "NaN | \n", "22494326.0 | \n", "2 | \n", "Diagnostic | \n", "
4 | \n", "1 | \n", "1-Methylhistidine | \n", "1 | \n", "Normal | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Blood | \n", "12.7 uM | \n", "NaN | \n", "Dohm, G. L., Williams, R. T., Kasperek, G. J. ... | \n", "7061274.0 | \n", "2 | \n", "Diagnostic | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3389 | \n", "4961 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "1 | \n", "Normal | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "0.0023 (0.00090-0.0058) umol/mmol creatinine | \n", "NaN | \n", "NaN | \n", "24023812.0 | \n", "2 | \n", "Diagnostic | \n", "
3390 | \n", "4961 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "34 | \n", "Pregnancy | \n", "Adult: >=18 yrs old | \n", "Female | \n", "Blood | \n", "4.4 uM | \n", "NaN | \n", "NaN | \n", "24704061.0 | \n", "2 | \n", "Diagnostic | \n", "
3391 | \n", "4961 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "1 | \n", "Normal | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Blood | \n", "15.4 uM | \n", "NaN | \n", "Molecular You | \n", "NaN | \n", "2 | \n", "Diagnostic | \n", "
3392 | \n", "4973 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "6245 | \n", "Vertebral Osteoporosis | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", ">63 nmol/mmol creatine | \n", "NaN | \n", "Seibel, M. J., Woitge, H., Scheidt-Nave, C., L... | \n", "7817828.0 | \n", "2 | \n", "Diagnostic | \n", "
3393 | \n", "4973 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "1 | \n", "Normal | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "<63 nmol/mmol creatine | \n", "NaN | \n", "<63 | \n", "NaN | \n", "2 | \n", "Diagnostic | \n", "
3394 rows × 13 columns
\n", "\n", " | marker_id | \n", "marker | \n", "name_id | \n", "name | \n", "patient | \n", "gender | \n", "sample | \n", "concentration | \n", "Column9 | \n", "reference | \n", "\n", " | Column12 | \n", "type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1 | \n", "1-Methylhistidine | \n", "251 | \n", "Obesity | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "NaN | \n", "Tuma, P., Samcova, E. & Balinova, P. Determina... | \n", "15899597.0 | \n", "2 | \n", "Diagnostic | \n", "
2 | \n", "1 | \n", "1-Methylhistidine | \n", "33 | \n", "Alzheimer's Disease | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "15.7 (11.7-19.7) umol/mmol creatinine | \n", "NaN | \n", "Fonteh, A. N., Harrington, R. J., Tsai, A., Li... | \n", "17031479.0 | \n", "2 | \n", "Diagnostic | \n", "
5 | \n", "1 | \n", "1-Methylhistidine | \n", "5988 | \n", "Preeclampsia/Eclampsia | \n", "Adult: >=18 yrs old | \n", "Female | \n", "Blood | \n", "50.7 uM | \n", "NaN | \n", "NaN | \n", "22494326.0 | \n", "2 | \n", "Diagnostic | \n", "
6 | \n", "1 | \n", "1-Methylhistidine | \n", "83 | \n", "Chronic Kidney Disease | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Blood | \n", "28.8 (10.6-47.0) uM | \n", "NaN | \n", "Raj, D. S., Ouwendyk, M., Francoeur, R. & Pier... | \n", "10838467.0 | \n", "2 | \n", "Diagnostic | \n", "
7 | \n", "2 | \n", "1,3-Diaminopropane | \n", "207 | \n", "Leukemia | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", "0.96 (0.12-2.1) umol/mmol creatinine | \n", "NaN | \n", "Lee, S. H., Suh, J. W., Chung, B. C. & Kim, S.... | \n", "9464484.0 | \n", "2 | \n", "Diagnostic | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3356 | \n", "4931 | \n", "PC(o-18:1(11Z)/18:2(9Z,12Z)) | \n", "251 | \n", "Obesity | \n", "Children: 2-17 yrs old | \n", "Both | \n", "Blood | \n", "8.4 (5.7-11.1) uM | \n", "NaN | \n", "NaN | \n", "24740590.0 | \n", "2 | \n", "Diagnostic | \n", "
3358 | \n", "4934 | \n", "PC(o-18:1(9Z)/18:2(9Z,12Z)) | \n", "251 | \n", "Obesity | \n", "Children: 2-17 yrs old | \n", "Both | \n", "Blood | \n", "8.4 (5.7-11.1) uM | \n", "NaN | \n", "NaN | \n", "24740590.0 | \n", "2 | \n", "Diagnostic | \n", "
3386 | \n", "4957 | \n", "SM(d18:0/14:1(9Z)(OH)) | \n", "251 | \n", "Obesity | \n", "Adolescent:13-18 yrs old | \n", "Both | \n", "Urine | \n", "0.36 (0.32-0.40) umol/mmol creatinine | \n", "NaN | \n", "NaN | \n", "26910390.0 | \n", "2 | \n", "Diagnostic | \n", "
3388 | \n", "4961 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "251 | \n", "Obesity | \n", "Adolescent:13-18 yrs old | \n", "Both | \n", "Urine | \n", "2.2 (2.1-2.3) umol/mmol creatinine | \n", "NaN | \n", "NaN | \n", "26910390.0 | \n", "2 | \n", "Diagnostic | \n", "
3392 | \n", "4973 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "6245 | \n", "Vertebral Osteoporosis | \n", "Adult: >=18 yrs old | \n", "Both | \n", "Urine | \n", ">63 nmol/mmol creatine | \n", "NaN | \n", "Seibel, M. J., Woitge, H., Scheidt-Nave, C., L... | \n", "7817828.0 | \n", "2 | \n", "Diagnostic | \n", "
1545 rows × 13 columns
\n", "\n", " | marker | \n", "name | \n", "concentration | \n", "sample | \n", "
---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "Obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "
2 | \n", "1-Methylhistidine | \n", "Alzheimer's Disease | \n", "15.7 (11.7-19.7) umol/mmol creatinine | \n", "Urine | \n", "
5 | \n", "1-Methylhistidine | \n", "Preeclampsia/Eclampsia | \n", "50.7 uM | \n", "Blood | \n", "
6 | \n", "1-Methylhistidine | \n", "Chronic Kidney Disease | \n", "28.8 (10.6-47.0) uM | \n", "Blood | \n", "
7 | \n", "1,3-Diaminopropane | \n", "Leukemia | \n", "0.96 (0.12-2.1) umol/mmol creatinine | \n", "Urine | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3356 | \n", "PC(o-18:1(11Z)/18:2(9Z,12Z)) | \n", "Obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "
3358 | \n", "PC(o-18:1(9Z)/18:2(9Z,12Z)) | \n", "Obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "
3386 | \n", "SM(d18:0/14:1(9Z)(OH)) | \n", "Obesity | \n", "0.36 (0.32-0.40) umol/mmol creatinine | \n", "Urine | \n", "
3388 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "Obesity | \n", "2.2 (2.1-2.3) umol/mmol creatinine | \n", "Urine | \n", "
3392 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "Vertebral Osteoporosis | \n", ">63 nmol/mmol creatine | \n", "Urine | \n", "
1545 rows × 4 columns
\n", "\n", " | marker | \n", "name | \n", "concentration | \n", "sample | \n", "source_id | \n", "source_name | \n", "
---|---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "Obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
2 | \n", "1-Methylhistidine | \n", "Alzheimer's Disease | \n", "15.7 (11.7-19.7) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
5 | \n", "1-Methylhistidine | \n", "Preeclampsia/Eclampsia | \n", "50.7 uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
6 | \n", "1-Methylhistidine | \n", "Chronic Kidney Disease | \n", "28.8 (10.6-47.0) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
7 | \n", "1,3-Diaminopropane | \n", "Leukemia | \n", "0.96 (0.12-2.1) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3356 | \n", "PC(o-18:1(11Z)/18:2(9Z,12Z)) | \n", "Obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
3358 | \n", "PC(o-18:1(9Z)/18:2(9Z,12Z)) | \n", "Obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
3386 | \n", "SM(d18:0/14:1(9Z)(OH)) | \n", "Obesity | \n", "0.36 (0.32-0.40) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
3388 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "Obesity | \n", "2.2 (2.1-2.3) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
3392 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "Vertebral Osteoporosis | \n", ">63 nmol/mmol creatine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
1545 rows × 6 columns
\n", "\n", " | marker | \n", "name | \n", "concentration | \n", "sample | \n", "source_id | \n", "source_name | \n", "
---|---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
2 | \n", "1-Methylhistidine | \n", "alzheimer's disease | \n", "15.7 (11.7-19.7) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
5 | \n", "1-Methylhistidine | \n", "preeclampsia/eclampsia | \n", "50.7 uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
6 | \n", "1-Methylhistidine | \n", "chronic kidney disease | \n", "28.8 (10.6-47.0) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
7 | \n", "1,3-Diaminopropane | \n", "leukemia | \n", "0.96 (0.12-2.1) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3356 | \n", "PC(o-18:1(11Z)/18:2(9Z,12Z)) | \n", "obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
3358 | \n", "PC(o-18:1(9Z)/18:2(9Z,12Z)) | \n", "obesity | \n", "8.4 (5.7-11.1) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "
3386 | \n", "SM(d18:0/14:1(9Z)(OH)) | \n", "obesity | \n", "0.36 (0.32-0.40) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
3388 | \n", "SM(d18:0/22:1(13Z)(OH)) | \n", "obesity | \n", "2.2 (2.1-2.3) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
3392 | \n", "Carboxyterminal telopeptide of collagen 1 | \n", "vertebral osteoporosis | \n", ">63 nmol/mmol creatine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "
1545 rows × 6 columns
\n", "\n", " | disease_id | \n", "disease_name | \n", "name | \n", "vocab | \n", "
---|---|---|---|---|
0 | \n", "C0000735 | \n", "Abdominal Neoplasms | \n", "Abdominal Neoplasms | \n", "MSH | \n", "
1 | \n", "C0000737 | \n", "Abdominal Pain | \n", "Colicky Pain | \n", "MSH | \n", "
2 | \n", "C0000744 | \n", "Abetalipoproteinemia | \n", "abetalipoproteinemia | \n", "DO | \n", "
3 | \n", "C0000744 | \n", "Abetalipoproteinemia | \n", "Abetalipoproteinemia | \n", "MSH | \n", "
4 | \n", "C0000744 | \n", "Abetalipoproteinemia | \n", "hypolipoproteinemia | \n", "DO | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
22229 | \n", "C4540400 | \n", "SPINOCEREBELLAR ATAXIA 45 | \n", "spinocerebellar ataxia 45 | \n", "DO | \n", "
22230 | \n", "C4540404 | \n", "SPINOCEREBELLAR ATAXIA 46 | \n", "spinocerebellar ataxia 46 | \n", "DO | \n", "
22231 | \n", "C4540411 | \n", "EPILEPTIC ENCEPHALOPATHY, EARLY INFANTILE, 57 | \n", "early infantile epileptic encephalopathy 57 | \n", "DO | \n", "
22232 | \n", "C4540470 | \n", "MENTAL RETARDATION, AUTOSOMAL DOMINANT 50 | \n", "autosomal dominant mental retardation 50 | \n", "DO | \n", "
22233 | \n", "C4540499 | \n", "COFFIN-SIRIS SYNDROME 6 | \n", "Coffin-Siris syndrome 6 | \n", "DO | \n", "
22234 rows × 4 columns
\n", "\n", " | marker | \n", "name | \n", "concentration | \n", "sample | \n", "source_id | \n", "source_name | \n", "disease_id | \n", "disease_name | \n", "vocab | \n", "
---|---|---|---|---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "C0028754 | \n", "Obesity | \n", "DO | \n", "
1 | \n", "1-Methylhistidine | \n", "obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "C0028754 | \n", "Obesity | \n", "MSH | \n", "
2 | \n", "1-Methylhistidine | \n", "obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "C0039870 | \n", "Thinness | \n", "DO | \n", "
3 | \n", "1-Methylhistidine | \n", "obesity | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "Markerdb | \n", "C0451819 | \n", "Simple obesity | \n", "DO | \n", "
4 | \n", "(R)-3-Hydroxybutyric acid | \n", "obesity | \n", "235.0 (218.0-252.0) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0028754 | \n", "Obesity | \n", "DO | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3292 | \n", "Trihexosylceramide (d18:1/26:1(17Z)) | \n", "hypobetalipoproteinemia | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0020597 | \n", "Hypobetalipoproteinemias | \n", "DO | \n", "
3293 | \n", "Trihexosylceramide (d18:1/24:0) | \n", "hypobetalipoproteinemia | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0020597 | \n", "Hypobetalipoproteinemias | \n", "DO | \n", "
3294 | \n", "Tetrahexosylceramide (d18:1/12:0) | \n", "hypobetalipoproteinemia | \n", "1.00 (1.00-1.1) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0020597 | \n", "Hypobetalipoproteinemias | \n", "DO | \n", "
3295 | \n", "5-HETE | \n", "rhinitis | \n", "0.79 (0.73-0.84) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0035455 | \n", "Rhinitis | \n", "DO | \n", "
3296 | \n", "5-HETE | \n", "rhinitis | \n", "0.79 (0.73-0.84) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0035455 | \n", "Rhinitis | \n", "MSH | \n", "
3297 rows × 9 columns
\n", "\n", " | marker | \n", "disease_id | \n", "concentration | \n", "sample | \n", "source_id | \n", "
---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "C0028754 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
2 | \n", "1-Methylhistidine | \n", "C0039870 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
3 | \n", "1-Methylhistidine | \n", "C0451819 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
4 | \n", "(R)-3-Hydroxybutyric acid | \n", "C0028754 | \n", "235.0 (218.0-252.0) uM | \n", "Blood | \n", "7 | \n", "
6 | \n", "(R)-3-Hydroxybutyric acid | \n", "C0039870 | \n", "235.0 (218.0-252.0) uM | \n", "Blood | \n", "7 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3291 | \n", "Trihexosylceramide (d18:1/22:0) | \n", "C0020597 | \n", "0.90 (1.00-0.90) uM | \n", "Blood | \n", "7 | \n", "
3292 | \n", "Trihexosylceramide (d18:1/26:1(17Z)) | \n", "C0020597 | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "
3293 | \n", "Trihexosylceramide (d18:1/24:0) | \n", "C0020597 | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "
3294 | \n", "Tetrahexosylceramide (d18:1/12:0) | \n", "C0020597 | \n", "1.00 (1.00-1.1) uM | \n", "Blood | \n", "7 | \n", "
3295 | \n", "5-HETE | \n", "C0035455 | \n", "0.79 (0.73-0.84) uM | \n", "Blood | \n", "7 | \n", "
2763 rows × 5 columns
\n", "\n", " | source_id | \n", "
---|---|
count | \n", "2763.0 | \n", "
mean | \n", "7.0 | \n", "
std | \n", "0.0 | \n", "
min | \n", "7.0 | \n", "
25% | \n", "7.0 | \n", "
50% | \n", "7.0 | \n", "
75% | \n", "7.0 | \n", "
max | \n", "7.0 | \n", "
\n", " | disease_id | \n", "
---|---|
count | \n", "341.000000 | \n", "
mean | \n", "8.102639 | \n", "
std | \n", "24.981959 | \n", "
min | \n", "1.000000 | \n", "
25% | \n", "1.000000 | \n", "
50% | \n", "2.000000 | \n", "
75% | \n", "7.000000 | \n", "
max | \n", "252.000000 | \n", "
\n", " | marker | \n", "
---|---|
count | \n", "618.000000 | \n", "
mean | \n", "4.470874 | \n", "
std | \n", "4.225410 | \n", "
min | \n", "1.000000 | \n", "
25% | \n", "2.000000 | \n", "
50% | \n", "3.000000 | \n", "
75% | \n", "5.000000 | \n", "
max | \n", "31.000000 | \n", "
\n", " | biomarker appereances | \n", "
---|---|
L-Phenylalanine | \n", "31 | \n", "
L-Arginine | \n", "30 | \n", "
L-Valine | \n", "27 | \n", "
Pipecolic acid | \n", "24 | \n", "
Glycine | \n", "23 | \n", "
... | \n", "... | \n", "
Gamma-Linolenic acid | \n", "1 | \n", "
Stearic acid | \n", "1 | \n", "
Glycerol | \n", "1 | \n", "
Thymine | \n", "1 | \n", "
Trihexosylceramide (d18:1/18:0) | \n", "1 | \n", "
618 rows × 1 columns
\n", "\n", " | disease appereances | \n", "
---|---|
C0039870 | \n", "252 | \n", "
C0028754 | \n", "252 | \n", "
C0451819 | \n", "252 | \n", "
C0002395 | \n", "82 | \n", "
C0154671 | \n", "82 | \n", "
... | \n", "... | \n", "
C0699791 | \n", "1 | \n", "
C0238052 | \n", "1 | \n", "
C1708349 | \n", "1 | \n", "
C0014038 | \n", "1 | \n", "
C0220993 | \n", "1 | \n", "
341 rows × 1 columns
\n", "\n", " | marker | \n", "disease_id | \n", "concentration | \n", "sample | \n", "source_id | \n", "
---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "C0028754 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
2 | \n", "1-Methylhistidine | \n", "C0039870 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
3 | \n", "1-Methylhistidine | \n", "C0451819 | \n", "10.9 (0.80-21.0) umol/mmol creatinine | \n", "Urine | \n", "7 | \n", "
4 | \n", "(R)-3-Hydroxybutyric acid | \n", "C0028754 | \n", "235.0 (218.0-252.0) uM | \n", "Blood | \n", "7 | \n", "
6 | \n", "(R)-3-Hydroxybutyric acid | \n", "C0039870 | \n", "235.0 (218.0-252.0) uM | \n", "Blood | \n", "7 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
3291 | \n", "Trihexosylceramide (d18:1/22:0) | \n", "C0020597 | \n", "0.90 (1.00-0.90) uM | \n", "Blood | \n", "7 | \n", "
3292 | \n", "Trihexosylceramide (d18:1/26:1(17Z)) | \n", "C0020597 | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "
3293 | \n", "Trihexosylceramide (d18:1/24:0) | \n", "C0020597 | \n", "0.90 (0.90-1.00) uM | \n", "Blood | \n", "7 | \n", "
3294 | \n", "Tetrahexosylceramide (d18:1/12:0) | \n", "C0020597 | \n", "1.00 (1.00-1.1) uM | \n", "Blood | \n", "7 | \n", "
3295 | \n", "5-HETE | \n", "C0035455 | \n", "0.79 (0.73-0.84) uM | \n", "Blood | \n", "7 | \n", "
2763 rows × 5 columns
\n", "\n", " | marker | \n", "name | \n", "concentration | \n", "sample | \n", "source_id | \n", "source_name | \n", "disease_id | \n", "disease_name | \n", "vocab | \n", "
---|---|---|---|---|---|---|---|---|---|
0 | \n", "L-Valine | \n", "obesity | \n", "1.4 (0.79-2.0) uM | \n", "Blood | \n", "7 | \n", "Markerdb | \n", "C0028754 | \n", "Obesity | \n", "MSH | \n", "
\n", " | marker | \n", "name | \n", "disease_id | \n", "
---|---|---|---|
468 | \n", "L-Leucine | \n", "maple syrup urine disease | \n", "20 | \n", "
129 | \n", "Alpha-ketoisovaleric acid | \n", "maple syrup urine disease | \n", "20 | \n", "
66 | \n", "3-Methyl-2-oxovaleric acid | \n", "maple syrup urine disease | \n", "20 | \n", "
39 | \n", "2-Hydroxy-3-methylbutyric acid | \n", "maple syrup urine disease | \n", "20 | \n", "
508 | \n", "L-Valine | \n", "maple syrup urine disease | \n", "20 | \n", "
368 | \n", "Hydroxyisocaproic acid | \n", "maple syrup urine disease | \n", "20 | \n", "
558 | \n", "Mevalonic acid | \n", "mevalonic aciduria | \n", "18 | \n", "
528 | \n", "Lipoxin A4 | \n", "coronary artery disease | \n", "12 | \n", "
454 | \n", "L-Homocystine | \n", "homocystinuria | \n", "10 | \n", "
135 | \n", "Androstenedione | \n", "congenital adrenal hyperplasia | \n", "10 | \n", "
418 | \n", "L-Arginine | \n", "maple syrup urine disease | \n", "10 | \n", "
405 | \n", "L-Alanine | \n", "lung cancer | \n", "10 | \n", "
159 | \n", "Betaine | \n", "lung cancer | \n", "10 | \n", "
999 | \n", "trans-Aconitic acid | \n", "lung cancer | \n", "10 | \n", "
32 | \n", "17-Hydroxyprogesterone | \n", "congenital adrenal hyperplasia | \n", "10 | \n", "
281 | \n", "Ethanolamine | \n", "maple syrup urine disease | \n", "10 | \n", "
194 | \n", "Citric acid | \n", "maple syrup urine disease | \n", "10 | \n", "
849 | \n", "Putrescine | \n", "pancreatic cancer | \n", "10 | \n", "
320 | \n", "Glycolic acid | \n", "lung cancer | \n", "10 | \n", "
242 | \n", "D-Xylose | \n", "lung cancer | \n", "10 | \n", "
\n", " | disease_id | \n", "class_name | \n", "class_range | \n", "
---|---|---|---|
0 | \n", "C0008354 | \n", "Certain infectious and parasitic diseases | \n", "A00-B99 | \n", "
1 | \n", "C0178238 | \n", "Certain infectious and parasitic diseases | \n", "A00-B99 | \n", "
2 | \n", "C0041466 | \n", "Certain infectious and parasitic diseases | \n", "A00-B99 | \n", "
3 | \n", "C0030528 | \n", "Certain infectious and parasitic diseases | \n", "A00-B99 | \n", "
4 | \n", "C0152491 | \n", "Certain infectious and parasitic diseases | \n", "A00-B99 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "
3613 | \n", "C0013182 | \n", "Injury, poisoning and certain other consequenc... | \n", "S00-T98 | \n", "
3614 | \n", "C0041755 | \n", "Injury, poisoning and certain other consequenc... | \n", "S00-T98 | \n", "
3615 | \n", "C0085639 | \n", "External causes of morbidity and mortality | \n", "V01-Y98 | \n", "
3616 | \n", "C0019699 | \n", "Factors influencing health status and contact ... | \n", "Z00-Z99 | \n", "
3617 | \n", "C0037316 | \n", "Factors influencing health status and contact ... | \n", "Z00-Z99 | \n", "
3618 rows × 3 columns
\n", "\n", " | disease_id | \n", "gene_id | \n", "source_id | \n", "score | \n", "sio_id | \n", "
---|---|---|---|---|---|
0 | \n", "C0000731 | \n", "72 | \n", "1 | \n", "0.10 | \n", "SIO_001121 | \n", "
1 | \n", "C0000731 | \n", "672 | \n", "1 | \n", "0.10 | \n", "SIO_001121 | \n", "
2 | \n", "C0000731 | \n", "1280 | \n", "1 | \n", "0.10 | \n", "SIO_001121 | \n", "
3 | \n", "C0000731 | \n", "1482 | \n", "1 | \n", "0.10 | \n", "SIO_001121 | \n", "
4 | \n", "C0000731 | \n", "1811 | \n", "1 | \n", "0.10 | \n", "SIO_001121 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
358204 | \n", "C4540535 | \n", "2778 | \n", "1 | \n", "0.30 | \n", "SIO_001122 | \n", "
358205 | \n", "C4540536 | \n", "2778 | \n", "1 | \n", "0.30 | \n", "SIO_001122 | \n", "
358206 | \n", "C4540602 | \n", "2778 | \n", "1 | \n", "0.30 | \n", "SIO_001122 | \n", "
358207 | \n", "C4543926 | \n", "3060 | \n", "1 | \n", "0.03 | \n", "SIO_001121 | \n", "
358208 | \n", "C4545381 | \n", "5156 | \n", "1 | \n", "0.30 | \n", "SIO_001348 | \n", "
358209 rows × 5 columns
\n", "\n", " | disease_id | \n", "gene_id | \n", "class_range | \n", "icd_class_name | \n", "class_name | \n", "
---|---|---|---|---|---|
0 | \n", "C0000744 | \n", "25 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
1 | \n", "C0000744 | \n", "27 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
2 | \n", "C0000744 | \n", "238 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
3 | \n", "C0000744 | \n", "338 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
4 | \n", "C0000744 | \n", "348 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
118041 | \n", "C1691779 | \n", "2707 | \n", "H60-H95 | \n", "Diseases of the ear and mastoid process | \n", "Ear | \n", "
118042 | \n", "C1691779 | \n", "4036 | \n", "H60-H95 | \n", "Diseases of the ear and mastoid process | \n", "Ear | \n", "
118043 | \n", "C1691779 | \n", "5172 | \n", "H60-H95 | \n", "Diseases of the ear and mastoid process | \n", "Ear | \n", "
118044 | \n", "C1691779 | \n", "8772 | \n", "H60-H95 | \n", "Diseases of the ear and mastoid process | \n", "Ear | \n", "
118045 | \n", "C1691779 | \n", "10265 | \n", "H60-H95 | \n", "Diseases of the ear and mastoid process | \n", "Ear | \n", "
118046 rows × 5 columns
\n", "\n", " | class_name | \n", "disease_id | \n", "num_feature_disease | \n", "feature | \n", "
---|---|---|---|---|
0 | \n", "Circulatory | \n", "C0002940 | \n", "56 | \n", "genes | \n", "
1 | \n", "Circulatory | \n", "C0002962 | \n", "54 | \n", "genes | \n", "
2 | \n", "Circulatory | \n", "C0002963 | \n", "1 | \n", "genes | \n", "
3 | \n", "Circulatory | \n", "C0002965 | \n", "19 | \n", "genes | \n", "
4 | \n", "Circulatory | \n", "C0003486 | \n", "95 | \n", "genes | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2796 | \n", "Skin | \n", "C0702166 | \n", "44 | \n", "genes | \n", "
2797 | \n", "Skin | \n", "C1112570 | \n", "4 | \n", "genes | \n", "
2798 | \n", "Skin | \n", "C1260874 | \n", "1 | \n", "genes | \n", "
2799 | \n", "Skin | \n", "C2936846 | \n", "1 | \n", "genes | \n", "
2800 | \n", "Skin | \n", "C4083212 | \n", "19 | \n", "genes | \n", "
2801 rows × 4 columns
\n", "\n", " | disease_id | \n", "variant_id | \n", "source_id | \n", "score | \n", "
---|---|---|---|---|
0 | \n", "C0000737 | \n", "rs1057518806 | \n", "1 | \n", "0.70 | \n", "
1 | \n", "C0000737 | \n", "rs1057518886 | \n", "1 | \n", "0.70 | \n", "
2 | \n", "C0000744 | \n", "rs146064714 | \n", "1 | \n", "0.70 | \n", "
3 | \n", "C0000744 | \n", "rs199422219 | \n", "1 | \n", "0.70 | \n", "
4 | \n", "C0000744 | \n", "rs199422220 | \n", "1 | \n", "0.80 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
210493 | \n", "C4540536 | \n", "rs148033592 | \n", "1 | \n", "0.70 | \n", "
210494 | \n", "C4540536 | \n", "rs61749698 | \n", "1 | \n", "0.70 | \n", "
210495 | \n", "C4540602 | \n", "rs148033592 | \n", "1 | \n", "0.70 | \n", "
210496 | \n", "C4540602 | \n", "rs61749698 | \n", "1 | \n", "0.70 | \n", "
210497 | \n", "C4543822 | \n", "rs1044396 | \n", "1 | \n", "0.01 | \n", "
210498 rows × 4 columns
\n", "\n", " | class_name | \n", "disease_id | \n", "num_feature_disease | \n", "feature | \n", "
---|---|---|---|---|
0 | \n", "Circulatory | \n", "C0002940 | \n", "7 | \n", "variants | \n", "
1 | \n", "Circulatory | \n", "C0002962 | \n", "64 | \n", "variants | \n", "
2 | \n", "Circulatory | \n", "C0002963 | \n", "2 | \n", "variants | \n", "
3 | \n", "Circulatory | \n", "C0002965 | \n", "4 | \n", "variants | \n", "
4 | \n", "Circulatory | \n", "C0003486 | \n", "9 | \n", "variants | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1623 | \n", "Skin | \n", "C0406317 | \n", "1 | \n", "variants | \n", "
1624 | \n", "Skin | \n", "C0409974 | \n", "17 | \n", "variants | \n", "
1625 | \n", "Skin | \n", "C0477474 | \n", "1 | \n", "variants | \n", "
1626 | \n", "Skin | \n", "C0702166 | \n", "8 | \n", "variants | \n", "
1627 | \n", "Skin | \n", "C4083212 | \n", "2 | \n", "variants | \n", "
1628 rows × 4 columns
\n", "\n", " | disease_id | \n", "pathway_id | \n", "
---|---|---|
0 | \n", "C0000731 | \n", "WP117 | \n", "
1 | \n", "C0000731 | \n", "WP138 | \n", "
2 | \n", "C0000731 | \n", "WP15 | \n", "
3 | \n", "C0000731 | \n", "WP1533 | \n", "
4 | \n", "C0000731 | \n", "WP1544 | \n", "
... | \n", "... | \n", "... | \n", "
400696 | \n", "C4540602 | \n", "WP734 | \n", "
400697 | \n", "C4545381 | \n", "WP306 | \n", "
400698 | \n", "C4545381 | \n", "WP322 | \n", "
400699 | \n", "C4545381 | \n", "WP3611 | \n", "
400700 | \n", "C4545381 | \n", "WP51 | \n", "
400701 rows × 2 columns
\n", "\n", " | class_name | \n", "disease_id | \n", "num_feature_disease | \n", "feature | \n", "
---|---|---|---|---|
0 | \n", "Circulatory | \n", "C0002940 | \n", "120 | \n", "pathway | \n", "
1 | \n", "Circulatory | \n", "C0002962 | \n", "96 | \n", "pathway | \n", "
2 | \n", "Circulatory | \n", "C0002963 | \n", "8 | \n", "pathway | \n", "
3 | \n", "Circulatory | \n", "C0002965 | \n", "79 | \n", "pathway | \n", "
4 | \n", "Circulatory | \n", "C0003486 | \n", "139 | \n", "pathway | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2423 | \n", "Skin | \n", "C0549567 | \n", "9 | \n", "pathway | \n", "
2424 | \n", "Skin | \n", "C0600336 | \n", "1 | \n", "pathway | \n", "
2425 | \n", "Skin | \n", "C0702166 | \n", "81 | \n", "pathway | \n", "
2426 | \n", "Skin | \n", "C1112570 | \n", "4 | \n", "pathway | \n", "
2427 | \n", "Skin | \n", "C4083212 | \n", "31 | \n", "pathway | \n", "
2428 rows × 4 columns
\n", "\n", " | marker | \n", "disease_id | \n", "class_range | \n", "icd_class_name | \n", "class_name | \n", "
---|---|---|---|---|---|
0 | \n", "1-Methylhistidine | \n", "C0028754 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
1 | \n", "(R)-3-Hydroxybutyric acid | \n", "C0028754 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
2 | \n", "L-Carnitine | \n", "C0028754 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
3 | \n", "L-Threonine | \n", "C0028754 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
4 | \n", "Ornithine | \n", "C0028754 | \n", "E00-E90 | \n", "Endocrine, nutritional and metabolic diseases | \n", "Metabolic | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
1712 | \n", "Theophylline | \n", "C1319018 | \n", "J00-J99 | \n", "Diseases of the respiratory system | \n", "Respiratory | \n", "
1713 | \n", "Theobromine | \n", "C1319018 | \n", "J00-J99 | \n", "Diseases of the respiratory system | \n", "Respiratory | \n", "
1714 | \n", "11b-PGF2a | \n", "C1319018 | \n", "J00-J99 | \n", "Diseases of the respiratory system | \n", "Respiratory | \n", "
1715 | \n", "1,7-Dimethyluric acid | \n", "C1319018 | \n", "J00-J99 | \n", "Diseases of the respiratory system | \n", "Respiratory | \n", "
1716 | \n", "5-HETE | \n", "C1319018 | \n", "J00-J99 | \n", "Diseases of the respiratory system | \n", "Respiratory | \n", "
1717 rows × 5 columns
\n", "\n", " | class_name | \n", "disease_id | \n", "num_feature_disease | \n", "class_range | \n", "icd_class_name | \n", "feature | \n", "
---|---|---|---|---|---|---|
0 | \n", "Circulatory | \n", "C0004153 | \n", "1 | \n", "1 | \n", "1 | \n", "biomarker | \n", "
1 | \n", "Circulatory | \n", "C0010054 | \n", "1 | \n", "1 | \n", "1 | \n", "biomarker | \n", "
2 | \n", "Circulatory | \n", "C0010068 | \n", "1 | \n", "1 | \n", "1 | \n", "biomarker | \n", "
3 | \n", "Circulatory | \n", "C0010072 | \n", "3 | \n", "3 | \n", "3 | \n", "biomarker | \n", "
4 | \n", "Circulatory | \n", "C0020538 | \n", "9 | \n", "9 | \n", "9 | \n", "biomarker | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
175 | \n", "Respiratory | \n", "C0264413 | \n", "8 | \n", "8 | \n", "8 | \n", "biomarker | \n", "
176 | \n", "Respiratory | \n", "C1260881 | \n", "8 | \n", "8 | \n", "8 | \n", "biomarker | \n", "
177 | \n", "Respiratory | \n", "C1319018 | \n", "8 | \n", "8 | \n", "8 | \n", "biomarker | \n", "
178 | \n", "Skin | \n", "C0013595 | \n", "2 | \n", "2 | \n", "2 | \n", "biomarker | \n", "
179 | \n", "Skin | \n", "C0042900 | \n", "1 | \n", "1 | \n", "1 | \n", "biomarker | \n", "
180 rows × 6 columns
\n", "