{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "28a48d50", "metadata": { "scrolled": true }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: biopython in /home/lmasa/miniconda3/lib/python3.12/site-packages (1.83)\n", "Requirement already satisfied: numpy in /home/lmasa/miniconda3/lib/python3.12/site-packages (from biopython) (1.26.4)\n" ] } ], "source": [ "!pip install biopython" ] }, { "cell_type": "code", "execution_count": 2, "id": "322cad3f", "metadata": { "scrolled": true }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: geoparse in /home/lmasa/miniconda3/lib/python3.12/site-packages (2.0.4)\n", "Requirement already satisfied: numpy>=1.7 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geoparse) (1.26.4)\n", "Requirement already satisfied: pandas>=0.17 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geoparse) (2.2.2)\n", "Requirement already satisfied: requests>=2.21.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geoparse) (2.31.0)\n", "Requirement already satisfied: tqdm>=4.31.1 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geoparse) (4.65.0)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=0.17->geoparse) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=0.17->geoparse) (2023.3.post1)\n", "Requirement already satisfied: tzdata>=2022.7 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=0.17->geoparse) (2024.1)\n", "Requirement already satisfied: charset-normalizer<4,>=2 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from requests>=2.21.0->geoparse) (2.0.4)\n", "Requirement already satisfied: idna<4,>=2.5 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from requests>=2.21.0->geoparse) (3.4)\n", "Requirement already satisfied: urllib3<3,>=1.21.1 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from requests>=2.21.0->geoparse) (2.1.0)\n", "Requirement already satisfied: certifi>=2017.4.17 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from requests>=2.21.0->geoparse) (2024.2.2)\n", "Requirement already satisfied: six>=1.5 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from python-dateutil>=2.8.2->pandas>=0.17->geoparse) (1.16.0)\n" ] } ], "source": [ "!pip install geoparse" ] }, { "cell_type": "code", "execution_count": 3, "id": "a84213b2", "metadata": { "scrolled": true }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: geopandas in /home/lmasa/miniconda3/lib/python3.12/site-packages (0.14.4)\n", "Requirement already satisfied: fiona>=1.8.21 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (1.9.6)\n", "Requirement already satisfied: numpy>=1.22 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (1.26.4)\n", "Requirement already satisfied: packaging in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (23.1)\n", "Requirement already satisfied: pandas>=1.4.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (2.2.2)\n", "Requirement already satisfied: pyproj>=3.3.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (3.6.1)\n", "Requirement already satisfied: shapely>=1.8.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from geopandas) (2.0.4)\n", "Requirement already satisfied: attrs>=19.2.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (23.1.0)\n", "Requirement already satisfied: certifi in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (2024.2.2)\n", "Requirement already satisfied: click~=8.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (8.1.7)\n", "Requirement already satisfied: click-plugins>=1.0 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (1.1.1)\n", "Requirement already satisfied: cligj>=0.5 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (0.7.2)\n", "Requirement already satisfied: six in /home/lmasa/miniconda3/lib/python3.12/site-packages (from fiona>=1.8.21->geopandas) (1.16.0)\n", "Requirement already satisfied: python-dateutil>=2.8.2 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=1.4.0->geopandas) (2.8.2)\n", "Requirement already satisfied: pytz>=2020.1 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=1.4.0->geopandas) (2023.3.post1)\n", "Requirement already satisfied: tzdata>=2022.7 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pandas>=1.4.0->geopandas) (2024.1)\n" ] } ], "source": [ "!pip install geopandas" ] }, { "cell_type": "code", "execution_count": 4, "id": "b0ac0c04-168b-4183-abb4-412383f9db05", "metadata": { "scrolled": true }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Requirement already satisfied: pyspark in /home/lmasa/miniconda3/lib/python3.12/site-packages (3.5.1)\n", "Requirement already satisfied: py4j==0.10.9.7 in /home/lmasa/miniconda3/lib/python3.12/site-packages (from pyspark) (0.10.9.7)\n" ] } ], "source": [ "!pip install pyspark" ] }, { "cell_type": "code", "execution_count": 1, "id": "8e7956d3", "metadata": {}, "outputs": [], "source": [ "import requests\n", "from Bio import Entrez\n", "import GEOparse\n", "import os\n", "import gzip\n", "import shutil\n", "import pandas as pd\n", "from os.path import join\n", "from collections import defaultdict\n", "import numpy as np\n", "import csv\n", "import download_files\n", "import polars as pl\n", "import mysql.connector\n", "from mysql.connector import errorcode" ] }, { "cell_type": "code", "execution_count": 2, "id": "11c53552", "metadata": { "scrolled": true }, "outputs": [], "source": [ "#disease names and ids \n", "diseases_tsv_file='../data/raw/data_01_neuro_diseases_final_disease_selected.tsv'\n", "disease_names=download_files.extract_tsv(diseases_tsv_file)" ] }, { "cell_type": "code", "execution_count": 3, "id": "0af72d99-57be-48ae-bef7-a6692cc53ff2", "metadata": { "scrolled": true }, "outputs": [], "source": [ "#email and path to store the GDS files\n", "email_request='l.masa@alumnos.upm.es'\n", "gds_path=\"../data/gds\"" ] }, { "cell_type": "code", "execution_count": null, "id": "b6361761-21a1-412a-b342-6f5b0e0af402", "metadata": { "scrolled": true }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "29-May-2024 10:08:57 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:08:57 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3864/soft/GDS3864.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3864.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 3.26M/3.26M [00:01<00:00, 1.71MB/s]\n", "29-May-2024 10:09:00 DEBUG downloader - Size validation passed\n", "29-May-2024 10:09:00 DEBUG downloader - Moving /tmp/tmp1n5w3mdb to /home/lmasa/GEO_Laura/Data/gds/GDS3864.soft.gz\n", "29-May-2024 10:09:00 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3864/soft/GDS3864.soft.gz\n", "29-May-2024 10:09:00 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3864.soft.gz: \n", "29-May-2024 10:09:00 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:09:00 DEBUG GEOparse - DATASET: GDS3864\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_1\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_2\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_3\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_4\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_5\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_6\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_7\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_8\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_9\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_10\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_11\n", "29-May-2024 10:09:00 DEBUG GEOparse - SUBSET: GDS3864_12\n", "29-May-2024 10:09:00 DEBUG GEOparse - DATASET: GDS3864\n", "29-May-2024 10:09:03 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:09:03 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS1nnn/GDS1962/soft/GDS1962.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS1962.soft.gz\n", " 28%|█████████████████████████▏ | 5.85M/20.9M [00:02<00:02, 6.26MB/s]29-May-2024 10:13:31 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:13:31 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4879/soft/GDS4879.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS4879.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 3.91M/3.91M [00:02<00:00, 1.93MB/s]\n", "29-May-2024 10:13:34 DEBUG downloader - Size validation passed\n", "29-May-2024 10:13:34 DEBUG downloader - Moving /tmp/tmpboa6aqc5 to /home/lmasa/GEO_Laura/Data/gds/GDS4879.soft.gz\n", "29-May-2024 10:13:34 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4879/soft/GDS4879.soft.gz\n", "29-May-2024 10:13:34 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS4879.soft.gz: \n", "29-May-2024 10:13:34 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:13:34 DEBUG GEOparse - DATASET: GDS4879\n", "29-May-2024 10:13:34 DEBUG GEOparse - SUBSET: GDS4879_1\n", "29-May-2024 10:13:34 DEBUG GEOparse - SUBSET: GDS4879_2\n", "29-May-2024 10:13:34 DEBUG GEOparse - SUBSET: GDS4879_3\n", "29-May-2024 10:13:34 DEBUG GEOparse - SUBSET: GDS4879_4\n", "29-May-2024 10:13:34 DEBUG GEOparse - DATASET: GDS4879\n", "29-May-2024 10:13:37 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:13:37 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3345/soft/GDS3345.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3345.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 2.11M/2.11M [00:01<00:00, 1.33MB/s]\n", "29-May-2024 10:13:39 DEBUG downloader - Size validation passed\n", "29-May-2024 10:13:39 DEBUG downloader - Moving /tmp/tmpvp5786ab to /home/lmasa/GEO_Laura/Data/gds/GDS3345.soft.gz\n", "29-May-2024 10:13:39 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3345/soft/GDS3345.soft.gz\n", "29-May-2024 10:13:39 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3345.soft.gz: \n", "29-May-2024 10:13:39 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:13:39 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:13:39 DEBUG GEOparse - SUBSET: GDS3345_1\n", "29-May-2024 10:13:39 DEBUG GEOparse - SUBSET: GDS3345_2\n", "29-May-2024 10:13:39 DEBUG GEOparse - SUBSET: GDS3345_3\n", "29-May-2024 10:13:39 DEBUG GEOparse - SUBSET: GDS3345_4\n", "29-May-2024 10:13:39 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:13:40 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:13:40 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3268/soft/GDS3268.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3268.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 25.5M/25.5M [00:03<00:00, 7.57MB/s]\n", "29-May-2024 10:13:45 DEBUG downloader - Size validation passed\n", "29-May-2024 10:13:45 DEBUG downloader - Moving /tmp/tmpldvkp0et to /home/lmasa/GEO_Laura/Data/gds/GDS3268.soft.gz\n", "29-May-2024 10:13:45 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3268/soft/GDS3268.soft.gz\n", "29-May-2024 10:13:45 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3268.soft.gz: \n", "29-May-2024 10:13:45 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:13:45 DEBUG GEOparse - DATASET: GDS3268\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_1\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_2\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_3\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_4\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_5\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_6\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_7\n", "29-May-2024 10:13:45 DEBUG GEOparse - SUBSET: GDS3268_8\n", "29-May-2024 10:13:45 DEBUG GEOparse - DATASET: GDS3268\n", "29-May-2024 10:13:46 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:13:46 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS2nnn/GDS2447/soft/GDS2447.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS2447.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 2.06M/2.06M [00:01<00:00, 1.27MB/s]\n", "29-May-2024 10:13:49 DEBUG downloader - Size validation passed\n", "29-May-2024 10:13:49 DEBUG downloader - Moving /tmp/tmp5fkb1opz to /home/lmasa/GEO_Laura/Data/gds/GDS2447.soft.gz\n", "29-May-2024 10:13:49 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS2nnn/GDS2447/soft/GDS2447.soft.gz\n", "29-May-2024 10:13:49 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS2447.soft.gz: \n", "29-May-2024 10:13:49 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:13:49 DEBUG GEOparse - DATASET: GDS2447\n", "29-May-2024 10:13:49 DEBUG GEOparse - SUBSET: GDS2447_1\n", "29-May-2024 10:13:49 DEBUG GEOparse - SUBSET: GDS2447_2\n", "29-May-2024 10:13:49 DEBUG GEOparse - DATASET: GDS2447\n", "29-May-2024 10:15:57 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:15:57 INFO GEOparse - File already exist: using local version.\n", "29-May-2024 10:15:57 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS4879.soft.gz: \n", "29-May-2024 10:15:57 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:15:57 DEBUG GEOparse - DATASET: GDS4879\n", "29-May-2024 10:15:57 DEBUG GEOparse - SUBSET: GDS4879_1\n", "29-May-2024 10:15:57 DEBUG GEOparse - SUBSET: GDS4879_2\n", "29-May-2024 10:15:57 DEBUG GEOparse - SUBSET: GDS4879_3\n", "29-May-2024 10:15:57 DEBUG GEOparse - SUBSET: GDS4879_4\n", "29-May-2024 10:15:57 DEBUG GEOparse - DATASET: GDS4879\n", "29-May-2024 10:16:00 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:00 INFO GEOparse - File already exist: using local version.\n", "29-May-2024 10:16:00 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3345.soft.gz: \n", "29-May-2024 10:16:00 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:00 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:16:00 DEBUG GEOparse - SUBSET: GDS3345_1\n", "29-May-2024 10:16:00 DEBUG GEOparse - SUBSET: GDS3345_2\n", "29-May-2024 10:16:00 DEBUG GEOparse - SUBSET: GDS3345_3\n", "29-May-2024 10:16:00 DEBUG GEOparse - SUBSET: GDS3345_4\n", "29-May-2024 10:16:00 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:16:01 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:01 INFO GEOparse - File already exist: using local version.\n", "29-May-2024 10:16:01 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3268.soft.gz: \n", "29-May-2024 10:16:01 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:01 DEBUG GEOparse - DATASET: GDS3268\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_1\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_2\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_3\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_4\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_5\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_6\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_7\n", "29-May-2024 10:16:01 DEBUG GEOparse - SUBSET: GDS3268_8\n", "29-May-2024 10:16:01 DEBUG GEOparse - DATASET: GDS3268\n", "29-May-2024 10:16:03 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:03 INFO GEOparse - File already exist: using local version.\n", "29-May-2024 10:16:03 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS2447.soft.gz: \n", "29-May-2024 10:16:03 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:03 DEBUG GEOparse - DATASET: GDS2447\n", "29-May-2024 10:16:03 DEBUG GEOparse - SUBSET: GDS2447_1\n", "29-May-2024 10:16:03 DEBUG GEOparse - SUBSET: GDS2447_2\n", "29-May-2024 10:16:03 DEBUG GEOparse - DATASET: GDS2447\n", "29-May-2024 10:16:39 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:39 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4522/soft/GDS4522.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS4522.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 7.04M/7.04M [00:02<00:00, 2.55MB/s]\n", "29-May-2024 10:16:42 DEBUG downloader - Size validation passed\n", "29-May-2024 10:16:42 DEBUG downloader - Moving /tmp/tmpvykmsiq8 to /home/lmasa/GEO_Laura/Data/gds/GDS4522.soft.gz\n", "29-May-2024 10:16:42 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4522/soft/GDS4522.soft.gz\n", "29-May-2024 10:16:42 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS4522.soft.gz: \n", "29-May-2024 10:16:42 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:42 DEBUG GEOparse - DATASET: GDS4522\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_1\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_2\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_3\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_4\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_5\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_6\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_7\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_8\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_9\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_10\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_11\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_12\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_13\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_14\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_15\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_16\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_17\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_18\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_19\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_20\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_21\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_22\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_23\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_24\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_25\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_26\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_27\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_28\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_29\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_30\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_31\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_32\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_33\n", "29-May-2024 10:16:42 DEBUG GEOparse - SUBSET: GDS4522_34\n", "29-May-2024 10:16:42 DEBUG GEOparse - DATASET: GDS4522\n", "29-May-2024 10:16:44 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:44 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3938/soft/GDS3938.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3938.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 2.88M/2.88M [00:02<00:00, 1.50MB/s]\n", "29-May-2024 10:16:47 DEBUG downloader - Size validation passed\n", "29-May-2024 10:16:47 DEBUG downloader - Moving /tmp/tmpl_rfhlfc to /home/lmasa/GEO_Laura/Data/gds/GDS3938.soft.gz\n", "29-May-2024 10:16:47 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3938/soft/GDS3938.soft.gz\n", "29-May-2024 10:16:47 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3938.soft.gz: \n", "29-May-2024 10:16:47 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:47 DEBUG GEOparse - DATASET: GDS3938\n", "29-May-2024 10:16:47 DEBUG GEOparse - SUBSET: GDS3938_1\n", "29-May-2024 10:16:47 DEBUG GEOparse - SUBSET: GDS3938_2\n", "29-May-2024 10:16:47 DEBUG GEOparse - SUBSET: GDS3938_3\n", "29-May-2024 10:16:47 DEBUG GEOparse - SUBSET: GDS3938_4\n", "29-May-2024 10:16:47 DEBUG GEOparse - DATASET: GDS3938\n", "29-May-2024 10:16:51 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:51 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4523/soft/GDS4523.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS4523.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 7.09M/7.09M [00:02<00:00, 2.80MB/s]\n", "29-May-2024 10:16:54 DEBUG downloader - Size validation passed\n", "29-May-2024 10:16:54 DEBUG downloader - Moving /tmp/tmphrrn826s to /home/lmasa/GEO_Laura/Data/gds/GDS4523.soft.gz\n", "29-May-2024 10:16:54 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4523/soft/GDS4523.soft.gz\n", "29-May-2024 10:16:54 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS4523.soft.gz: \n", "29-May-2024 10:16:54 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:54 DEBUG GEOparse - DATASET: GDS4523\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_1\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_2\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_3\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_4\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_5\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_6\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_7\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_8\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_9\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_10\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_11\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_12\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_13\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_14\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_15\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_16\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_17\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_18\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_19\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_20\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_21\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_22\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_23\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_24\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_25\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_26\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_27\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_28\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_29\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_30\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_31\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_32\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_33\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_34\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_35\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_36\n", "29-May-2024 10:16:54 DEBUG GEOparse - SUBSET: GDS4523_37\n", "29-May-2024 10:16:54 DEBUG GEOparse - DATASET: GDS4523\n", "29-May-2024 10:16:56 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:16:56 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3502/soft/GDS3502.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3502.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 6.98M/6.98M [00:03<00:00, 2.22MB/s]\n", "29-May-2024 10:16:59 DEBUG downloader - Size validation passed\n", "29-May-2024 10:16:59 DEBUG downloader - Moving /tmp/tmpjbt967em to /home/lmasa/GEO_Laura/Data/gds/GDS3502.soft.gz\n", "29-May-2024 10:16:59 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3502/soft/GDS3502.soft.gz\n", "29-May-2024 10:16:59 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3502.soft.gz: \n", "29-May-2024 10:16:59 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:16:59 DEBUG GEOparse - DATASET: GDS3502\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_1\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_2\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_3\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_4\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_5\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_6\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_7\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_8\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_9\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_10\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_11\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_12\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_13\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_14\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_15\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_16\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_17\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_18\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_19\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_20\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_21\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_22\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_23\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_24\n", "29-May-2024 10:16:59 DEBUG GEOparse - SUBSET: GDS3502_25\n", "29-May-2024 10:16:59 DEBUG GEOparse - DATASET: GDS3502\n", "29-May-2024 10:17:01 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:17:01 INFO GEOparse - File already exist: using local version.\n", "29-May-2024 10:17:01 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3345.soft.gz: \n", "29-May-2024 10:17:01 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:17:01 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:17:01 DEBUG GEOparse - SUBSET: GDS3345_1\n", "29-May-2024 10:17:01 DEBUG GEOparse - SUBSET: GDS3345_2\n", "29-May-2024 10:17:01 DEBUG GEOparse - SUBSET: GDS3345_3\n", "29-May-2024 10:17:01 DEBUG GEOparse - SUBSET: GDS3345_4\n", "29-May-2024 10:17:01 DEBUG GEOparse - DATASET: GDS3345\n", "29-May-2024 10:17:03 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:17:03 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS1nnn/GDS1917/soft/GDS1917.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS1917.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 5.75M/5.75M [00:02<00:00, 2.51MB/s]\n", "29-May-2024 10:17:06 DEBUG downloader - Size validation passed\n", "29-May-2024 10:17:06 DEBUG downloader - Moving /tmp/tmpd2_2fbex to /home/lmasa/GEO_Laura/Data/gds/GDS1917.soft.gz\n", "29-May-2024 10:17:06 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS1nnn/GDS1917/soft/GDS1917.soft.gz\n", "29-May-2024 10:17:06 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS1917.soft.gz: \n", "29-May-2024 10:17:06 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:17:06 DEBUG GEOparse - DATASET: GDS1917\n", "29-May-2024 10:17:06 DEBUG GEOparse - SUBSET: GDS1917_1\n", "29-May-2024 10:17:06 DEBUG GEOparse - SUBSET: GDS1917_2\n", "29-May-2024 10:17:06 DEBUG GEOparse - DATASET: GDS1917\n", "29-May-2024 10:23:40 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:23:40 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS1nnn/GDS1956/soft/GDS1956.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS1956.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 9.39M/9.39M [00:03<00:00, 3.26MB/s]\n", "29-May-2024 10:23:44 DEBUG downloader - Size validation passed\n", "29-May-2024 10:23:44 DEBUG downloader - Moving /tmp/tmpmcy5md5j to /home/lmasa/GEO_Laura/Data/gds/GDS1956.soft.gz\n", "29-May-2024 10:23:44 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS1nnn/GDS1956/soft/GDS1956.soft.gz\n", "29-May-2024 10:23:44 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS1956.soft.gz: \n", "29-May-2024 10:23:44 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:23:44 DEBUG GEOparse - DATASET: GDS1956\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_1\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_2\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_3\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_4\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_5\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_6\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_7\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_8\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_9\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_10\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_11\n", "29-May-2024 10:23:44 DEBUG GEOparse - SUBSET: GDS1956_12\n", "29-May-2024 10:23:44 DEBUG GEOparse - DATASET: GDS1956\n", "29-May-2024 10:23:45 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:23:45 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDSnnn/GDS412/soft/GDS412.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS412.soft.gz\n", "100%|█████████████████████████████████████████████████████████████████████████████████████████████| 184k/184k [00:00<00:00, 204kB/s]\n", "29-May-2024 10:23:47 DEBUG downloader - Size validation passed\n", "29-May-2024 10:23:47 DEBUG downloader - Moving /tmp/tmp6jbesoyo to /home/lmasa/GEO_Laura/Data/gds/GDS412.soft.gz\n", "29-May-2024 10:23:47 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDSnnn/GDS412/soft/GDS412.soft.gz\n", "29-May-2024 10:23:47 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS412.soft.gz: \n", "29-May-2024 10:23:47 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:23:47 DEBUG GEOparse - DATASET: GDS412\n", "29-May-2024 10:23:47 DEBUG GEOparse - SUBSET: GDS412_1\n", "29-May-2024 10:23:47 DEBUG GEOparse - SUBSET: GDS412_2\n", "29-May-2024 10:23:47 DEBUG GEOparse - SUBSET: GDS412_3\n", "29-May-2024 10:23:47 DEBUG GEOparse - DATASET: GDS412\n", "29-May-2024 10:25:01 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:25:01 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4218/soft/GDS4218.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS4218.soft.gz\n", "100%|███████████████████████████████████████████████████████████████████████████████████████████| 1.28M/1.28M [00:01<00:00, 875kB/s]\n", "29-May-2024 10:25:04 DEBUG downloader - Size validation passed\n", "29-May-2024 10:25:04 DEBUG downloader - Moving /tmp/tmpwxisu6m2 to /home/lmasa/GEO_Laura/Data/gds/GDS4218.soft.gz\n", "29-May-2024 10:25:04 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4218/soft/GDS4218.soft.gz\n", "29-May-2024 10:25:04 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS4218.soft.gz: \n", "29-May-2024 10:25:04 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:25:04 DEBUG GEOparse - DATASET: GDS4218\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_1\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_2\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_3\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_4\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_5\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_6\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_7\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_8\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_9\n", "29-May-2024 10:25:04 DEBUG GEOparse - SUBSET: GDS4218_10\n", "29-May-2024 10:25:04 DEBUG GEOparse - DATASET: GDS4218\n", "29-May-2024 10:25:07 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:25:07 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3920/soft/GDS3920.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS3920.soft.gz\n", "100%|██████████████████████████████████████████████████████████████████████████████████████████| 2.84M/2.84M [00:02<00:00, 1.47MB/s]\n", "29-May-2024 10:25:10 DEBUG downloader - Size validation passed\n", "29-May-2024 10:25:10 DEBUG downloader - Moving /tmp/tmpk0rzde4u to /home/lmasa/GEO_Laura/Data/gds/GDS3920.soft.gz\n", "29-May-2024 10:25:10 DEBUG downloader - Successfully downloaded ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS3nnn/GDS3920/soft/GDS3920.soft.gz\n", "29-May-2024 10:25:10 INFO GEOparse - Parsing /home/lmasa/GEO_Laura/Data/gds/GDS3920.soft.gz: \n", "29-May-2024 10:25:10 DEBUG GEOparse - DATABASE: Geo\n", "29-May-2024 10:25:10 DEBUG GEOparse - DATASET: GDS3920\n", "29-May-2024 10:25:10 DEBUG GEOparse - SUBSET: GDS3920_1\n", "29-May-2024 10:25:10 DEBUG GEOparse - SUBSET: GDS3920_2\n", "29-May-2024 10:25:10 DEBUG GEOparse - DATASET: GDS3920\n", "29-May-2024 10:25:12 DEBUG utils - Directory /home/lmasa/GEO_Laura/Data/gds already exists. Skipping.\n", "29-May-2024 10:25:12 INFO GEOparse - Downloading ftp://ftp.ncbi.nlm.nih.gov/geo/datasets/GDS4nnn/GDS4152/soft/GDS4152.soft.gz to /home/lmasa/GEO_Laura/Data/gds/GDS4152.soft.gz\n", " 0%| | 0.00/2.36M [00:00