{ "nbformat": 4, "nbformat_minor": 0, "metadata": { "colab": { "name": "05.Downloading subsets of a project.ipynb", "provenance": [], "collapsed_sections": [], "authorship_tag": "ABX9TyMwGm36+9vVPTY3ariKzrRm", "include_colab_link": true }, "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" } }, "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "[](https://colab.research.google.com/github/saketkc/pysradb/blob/develop/notebooks/05.Downloading_subsets_of_a_project.ipynb)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "# Downloading Subsets of a Project\n", "\n", "This notebook shows how to filter and download specific samples from a larger SRA project." ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "# Install pysradb if not already installed\n", "try:\n", " import pysradb\n", "\n", " print(f\"pysradb {pysradb.__version__} is already installed\")\n", "except ImportError:\n", " print(\"Installing pysradb from GitHub...\")\n", " import sys\n", "\n", " !{sys.executable} -m pip install -q git+https://github.com/saketkc/pysradb\n", " print(\"pysradb installed successfully!\")" ] }, { "cell_type": "code", "metadata": { "id": "ZimlPnZwF3JP", "colab_type": "code", "outputId": "25bca786-e5e1-4980-f304-8493b06c3481", "colab": { "base_uri": "https://localhost:8080/", "height": 683 } }, "source": [ "pip install git+https://github.com/saketkc/pysradb.git" ], "execution_count": 1, "outputs": [ { "output_type": "stream", "text": [ "Collecting git+https://github.com/saketkc/pysradb.git\n", " Cloning https://github.com/saketkc/pysradb.git to /tmp/pip-req-build-3dlg9hp3\n", " Running command git clone -q https://github.com/saketkc/pysradb.git /tmp/pip-req-build-3dlg9hp3\n", "Requirement already satisfied: pandas==0.25.3 in /usr/local/lib/python3.6/dist-packages (from pysradb==0.10.3.dev0) (0.25.3)\n", "Collecting tqdm==4.41.1\n", " Using cached https://files.pythonhosted.org/packages/72/c9/7fc20feac72e79032a7c8138fd0d395dc6d8812b5b9edf53c3afd0b31017/tqdm-4.41.1-py2.py3-none-any.whl\n", "Collecting requests==2.22.0\n", " Using cached https://files.pythonhosted.org/packages/51/bd/23c926cd341ea6b7dd0b2a00aba99ae0f828be89d72b2190f27c11d4b7fb/requests-2.22.0-py2.py3-none-any.whl\n", "Collecting xmltodict==0.12.0\n", " Using cached https://files.pythonhosted.org/packages/28/fd/30d5c1d3ac29ce229f6bdc40bbc20b28f716e8b363140c26eff19122d8a5/xmltodict-0.12.0-py2.py3-none-any.whl\n", "Requirement already satisfied: python-dateutil>=2.6.1 in /usr/local/lib/python3.6/dist-packages (from pandas==0.25.3->pysradb==0.10.3.dev0) (2.6.1)\n", "Requirement already satisfied: pytz>=2017.2 in /usr/local/lib/python3.6/dist-packages (from pandas==0.25.3->pysradb==0.10.3.dev0) (2018.9)\n", "Requirement already satisfied: numpy>=1.13.3 in /usr/local/lib/python3.6/dist-packages (from pandas==0.25.3->pysradb==0.10.3.dev0) (1.17.5)\n", "Requirement already satisfied: idna<2.9,>=2.5 in /usr/local/lib/python3.6/dist-packages (from requests==2.22.0->pysradb==0.10.3.dev0) (2.8)\n", "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.6/dist-packages (from requests==2.22.0->pysradb==0.10.3.dev0) (1.24.3)\n", "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.6/dist-packages (from requests==2.22.0->pysradb==0.10.3.dev0) (2019.11.28)\n", "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.6/dist-packages (from requests==2.22.0->pysradb==0.10.3.dev0) (3.0.4)\n", "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.6/dist-packages (from python-dateutil>=2.6.1->pandas==0.25.3->pysradb==0.10.3.dev0) (1.12.0)\n", "Building wheels for collected packages: pysradb\n", " Building wheel for pysradb (setup.py) ... \u001b[?25l\u001b[?25hdone\n", " Created wheel for pysradb: filename=pysradb-0.10.3.dev0-cp36-none-any.whl size=147411 sha256=6ccd6874b7cde11cb10eae96cb14e86f9cdfe5f1b02b16a3c7eb20879afd6a62\n", " Stored in directory: /tmp/pip-ephem-wheel-cache-z9xalsuu/wheels/d5/24/42/81dccabc3a4aac9757e23b7175ad7270090a4b3c203cd4fc8f\n", "Successfully built pysradb\n", "\u001b[31mERROR: google-colab 1.0.0 has requirement requests~=2.21.0, but you'll have requests 2.22.0 which is incompatible.\u001b[0m\n", "\u001b[31mERROR: datascience 0.10.6 has requirement folium==0.2.1, but you'll have folium 0.8.3 which is incompatible.\u001b[0m\n", "Installing collected packages: tqdm, requests, xmltodict, pysradb\n", " Found existing installation: tqdm 4.28.1\n", " Uninstalling tqdm-4.28.1:\n", " Successfully uninstalled tqdm-4.28.1\n", " Found existing installation: requests 2.21.0\n", " Uninstalling requests-2.21.0:\n", " Successfully uninstalled requests-2.21.0\n", "Successfully installed pysradb-0.10.3.dev0 requests-2.22.0 tqdm-4.41.1 xmltodict-0.12.0\n" ], "name": "stdout" }, { "output_type": "display_data", "data": { "application/vnd.colab-display-data+json": { "pip_warning": { "packages": [ "requests", "tqdm" ] } } }, "metadata": { "tags": [] } } ] }, { "cell_type": "code", "metadata": { "id": "Dg62g5OM_qbn", "colab_type": "code", "colab": { "base_uri": "https://localhost:8080/", "height": 34 }, "outputId": "295c4af3-0a46-4f70-b695-ab395422edec" }, "source": [ "!pysradb --version" ], "execution_count": 2, "outputs": [ { "output_type": "stream", "text": [ "pysradb 0.10.3-dev0\n" ], "name": "stdout" } ] }, { "cell_type": "code", "metadata": { "id": "Vi6ELv2KF_V4", "colab_type": "code", "colab": {} }, "source": [ "from pysradb.sraweb import SRAweb\n", "\n", "db = SRAweb()" ], "execution_count": 0, "outputs": [] }, { "cell_type": "markdown", "metadata": { "id": "xLZ431sPKJcX", "colab_type": "text" }, "source": [ "## Example of a record missing \"SAMPLE_ATTRIBUES\" \n", "\n", "It also has an \"auxillary\" contig file: https://trace.ncbi.nlm.nih.gov/Traces/sra/?run=SRR5146869" ] }, { "cell_type": "code", "metadata": { "id": "x5OmbCI-GFcA", "colab_type": "code", "outputId": "8f445628-1d50-4845-b918-7a6d9dbe636d", "colab": { "base_uri": "https://localhost:8080/", "height": 966 } }, "source": [ "df = db.sra_metadata(\"SRP096127\", detailed=True)\n", "df" ], "execution_count": 4, "outputs": [ { "output_type": "execute_result", "data": { "text/html": [ "
| \n", " | study_accession | \n", "experiment_accession | \n", "experiment_title | \n", "experiment_desc | \n", "organism_taxid | \n", "organism_name | \n", "library_strategy | \n", "library_source | \n", "library_selection | \n", "sample_accession | \n", "sample_title | \n", "instrument | \n", "total_spots | \n", "total_size | \n", "run_accession | \n", "run_total_spots | \n", "run_total_bases | \n", "run_alias | \n", "sra_url_alt | \n", "sra_url | \n", "experiment_alias | \n", "source_name | \n", "cell type | \n", "group | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "SRP096127 | \n", "SRX2467007 | \n", "GSM2448483: normal.ct-970; Homo sapiens; Bisul... | \n", "GSM2448483: normal.ct-970; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899466 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "559547 | \n", "50734487 | \n", "SRR5149059 | \n", "559547 | \n", "83216675 | \n", "GSM2448483_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448483 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 1 | \n", "SRP096127 | \n", "SRX2467006 | \n", "GSM2448482: normal.ct-969; Homo sapiens; Bisul... | \n", "GSM2448482: normal.ct-969; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899465 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "441577 | \n", "40899268 | \n", "SRR5149058 | \n", "441577 | \n", "65549383 | \n", "GSM2448482_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448482 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 2 | \n", "SRP096127 | \n", "SRX2467005 | \n", "GSM2448481: normal.ct-968; Homo sapiens; Bisul... | \n", "GSM2448481: normal.ct-968; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899464 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "563378 | \n", "50951134 | \n", "SRR5149057 | \n", "563378 | \n", "83839813 | \n", "GSM2448481_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448481 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 3 | \n", "SRP096127 | \n", "SRX2467004 | \n", "GSM2448480: normal.ct-967; Homo sapiens; Bisul... | \n", "GSM2448480: normal.ct-967; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899463 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "422878 | \n", "39223860 | \n", "SRR5149056 | \n", "422878 | \n", "62753430 | \n", "GSM2448480_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448480 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 4 | \n", "SRP096127 | \n", "SRX2467003 | \n", "GSM2448479: normal.ct-966; Homo sapiens; Bisul... | \n", "GSM2448479: normal.ct-966; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899461 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "517254 | \n", "46881651 | \n", "SRR5149055 | \n", "517254 | \n", "77004865 | \n", "GSM2448479_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448479 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2186 | \n", "SRP096127 | \n", "SRX2464821 | \n", "GSM2446284: HCC.ct-5; Homo sapiens; Bisulfite-Seq | \n", "GSM2446284: HCC.ct-5; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897280 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "1033204 | \n", "83576370 | \n", "SRR5146873 | \n", "1033204 | \n", "196635123 | \n", "GSM2446284_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446284 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2187 | \n", "SRP096127 | \n", "SRX2464820 | \n", "GSM2446283: HCC.ct-4; Homo sapiens; Bisulfite-Seq | \n", "GSM2446283: HCC.ct-4; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897279 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "840853 | \n", "68410342 | \n", "SRR5146872 | \n", "840853 | \n", "159822416 | \n", "GSM2446283_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446283 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2188 | \n", "SRP096127 | \n", "SRX2464819 | \n", "GSM2446282: HCC.ct-3; Homo sapiens; Bisulfite-Seq | \n", "GSM2446282: HCC.ct-3; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897278 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "885724 | \n", "71407675 | \n", "SRR5146871 | \n", "885724 | \n", "166270272 | \n", "GSM2446282_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446282 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2189 | \n", "SRP096127 | \n", "SRX2464818 | \n", "GSM2446281: HCC.ct-2; Homo sapiens; Bisulfite-Seq | \n", "GSM2446281: HCC.ct-2; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897277 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "775684 | \n", "62094237 | \n", "SRR5146870 | \n", "775684 | \n", "145671062 | \n", "GSM2446281_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446281 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2190 | \n", "SRP096127 | \n", "SRX2464817 | \n", "GSM2446280: HCC.ct-1; Homo sapiens; Bisulfite-Seq | \n", "GSM2446280: HCC.ct-1; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897276 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "1124031 | \n", "89769302 | \n", "SRR5146869 | \n", "1124031 | \n", "212986785 | \n", "GSM2446280_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446280 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
2191 rows × 24 columns
\n", "| \n", " | study_accession | \n", "experiment_accession | \n", "experiment_title | \n", "experiment_desc | \n", "organism_taxid | \n", "organism_name | \n", "library_strategy | \n", "library_source | \n", "library_selection | \n", "sample_accession | \n", "sample_title | \n", "instrument | \n", "total_spots | \n", "total_size | \n", "run_accession | \n", "run_total_spots | \n", "run_total_bases | \n", "run_alias | \n", "sra_url_alt | \n", "sra_url | \n", "experiment_alias | \n", "source_name | \n", "cell type | \n", "group | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "SRP096127 | \n", "SRX2467007 | \n", "GSM2448483: normal.ct-970; Homo sapiens; Bisul... | \n", "GSM2448483: normal.ct-970; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899466 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "559547 | \n", "50734487 | \n", "SRR5149059 | \n", "559547 | \n", "83216675 | \n", "GSM2448483_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448483 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 1 | \n", "SRP096127 | \n", "SRX2467006 | \n", "GSM2448482: normal.ct-969; Homo sapiens; Bisul... | \n", "GSM2448482: normal.ct-969; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899465 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "441577 | \n", "40899268 | \n", "SRR5149058 | \n", "441577 | \n", "65549383 | \n", "GSM2448482_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448482 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 2 | \n", "SRP096127 | \n", "SRX2467005 | \n", "GSM2448481: normal.ct-968; Homo sapiens; Bisul... | \n", "GSM2448481: normal.ct-968; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899464 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "563378 | \n", "50951134 | \n", "SRR5149057 | \n", "563378 | \n", "83839813 | \n", "GSM2448481_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448481 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 3 | \n", "SRP096127 | \n", "SRX2467004 | \n", "GSM2448480: normal.ct-967; Homo sapiens; Bisul... | \n", "GSM2448480: normal.ct-967; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899463 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "422878 | \n", "39223860 | \n", "SRR5149056 | \n", "422878 | \n", "62753430 | \n", "GSM2448480_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448480 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| 4 | \n", "SRP096127 | \n", "SRX2467003 | \n", "GSM2448479: normal.ct-966; Homo sapiens; Bisul... | \n", "GSM2448479: normal.ct-966; Homo sapiens; Bisul... | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1899461 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "517254 | \n", "46881651 | \n", "SRR5149055 | \n", "517254 | \n", "77004865 | \n", "GSM2448479_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2448479 | \n", "blood serum | \n", "blood serum | \n", "healthy control | \n", "
| ... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
| 2186 | \n", "SRP096127 | \n", "SRX2464821 | \n", "GSM2446284: HCC.ct-5; Homo sapiens; Bisulfite-Seq | \n", "GSM2446284: HCC.ct-5; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897280 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "1033204 | \n", "83576370 | \n", "SRR5146873 | \n", "1033204 | \n", "196635123 | \n", "GSM2446284_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446284 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2187 | \n", "SRP096127 | \n", "SRX2464820 | \n", "GSM2446283: HCC.ct-4; Homo sapiens; Bisulfite-Seq | \n", "GSM2446283: HCC.ct-4; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897279 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "840853 | \n", "68410342 | \n", "SRR5146872 | \n", "840853 | \n", "159822416 | \n", "GSM2446283_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446283 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2188 | \n", "SRP096127 | \n", "SRX2464819 | \n", "GSM2446282: HCC.ct-3; Homo sapiens; Bisulfite-Seq | \n", "GSM2446282: HCC.ct-3; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897278 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "885724 | \n", "71407675 | \n", "SRR5146871 | \n", "885724 | \n", "166270272 | \n", "GSM2446282_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446282 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2189 | \n", "SRP096127 | \n", "SRX2464818 | \n", "GSM2446281: HCC.ct-2; Homo sapiens; Bisulfite-Seq | \n", "GSM2446281: HCC.ct-2; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897277 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "775684 | \n", "62094237 | \n", "SRR5146870 | \n", "775684 | \n", "145671062 | \n", "GSM2446281_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446281 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
| 2190 | \n", "SRP096127 | \n", "SRX2464817 | \n", "GSM2446280: HCC.ct-1; Homo sapiens; Bisulfite-Seq | \n", "GSM2446280: HCC.ct-1; Homo sapiens; Bisulfite-Seq | \n", "9606 | \n", "Homo sapiens | \n", "Bisulfite-Seq | \n", "GENOMIC | \n", "RANDOM | \n", "SRS1897276 | \n", "N/A | \n", "Illumina HiSeq 2500 | \n", "1124031 | \n", "89769302 | \n", "SRR5146869 | \n", "1124031 | \n", "212986785 | \n", "GSM2446280_r1 | \n", "https://sra-download.ncbi.nlm.nih.gov/traces/s... | \n", "https://sra-download.st-va.ncbi.nlm.nih.gov/so... | \n", "GSM2446280 | \n", "blood serum | \n", "blood serum | \n", "hepatocellular carcinoma patient | \n", "
1654 rows × 24 columns
\n", "