# Download data for Cool-Seq-Tool

This notebook downloads data for Cool-Seq-Tool used throughout the analysis.

In [1]:
import requests
from pathlib import Path

In [2]:
def download_s3(url: str, outfile_path: Path) -> None:
    """Download objects from public s3 bucket

    :param url: URL for file in s3 bucket
    :param outfile_path: Path where file should be saved
    """
    with requests.get(url, stream=True) as r:
        r.raise_for_status()
        with open(outfile_path, "wb") as h:
            for chunk in r.iter_content(chunk_size=8192):
                if chunk:
                    h.write(chunk)

In [3]:
Path("data").mkdir(exist_ok=True)

for fn in [
    "LRG_RefSeqGene_20231114",
    "MANE.GRCh38.v1.3.summary.txt",
    "transcript_mapping.tsv",
]:
    url = f"https://nch-igm-wagner-lab-public.s3.us-east-2.amazonaws.com/variation-normalizer-manuscript/cool-seq-tool/{fn}"
    outfile_path = Path(f"data/{fn}")
    download_s3(url, outfile_path)