## PhyloCSF  Score URLs

The raw score bigWig files are available at:

In [4]:
base_url = "http://data.broadinstitute.org/compbio1/PhyloCSFtracks/hg38/latest"

raw_tracks = {
    "plus1": f"{base_url}/PhyloCSFRaw+1.bw",
    "plus2": f"{base_url}/PhyloCSFRaw+2.bw", 
    "plus3": f"{base_url}/PhyloCSFRaw+3.bw",
    "minus1": f"{base_url}/PhyloCSFRaw-1.bw",
    "minus2": f"{base_url}/PhyloCSFRaw-2.bw",
    "minus3": f"{base_url}/PhyloCSFRaw-3.bw",
    "power": f"{base_url}/PhyloCSFpower.bw"
}

# Example download code
import requests
from pathlib import Path


In [2]:

phylo_dir = Path("../data/raw/phylocsf")
phylo_dir.mkdir(exist_ok=True, parents=True)

for name, url in raw_tracks.items():
    out_path = phylo_dir / f"PhyloCSFRaw_{name}.bw"
    if not out_path.exists():
        print(f"Downloading {name}...")
        response = requests.get(url, stream=True)
        if response.status_code == 200:
            with open(out_path, 'wb') as f:
                for chunk in response.iter_content(chunk_size=8192):
                    f.write(chunk)
            print(f"Downloaded {name}")
        else:
            print(f"Failed to download {name}")

Downloading plus1...
Downloaded plus1
Downloading plus2...
Downloaded plus2
Downloading plus3...
Downloaded plus3
Downloading minus1...
Downloaded minus1
Downloading minus2...
Downloaded minus2
Downloading minus3...
Downloaded minus3
Downloading power...
Downloaded power


# PhyloCSF Smoothed

In [2]:
base_url = "http://data.broadinstitute.org/compbio1/PhyloCSFtracks/hg38/latest"

smoothed_tracks = {
    "plus1": f"{base_url}/PhyloCSF+1.bw",
    "plus2": f"{base_url}/PhyloCSF+2.bw", 
    "plus3": f"{base_url}/PhyloCSF+3.bw",
    "minus1": f"{base_url}/PhyloCSF-1.bw",
    "minus2": f"{base_url}/PhyloCSF-2.bw",
    "minus3": f"{base_url}/PhyloCSF-3.bw",
    "power": f"{base_url}/PhyloCSFpower.bw"
}

# Example download code
import requests
from pathlib import Path


In [3]:

phylo_dir = Path("../data/raw/phylocsf")
phylo_dir.mkdir(exist_ok=True, parents=True)

for name, url in smoothed_tracks.items():
    out_path = phylo_dir / f"PhyloCSFsmooth_{name}.bw"
    if not out_path.exists():
        print(f"Downloading {name}...")
        response = requests.get(url, stream=True)
        if response.status_code == 200:
            with open(out_path, 'wb') as f:
                for chunk in response.iter_content(chunk_size=8192):
                    f.write(chunk)
            print(f"Downloaded {name}")
        else:
            print(f"Failed to download {name}")

Downloading minus2...
Downloaded minus2
Downloading minus3...
Downloaded minus3
Downloading power...
Downloaded power


# PhyloP Track Hg38


In [6]:
phyloP_url = {"phyloP": "https://hgdownload.cse.ucsc.edu/goldenpath/hg38/phyloP470way/hg38.phyloP470way.bw"}

In [7]:
phylo_dir = Path("../data/raw/phyloP")
phylo_dir.mkdir(exist_ok=True, parents=True)

for name, url in phyloP_url.items():
    out_path = phylo_dir / f"PhyloP_470way.bw"
    if not out_path.exists():
        print(f"Downloading {name}...")
        response = requests.get(url, stream=True)
        if response.status_code == 200:
            with open(out_path, 'wb') as f:
                for chunk in response.iter_content(chunk_size=8192):
                    f.write(chunk)
            print(f"Downloaded {name}")
        else:
            print(f"Failed to download {name}")

Downloading phyloP...
Downloaded phyloP
