# Notebook for mapping ATACseq Data

Raw data downloaded from [**here**](https://www.ebi.ac.uk/biostudies/arrayexpress/studies/E-MTAB-12919/sdrf)

    Developed by: Christian Eger
    Würzburg Institute for Systems Immunology - Faculty of Medicine - Julius Maximilian Universität Würzburg
    Created on: 240415
    Last modified: 240416

In [1]:
import os
import pandas as pd
import json
import matplotlib.pyplot as plt

## Creating input file for download and processing script

Downloaded from [**here**](https://www.ebi.ac.uk/biostudies/arrayexpress/studies/E-MTAB-12919)

In [2]:
data_path = '../.data/'

In [3]:
meta_data = pd.read_csv(
    filepath_or_buffer=os.path.join(data_path, 'E-MTAB-12919.sdrf.txt'),
    sep='\t',
)
meta_data

Unnamed: 0,Source Name,Comment[ENA_SAMPLE],Comment[BioSD_SAMPLE],Characteristics[organism],Characteristics[age],Characteristics[developmental stage],Characteristics[sex],Characteristics[individual],Characteristics[organism part],Characteristics[disease],...,Assay Name,Technology Type,Comment[ENA_EXPERIMENT],Scan Name,Comment[SUBMITTED_FILE_NAME],Comment[ENA_RUN],Comment[FASTQ_URI],Comment[read_index],Comment[read_type],Factor Value[organism part]
0,HCAHeart9508819,ERS15408182,SAMEA113413051,Homo sapiens,55 to 60,adult,male,D3,heart left ventricle,normal,...,HCAHeart9508819,sequencing assay,ERX10811516,HCAHeart9508819_S1_L001_I1_001.fastq.gz,HCAHeart9508819_S1_L001_I1_001.fastq.gz,ERR11403725,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,index1,sample_barcode,heart left ventricle
1,HCAHeart9508819,ERS15408182,SAMEA113413051,Homo sapiens,55 to 60,adult,male,D3,heart left ventricle,normal,...,HCAHeart9508819,sequencing assay,ERX10811516,HCAHeart9508819_S1_L001_I2_001.fastq.gz,HCAHeart9508819_S1_L001_I2_001.fastq.gz,ERR11403725,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,index2,cell_barcode,heart left ventricle
2,HCAHeart9508819,ERS15408182,SAMEA113413051,Homo sapiens,55 to 60,adult,male,D3,heart left ventricle,normal,...,HCAHeart9508819,sequencing assay,ERX10811516,HCAHeart9508819_S1_L001_R1_001.fastq.gz,HCAHeart9508819_S1_L001_R1_001.fastq.gz,ERR11403725,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,read1,paired,heart left ventricle
3,HCAHeart9508819,ERS15408182,SAMEA113413051,Homo sapiens,55 to 60,adult,male,D3,heart left ventricle,normal,...,HCAHeart9508819,sequencing assay,ERX10811516,HCAHeart9508819_S1_L001_R2_001.fastq.gz,HCAHeart9508819_S1_L001_R2_001.fastq.gz,ERR11403725,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,read2,paired,heart left ventricle
4,HCAHeart9508820,ERS15408183,SAMEA113413052,Homo sapiens,60 to 65,adult,male,D7,right cardiac atrium,normal,...,HCAHeart9508820,sequencing assay,ERX10811517,HCAHeart9508820_S1_L001_I1_001.fastq.gz,HCAHeart9508820_S1_L001_I1_001.fastq.gz,ERR11403726,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,index1,sample_barcode,right cardiac atrium
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
183,HCAHeartST13188801,ERS15408227,SAMEA113413096,Homo sapiens,70 to 75,adult,female,AV13,atrioventricular node,normal,...,HCAHeartST13188801,sequencing assay,ERX10811561,HCAHeartST13188801_S1_L001_R2_001.fastq.gz,HCAHeartST13188801_S1_L001_R2_001.fastq.gz,ERR11403770,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,read2,paired,atrioventricular node
184,HCAHeartST13188802,ERS15408228,SAMEA113413097,Homo sapiens,70 to 75,adult,female,AV13,atrioventricular node,normal,...,HCAHeartST13188802,sequencing assay,ERX10811562,HCAHeartST13188802_S1_L001_I1_001.fastq.gz,HCAHeartST13188802_S1_L001_I1_001.fastq.gz,ERR11403771,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,index1,sample_barcode,atrioventricular node
185,HCAHeartST13188802,ERS15408228,SAMEA113413097,Homo sapiens,70 to 75,adult,female,AV13,atrioventricular node,normal,...,HCAHeartST13188802,sequencing assay,ERX10811562,HCAHeartST13188802_S1_L001_I2_001.fastq.gz,HCAHeartST13188802_S1_L001_I2_001.fastq.gz,ERR11403771,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,index2,cell_barcode,atrioventricular node
186,HCAHeartST13188802,ERS15408228,SAMEA113413097,Homo sapiens,70 to 75,adult,female,AV13,atrioventricular node,normal,...,HCAHeartST13188802,sequencing assay,ERX10811562,HCAHeartST13188802_S1_L001_R1_001.fastq.gz,HCAHeartST13188802_S1_L001_R1_001.fastq.gz,ERR11403771,ftp://ftp.sra.ebi.ac.uk/vol1/run/ERR114/ERR114...,read1,paired,atrioventricular node
