# Fragment file creation with SnapATAC2

Notebook to create fragment files for downstream ATAC analysis

In [1]:
import os
import pandas as pd
import numpy as np

import snapatac2 as snap

snap.__version__

'2.6.4'

In [None]:
!ls /bamfiles_filtered

D0.filtered.bam      Q1.filtered.bam.csi  Q3.filtered.bam
D0.filtered.bam.csi  Q2.filtered.bam	  Q3.filtered.bam.csi
Q1.filtered.bam      Q2.filtered.bam.csi


In [None]:
# define bam file location
bam_path="/bamfiles_filtered/"
tsv_path="/fragments/"

In [None]:
for filename in os.listdir(bam_path):
    if filename.endswith(".bam"):
        try:
            file_path = os.path.join(bam_path, filename)
           
            print(f"Processing {file_path}")
            tsv = filename.replace(".filtered.bam", ".tsv.gz")
            tsv_full = os.path.join(tsv_path, tsv)
            print(f"Creating tsv file {tsv_full}")
            snap.pp.make_fragment_file(file_path, tsv_full, is_paired=False, barcode_tag="CB",
                min_mapq=30)
            print("\n")
        except:
            pass

## environment

```
pip list
Package                  Version
------------------------ -----------
absl-py                  2.1.0
aiohttp                  3.9.5
aiosignal                1.3.1
anndata                  0.10.8
annoy                    1.17.3
array_api_compat         1.8
asttokens                2.4.1
attrs                    23.2.0
certifi                  2024.7.4
charset-normalizer       3.3.2
chex                     0.1.86
comm                     0.2.2
contextlib2              21.6.0
contourpy                1.2.1
cycler                   0.12.1
cykhash                  2.0.1
debugpy                  1.8.2
decorator                5.1.1
Deprecated               1.2.14
dill                     0.3.8
docrep                   0.3.2
etils                    1.9.2
exceptiongroup           1.2.2
executing                2.0.1
fbpca                    1.0
filelock                 3.15.4
flax                     0.8.5
fonttools                4.53.1
frozenlist               1.4.1
fsspec                   2024.6.1
future                   1.0.0
geosketch                1.2
graphtools               1.5.3
h5py                     3.11.0
harmonypy                0.0.10
hmmlearn                 0.3.2
idna                     3.7
igraph                   0.11.6
importlib_metadata       8.2.0
importlib_resources      6.4.0
intervaltree             3.1.0
ipykernel                6.29.5
ipython                  8.26.0
jax                      0.4.30
jaxlib                   0.4.30
jedi                     0.19.1
Jinja2                   3.1.4
joblib                   1.4.2
jupyter_client           8.6.2
jupyter_core             5.7.2
kaleido                  0.2.1
kiwisolver               1.4.5
legacy-api-wrap          1.4
lightning                2.1.4
lightning-utilities      0.11.6
llvmlite                 0.43.0
MACS3                    3.0.1
magic-impute             3.0.0
markdown-it-py           3.0.0
MarkupSafe               2.1.5
matplotlib               3.9.1
matplotlib-inline        0.1.7
mdurl                    0.1.2
ml_collections           0.1.1
ml-dtypes                0.4.0
mpmath                   1.3.0
msgpack                  1.0.8
mudata                   0.2.4
multidict                6.0.5
multipledispatch         1.0.0
multiprocess             0.70.16
natsort                  8.4.0
nest_asyncio             1.6.0
networkx                 3.3
numba                    0.60.0
numpy                    1.26.4
numpyro                  0.15.1
nvidia-cublas-cu12       12.1.3.1
nvidia-cuda-cupti-cu12   12.1.105
nvidia-cuda-nvrtc-cu12   12.1.105
nvidia-cuda-runtime-cu12 12.1.105
nvidia-cudnn-cu12        9.1.0.70
nvidia-cufft-cu12        11.0.2.54
nvidia-curand-cu12       10.3.2.106
nvidia-cusolver-cu12     11.4.5.107
nvidia-cusparse-cu12     12.1.0.106
nvidia-nccl-cu12         2.20.5
nvidia-nvjitlink-cu12    12.5.82
nvidia-nvtx-cu12         12.1.105
opt-einsum               3.3.0
optax                    0.2.3
orbax-checkpoint         0.5.23
packaging                24.1
pandas                   2.0.3
parso                    0.8.4
patsy                    0.5.6
pexpect                  4.9.0
pickleshare              0.7.5
pillow                   10.4.0
pip                      24.0
platformdirs             4.2.2
plotly                   5.23.0
polars                   0.20.31
pooch                    1.8.2
prompt_toolkit           3.0.47
protobuf                 5.27.2
psutil                   6.0.0
ptyprocess               0.7.0
pure_eval                0.2.3
pyarrow                  17.0.0
pyfaidx                  0.7.2.2
Pygments                 2.18.0
PyGSP                    0.5.1
pynndescent              0.5.13
pyparsing                3.1.2
pyro-api                 0.1.2
pyro-ppl                 1.9.1
python-dateutil          2.9.0
pytorch-lightning        2.3.3
pytz                     2024.1
PyYAML                   6.0.1
pyzmq                    26.0.3
requests                 2.32.3
rich                     13.7.1
rustworkx                0.15.1
scanorama                1.7.4
scanpy                   1.10.2
scikit-learn             1.5.1
scikit-misc              0.5.1
scipy                    1.14.0
scprep                   1.2.3
scvi-tools               1.1.5
seaborn                  0.13.2
session_info             1.0.0
setuptools               71.0.4
six                      1.16.0
snapatac2                2.6.4
sortedcontainers         2.4.0
stack-data               0.6.2
statsmodels              0.14.2
stdlib-list              0.10.0
sympy                    1.13.1
tasklogger               1.2.0
tenacity                 8.5.0
tensorstore              0.1.63
texttable                1.7.0
threadpoolctl            3.5.0
toolz                    0.12.1
torch                    2.4.0
torchmetrics             1.4.0.post0
tornado                  6.4.1
tqdm                     4.66.4
traitlets                5.14.3
triton                   3.0.0
typing_extensions        4.12.2
tzdata                   2024.1
umap-learn               0.5.6
urllib3                  2.2.2
wcwidth                  0.2.13
wheel                    0.43.0
wrapt                    1.16.0
xgboost                  2.1.0
yarl                     1.9.4
zipp                     3.19.2
```