In [1]:
import pandas as pd
pd.set_option('display.max_colwidth', None)
import os
from biodata.bed import BEDGraphReader
import itertools
import numpy as np
import encode_utils as eu
from encode_utils.connection import Connection
from biodata.baseio import BaseReader

In [2]:
PROJECT_DIR_d = "/fs/cbsuhy02/storage/yc2553/yc2553/projects/TRE_directionality/"

# Data preparation

In [3]:
# Do we still use this award???

lab = "/labs/haiyuan-yu/"
award = "/awards/UM1HG009393/"
submitter_comment = "Experiment performed by Sagar R. Shah and preprocessed by Alden Leung"
assembly = "GRCh38"

In [4]:
encode_ontologies = {"C1": "encode:K562"
					}

In [5]:
lib_names = {"C1": ["C1a", "C1b"]}

In [6]:
procap_info = pd.read_excel(f"{PROJECT_DIR_d}output/supp_tables/suppTable1.xlsx")

In [7]:
# RNA length

rnalens = {}
for sample_id in lib_names:
	for lib_name in lib_names[sample_id]:
		df = pd.read_table(f"{PROJECT_DIR_d}PROcap/QC/RNALen/{lib_name}_RNALen_stat.txt", header=None, index_col=0)
		rnalens[lib_name] = int(df.loc["mean"].iloc[0])

# Data submission

In [33]:
# Sagar will get a new key under his name

# %env DCC_API_KEY=Q3BTI4I7
# %env DCC_SECRET_KEY=rbrmcsulnpvcvr7d

In [29]:
# Confirm with data wrangler after submitting to test server
# Submit to real server
# Fill out ENCODE ID in suppTable and 1-1.ipynb

# conn = Connection("dev")
# conn = Connection("prod")

2024-10-11 22:08:43,019:eu_debug:	submission=False: In non-submission mode.


In [8]:
cd $PROJECT_DIR_d/PROcap

/NFS4/storage/yc2553/yc2553/projects/TRE_directionality/PROcap


## Document

In [23]:
# payload = {
# 			"document_type": "general protocol",
# 			"lab": lab,
# 			"award": award,
# 			"attachment": {"path":"20220128_PROcap_Experimental_Protocol.pdf"},
# 			"aliases": ["haiyuan-yu:PROcap-Protocols"],
# 		}
# payload[Connection.PROFILE_KEY] = "document"
# conn.post(payload)

In [24]:
# payload = {
# 			"document_type": "pipeline protocol",
# 			"lab": lab,
# 			"award": award,
# 			"attachment": {"path":"20240501_PROcap_Computational_Pipeline.pdf"},
# 			"aliases": ["haiyuan-yu:PROcap-Pipelines"],
# 		}
# payload[Connection.PROFILE_KEY] = "document"
# conn.post(payload)

## Library

In [9]:
nucleic_acid_term_name = "RNA"
strand_specificity = "reverse"
construction_method = ["capped RNA enrichment"]
library_size_selection_method = "Streptavidin magnetic beads"

contents = []
header = ["lab", "award", "aliases", "nucleic_acid_term_name", "strand_specificity", "biosample", "average_fragment_size", "construction_method", "library_size_selection_method"]
for sample_id in lib_names:
	biosample = encode_ontologies[sample_id].split(":")[1]
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		aliases = [f"haiyuan-yu:procap-library-{sample_id}-{biological_replicate_number}_{technical_replicate_number}"]
		average_fragment_size = rnalens[lib_name]
		contents.append([lab, award, aliases, nucleic_acid_term_name, strand_specificity, biosample, average_fragment_size, construction_method, library_size_selection_method])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_library.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,aliases,nucleic_acid_term_name,strand_specificity,biosample,average_fragment_size,construction_method,library_size_selection_method
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,[haiyuan-yu:procap-library-C1-1_1],RNA,reverse,K562,17,[capped RNA enrichment],Streptavidin magnetic beads
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,[haiyuan-yu:procap-library-C1-1_2],RNA,reverse,K562,17,[capped RNA enrichment],Streptavidin magnetic beads


In [55]:
# library_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "library"
# 	library_logs.append(conn.post(payload))

## Experiment

In [94]:
contents =[]
header=["lab", "award", "biosample_ontology", "assay_term_name", "description", "documents", "aliases"]
for sample_id in lib_names:
	description = f"A run-on assay that precisely maps the transcription start sites genome-wide with high sensitivity and specificity in {sample_id}."
	biosample_ontology = encode_ontologies[sample_id]
	assay_term_name = "PRO-cap"
	documents = ["haiyuan-yu:PROcap-Pipelines", "haiyuan-yu:PROcap-Protocols"]
	aliases = [f"haiyuan-yu:procap-experiment-{sample_id}"]
	contents.append([lab, award, biosample_ontology, assay_term_name, description, documents, aliases])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_experiment.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,biosample_ontology,assay_term_name,description,documents,aliases
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,encode:K562,PRO-cap,A run-on assay that precisely maps the transcription start sites genome-wide with high sensitivity and specificity in C1.,"[haiyuan-yu:PROcap-Pipelines, haiyuan-yu:PROcap-Protocols]",[haiyuan-yu:procap-experiment-C1]


In [54]:
# experiment_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "experiment"
# 	experiment_logs.append(conn.post(payload))

## Replicate

In [70]:
contents = []
header = ["aliases", "experiment", "biological_replicate_number", "technical_replicate_number", "library"]
for sample_id in lib_names:
	experiment = f"haiyuan-yu:procap-experiment-{sample_id}"
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		suffix = f"{lib_name}-{biological_replicate_number}_{technical_replicate_number}"
		library = f"haiyuan-yu:procap-library-{suffix}"
		aliases = [f"haiyuan-yu:procap-replicate-{suffix}"]
		contents.append([aliases, experiment, biological_replicate_number, technical_replicate_number, library])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_replicate.txt", sep="\t", index=False)
df

Unnamed: 0,aliases,experiment,biological_replicate_number,technical_replicate_number,library
0,[haiyuan-yu:procap-replicate-C1a-1_1],haiyuan-yu:procap-experiment-C1,1,1,haiyuan-yu:procap-library-C1a-1_1
1,[haiyuan-yu:procap-replicate-C1b-1_2],haiyuan-yu:procap-experiment-C1,1,2,haiyuan-yu:procap-library-C1b-1_2


In [53]:
# replicate_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "replicate"
# 	replicate_logs.append(conn.post(payload))

## File

### fastq

In [71]:
def get_read_length(f):
	with BaseReader(f) as br:
		br.read()
		s1 = br.read()
		br.read()
		s2 = br.read()
		if len(s1) != len(s2):
			raise Exception()
		return len(s1)

In [95]:
run_type = "paired-ended"
platform = "encode:NovaSeq6000"
file_format = "fastq"
output_type = "reads"

contents = []
header = ["lab", "award", "dataset", "file_format", "run_type", "platform", "output_type", "replicate", "submitted_file_name", "paired_end", "paired_with", "aliases", "read_length"]
for sample_id in lib_names:
	dataset = f"haiyuan-yu:procap-experiment-{sample_id}"
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		replicate = f"haiyuan-yu:procap-replicate-{lib_name}-{biological_replicate_number}_{technical_replicate_number}"
		for row in procap_info.loc[procap_info["Library Name"] == lib_name].iterrows():
			r1, r2 = "RawData/" + row[1]["Sequencing Read 1"], "RawData/" + row[1]["Sequencing Read 2"]
			suffix = f"{sample_id}-{biological_replicate_number}_{technical_replicate_number}"
			submitted_file_name = r1
			paired_end = "1"
			paired_with = ""
			aliases = [f"haiyuan-yu:procap-read1-{suffix}"]
			read_length = get_read_length(r1)
			contents.append([lab, award, dataset, file_format, run_type, platform, output_type, replicate, submitted_file_name, paired_end, paired_with, aliases, read_length])

			submitted_file_name = r2 
			paired_end = "2"
			paired_with = f"haiyuan-yu:procap-read1-{suffix}"
			aliases = [f"haiyuan-yu:procap-read2-{suffix}"]
			read_length = get_read_length(r2)
			contents.append([lab, award, dataset, file_format, run_type, platform, output_type, replicate, submitted_file_name, paired_end, paired_with, aliases, read_length])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_file_fastq.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,dataset,file_format,run_type,platform,output_type,replicate,submitted_file_name,paired_end,paired_with,aliases,read_length
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,fastq,paired-ended,encode:NovaSeq6000,reads,haiyuan-yu:procap-replicate-C1a-1_1,RawData/C1a_CKDL220028609-1A_HLJNNDSX5_L4_1.fq.gz,1,,[haiyuan-yu:procap-read1-C1-1_1],150
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,fastq,paired-ended,encode:NovaSeq6000,reads,haiyuan-yu:procap-replicate-C1a-1_1,RawData/C1a_CKDL220028609-1A_HLJNNDSX5_L4_2.fq.gz,2,haiyuan-yu:procap-read1-C1-1_1,[haiyuan-yu:procap-read2-C1-1_1],150
2,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,fastq,paired-ended,encode:NovaSeq6000,reads,haiyuan-yu:procap-replicate-C1b-1_2,RawData/C1b_CKDL220028609-1A_HLJNNDSX5_L4_1.fq.gz,1,,[haiyuan-yu:procap-read1-C1-1_2],150
3,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,fastq,paired-ended,encode:NovaSeq6000,reads,haiyuan-yu:procap-replicate-C1b-1_2,RawData/C1b_CKDL220028609-1A_HLJNNDSX5_L4_2.fq.gz,2,haiyuan-yu:procap-read1-C1-1_2,[haiyuan-yu:procap-read2-C1-1_2],150


In [57]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	if payload["paired_with"] == '':
# 		payload.pop('paired_with')
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.post(payload))

### bam (unfiltered alignments)

In [96]:
step_run = "haiyuan-yu:pro-cap-run-step-1"
file_format = "bam"
output_type = "unfiltered alignments"

contents = []
header = ["lab", "award", "dataset", "file_format", "output_type", "submitted_file_name", "aliases", "derived_from", "assembly", "step_run"]
for sample_id in lib_names:
	dataset = f"haiyuan-yu:procap-experiment-{sample_id}"
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		suffix = f"{sample_id}-{biological_replicate_number}_{technical_replicate_number}"
		aliases = [f"haiyuan-yu:test-procap-unfiltered_alignment-{suffix}"]
		derived_from = ["john-lis:procap-rdna", "dnanexus:file-BjB0pV00Qy5PzkzfX1Gy6pYy",
						f"haiyuan-yu:procap-read1-{suffix}",
						f"haiyuan-yu:procap-read2-{suffix}"
						]
		submitted_file_name = f"RawAlignments/{lib_name}_Aligned.sortedByCoord.out.bam"
		contents.append([lab, award, dataset, file_format, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_file_unfiltered_alignment.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,dataset,file_format,output_type,submitted_file_name,aliases,derived_from,assembly,step_run
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bam,unfiltered alignments,RawAlignments/C1a_Aligned.sortedByCoord.out.bam,[haiyuan-yu:test-procap-unfiltered_alignment-C1-1_1],"[john-lis:procap-rdna, dnanexus:file-BjB0pV00Qy5PzkzfX1Gy6pYy, haiyuan-yu:procap-read1-C1-1_1, haiyuan-yu:procap-read2-C1-1_1]",GRCh38,haiyuan-yu:pro-cap-run-step-1
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bam,unfiltered alignments,RawAlignments/C1b_Aligned.sortedByCoord.out.bam,[haiyuan-yu:test-procap-unfiltered_alignment-C1-1_2],"[john-lis:procap-rdna, dnanexus:file-BjB0pV00Qy5PzkzfX1Gy6pYy, haiyuan-yu:procap-read1-C1-1_2, haiyuan-yu:procap-read2-C1-1_2]",GRCh38,haiyuan-yu:pro-cap-run-step-1


In [60]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.post(payload))

In [58]:
# file_logs = []
# for content in contents:	
# 	payload = OrderedDict(zip(header, content))
# 	payload["_enc_id"] = payload["aliases"][0]
# 	payload[Connection.PROFILE_KEY] = "file"
# 	payload.pop("derived_from")
# 	file_logs.append(conn.patch(payload))

In [59]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload["_enc_id"] = payload["aliases"][0]
# 	if payload["paired_with"] == '':
# 		payload.pop('paired_with')
# 	payload.pop('submitted_file_name')
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.patch(payload))

### bam (alignments)

In [97]:
step_run = "haiyuan-yu:pro-cap-run-step-2"
file_format = "bam"
output_type = "alignments"

contents = []
header = ["lab", "award", "dataset", "file_format", "output_type", "submitted_file_name", "aliases", "derived_from", "assembly", "step_run"]
for sample_id in lib_names:
	dataset = f"haiyuan-yu:procap-experiment-{sample_id}"
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		suffix = f"{sample_id}-{biological_replicate_number}_{technical_replicate_number}"
		aliases = [f"haiyuan-yu:procap-alignment-{suffix}"]
		derived_from = [f"haiyuan-yu:procap-unfiltered_alignment-{suffix}"]
		submitted_file_name = f"RawAlignments/{lib_name}_dedup.bam"
		contents.append([lab, award, dataset, file_format, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_file_alignment.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,dataset,file_format,output_type,submitted_file_name,aliases,derived_from,assembly,step_run
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bam,alignments,RawAlignments/C1a_dedup.bam,[haiyuan-yu:procap-alignment-C1-1_1],[haiyuan-yu:procap-unfiltered_alignment-C1-1_1],GRCh38,haiyuan-yu:pro-cap-run-step-2
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bam,alignments,RawAlignments/C1b_dedup.bam,[haiyuan-yu:procap-alignment-C1-1_2],[haiyuan-yu:procap-unfiltered_alignment-C1-1_2],GRCh38,haiyuan-yu:pro-cap-run-step-2


In [61]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.post(payload))

### bigwig

In [98]:
step_run = "haiyuan-yu:pro-cap-run-step-3"
file_format = "bigWig"

header=["lab", "award", "dataset", "file_format", "output_type", "submitted_file_name", "aliases", "derived_from", "assembly", "step_run"]
contents = []

for sample_id in lib_names:
	dataset = f"haiyuan-yu:procap-experiment-{sample_id}"
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		suffix = f"{sample_id}-{biological_replicate_number}_{technical_replicate_number}"
		derived_from = [f"haiyuan-yu:procap-alignment-{suffix}"]
		
		output_type = "plus strand signal of unique reads"
		aliases = [f"haiyuan-yu:procap-bigwig-plus-{suffix}"]
		submitted_file_name=f"Alignments/{lib_name}_pl.bw"
		contents.append([lab, award, dataset, file_format, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])
		
		output_type = "minus strand signal of unique reads"
		aliases = [f"haiyuan-yu:procap-bigwig-minus-{suffix}"]
		submitted_file_name = f"Alignments/{lib_name}_mn.bw"
		contents.append([lab, award, dataset, file_format, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_file_bigwig_patch.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,dataset,file_format,output_type,submitted_file_name,aliases,derived_from,assembly,step_run
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bigWig,plus strand signal of unique reads,Alignments/C1a_pl.bw,[haiyuan-yu:procap-bigwig-plus-C1-1_1],[haiyuan-yu:procap-alignment-C1-1_1],GRCh38,haiyuan-yu:pro-cap-run-step-3
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bigWig,minus strand signal of unique reads,Alignments/C1a_mn.bw,[haiyuan-yu:procap-bigwig-minus-C1-1_1],[haiyuan-yu:procap-alignment-C1-1_1],GRCh38,haiyuan-yu:pro-cap-run-step-3
2,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bigWig,plus strand signal of unique reads,Alignments/C1b_pl.bw,[haiyuan-yu:procap-bigwig-plus-C1-1_2],[haiyuan-yu:procap-alignment-C1-1_2],GRCh38,haiyuan-yu:pro-cap-run-step-3
3,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bigWig,minus strand signal of unique reads,Alignments/C1b_mn.bw,[haiyuan-yu:procap-bigwig-minus-C1-1_2],[haiyuan-yu:procap-alignment-C1-1_2],GRCh38,haiyuan-yu:pro-cap-run-step-3


In [62]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.post(payload))

### bed

In [34]:
step_run = "haiyuan-yu:pro-cap-run-step-4"
file_format = "bed"
file_format_type = "bed3+"

contents = []
header=["lab", "award", "dataset", "file_format", "file_format_type", "output_type", "submitted_file_name", "aliases", "derived_from", "assembly", "step_run"]
for sample_id in lib_names:
	dataset=f"haiyuan-yu:procap-experiment-{sample_id}"
	suffice = []
	slibs = []
	for lib_name in lib_names[sample_id]:
		biological_replicate_number = 1
		technical_replicate_number = lib_names[sample_id].index(lib_name)+1
		slibs.append(lib_name)
		suffice.append(f"{sample_id}-{biological_replicate_number}_{technical_replicate_number}")
	derived_from = ([f"haiyuan-yu:procap-bigwig-plus-{suffix}" for suffix in suffice]
					+ [f"haiyuan-yu:procap-bigwig-minus-{suffix}" for suffix in suffice])

	output_type = "bidirectional peaks"
	output_type_str = "bidirectional_peaks"
	aliases = [f"haiyuan-yu:procap-{output_type_str}-{sample_id}"]
	submitted_file_name=f"Peaks/PINTS/alignmentmerge_{'_and_'.join(slibs)}_1_bidirectional_peaks.bed.gz"
	contents.append([lab, award, dataset, file_format, file_format_type, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])

	output_type = "divergent peaks"
	output_type_str = "divergent_peaks"
	aliases = [f"haiyuan-yu:procap-{output_type_str}-{sample_id}"]
	submitted_file_name=f"Peaks/PINTS/alignmentmerge_{'_and_'.join(slibs)}_1_bidirectional_peaks.bed.gz"
	contents.append([lab, award, dataset, file_format, file_format_type, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])

	output_type = "unidirectional peaks"
	output_type_str = "unidirectional_peaks"
	aliases = [f"haiyuan-yu:procap-{output_type_str}-{sample_id}"]
	submitted_file_name=f"Peaks/PINTS/alignmentmerge_{'_and_'.join(slibs)}_1_unidirectional_peaks.bed.gz"
	contents.append([lab, award, dataset, file_format, file_format_type, output_type, submitted_file_name, aliases, derived_from, assembly, step_run])
df = pd.DataFrame(contents, columns=header)
df.to_csv(f"{PROJECT_DIR_d}/PROcap/ENCODE_submission/submit_file_bed.txt", sep="\t", index=False)
df

Unnamed: 0,lab,award,dataset,file_format,file_format_type,output_type,submitted_file_name,aliases,derived_from,assembly,step_run
0,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bed,bed3+,bidirectional peaks,Peaks/PINTS/alignmentmerge_C1a_and_C1b_1_bidirectional_peaks.bed.gz,[haiyuan-yu:procap-bidirectional_peaks-C1],"[haiyuan-yu:procap-bigwig-plus-C1-1_1, haiyuan-yu:procap-bigwig-plus-C1-1_2, haiyuan-yu:procap-bigwig-minus-C1-1_1, haiyuan-yu:procap-bigwig-minus-C1-1_2]",GRCh38,haiyuan-yu:pro-cap-run-step-4
1,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bed,bed3+,divergent peaks,Peaks/PINTS/alignmentmerge_C1a_and_C1b_1_bidirectional_peaks.bed.gz,[haiyuan-yu:procap-divergent_peaks-C1],"[haiyuan-yu:procap-bigwig-plus-C1-1_1, haiyuan-yu:procap-bigwig-plus-C1-1_2, haiyuan-yu:procap-bigwig-minus-C1-1_1, haiyuan-yu:procap-bigwig-minus-C1-1_2]",GRCh38,haiyuan-yu:pro-cap-run-step-4
2,/labs/haiyuan-yu/,/awards/UM1HG009393/,haiyuan-yu:procap-experiment-C1,bed,bed3+,unidirectional peaks,Peaks/PINTS/alignmentmerge_C1a_and_C1b_1_unidirectional_peaks.bed.gz,[haiyuan-yu:procap-unidirectional_peaks-C1],"[haiyuan-yu:procap-bigwig-plus-C1-1_1, haiyuan-yu:procap-bigwig-plus-C1-1_2, haiyuan-yu:procap-bigwig-minus-C1-1_1, haiyuan-yu:procap-bigwig-minus-C1-1_2]",GRCh38,haiyuan-yu:pro-cap-run-step-4


In [63]:
# file_logs = []
# for content in contents:
# 	payload = OrderedDict(zip(header, content))
# 	payload[Connection.PROFILE_KEY] = "file"
# 	file_logs.append(conn.post(payload))