<h1 align='center'>Sanity Checks on Gateway</h1>

<h4 align='center'>iReceptor $\mid$ Laura Gutierrez Funderburk $\mid$ October 14</h4>

<h4 align='center'>Supervised by Dr. Felix Breden, Dr. Jamie Scott, Dr. Brian Corrie</h4>

<h2 align='center'>Abstract</h2>

In this notebook I will parse V-gene, D-gene and J-gene entries categorised per Lab as they appear under  https://gateway.ireceptor.org

In [6]:
# Test 1: Check len(Junction Sequence) and Junction length math
# Test 2: Check all entries do not contain non 'IG' or non 'TC' or non 'or' words
# Test 3: Verify entries are consistent within each row, i.e. 3 letter should be the 
#   same on all V,D,J-gene columns

In [1]:
#NOTE: Missing Complete name for Gastroenterology clinic, Oslo University Hospital?Rikshospitalet
lab_names = ["Institute of Molecular and Genomic Medicine, National Health Research Institutes",\
            "Von Budingen Lab",\
             "The Wellcome Trust Sanger Institute",\
            "Department of Pathology, Standford University",\
             "Kwong Lab",\
            "Vaccine Research Centre",\
             "Shemyakin-Ovchinnikov institute of Bioorganic Chemistry",\
            "Ramit Mehr's Computational Immunology Lab",\
             "Department of Immunology and Microbiology",\
            "Department of Immunology",\
            "Immunogenomics Lab",\
             "Georgiou Lab",\
             "Department of Medicine"]

lab_alias = ["IMGM",\
             "VBL",\
             "WTSI",\
             "DPS",\
             "KL",\
             "VRC",\
             "SOIBC",\
             "RMCIL",\
             "DIM",\
            "DI",\
             "IL",\
             "GL",\
             "DM"]

if len(lab_names)==len(lab_alias):
    
    lab_alias_name_dic = {lab_alias[i]:lab_names[i] for i in range(len(lab_names))}
else:
    
    print("Check lengths of arrays and look for abnormalities, duplicates, missing names/aliases ...")

In [2]:
import json
import pandas as pd

In [3]:
#IMGM= json.loads('[{"_id":4,"collapsing_method":null,"collection_time_point_relative":"Week 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278153_filtered_1.fastq -r ERR1278153_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278153.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"35","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278153.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A2wk1","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278153_aa.txz, ERR1278153_ab.txz, ERR1278153_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278153","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 2","igblast_file_name":"ERR1278153.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,463,721","cell_number":"2,369,736","ir_sequence_count":1000000,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":35,"ir_subject_age_max":35,"ir_project_sample_id":4},{"_id":43,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875289_filtered_1.fastq -r ERR875289_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875289.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"13","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875290.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F1Cpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875290_aa.txz, ERR875290_ab.txz, ERR875290_ac.txz, ERR875290_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875290","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 1 Carrier","igblast_file_name":"ERR875290.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":null,"cell_number":"4,401,648","ir_sequence_count":1928616,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier vaccinated","ir_subject_age_min":13,"ir_subject_age_max":13,"ir_project_sample_id":43},{"_id":77,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875304_filtered_1.fastq -r ERR875304_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875304.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"42","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278149.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A1pre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278149_aa.txz, ERR1278149_ab.txz, ERR1278149_ac.txz, ERR1278149_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278149","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 1","igblast_file_name":"ERR1278149.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,617,248","cell_number":"3,207,806","ir_sequence_count":1821655,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":42,"ir_subject_age_max":42,"ir_project_sample_id":77},{"_id":111,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875298_filtered_1.fastq -r ERR875298_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875298.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"4","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875299.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F3NCpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875299_aa.txz, ERR875299_ab.txz, ERR875299_ac.txz, ERR875299_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875299","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 3 Non-carrier","igblast_file_name":"ERR875299.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"3,400,216","cell_number":"2,634,244","ir_sequence_count":1633051,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier unvaccinated","ir_subject_age_min":4,"ir_subject_age_max":4,"ir_project_sample_id":111},{"_id":114,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875294_filtered_1.fastq -r ERR875294_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875294.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"12","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875295.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F2Cpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875295_aa.txz, ERR875295_ab.txz, ERR875295_ac.txz, ERR875295_ad.txz, ERR875295_ae.txz, ERR875295_af.txz, ERR875295_ag.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875295","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 2 Carrier","igblast_file_name":"ERR875295.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"3,364,283","cell_number":"5,274,181","ir_sequence_count":3261822,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier unvaccinated","ir_subject_age_min":12,"ir_subject_age_max":12,"ir_project_sample_id":114},{"_id":119,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875293_filtered_1.fastq -r ERR875293_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875293.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"14","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875294.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F2NCpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875294_aa.txz, ERR875294_ab.txz, ERR875294_ac.txz, ERR875294_ad.txz, ERR875294_ae.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875294","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 2 Non-carrier","igblast_file_name":"ERR875294.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,904,961","cell_number":"3,735,856","ir_sequence_count":2257018,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier vaccinated","ir_subject_age_min":14,"ir_subject_age_max":14,"ir_project_sample_id":119},{"_id":147,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278155_filtered_1.fastq -r ERR1278155_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278155.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"47","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278155.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A3pre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278155_aa.txz, ERR1278155_ab.txz, ERR1278155_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278155","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 3","igblast_file_name":"ERR1278155.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,316,424","cell_number":"2,830,403","ir_sequence_count":1091249,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":47,"ir_subject_age_max":47,"ir_project_sample_id":147},{"_id":154,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875302_filtered_1.fastq -r ERR875302_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875302.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"3","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875303.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F4Cpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875303_aa.txz, ERR875303_ab.txz, ERR875303_ac.txz, ERR875303_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875303","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 4 Carrier","igblast_file_name":"ERR875303.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,485,869","cell_number":"2,706,342","ir_sequence_count":1617248,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier unvaccinated","ir_subject_age_min":3,"ir_subject_age_max":3,"ir_project_sample_id":154},{"_id":181,"collapsing_method":null,"collection_time_point_relative":"Week 2 ","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278160_filtered_1.fastq -r ERR1278160_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278160.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"37","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278160.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A4wk2","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278160_aa.txz, ERR1278160_ab.txz, ERR1278160_ac.txz, ERR1278160_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278160","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 4","igblast_file_name":"ERR1278160.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,420,729","cell_number":"2,033,064","ir_sequence_count":1855317,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":37,"ir_subject_age_max":37,"ir_project_sample_id":181},{"_id":185,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875295_filtered_1.fastq -r ERR875295_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875295.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"12","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875296.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F2Cpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875296_aa.txz, ERR875296_ab.txz, ERR875296_ac.txz, ERR875296_ad.txz, ERR875296_ae.txz, ERR875296_af.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875296","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 2 Carrier","igblast_file_name":"ERR875296.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,257,018","cell_number":"4,373,440","ir_sequence_count":2782921,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier vaccinated","ir_subject_age_min":12,"ir_subject_age_max":12,"ir_project_sample_id":185},{"_id":211,"collapsing_method":null,"collection_time_point_relative":"Week 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278150_filtered_1.fastq -r ERR1278150_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278150.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"42","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278150.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A1wk1","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278150_aa.txz, ERR1278150_ab.txz, ERR1278150_ac.txz, ERR1278150_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278150","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 1","igblast_file_name":"ERR1278150.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,784,287","cell_number":"3,303,418","ir_sequence_count":1951899,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":42,"ir_subject_age_max":42,"ir_project_sample_id":211},{"_id":279,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875300_filtered_1.fastq -r ERR875300_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875300.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"5","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875301.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F4NCpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875301_aa.txz, ERR875301_ab.txz, ERR875301_ac.txz, ERR875301_ad.txz, ERR875301_ae.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875301","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 4 Non-carrier","igblast_file_name":"ERR875301.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,633,051","cell_number":"3,841,175","ir_sequence_count":2485869,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier unvaccinated","ir_subject_age_min":5,"ir_subject_age_max":5,"ir_project_sample_id":279},{"_id":301,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875297_filtered_1.fastq -r ERR875297_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875297.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"10","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875298.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F3Cpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875298_aa.txz, ERR875298_ab.txz, ERR875298_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875298","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 3 Carrier","igblast_file_name":"ERR875298.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,782,921","cell_number":"3,110,161","ir_sequence_count":1394920,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier vaccinated","ir_subject_age_min":10,"ir_subject_age_max":10,"ir_project_sample_id":301},{"_id":308,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":null,"ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"13","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":null,"prior_therapies":null,"fasta_file_name":"paired_ERR875289.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F1Cpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875289_aa.txz, ERR875289_ab.txz, ERR875289_ac.txz, ERR875289_ad.txz, ERR875289_ae.txz, ERR875289_af.txz, ERR875289_ag.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875289","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 1 Carrier","igblast_file_name":"ERR875289.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":null,"cell_number":"4,821,880","ir_sequence_count":3111452,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier unvaccinated","ir_subject_age_min":13,"ir_subject_age_max":13,"ir_project_sample_id":308},{"_id":317,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875301_filtered_1.fastq -r ERR875301_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875301.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"5","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875302.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F4NCpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875302_aa.txz, ERR875302_ab.txz, ERR875302_ac.txz, ERR875302_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875302","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 4 Non-carrier","igblast_file_name":"ERR875302.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,188,780","cell_number":"2,997,090","ir_sequence_count":1880567,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier vaccinated","ir_subject_age_min":5,"ir_subject_age_max":5,"ir_project_sample_id":317},{"_id":327,"collapsing_method":null,"collection_time_point_relative":"Week 2 ","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278151_filtered_1.fastq -r ERR1278151_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278151.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"42","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278151.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A1wk2","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278151_aa.txz, ERR1278151_ab.txz, ERR1278151_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278151","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 1","igblast_file_name":"ERR1278151.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,821,655","cell_number":"2,868,249","ir_sequence_count":1463721,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":42,"ir_subject_age_max":42,"ir_project_sample_id":327},{"_id":368,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875292_filtered_1.fastq -r ERR875292_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875292.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"14","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875293.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F2NCpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875293_aa.txz, ERR875293_ab.txz, ERR875293_ac.txz, ERR875293_ad.txz, ERR875293_ae.txz, ERR875293_af.txz, ERR875293_ag.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875293 ","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 2 Non-carrier","igblast_file_name":"ERR875293.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"4,260,441","cell_number":"5,891,225","ir_sequence_count":3364283,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier unvaccinated","ir_subject_age_min":14,"ir_subject_age_max":14,"ir_project_sample_id":368},{"_id":370,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875290_filtered_1.fastq -r ERR875290_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875290.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"11","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875291.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F1NCpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875291_aa.txz, ERR875291_ab.txz, ERR875291_ac.txz, ERR875291_ad.txz, ERR875291_ae.txz, ERR875291_af.txz, ERR875291_ag.txz, ERR875291_ah.txz, ERR875291_ai.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875291","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 1 Non-carrier","igblast_file_name":"ERR875291.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"3,111,452","cell_number":"6,353,773","ir_sequence_count":4260441,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier unvaccinated","ir_subject_age_min":11,"ir_subject_age_max":11,"ir_project_sample_id":370},{"_id":373,"collapsing_method":null,"collection_time_point_relative":"Week 2 ","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278157_filtered_1.fastq -r ERR1278157_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278157.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"47","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278157.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A3wk2","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278157_aa.txz, ERR1278157_ab.txz, ERR1278157_ac.txz, ERR1278157_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278157 ","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 3","igblast_file_name":"ERR1278157.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,091,249","cell_number":"2,563,993","ir_sequence_count":1534270,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":47,"ir_subject_age_max":47,"ir_project_sample_id":373},{"_id":393,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875299_filtered_1.fastq -r ERR875299_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875299.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"4","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875300.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F3NCpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875300_aa.txz, ERR875300_ab.txz, ERR875300_ac.txz, ERR875300_ad.txz, ERR875300_ae.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875300","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 3 Non-carrier","igblast_file_name":"ERR875300.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,394,920","cell_number":"3,008,771","ir_sequence_count":2188780,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier vaccinated","ir_subject_age_min":4,"ir_subject_age_max":4,"ir_project_sample_id":393},{"_id":392,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875291_filtered_1.fastq -r ERR875291_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875291.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"11","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875292.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"F1NCpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875292_aa.txz, ERR875292_ab.txz, ERR875292_ac.txz, ERR875292_ad.txz, ERR875292_ae.txz, ERR875292_af.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875292","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 1 Non-carrier","igblast_file_name":"ERR875292.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,928,616","cell_number":"4,762,812","ir_sequence_count":2904961,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg non-carrier vaccinated","ir_subject_age_min":11,"ir_subject_age_max":11,"ir_project_sample_id":392},{"_id":397,"collapsing_method":null,"collection_time_point_relative":"Day 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875303_filtered_1.fastq -r ERR875303_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875303.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"3","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875304.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F4Cpost","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875304_aa.txz, ERR875304_ab.txz, ERR875304_ac.txz, ERR875304_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875304 ","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 4 Carrier","igblast_file_name":"ERR875304.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,880,567","cell_number":"2,966,573","ir_sequence_count":1784287,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier vaccinated","ir_subject_age_min":3,"ir_subject_age_max":3,"ir_project_sample_id":397},{"_id":414,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR875296_filtered_1.fastq -r ERR875296_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR875296.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"10","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Hepatitis B","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR875297.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Case","sample_id":"F3Cpre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR875297_aa.txz, ERR875297_ab.txz, ERR875297_ac.txz, ERR875297_ad.txz, ERR875297_ae.txz, ERR875297_af.txz, ERR875297_ag.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR875297 ","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Family 3 Carrier","igblast_file_name":"ERR875297.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"3,261,822","cell_number":"4,490,360","ir_sequence_count":3400216,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"M","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"HBeAg carrier unvaccinated","ir_subject_age_min":10,"ir_subject_age_max":10,"ir_project_sample_id":414},{"_id":457,"collapsing_method":null,"collection_time_point_relative":"Week 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278156_filtered_1.fastq -r ERR1278156_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278156.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"47","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278156.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A3wk1","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278156_aa.txz, ERR1278156_ab.txz, ERR1278156_ac.txz, ERR1278156_ad.txz, ERR1278156_ae.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278156","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 3","igblast_file_name":"ERR1278156.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"3,199,488","cell_number":"2,408,132","ir_sequence_count":2148806,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":47,"ir_subject_age_max":47,"ir_project_sample_id":457},{"_id":472,"collapsing_method":null,"collection_time_point_relative":"Week 1","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278159_filtered_1.fastq -r ERR1278159_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278159.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Mature B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"37","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278159.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A4wk1","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278159_aa.txz, ERR1278159_ab.txz, ERR1278159_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278159","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 4","igblast_file_name":"ERR1278159.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,534,270","cell_number":"2,820,131","ir_sequence_count":1493227,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":37,"ir_subject_age_max":37,"ir_project_sample_id":472},{"_id":476,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278158_filtered_1.fastq -r ERR1278158_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278158.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Mature B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"37","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278158.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A4pre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278158_aa.txz, ERR1278158_ab.txz, ERR1278158_ac.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278158","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 4","igblast_file_name":"ERR1278158.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"2,148,806","cell_number":"2,041,832","ir_sequence_count":1420729,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":37,"ir_subject_age_max":37,"ir_project_sample_id":476},{"_id":484,"collapsing_method":null,"collection_time_point_relative":"Day 0","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278152_filtered_1.fastq -r ERR1278152_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278152.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"35","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278152.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A2pre","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278152_aa.txz, ERR1278152_ab.txz, ERR1278152_ac.txz, ERR1278152_ad.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278152","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 2","igblast_file_name":"ERR1278152.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,951,899","cell_number":"3,894,726","ir_sequence_count":1581000,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":35,"ir_subject_age_max":35,"ir_project_sample_id":484},{"_id":489,"collapsing_method":null,"collection_time_point_relative":"Week 2 ","sequencing_facility":null,"cell_phenotype":null,"paired_read_assembly":"pear -f ERR1278154_filtered_1.fastq -r ERR1278154_filtered_2.fastq -n 60 -t 60 -q 25 -o paired_ERR1278154.fastq","ethnicity":null,"sequencing_platform":"Illumina NextSeq","cell_subset":"Naive B cell","sequencing_kit":null,"germline_database":null,"ir_subject_age":"35","organism":"Homo sapiens","tissue":"PBMC","collected_by":"Chang, Y.H., Kuan, H.C.","link_type":null,"immunogen":null,"cell_storage":null,"age_event":null,"medical_history":null,"reverse_PCR_primer_target_location":"J gene","disease_state_sample":"Healthy","study_id":"PRJEB9332","sequencing_run_date":null,"grants":null,"single_cell":null,"software_versions":null,"template_quality":null,"race":null,"cell_isolation":null,"tissue_processing":null,"quality_thresholds":25,"prior_therapies":null,"fasta_file_name":"paired_ERR1278154.fasta","library_construction_method":"PCR","data_processing_protocols":null,"library_generation_protocol":null,"biomaterial_provider":null,"disease_stage":null,"library_source":"Transcriptomic","study_group_description":"Control","sample_id":"A2wk2","lab_name":"Institute of Molecular and Genomic Medicine, National Health Research Institutes","pcr_target_locus":null,"lab_address":null,"sequencing_run_id":null,"primer_match_cutoffs":null,"anatomic_site":null,"imgt_file_name":"ERR1278154_aa.txz, ERR1278154_ab.txz, ERR1278154_ac.txz, ERR1278154_ad.txz, ERR1278154_ae.txz, ERR1278154_af.txz, ERR1278154_ag.txz","complete_sequences":null,"strain_name":null,"library_generation_kit_version":null,"cell_quality":null,"cell_processing_protocol":null,"study_description":"Hepatitis B Study","ir_sra_run_id":"ERR1278154","template_amount":null,"submitted_by":"Chang, Y.H., Kuan, H.C.","mixcr_file_name":null,"collection_time_event":"Vaccination","read_length":null,"ancestry_population":null,"cells_per_reaction":null,"subject_id":"Adult 2","igblast_file_name":"ERR1278154.fmt7","intervention":null,"linked_subjects":null,"total_reads_passing_qc_filter":"1,581,000","cell_number":"5,123,678","ir_sequence_count":3199488,"forward_PCR_primer_target_location":"V gene","physical_linkage":null,"sex":"F","synthetic":null,"inclusion_exclusion_criteria":null,"sample_type":null,"disease_length":null,"template_class":"cDNA","study_title":"Network Signatures of IgG Immune Repertoires in Hepatitis B Associated Chronic Infection and Vaccination Responses.","pub_ids":null,"disease_diagnosis":"Healthy Vaccinated with HBV","ir_subject_age_min":35,"ir_subject_age_max":35,"ir_project_sample_id":489}]')

In [4]:
# Directories

CSV_Directory = "./CSV_FILES/"
IMGM_cont = CSV_Directory + "IMGM_Seq.csv"

In [87]:
IMGM_parsed = pd.read_csv(IMGM_cont,sep="\t")
V_genes = [item.split(", or ") for item in IMGM_parsed['V-Gene']]
J_genes = [item.split(", or ") for item in IMGM_parsed['J-Gene']]
D_genes = [item.split(", or ") for item in IMGM_parsed['D-Gene']]
VJD_genes = [[V_genes[i],J_genes[i],D_genes[i]] for i in range(len(V_genes))]
Junction_Sequence = [item for item in IMGM_parsed['Junction Sequence (AA)']]
Junction_Length = [item for item in IMGM_parsed['Junction Length (AA)']]

In [10]:
# Test area
# Test 1
Junction_Seq_Len_Test = [[False,i,Junction_Sequence[i],Junction_Length[i]] for i in range(len(Junction_Length)) if len(Junction_Sequence[i]) !=Junction_Length[i]]
print(Junction_Seq_Len_Test)

[]


In [13]:
# Test area
# test 2
def test_x_gene(x_gene_array):
    x_gene_test = []
    for item in x_gene_array:
        for i in range(len(item)):
            if "IG" not in item[i] and "TC" not in item[i]:
                x_gene_test.append([item,item[i]])
    return x_gene_test
print(test_x_gene(V_genes))
print(test_x_gene(J_genes))
print(test_x_gene(D_genes))

[]
[]
[[['IGHD4-11*01', 'ORF'], 'ORF'], [['IGHD4-11*01', 'ORF'], 'ORF']]


In [72]:
# Test 3

def test_IG_or_TC(x_gene_array):

    IG_vs_TC = []
    Nu_iterations = len(x_gene_array)
    for i in range(Nu_iterations):
        IG_vs_TC.append([sum("IG" in s for s in x_gene_array[i]),\
                         sum("TC" in s for s in x_gene_array[i])])
        
    tabulate_occurrences = pd.DataFrame(IG_vs_TC,columns=["Number of 'IG' occurrences"\
                               ,"Number of 'TC' occurrences"])
    
    IG_occurs = tabulate_occurrences["Number of 'IG' occurrences"].sum()
    TC_occurs = tabulate_occurrences["Number of 'TC' occurrences"].sum()
    
    return [[IG_occurs,TC_occurs],tabulate_occurrences]

def message_test_IG_or_TC():
    
    A_V,B_V = test_IG_or_TC(V_genes)
    A_J,B_J = test_IG_or_TC(J_genes)
    A_D,B_D = test_IG_or_TC(D_genes)
    
    if A_V[0]>A_V[1] and A_J[0]>A_J[1] and A_D[0]>A_D[1]:
        message="IG study"
    elif A_V[0]<A_V[1] and A_J[0]<A_J[1] and A_D[0]<A_D[1]:
        message="TC study"
    else:
        message="huh?"
    return message

print(message_test_IG_or_TC())
print("\n")
# V-genes
print(test_IG_or_TC(V_genes)[1])
print(test_IG_or_TC(V_genes)[0])
# J-genes
print(test_IG_or_TC(J_genes)[1])
print(test_IG_or_TC(J_genes)[0])
# D-genes
print(test_IG_or_TC(D_genes)[1])
print(test_IG_or_TC(D_genes)[0])

IG study


    Number of 'IG' occurrences  Number of 'TC' occurrences
0                            2                           0
1                            2                           0
2                            2                           0
3                            1                           0
4                            6                           0
5                            6                           0
6                            3                           0
7                            1                           0
8                            3                           0
9                           11                           0
10                           4                           0
11                           3                           0
12                           8                           0
13                          13                           0
14                          10                           0
15                           6               

In [90]:
VJD_genes[-2]

[['IGHV3-7*03',
  'IGHV3-53*03',
  'IGHV3-21*04',
  'IGHV3-71*01',
  'IGHV3-53*01',
  'IGHV3-48*02',
  'IGHV3-11*01',
  'IGHV3-11*05',
  'IGHV3-53*02',
  'IGHV3-11*03'],
 ['IGHJ4*02'],
 ['IGHD4-11*01', 'ORF']]