# DATASET 2 (Series 1 - 5 comparison)
## How it works
1) Data from 2nd dataset is included from csv file, categorise their column <br>
2) to compare 2 different sets of data, we first check using Chi-square test to see if difference between datas from a similar group are significant or not. We will only proceed if the differences are insignificant. <br>
3) We then take the average of the data in a set, and perform another Chi-square test onto the 2 dataset average we would like to know. If it's difference is significant we then check whether it has an increase or decrease in the number of genes and categorise them accordingly. <br>
4) The data obtained is then compiled into a csv file, sorted by the Chi-square values to indicated the magnitude it has changed (larger Chi-square value indicates a greater change). <br>
5) Graphs are plotted for the top 10 genes which has changed


In [1]:
#Import modules
import pandas as pd
import csv
import matplotlib.pyplot as plt
import numpy as np
from matplotlib.backends.backend_pdf import PdfPages
from scipy.stats import chisquare

#Import files (Change files if needed)
in_1 = "/Users/aldricgoh/COVID_Hackathon/Datasets/lung_cellline_infection/normalized_human_cellline_data.csv" #Normalised human cellline data
in_2 = "/Users/aldricgoh/COVID_Hackathon/Datasets/lung_cellline_infection/human_cellline_metadata.csv" #Metadata

#Read files
df_1 = pd.read_csv(in_1, usecols = ['gene_symbol', 'Series1_NHBE_Mock_1', 'Series1_NHBE_Mock_2', 'Series1_NHBE_Mock_3', 'Series1_NHBE_SARS.CoV.2_1', 'Series1_NHBE_SARS.CoV.2_2', 'Series1_NHBE_SARS.CoV.2_3', 'Series2_A549_Mock_1', 'Series2_A549_Mock_2', 'Series2_A549_Mock_3', 'Series2_A549_SARS.CoV.2_1', 'Series2_A549_SARS.CoV.2_2', 'Series2_A549_SARS.CoV.2_3', 'Series3_A549_Mock_1', 'Series3_A549_Mock_2', 'Series3_A549_RSV_1', 'Series3_A549_RSV_2', 'Series4_A549_Mock_1', 'Series4_A549_Mock_2', 'Series4_A549_IAV_1', 'Series4_A549_IAV_2', 'Series5_A549_Mock_1', 'Series5_A549_Mock_2', 'Series5_A549_Mock_3', 'Series5_A549_SARS.CoV.2_1', 'Series5_A549_SARS.CoV.2_2', 'Series5_A549_SARS.CoV.2_3', 'Series6_A549.ACE2_Mock_1', 'Series6_A549.ACE2_Mock_2', 'Series6_A549.ACE2_Mock_3', 'Series6_A549.ACE2_SARS.CoV.2_1', 'Series6_A549.ACE2_SARS.CoV.2_2', 'Series6_A549.ACE2_SARS.CoV.2_3', 'Series7_Calu3_Mock_1', 'Series7_Calu3_Mock_2', 'Series7_Calu3_Mock_3', 'Series7_Calu3_SARS.CoV.2_1', 'Series7_Calu3_SARS.CoV.2_2', 'Series7_Calu3_SARS.CoV.2_3', 'Series8_A549_Mock_1', 'Series8_A549_Mock_2', 'Series8_A549_Mock_3', 'Series8_A549_RSV_1', 'Series8_A549_RSV_2', 'Series8_A549_RSV_3', 'Series8_A549_HPIV3_3', 'Series8_A549_HPIV3_2', 'Series8_A549_HPIV3_1', 'Series9_NHBE_Mock_1', 'Series9_NHBE_Mock_2', 'Series9_NHBE_Mock_3', 'Series9_NHBE_Mock_4', 'Series9_NHBE_IAV_1', 'Series9_NHBE_IAV_2', 'Series9_NHBE_IAV_3', 'Series9_NHBE_IAV_4', 'Series9_NHBE_IAVdNS1_1', 'Series9_NHBE_IAVdNS1_2', 'Series9_NHBE_IAVdNS1_3', 'Series9_NHBE_IAVdNS1_4', 'Series9_NHBE_IFNB_4h_1', 'Series9_NHBE_IFNB_4h_2', 'Series9_NHBE_IFNB_6h_1', 'Series9_NHBE_IFNB_6h_2', 'Series9_NHBE_IFNB_12h_1', 'Series9_NHBE_IFNB_12h_2', 'Series16_A549.ACE2_Mock_1', 'Series16_A549.ACE2_Mock_2', 'Series16_A549.ACE2_Mock_3', 'Series16_A549.ACE2_SARS.CoV.2_1', 'Series16_A549.ACE2_SARS.CoV.2_2', 'Series16_A549.ACE2_SARS.CoV.2_3', 'Series16_A549.ACE2_SARS.CoV.2_Rux_1', 'Series16_A549.ACE2_SARS.CoV.2_Rux_2', 'Series16_A549.ACE2_SARS.CoV.2_Rux_3'])
df_2 = pd.read_csv(in_2, usecols = ['title', 'geo_accession', 'organism', 'description', 'cell_line', 'cell_strain', 'treatment', 'time_after_treatment_hrs',	'name_short', 'replicate', 'cell_type'])

In [2]:
#Insert values into lists
genes = df_1['gene_symbol'].values

series1_mock1 = df_1['Series1_NHBE_Mock_1'].values
series1_mock2 = df_1['Series1_NHBE_Mock_2'].values
series1_mock3 = df_1['Series1_NHBE_Mock_3'].values
series1_1 = df_1['Series1_NHBE_SARS.CoV.2_1'].values
series1_2 = df_1['Series1_NHBE_SARS.CoV.2_2'].values
series1_3 = df_1['Series1_NHBE_SARS.CoV.2_3'].values

series2_mock1 = df_1['Series2_A549_Mock_1'].values
series2_mock2 = df_1['Series2_A549_Mock_2'].values
series2_mock3 = df_1['Series2_A549_Mock_3'].values
series2_1 = df_1['Series2_A549_SARS.CoV.2_1'].values
series2_2 = df_1['Series2_A549_SARS.CoV.2_2'].values
series2_3 = df_1['Series2_A549_SARS.CoV.2_3'].values

In [18]:
#Set up empty lists
sig_diff_down_1 = []
sig_diff_up_1 = []
sig_diff_down_2 = []
sig_diff_up_2 = []

In [19]:
for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series1_mock1[i], series1_mock2[i], series1_mock3[i]])[0] < 6.635 and chisquare([series1_1[i], series1_2[i], series1_3[i]])[0] < 6.635:
        a = (series1_mock1[i] + series1_mock2[i] + series1_mock3[i])/3
        b = (series1_1[i] + series1_2[i] + series1_3[i])/3
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a < b:
                sig_diff_up_1.append([genes[i], series1_mock1[i], series1_mock2[i], series1_mock3[i], series1_1[i], series1_2[i], series1_3[i], chi])
            else:
                sig_diff_down_1.append([genes[i], series1_mock1[i], series1_mock2[i], series1_mock3[i], series1_1[i], series1_2[i], series1_3[i], chi])
        
    else:
        pass

In [17]:
#Check length of lists
print(len(sig_diff_down_1))
print(len(sig_diff_up_1))
print(len(sig_diff_down_1) + len(sig_diff_up_1))

117
130
247


In [6]:
output_filename_1 = "/Users/aldricgoh/Series1_analysis_upreg.csv"
output_filename_2 = "/Users/aldricgoh/Series1_analysis_downreg.csv"

#Function to write csv file
def write_csv(filename, header, data):
    with open(filename, 'w') as f:
        writer = csv.writer(f)
        writer.writerow(header)
        writer.writerows(data)

def take_chi(elem):
    return elem[7]
sig_diff_up_1 = sorted(sig_diff_up_1, key=take_chi,reverse=True)
sig_diff_down_1 = sorted(sig_diff_down_1, key=take_chi,reverse=True)

write_csv(filename=output_filename_1, header=['gene_symbol', 'Series1_NHBE_Mock_1', 'Series1_NHBE_Mock_2', 'Series1_NHBE_Mock_3', 'Series1_NHBE_SARS.CoV.2_1', 'Series1_NHBE_SARS.CoV.2_2', 'Series1_NHBE_SARS.CoV.2_3', 'Chisquare_Value'], data=sig_diff_up_1)
write_csv(filename=output_filename_2, header=['gene_symbol', 'Series1_NHBE_Mock_1', 'Series1_NHBE_Mock_2', 'Series1_NHBE_Mock_3', 'Series1_NHBE_SARS.CoV.2_1', 'Series1_NHBE_SARS.CoV.2_2', 'Series1_NHBE_SARS.CoV.2_3', 'Chisquare_Value'], data=sig_diff_down_1)

In [20]:
for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series2_mock1[i], series2_mock2[i], series2_mock3[i]])[0] < 6.635 and chisquare([series2_1[i], series2_2[i], series2_3[i]])[0] < 6.635:
        a = (series2_mock1[i] + series2_mock2[i] + series2_mock3[i])/3
        b = (series2_1[i] + series2_2[i] + series2_3[i])/3
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a < b:
                sig_diff_up_2.append([genes[i], a, b, chi])
            else:
                sig_diff_down_2.append([genes[i], a, b, chi])
        
    else:
        pass

In [21]:
#Check length of lists
print(len(sig_diff_down_2))
print(len(sig_diff_up_2))
print(len(sig_diff_down_2) + len(sig_diff_up_2))

75
95
170


In [22]:
output_filename_3 = "/Users/aldricgoh/COVID HACK/Series2_analysis_upreg.csv"
output_filename_4 = "/Users/aldricgoh/COVID HACK/Series2_analysis_downreg.csv"

def take_chi(elem):
    return elem[3]

sig_diff_up_2 = sorted(sig_diff_up_2, key=take_chi,reverse=True)
sig_diff_down_2 = sorted(sig_diff_down_2, key=take_chi,reverse=True)

write_csv(filename=output_filename_3, header=['gene_symbol', 'Series2_A549_Mock_average', 'Series2_A549_SARS.CoV.2_average', 'Chisquare Values'], data=sig_diff_up_2)
write_csv(filename=output_filename_4, header=['gene_symbol', 'Series2_A549_Mock_average', 'Series2_A549_SARS.CoV.2_average', 'Chisquare Values'], data=sig_diff_down_2)

In [23]:
#Make new lists
sig_diff_1_2_mock_A549_up = [] 
sig_diff_1_2_mock_A549_down = [] 

In [None]:
for i in range(len(genes)):
        #Check is there is significant difference 
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series2_mock1[i], series2_mock2[i], series2_mock3[i]])[0] < 6.635 and chisquare([series1_mock1[i], series1_mock2[i], series1_mock3[i]])[0] < 6.635:
        a = (series2_mock1[i] + series2_mock2[i] + series2_mock3[i])/3
        b = (series1_mock1[i] + series1_mock2[i] + series1_mock3[i])/3
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a > b:
                sig_diff_1_2_mock_A549_up.append([genes[i], a, b, chi])
            else:
                sig_diff_1_2_mock_A549_down.append([genes[i], series1_mock1[i], series1_mock2[i], series1_mock3[i], series2_mock1[i], series2_mock2[i], series2_mock3[i], chi])
        
    else:
        pass

In [None]:
#Check length of lists
print(len(sig_diff_1_2_mock_A549_up))
print(len(sig_diff_1_2_mock_A549_down))
print(len(sig_diff_1_2_mock_A549_up) + len(sig_diff_1_2_mock_A549_down))

In [None]:
output_filename_5 = "/Users/aldricgoh/COVID HACK/Series1v2_analysis_upreg.csv"
output_filename_6 = "/Users/aldricgoh/COVID HACK/Series1v2_analysis_downreg.csv"

sig_diff_1_2_mock_A549_up = sorted(sig_diff_1_2_mock_A549_up, key=take_chi,reverse=True)
sig_diff_1_2_mock_A549_down = sorted(sig_diff_1_2_mock_A549_down, key=take_chi,reverse=True)

write_csv(filename=output_filename_5, header=['gene_symbol', 'Series1_NHBE_Mock_1', 'Series1_NHBE_Mock_2', 'Series1_NHBE_Mock_3', 'Series2_A549_Mock_1', 'Series2_A549_Mock_2', 'Series2_A549_Mock_3', 'Chisquare Values'], data=sig_diff_1_2_mock_A549_up)
write_csv(filename=output_filename_6, header=['gene_symbol', 'Series1_NHBE_Mock_1', 'Series1_NHBE_Mock_2', 'Series1_NHBE_Mock_3', 'Series2_A549_Mock_1', 'Series2_A549_Mock_2', 'Series2_A549_Mock_3', 'Chisquare Values'], data=sig_diff_1_2_mock_A549_down)

In [24]:
#Make list of series 5
series5_mock1 = df_1['Series5_A549_Mock_1'].values
series5_mock2 = df_1['Series5_A549_Mock_2'].values
series5_mock3 = df_1['Series5_A549_Mock_3'].values
series5_1 = df_1['Series5_A549_SARS.CoV.2_1'].values
series5_2 = df_1['Series5_A549_SARS.CoV.2_2'].values
series5_3 = df_1['Series5_A549_SARS.CoV.2_3'].values

In [25]:
#Make new lists
sig_diff_2_5_mock_A549_up = [] 
sig_diff_2_5_mock_A549_down = [] 

In [26]:
for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series2_1[i], series2_2[i], series2_3[i]])[0] < 6.635 and chisquare([series5_1[i], series5_2[i], series5_3[i]])[0] < 6.635:
        a = (series2_1[i] + series2_2[i] + series2_3[i])/3
        b = (series5_1[i] + series5_2[i] + series5_3[i])/3
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a > b:
                sig_diff_2_5_mock_A549_down.append([genes[i], a, b, chi])
            else:
                sig_diff_2_5_mock_A549_up.append([genes[i], a, b, chi])
        
    else:
        pass

In [27]:
#Check length of lists
print(len(sig_diff_2_5_mock_A549_up))
print(len(sig_diff_2_5_mock_A549_down))
print(len(sig_diff_2_5_mock_A549_up) + len(sig_diff_2_5_mock_A549_down))

1165
1134
2299


In [28]:
output_filename_7 = "/Users/aldricgoh/COVID HACK/Series2v5_infected_analysis_upreg.csv"
output_filename_8 = "/Users/aldricgoh/COVID HACK/Series2v5_infected_analysis_downreg.csv"

sig_diff_2_5_mock_A549_up = sorted(sig_diff_2_5_mock_A549_up, key=take_chi,reverse=True)
sig_diff_2_5_mock_A549_down = sorted(sig_diff_2_5_mock_A549_down, key=take_chi,reverse=True)

write_csv(filename=output_filename_7, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series5_A549_SARS.CoV.2_average', 'Chisquare Values'], data=sig_diff_2_5_mock_A549_up)
write_csv(filename=output_filename_8, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series5_A549_SARS.CoV.2_average', 'Chisquare Values'], data=sig_diff_2_5_mock_A549_down)

In [29]:
series3_1 = df_1['Series3_A549_RSV_1'].values
series3_2 = df_1['Series3_A549_RSV_2'].values

In [30]:
upreg2_3 = []
downreg2_3 = []

In [31]:
for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series2_1[i], series2_2[i], series2_3[i]])[0] < 6.635 and chisquare([series3_1[i], series3_2[i]])[0] < 6.635:
        a = (series2_1[i] + series2_2[i] + series2_3[i])/3
        b = (series3_1[i] + series3_2[i])/2
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a < b:
                upreg2_3.append([genes[i], a, b, chi])
            else:
                downreg2_3.append([genes[i], a, b, chi])
        
    else:
        pass

In [32]:
#Check length of lists
print(len(upreg2_3))
print(len(downreg2_3))
print(len(upreg2_3) + len(downreg2_3))

1815
1789
3604


In [33]:
output_filename_9 = "/Users/aldricgoh/COVID HACK/Series2v3_infected_analysis_3 more than 2.csv"
output_filename_10 = "/Users/aldricgoh/COVID HACK/Series2v3_infected_analysis_3 less than 2.csv"

upreg2_3 = sorted(upreg2_3, key=take_chi,reverse=True)
downreg2_3 = sorted(downreg2_3, key=take_chi,reverse=True)

write_csv(filename=output_filename_9, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series3_A549_RSV_average', 'Chisquare Values'], data=upreg2_3)
write_csv(filename=output_filename_10, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series3_A549_RSV_average', 'Chisquare Values'], data=downreg2_3)

In [34]:
series4_1 = df_1['Series4_A549_IAV_1'].values
series4_2 = df_1['Series4_A549_IAV_2'].values

upreg2_4 = []
downreg2_4 = []

for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series2_1[i], series2_2[i], series2_3[i]])[0] < 6.635 and chisquare([series4_1[i], series4_2[i]])[0] < 6.635:
        a = (series2_1[i] + series2_2[i] + series2_3[i])/3
        b = (series4_1[i] + series4_2[i])/2
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a < b:
                upreg2_4.append([genes[i], a, b, chi])
            else:
                downreg2_4.append([genes[i], a, b, chi])
        
    else:
        pass

#Check length of lists
print(len(upreg2_4))
print(len(downreg2_4))
print(len(upreg2_4) + len(downreg2_4))

output_filename_11 = "/Users/aldricgoh/COVID HACK/Series2v4_infected_analysis_4 more than 2.csv"
output_filename_12 = "/Users/aldricgoh/COVID HACK/Series2v4_infected_analysis_4 less than 2.csv"

upreg2_4 = sorted(upreg2_4, key=take_chi,reverse=True)
downreg2_4 = sorted(downreg2_4, key=take_chi,reverse=True)

write_csv(filename=output_filename_11, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series4_A549_IAV_average', 'Chisquare Values'], data=upreg2_4)
write_csv(filename=output_filename_12, header=['gene_symbol', 'Series2_A549_SARS.CoV.2_average', 'Series4_A549_IAV_average', 'Chisquare Values'], data=downreg2_4)

637
909
1546


In [35]:
upreg3_4 = []
downreg3_4 = []

for i in range(len(genes)):
        #Check is there is significant difference
        #Only proceed when no significant differences
        #May encounter division by 0, but can be ignored
        #At a 0.1% level
    if chisquare([series3_1[i], series3_2[i]])[0] < 6.635 and chisquare([series4_1[i], series4_2[i]])[0] < 6.635:
        a = (series3_1[i] + series3_2[i])/3
        b = (series4_1[i] + series4_2[i])/2
        chi = chisquare([a, b])[0] #Degree of freedom of 1, and obtain value os chisquare

            #If difference is significant, only insert into list for monitoring
            #At a 0.5% level
        if chi > 7.879:
            if a < b:
                upreg3_4.append([genes[i], a, b, chi])
            else:
                downreg3_4.append([genes[i], a, b, chi])
        
    else:
        pass

#Check length of lists
print(len(upreg3_4))
print(len(downreg3_4))
print(len(upreg3_4) + len(downreg3_4))

output_filename_13 = "/Users/aldricgoh/COVID HACK/Series3v4_infected_analysis_4 more than 3.csv"
output_filename_14 = "/Users/aldricgoh/COVID HACK/Series3v4_infected_analysis_4 less than 3.csv"

upreg3_4 = sorted(upreg3_4, key=take_chi,reverse=True)
downreg3_4 = sorted(downreg3_4, key=take_chi,reverse=True)

write_csv(filename=output_filename_13, header=['gene_symbol', 'Series3_A549_RSV_average', 'Series4_A549_IAV_average', 'Chisquare Values'], data=upreg3_4)
write_csv(filename=output_filename_14, header=['gene_symbol', 'Series3_A549_RSV_average', 'Series4_A549_IAV_average', 'Chisquare Values'], data=downreg3_4)

1883
854
2737


In [None]:
#Function to plot graphs and compile them in a single pdf
def plotgraphs(list, c, title):
    genes = []
    chi_list = []
    for i in range(10):
        genes.append(list[i][0])
        chi_list.append(list[i][-1])

    x_pos = np.arange(len(genes))
    plt.bar(x_pos, chi_list, align='center', color= c);
    plt.xticks(x_pos, genes, rotation=90)
    plt.xlabel('Genes')
    plt.ylabel('Chisquare Count')
    plt.title(title)
    plt.tight_layout()
    pdf.savefig()
    plt.close()

    plt.bar(x_pos, chi_list, align='center', color= c)
    plt.semilogy(genes, chi_list)
    plt.xlabel('Genes')
    plt.ylabel('Chisquare Count')
    plt.xticks(x_pos, genes, rotation=90)
    plt.title(title + '(Log)')
    plt.tight_layout()
    pdf.savefig()
    plt.close()

with PdfPages('/Users/aldricgoh/COVID HACK/Dataset 2 analysis.pdf') as pdf:
    plotgraphs(sig_diff_up_1, 'r', 'Series 1: Top 10 non-COVID vs COVID infected\nlung cells up reg genes')
    plotgraphs(sig_diff_down_1, 'r', 'Series 1: Top 10 non-COVID vs COVID infected\nlung cells down reg genes')
    plotgraphs(sig_diff_up_2, 'b', 'Series 2: Top 10 non-COVID vs COVID infected\nlung cancer cells up reg genes (A549)')
    plotgraphs(sig_diff_down_2, 'b', 'Series 2: Top 10 non-COVID vs COVID infected\nlung cancer cells down reg genes (A549)')
    plotgraphs(sig_diff_2_5_mock_A549_up, 'g', 'Series 2 vs series 5 comparison\non quantity of COVID virus - up reg')
    plotgraphs(sig_diff_2_5_mock_A549_down, 'g', 'Series 2 vs series 5 comparison\non quantity of COVID virus - down reg')
    plotgraphs(upreg2_3, 'violet', 'Series 2 vs series 3 comparison\nbetween COVID and RSV virus - up reg')
    plotgraphs(downreg2_3, 'violet', 'Series 2 vs series 3 comparison\nbetween COVID and RSV virus - down reg')
    plotgraphs(upreg2_4, 'orange', 'Series 2 vs series 4 comparison\nbetween COVID and IAV virus - up reg')
    plotgraphs(downreg2_4, 'orange', 'Series 2 vs series 4 comparison\nbetween COVID and IAV virus - down reg')
    plotgraphs(upreg3_4, 'black', 'Series 3 vs series 4 comparison\nbetween RSV and IAV virus - up reg')
    plotgraphs(downreg3_4, 'black', 'Series 3 vs series 4 comparison\nbetween RSV and IAV virus - down reg')