### Two separate scripts under command line

In [None]:
import pandas as pd
data = pd.read_excel('DEG_list.xlsx')
data.to_csv('DEG_list.csv')

In [None]:
data = read.csv('DEG_list.csv')
pdf('result.pdf')
plot(data$log2FoldChange, data$stat)
dev.off()

### Step 1: book keeping

In [None]:
%run

python:
import pandas as pd
data = pd.read_excel('DEG_list.xlsx')
data.to_csv('DEG_list.csv')

R:
data = read.csv('DEG_list.csv')
pdf('result.pdf')
plot(data$log2FoldChange, data$stat)
dev.off()

### Step 2: indentation

In [None]:
%run -v3
python:
    import pandas as pd
    data = pd.read_excel('DEG_list.xlsx')
    data.to_csv('DEG_list.csv')

R:
    data = read.csv('DEG_list.csv')
    pdf('result.pdf')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### Step 3: Separate into two steps

In [None]:
%run -v3
[1]
python:
    import pandas as pd
    data = pd.read_excel('DEG_list.xlsx')
    data.to_csv('DEG_list.csv')

[2]
R:
    data = read.csv('DEG_list.csv')
    pdf('result.pdf')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### Step 4: Add some comments

In [None]:
%run -v3
[1 (convert data)]
# convert data
python:
    import pandas as pd
    data = pd.read_excel('DEG_list.xlsx')
    data.to_csv('DEG_list.csv')

[2 (data analysis)]
# data analysis
R:
    data = read.csv('DEG_list.csv')
    pdf('result.pdf')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### Step 5: Add parameter (use another file)

In [None]:
%run -v3 --deg-list DEG_list.xlsx

parameter: deg_list = 'DEG_list.xslx'

[proj_1 (convert data)]
# convert data
python: expand=True
    import pandas as pd
    data = pd.read_excel('{deg_list}')
    data.to_csv('DEG_list.csv')

[proj_2 (data analysis)]
# data analysis
R: 
    data = read.csv('DEG_list.csv')
    pdf('result.pdf')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### Step 6: add input and output (rerun to skip step)

In [None]:
%run -v3 --deg-list DEG_list.xlsx

parameter: deg_list = 'DEG_list.xslx'

[proj_1 (convert data)]
input: deg_list
output: 'DEG_list.csv'
# convert data
python: expand=True
    import pandas as pd
    data = pd.read_excel('{_input}')
    data.to_csv('{_output}')

[proj_2 (data analysis)]
output: 'result.pdf'
# data analysis
R: expand=True
    data = read.csv('{_input}')
    pdf('{_output}')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### VIDEO TWO: make file style

In [None]:
%run -v3 --deg-list DEG_list.csv

parameter: deg_list = 'DEG_list.xslx'

[convert: provides='{FILENAME}.csv']
input: f"{FILENAME}.xlsx"
# convert data
python: expand=True
    import pandas as pd
    data = pd.read_excel('{_input}')
    data.to_csv('{_output}')

[analysis (data analysis)]
input: deg_list
output: 'result.pdf'
# data analysis
R: expand=True
    data = read.csv('{_input}')
    pdf('{_output}')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### VIDEO TWO:  task (sos status)

In [None]:
%run -v3 --deg-list DEG_list.csv -s force

parameter: deg_list = 'DEG_list.xslx'

[convert: provides='{FILENAME}.csv']
input: f"{FILENAME}.xlsx"
# convert data
python: expand=True
    import pandas as pd
    data = pd.read_excel('{_input}')
    data.to_csv('{_output}')

[analysis (data analysis)]
input: deg_list
output: 'result.pdf'
# data analysis
task:
R: expand=True
    data = read.csv('{_input}')
    pdf('{_output}')
    plot(data$log2FoldChange, data$stat)
    dev.off()

### Video TWO.3: Remote task

In [None]:
%run -v4 --deg-list DEG_list.csv -s force -q pro -c ~/.sos/hosts.yml

parameter: deg_list = 'DEG_list.xslx'

[convert: provides='{FILENAME}.csv']
input: f"{FILENAME}.xlsx"
# convert data
python: expand=True
    import pandas as pd
    data = pd.read_excel('{input}')
    data.to_csv('{output}')

[analysis (data analysis)]
input: deg_list
output: 'result.pdf'
# data analysis
task:
R: expand=True
    data = read.csv('{_input}')
    pdf('{_output}')
    plot(data$log2FoldChange, data$stat)
    dev.off()