generated from opensafely/research-template
/
project.yaml
112 lines (101 loc) · 3.34 KB
/
project.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
version: '3.0'
expectations:
population_size: 1000000
actions:
generate_study_population:
run: cohortextractor:latest generate_cohort --study-definition study_definition
outputs:
highly_sensitive:
cohort: input.csv
calc_coverage:
needs: [generate_study_population]
# last argument relates to MSOA TPP coverage >= X%
run: r:latest analysis/calculate_tpp_coverage.R input.csv data/SAPE22DT15_mid_2019_msoa.csv 80
outputs:
moderately_sensitive:
log: coverage_log.txt
rds: tpp_coverage_included.rds
rds2: tpp_coverage_all.rds
csv: tpp_coverage_all.csv
csv2: msoas_in_tpp.csv
csv3: msoa_gt_100_cov.csv
figure: total_vs_tpp_pop.png
data_clean:
needs: [generate_study_population, calc_coverage]
# last argument relates to MSOA TPP coverage >= X%
run: r:latest analysis/data_clean.R input.csv tpp_coverage_included.rds 80
outputs:
moderately_sensitive:
log: data_clean_log.txt
highly_sensitive:
input_clean: input_clean.rds
data_check_figs:
needs: [data_clean]
run: r:latest analysis/data_check_figs.R input_clean.rds data/msoa_shp.rds
outputs:
moderately_sensitive:
figure1: tpp_coverage_msoa.png
figure2: tpp_coverage_carehomes.png
figure3: tpp_coverage_map.pdf
figure4: age_dist.png
figure5: infection_death_delays.png
figure6: hh_size_dist.png
data_setup:
needs: [data_clean]
# last argument relates to carehome TPP coverage >= X%
run: r:latest analysis/data_setup.R input_clean.rds data/cases_rolling_nation.csv 90
outputs:
moderately_sensitive:
log: data_setup_log.txt
highly_sensitive:
comm_prev: community_incidence.rds
analysisdata: analysisdata.rds
ch_linelist: ch_linelist.rds
ch_agg_long: ch_agg_long.rds
descriptive:
needs: [data_clean, data_setup]
run: r:latest analysis/descriptive.R
outputs:
moderately_sensitive:
report: descriptive.pdf
log: log_descriptive.txt
data: ch_gp_permsoa.csv
table: ch_chars_tab.csv
run_models:
needs: [data_setup]
run: r:latest analysis/run_models.R analysisdata.rds 0.0
outputs:
moderately_sensitive:
output: output_model_run.txt
log: log_model_run.txt
coeffs: coeffs_all.rds
figure: model_coeffs.pdf
table: model_comp.csv
highly_sensitive:
fit: model_out.rds
test: testdata.rds
# compare_models:
# needs: [run_models]
# run: r:latest analysis/compare_models.R model_out.rds
# outputs:
# moderately_sensitive:
# log: output_model_comp.txt
# coeffs: coeffs_all.rds
# figure: model_coeffs.pdf
# table: model_comp.csv
# validate_models:
# needs: [run_models]
# run: r:latest analysis/validate_models.R fits.rds testdata.rds
# outputs:
# moderately_sensitive:
# output: output_model_val.txt
# report: test_pred_figs.pdf
run_all:
needs: [run_models, descriptive]
# In order to be valid this action needs to define a run commmand and
# some output. We don't really care what these are but the below seems to
# do the trick.
run: cohortextractor:latest --version
outputs:
moderately_sensitive:
whatever: project.yaml