generated from opensafely/research-template
/
project.yaml
103 lines (92 loc) · 4.1 KB
/
project.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
version: "3.0"
expectations:
population_size: 1000
actions:
generate_cohort_2019:
run: cohortextractor:latest generate_cohort --study-definition study_definition_2019
outputs:
highly_sensitive:
cohort: output/input_2019.csv
generate_cohort_2020:
run: cohortextractor:latest generate_cohort --study-definition study_definition_2020
outputs:
highly_sensitive:
cohort: output/input_2020.csv
generate_measures_cohorts:
run: cohortextractor:latest generate_cohort --study-definition study_definition_measures --index-date-range "2019-02-01 to 2020-11-30 by week"
outputs:
highly_sensitive:
cohort1: output/input_measures_*.csv
generate_measures:
run: cohortextractor:latest generate_measures --study-definition study_definition_measures
needs: [generate_measures_cohorts]
outputs:
moderately_sensitive:
measure1: output/measure_covid_death_all.csv
measure2: output/measure_covid_death_sex.csv
measure3: output/measure_covid_death_age.csv
measure4: output/measure_covid_death_sex_age.csv
measure5: output/measure_allcause_death_all.csv
measure6: output/measure_allcause_death_sex.csv
measure7: output/measure_allcause_death_age.csv
measure8: output/measure_allcause_death_sex_age.csv
measure9: output/measure_noncovid_death_all.csv
measure10: output/measure_noncovid_death_sex.csv
measure11: output/measure_noncovid_death_age.csv
measure12: output/measure_noncovid_death_sex_age.csv
010_data_management_2019:
run: r:latest analysis/010_data_management.R ./output/input_2019.csv 20190201 ./data/study_population_2019.csv
needs: [generate_cohort_2019]
outputs:
highly_sensitive:
data1: data/study_population_2019.csv
010_data_management_2020:
run: r:latest analysis/010_data_management.R ./output/input_2020.csv 20200201 ./data/study_population_2020.csv
needs: [generate_cohort_2020]
outputs:
highly_sensitive:
data2: data/study_population_2020.csv
020_baseline_characteristics_2019:
run: r:latest analysis/020_baseline_characteristics.R ./data/study_population_2019.csv ./analysis/outfiles/table_1a.txt
needs: [generate_cohort_2019, 010_data_management_2019]
outputs:
moderately_sensitive:
table1a: analysis/outfiles/table_1a.txt
020_baseline_characteristics_2020:
run: r:latest analysis/020_baseline_characteristics.R ./data/study_population_2020.csv ./analysis/outfiles/table_1b.txt
needs: [generate_cohort_2020, 010_data_management_2020]
outputs:
moderately_sensitive:
table1b: analysis/outfiles/table_1b.txt
025_carehome_characteristics:
run: r:latest analysis/025_carehome_characteristics.R ./data/study_population_2020.csv
needs: [010_data_management_2020]
outputs:
moderately_sensitive:
log: analysis/outfiles/carehome_characteristics.txt
030_descriptive_mortality_rates.R:
run: r:latest analysis/030_descriptive_mortality_rates.R
needs: [generate_measures_cohorts, generate_measures]
outputs:
moderately_sensitive:
table_2a: analysis/outfiles/table_2a.txt
table_2b: analysis/outfiles/table_2b.txt
table_2c: analysis/outfiles/table_2c.txt
table_2d: analysis/outfiles/table_2d.txt
table_3a: analysis/outfiles/table_3a.txt
table_3b: analysis/outfiles/table_3b.txt
table_3c: analysis/outfiles/table_3c.txt
table_3d: analysis/outfiles/table_3d.txt
table_4a: analysis/outfiles/table_4a.txt
table_4b: analysis/outfiles/table_4b.txt
table_4c: analysis/outfiles/table_4c.txt
table_4d: analysis/outfiles/table_4d.txt
plot_1a: analysis/outfiles/plot_1a.png
plot_1b: analysis/outfiles/plot_1b.png
plot_1c: analysis/outfiles/plot_1c.png
plot_2a: analysis/outfiles/plot_2a.png
plot_2b: analysis/outfiles/plot_2b.png
plot_2c: analysis/outfiles/plot_2c.png
plot_3a: analysis/outfiles/plot_3a.png
plot_3b: analysis/outfiles/plot_3b.png
plot_3c: analysis/outfiles/plot_3c.png