generated from opensafely/research-template
/
project.yaml
37 lines (32 loc) · 976 Bytes
/
project.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
version: '3.0'
expectations:
population_size: 1000
actions:
generate_dataset_cohortextractor:
run: >
cohortextractor:latest generate_cohort
--study-definition study_definition
--output-dir 'output'
--output-file "output/dataset_cohortextractor_2022-09-25.csv"
--output-format csv
outputs:
highly_sensitive:
cohort: output/dataset_cohortextractor_2022-09-25.csv
generate_dataset_ehrql:
run: >
databuilder:v0
generate-dataset analysis/dataset_definition.py
--output output/dataset_ehrql_2022-09-25.csv
--dummy-tables dummy_data
outputs:
highly_sensitive:
cohort: output/dataset_ehrql_2022-09-25.csv
calculate_dataset_diff:
run: >
r:latest analysis/dataset_diff.R
needs:
- generate_dataset_cohortextractor
- generate_dataset_ehrql
outputs:
moderately_sensitive:
cohort: output/diff/dataset_diff_summary.csv