-
Notifications
You must be signed in to change notification settings - Fork 0
/
datasets.yaml
131 lines (121 loc) · 3.71 KB
/
datasets.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
mednli:
training_data_dir: ''
eval_data_dir: ''
data_dir: /mnt/sdd/efficient_ml_data/datasets/MedNLI
training_file: ''
validation_file: ''
test_file: ''
task_type: SEQ_CLS
label_name: ''
text_column: [sentence1 sentence2]
remove_columns: [sentence1 sentence2]
mimic-dia:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/dia
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/dia
data_dir: ''
training_file: DIA_GROUPS_3_DIGITS_adm_train.csv
validation_file: DIA_GROUPS_3_DIGITS_adm_val.csv
test_file: DIA_GROUPS_3_DIGITS_adm_test.csv
task_type: SEQ_CLS
label_name: ''
text_column: text
remove_columns: [text]
mimic-dia-adm-only:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/dia_adm_only
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/dia_adm_only
data_dir: ''
training_file: DIA_GROUPS_3_DIGITS_adm_train.csv
validation_file: DIA_GROUPS_3_DIGITS_adm_val.csv
test_file: DIA_GROUPS_3_DIGITS_adm_test.csv
task_type: SEQ_CLS
label_name: ''
text_column: text
remove_columns: [text]
mimic-los:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/los
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/los
data_dir: ''
training_file: train.csv
validation_file: valid.csv
test_file: LOS_WEEKS_adm_test.csv
task_type: SEQ_CLS
label_name: los_label
text_column: text
remove_columns: [text]
mimic-los-adm-only:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/los_adm_only
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/los_adm_only
data_dir: ''
training_file: LOS_WEEKS_adm_train.csv
validation_file: LOS_WEEKS_adm_val.csv
test_file: LOS_WEEKS_adm_test.csv
task_type: SEQ_CLS
label_name: ''
text_column: text
remove_columns: [text]
mimic-mp:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/mp
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/mimic3-clinical-outcomes/mp
data_dir: ''
training_file: train.csv
validation_file: valid.csv
test_file: test.csv
task_type: SEQ_CLS
label_name: hospital_expire_flag
text_column: text
remove_columns: [text]
ICD9-Triage:
training_data_dir: /mnt/sdd/efficient_ml_data/datasets/icd9-triage/no_category_in_text
eval_data_dir: /mnt/sdd/efficient_ml_data/datasets/icd9-triage/no_category_in_text
data_dir: ''
training_file: train.csv
validation_file: valid.csv
test_file: test.csv
task_type: SEQ_CLS
label_name: label
text_column: text
remove_columns: [text,triage-category]
i2b2-2010-NER:
training_data_dir: ''
eval_data_dir: ''
data_dir: /mnt/sdd/efficient_ml_data/datasets/I2B22010NER_hf_dataset
training_file: ''
validation_file: ''
test_file: ''
task_type: TOKEN_CLS
label_name: ''
text_column: text
remove_columns: [text]
i2b2-2012-NER:
training_data_dir: ''
eval_data_dir: ''
data_dir: /mnt/sdd/efficient_ml_data/datasets/i2b2-2012_hf_dataset
training_file: ''
validation_file: ''
test_file: ''
task_type: TOKEN_CLS
label_name: ''
text_column: text
remove_columns: [text]
i2b2-2014-NER:
training_data_dir: ''
eval_data_dir: ''
data_dir: /mnt/sdd/efficient_ml_data/datasets/i2b2-2014_hf_dataset
training_file: ''
validation_file: ''
test_file: ''
task_type: TOKEN_CLS
label_name: ''
text_column: text
remove_columns: [text]
i2b2-2010-RE:
training_data_dir: ''
eval_data_dir: ''
data_dir: /mnt/sdd/efficient_ml_data/datasets/i2b2-2010-RE
training_file: ''
validation_file: ''
test_file: ''
task_type: SEQ_CLS
label_name:
text_column: text
remove_columns: [text]