-
Notifications
You must be signed in to change notification settings - Fork 0
/
report.py
80 lines (61 loc) · 6.14 KB
/
report.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
data = pd.read_csv("output/input_paired.csv")
data_symptom = data[["colorectal_symptom_1_date_symp_date", "colorectal_symptom_2_date_symp_date", "colorectal_symptom_3_date_symp_date", "colorectal_symptom_4_date_symp_date", "colorectal_symptom_5_date_symp_date", "colorectal_symptom_6_date_symp_date", "colorectal_symptom_7_date_symp_date", "colorectal_symptom_8_date_symp_date", "colorectal_symptom_9_date_symp_date", "colorectal_symptom_10_date_symp_date"]]
data_referral = data[["colorectal_symptom_1_date_ref_date", "colorectal_symptom_2_date_ref_date", "colorectal_symptom_3_date_ref_date", "colorectal_symptom_4_date_ref_date", "colorectal_symptom_5_date_ref_date", "colorectal_symptom_6_date_ref_date", "colorectal_symptom_7_date_ref_date", "colorectal_symptom_8_date_ref_date", "colorectal_symptom_9_date_ref_date", "colorectal_symptom_10_date_ref_date"]]
num_symptoms = data_symptom.count(axis=1)
plt.hist(num_symptoms.values.tolist(), bins=10)
plt.savefig('output/colorectal_cancer.jpg')
plt.clf()
data_symptom['colorectal_symptom_1_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_1_date_symp_date'])
data_symptom['colorectal_symptom_2_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_2_date_symp_date'])
data_symptom['colorectal_symptom_3_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_3_date_symp_date'])
data_symptom['colorectal_symptom_4_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_4_date_symp_date'])
data_symptom['colorectal_symptom_5_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_5_date_symp_date'])
data_symptom['colorectal_symptom_6_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_6_date_symp_date'])
data_symptom['colorectal_symptom_7_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_7_date_symp_date'])
data_symptom['colorectal_symptom_8_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_8_date_symp_date'])
data_symptom['colorectal_symptom_9_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_9_date_symp_date'])
data_symptom['colorectal_symptom_10_date_symp_date'] = pd.to_datetime(data_symptom['colorectal_symptom_10_date_symp_date'])
data_month_year_1 = data_symptom['colorectal_symptom_1_date_symp_date'].dt.to_period('M')
data_month_year_2 = data_symptom['colorectal_symptom_2_date_symp_date'].dt.to_period('M')
data_month_year_3 = data_symptom['colorectal_symptom_3_date_symp_date'].dt.to_period('M')
data_month_year_4 = data_symptom['colorectal_symptom_4_date_symp_date'].dt.to_period('M')
data_month_year_5 = data_symptom['colorectal_symptom_5_date_symp_date'].dt.to_period('M')
data_month_year_6 = data_symptom['colorectal_symptom_6_date_symp_date'].dt.to_period('M')
data_month_year_7 = data_symptom['colorectal_symptom_7_date_symp_date'].dt.to_period('M')
data_month_year_8 = data_symptom['colorectal_symptom_8_date_symp_date'].dt.to_period('M')
data_month_year_9 = data_symptom['colorectal_symptom_9_date_symp_date'].dt.to_period('M')
data_month_year_10 = data_symptom['colorectal_symptom_10_date_symp_date'].dt.to_period('M')
data_month_year = pd.concat([data_month_year_1, data_month_year_2, data_month_year_3, data_month_year_4, data_month_year_5, data_month_year_6, data_month_year_7, data_month_year_8, data_month_year_9, data_month_year_10], axis=1)
counts = data_month_year.stack().value_counts()
counts = counts.sort_index()
ax = counts.plot.bar()
plt.savefig('output/colorectal_cancer_2.jpg')
plt.clf()
data_referral['colorectal_symptom_1_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_1_date_ref_date'])
data_referral['colorectal_symptom_2_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_2_date_ref_date'])
data_referral['colorectal_symptom_3_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_3_date_ref_date'])
data_referral['colorectal_symptom_4_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_4_date_ref_date'])
data_referral['colorectal_symptom_5_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_5_date_ref_date'])
data_referral['colorectal_symptom_6_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_6_date_ref_date'])
data_referral['colorectal_symptom_7_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_7_date_ref_date'])
data_referral['colorectal_symptom_8_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_8_date_ref_date'])
data_referral['colorectal_symptom_9_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_9_date_ref_date'])
data_referral['colorectal_symptom_10_date_ref_date'] = pd.to_datetime(data_referral['colorectal_symptom_10_date_ref_date'])
data_ref_month_year_1 = data_referral['colorectal_symptom_1_date_ref_date'].dt.to_period('M')
data_ref_month_year_2 = data_referral['colorectal_symptom_2_date_ref_date'].dt.to_period('M')
data_ref_month_year_3 = data_referral['colorectal_symptom_3_date_ref_date'].dt.to_period('M')
data_ref_month_year_4 = data_referral['colorectal_symptom_4_date_ref_date'].dt.to_period('M')
data_ref_month_year_5 = data_referral['colorectal_symptom_5_date_ref_date'].dt.to_period('M')
data_ref_month_year_6 = data_referral['colorectal_symptom_6_date_ref_date'].dt.to_period('M')
data_ref_month_year_7 = data_referral['colorectal_symptom_7_date_ref_date'].dt.to_period('M')
data_ref_month_year_8 = data_referral['colorectal_symptom_8_date_ref_date'].dt.to_period('M')
data_ref_month_year_9 = data_referral['colorectal_symptom_9_date_ref_date'].dt.to_period('M')
data_ref_month_year_10 = data_referral['colorectal_symptom_10_date_ref_date'].dt.to_period('M')
data_ref_month_year = pd.concat([data_ref_month_year_1, data_ref_month_year_2, data_ref_month_year_3, data_ref_month_year_4, data_ref_month_year_5, data_ref_month_year_6, data_ref_month_year_7, data_ref_month_year_8, data_ref_month_year_9, data_ref_month_year_10], axis=1)
counts_ref = data_ref_month_year.stack().value_counts()
counts_ref = counts_ref.sort_index()
ax = counts_ref.plot.bar()
plt.savefig('output/colorectal_cancer_3.jpg')