In [1]:
import pandas as pd
import numpy as np
import requests
from pandas_profiling import ProfileReport

In [2]:
response = requests.get("https://raw.githubusercontent.com/wcota/covid19br/master/cases-brazil-states.csv")
response

<Response [200]>

In [3]:
response = response.content.decode("utf-8")
result = [x.split(',') for x in response.split('\n')]
df = pd.DataFrame(result[1:], columns= result[0])

In [4]:
df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 27259 entries, 0 to 27258
Data columns (total 26 columns):
 #   Column                                 Non-Null Count  Dtype 
---  ------                                 --------------  ----- 
 0   epi_week                               27259 non-null  object
 1   date                                   27258 non-null  object
 2   country                                27258 non-null  object
 3   state                                  27258 non-null  object
 4   city                                   27258 non-null  object
 5   newDeaths                              27258 non-null  object
 6   deaths                                 27258 non-null  object
 7   newCases                               27258 non-null  object
 8   totalCases                             27258 non-null  object
 9   deathsMS                               27258 non-null  object
 10  totalCasesMS                           27258 non-null  object
 11  deaths_per_100k

In [5]:
df

Unnamed: 0,epi_week,date,country,state,city,newDeaths,deaths,newCases,totalCases,deathsMS,...,tests,tests_per_100k_inhabitants,vaccinated,vaccinated_per_100_inhabitants,vaccinated_second,vaccinated_second_per_100_inhabitants,vaccinated_single,vaccinated_single_per_100_inhabitants,vaccinated_third,vaccinated_third_per_100_inhabitants
0,9,2020-02-25,Brazil,SP,TOTAL,0,0,1,1,0,...,,,,,,,,,,
1,9,2020-02-25,Brazil,TOTAL,TOTAL,0,0,1,1,0,...,,,,,,,,,,
2,9,2020-02-26,Brazil,SP,TOTAL,0,0,0,1,0,...,,,,,,,,,,
3,9,2020-02-26,Brazil,TOTAL,TOTAL,0,0,0,1,0,...,,,,,,,,,,
4,9,2020-02-27,Brazil,SP,TOTAL,0,0,0,1,0,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
27254,245,2022-11-10,Brazil,SE,TOTAL,0,6443,0,342918,6443,...,604183,26283.72782,1992913,86.69755,1834937,79.82513,42285,1.83952,1376006,59.86029
27255,245,2022-11-10,Brazil,SP,TOTAL,0,175673,0,6149751,175673,...,19501783,42469.91918,42751507,93.10190,40221220,87.59158,1280044,2.78761,27899204,60.75736
27256,245,2022-11-10,Brazil,TO,TOTAL,0,4206,0,344864,4206,...,903975,57473.10960,1167326,74.21649,1007278,64.04093,56219,3.57430,526358,33.46490
27257,245,2022-11-10,Brazil,TOTAL,TOTAL,0,688395,0,34855492,688395,...,70923215,33247.70297,181964720,85.30224,166908532,78.24413,5434803,2.54775,118811893,55.69717


> Apesar de aparentar não existirem valores nulos, percebemos que existem muitas células vazias na base de dados. Esses valores foram preenchidos por "0", por indicarem a ausência de casos.

## Data Cleaning

In [6]:
# Substituindo os valores vazios por Nan:
df = df.replace("", 0, regex=True)

In [7]:
#  Removendo colunas com valores constantes:
df.drop(["country", "city"], axis=1, inplace=True)
df = df[:-1]

In [8]:
# Transformando a coluna de data para o formato apropriado:
df["date"] = pd.to_datetime(df["date"], format="%Y-%m-%d")

In [9]:
# Como a maioria das colunas está em um formato numérico, vamos converter elas para float:
for column in df.columns:
    try:
        df[column] = df[column].astype(float)
    except:
        continue

In [10]:
df

Unnamed: 0,epi_week,date,state,newDeaths,deaths,newCases,totalCases,deathsMS,totalCasesMS,deaths_per_100k_inhabitants,...,tests,tests_per_100k_inhabitants,vaccinated,vaccinated_per_100_inhabitants,vaccinated_second,vaccinated_second_per_100_inhabitants,vaccinated_single,vaccinated_single_per_100_inhabitants,vaccinated_third,vaccinated_third_per_100_inhabitants
0,9.0,2020-02-25,SP,0.0,0.0,1.0,1.0,0.0,0.0,0.00000,...,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000
1,9.0,2020-02-25,TOTAL,0.0,0.0,1.0,1.0,0.0,0.0,0.00000,...,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000
2,9.0,2020-02-26,SP,0.0,0.0,0.0,1.0,0.0,1.0,0.00000,...,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000
3,9.0,2020-02-26,TOTAL,0.0,0.0,0.0,1.0,0.0,1.0,0.00000,...,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000
4,9.0,2020-02-27,SP,0.0,0.0,0.0,1.0,0.0,1.0,0.00000,...,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000,0.0,0.00000
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
27253,245.0,2022-11-10,SC,0.0,22413.0,0.0,1886824.0,22413.0,1886824.0,312.82154,...,2568392.0,35847.42493,6305426.0,88.00576,5789037.0,80.79844,277356.0,3.87110,3858826.0,53.85820
27254,245.0,2022-11-10,SE,0.0,6443.0,0.0,342918.0,6443.0,342918.0,280.28935,...,604183.0,26283.72782,1992913.0,86.69755,1834937.0,79.82513,42285.0,1.83952,1376006.0,59.86029
27255,245.0,2022-11-10,SP,0.0,175673.0,0.0,6149751.0,175673.0,6149751.0,382.57108,...,19501783.0,42469.91918,42751507.0,93.10190,40221220.0,87.59158,1280044.0,2.78761,27899204.0,60.75736
27256,245.0,2022-11-10,TO,0.0,4206.0,0.0,344864.0,4206.0,344864.0,267.40994,...,903975.0,57473.10960,1167326.0,74.21649,1007278.0,64.04093,56219.0,3.57430,526358.0,33.46490


In [11]:
df.epi_week.unique()

array([  9.,  10.,  11.,  12.,  13.,  14.,  15.,  16.,  17.,  18.,  19.,
        20.,  21.,  22.,  23.,  24.,  25.,  26.,  27.,  28.,  29.,  30.,
        31.,  32.,  33.,  34.,  35.,  36.,  37.,  38.,  39.,  40.,  41.,
        42.,  43.,  44.,  45.,  46.,  47.,  48.,  49.,  50.,  51.,  52.,
        53., 101., 102., 103., 104., 105., 106., 107., 108., 109., 110.,
       111., 112., 113., 114., 115., 116., 117., 118., 119., 120., 121.,
       122., 123., 124., 125., 126., 127., 128., 129., 130., 131., 132.,
       133., 134., 135., 136., 137., 138., 139., 140., 141., 142., 143.,
       144., 145., 146., 147., 148., 149., 150., 151., 152., 201., 202.,
       203., 204., 205., 206., 207., 208., 209., 210., 211., 212., 213.,
       214., 215., 216., 217., 218., 219., 220., 221., 222., 223., 224.,
       225., 226., 227., 228., 229., 230., 231., 232., 233., 234., 235.,
       236., 237., 238., 239., 240., 241., 242., 243., 244., 245.])

In [12]:
print(df.index, df["epi_week"])

RangeIndex(start=0, stop=27258, step=1) 0          9.0
1          9.0
2          9.0
3          9.0
4          9.0
         ...  
27253    245.0
27254    245.0
27255    245.0
27256    245.0
27257    245.0
Name: epi_week, Length: 27258, dtype: float64


In [13]:
for row in df.index:
    print((row, df["epi_week"][row]))



(0, 9.0)
(1, 9.0)
(2, 9.0)
(3, 9.0)
(4, 9.0)
(5, 9.0)
(6, 9.0)
(7, 9.0)
(8, 9.0)
(9, 9.0)
(10, 10.0)
(11, 10.0)
(12, 10.0)
(13, 10.0)
(14, 10.0)
(15, 10.0)
(16, 10.0)
(17, 10.0)
(18, 10.0)
(19, 10.0)
(20, 10.0)
(21, 10.0)
(22, 10.0)
(23, 10.0)
(24, 10.0)
(25, 10.0)
(26, 10.0)
(27, 10.0)
(28, 10.0)
(29, 10.0)
(30, 10.0)
(31, 10.0)
(32, 11.0)
(33, 11.0)
(34, 11.0)
(35, 11.0)
(36, 11.0)
(37, 11.0)
(38, 11.0)
(39, 11.0)
(40, 11.0)
(41, 11.0)
(42, 11.0)
(43, 11.0)
(44, 11.0)
(45, 11.0)
(46, 11.0)
(47, 11.0)
(48, 11.0)
(49, 11.0)
(50, 11.0)
(51, 11.0)
(52, 11.0)
(53, 11.0)
(54, 11.0)
(55, 11.0)
(56, 11.0)
(57, 11.0)
(58, 11.0)
(59, 11.0)
(60, 11.0)
(61, 11.0)
(62, 11.0)
(63, 11.0)
(64, 11.0)
(65, 11.0)
(66, 11.0)
(67, 11.0)
(68, 11.0)
(69, 11.0)
(70, 11.0)
(71, 11.0)
(72, 11.0)
(73, 11.0)
(74, 11.0)
(75, 11.0)
(76, 11.0)
(77, 11.0)
(78, 11.0)
(79, 11.0)
(80, 11.0)
(81, 11.0)
(82, 11.0)
(83, 11.0)
(84, 11.0)
(85, 11.0)
(86, 11.0)
(87, 11.0)
(88, 11.0)
(89, 11.0)
(90, 11.0)
(91, 11.0)
(92, 11.

(21404, 215.0)
(21405, 215.0)
(21406, 215.0)
(21407, 215.0)
(21408, 215.0)
(21409, 215.0)
(21410, 215.0)
(21411, 215.0)
(21412, 215.0)
(21413, 215.0)
(21414, 215.0)
(21415, 215.0)
(21416, 215.0)
(21417, 215.0)
(21418, 215.0)
(21419, 215.0)
(21420, 215.0)
(21421, 215.0)
(21422, 215.0)
(21423, 215.0)
(21424, 215.0)
(21425, 215.0)
(21426, 215.0)
(21427, 215.0)
(21428, 215.0)
(21429, 215.0)
(21430, 215.0)
(21431, 215.0)
(21432, 215.0)
(21433, 215.0)
(21434, 216.0)
(21435, 216.0)
(21436, 216.0)
(21437, 216.0)
(21438, 216.0)
(21439, 216.0)
(21440, 216.0)
(21441, 216.0)
(21442, 216.0)
(21443, 216.0)
(21444, 216.0)
(21445, 216.0)
(21446, 216.0)
(21447, 216.0)
(21448, 216.0)
(21449, 216.0)
(21450, 216.0)
(21451, 216.0)
(21452, 216.0)
(21453, 216.0)
(21454, 216.0)
(21455, 216.0)
(21456, 216.0)
(21457, 216.0)
(21458, 216.0)
(21459, 216.0)
(21460, 216.0)
(21461, 216.0)
(21462, 216.0)
(21463, 216.0)
(21464, 216.0)
(21465, 216.0)
(21466, 216.0)
(21467, 216.0)
(21468, 216.0)
(21469, 216.0)
(21470, 21

(22704, 222.0)
(22705, 222.0)
(22706, 222.0)
(22707, 222.0)
(22708, 222.0)
(22709, 222.0)
(22710, 222.0)
(22711, 222.0)
(22712, 222.0)
(22713, 222.0)
(22714, 222.0)
(22715, 222.0)
(22716, 222.0)
(22717, 222.0)
(22718, 222.0)
(22719, 222.0)
(22720, 222.0)
(22721, 222.0)
(22722, 222.0)
(22723, 222.0)
(22724, 222.0)
(22725, 222.0)
(22726, 222.0)
(22727, 222.0)
(22728, 222.0)
(22729, 222.0)
(22730, 222.0)
(22731, 222.0)
(22732, 222.0)
(22733, 222.0)
(22734, 222.0)
(22735, 222.0)
(22736, 222.0)
(22737, 222.0)
(22738, 222.0)
(22739, 222.0)
(22740, 222.0)
(22741, 222.0)
(22742, 222.0)
(22743, 222.0)
(22744, 222.0)
(22745, 222.0)
(22746, 222.0)
(22747, 222.0)
(22748, 222.0)
(22749, 222.0)
(22750, 222.0)
(22751, 222.0)
(22752, 222.0)
(22753, 222.0)
(22754, 222.0)
(22755, 222.0)
(22756, 222.0)
(22757, 222.0)
(22758, 222.0)
(22759, 222.0)
(22760, 222.0)
(22761, 222.0)
(22762, 222.0)
(22763, 222.0)
(22764, 222.0)
(22765, 222.0)
(22766, 222.0)
(22767, 222.0)
(22768, 222.0)
(22769, 222.0)
(22770, 22

In [14]:
for row in df.index:
    if df["epi_week"][row] > 200:
        df["epi_week"][row] = (df["epi_week"][row]-200+105)
    elif df["epi_week"][row] > 100:
        df["epi_week"][row] = (df["epi_week"][row]-100+53)
        
    print(row, df["epi_week"][row])
        

0 9.0
1 9.0
2 9.0
3 9.0
4 9.0
5 9.0
6 9.0
7 9.0
8 9.0
9 9.0
10 10.0
11 10.0
12 10.0
13 10.0
14 10.0
15 10.0
16 10.0
17 10.0
18 10.0
19 10.0
20 10.0
21 10.0
22 10.0
23 10.0
24 10.0
25 10.0
26 10.0
27 10.0
28 10.0
29 10.0
30 10.0
31 10.0
32 11.0
33 11.0
34 11.0
35 11.0
36 11.0
37 11.0
38 11.0
39 11.0
40 11.0
41 11.0
42 11.0
43 11.0
44 11.0
45 11.0
46 11.0
47 11.0
48 11.0
49 11.0
50 11.0
51 11.0
52 11.0
53 11.0
54 11.0
55 11.0
56 11.0
57 11.0
58 11.0
59 11.0
60 11.0
61 11.0
62 11.0
63 11.0
64 11.0
65 11.0
66 11.0
67 11.0
68 11.0
69 11.0
70 11.0
71 11.0
72 11.0
73 11.0
74 11.0
75 11.0
76 11.0
77 11.0
78 11.0
79 11.0
80 11.0
81 11.0
82 11.0
83 11.0
84 11.0
85 11.0
86 11.0
87 11.0
88 11.0
89 11.0
90 11.0
91 11.0
92 11.0
93 11.0
94 11.0
95 11.0
96 11.0
97 11.0
98 11.0
99 11.0
100 11.0
101 11.0
102 11.0
103 11.0
104 11.0
105 11.0
106 11.0
107 11.0
108 11.0
109 11.0
110 11.0
111 11.0
112 12.0
113 12.0
114 12.0
115 12.0
116 12.0
117 12.0
118 12.0
119 12.0
120 12.0
121 12.0
122 12.0
123 12.0
124 

6929 46.0
6930 47.0
6931 47.0
6932 47.0
6933 47.0
6934 47.0
6935 47.0
6936 47.0
6937 47.0
6938 47.0
6939 47.0
6940 47.0
6941 47.0
6942 47.0
6943 47.0
6944 47.0
6945 47.0
6946 47.0
6947 47.0
6948 47.0
6949 47.0
6950 47.0
6951 47.0
6952 47.0
6953 47.0
6954 47.0
6955 47.0
6956 47.0
6957 47.0
6958 47.0
6959 47.0
6960 47.0
6961 47.0
6962 47.0
6963 47.0
6964 47.0
6965 47.0
6966 47.0
6967 47.0
6968 47.0
6969 47.0
6970 47.0
6971 47.0
6972 47.0
6973 47.0
6974 47.0
6975 47.0
6976 47.0
6977 47.0
6978 47.0
6979 47.0
6980 47.0
6981 47.0
6982 47.0
6983 47.0
6984 47.0
6985 47.0
6986 47.0
6987 47.0
6988 47.0
6989 47.0
6990 47.0
6991 47.0
6992 47.0
6993 47.0
6994 47.0
6995 47.0
6996 47.0
6997 47.0
6998 47.0
6999 47.0
7000 47.0
7001 47.0
7002 47.0
7003 47.0
7004 47.0
7005 47.0
7006 47.0
7007 47.0
7008 47.0
7009 47.0
7010 47.0
7011 47.0
7012 47.0
7013 47.0
7014 47.0
7015 47.0
7016 47.0
7017 47.0
7018 47.0
7019 47.0
7020 47.0
7021 47.0
7022 47.0
7023 47.0
7024 47.0
7025 47.0
7026 47.0
7027 47.0
7028 47.0


8624 55.0
8625 55.0
8626 55.0
8627 55.0
8628 55.0
8629 55.0
8630 55.0
8631 55.0
8632 55.0
8633 55.0
8634 55.0
8635 55.0
8636 55.0
8637 55.0
8638 55.0
8639 55.0
8640 55.0
8641 55.0
8642 55.0
8643 55.0
8644 55.0
8645 55.0
8646 55.0
8647 55.0
8648 55.0
8649 55.0
8650 55.0
8651 55.0
8652 55.0
8653 55.0
8654 55.0
8655 55.0
8656 55.0
8657 55.0
8658 55.0
8659 55.0
8660 55.0
8661 55.0
8662 55.0
8663 55.0
8664 55.0
8665 55.0
8666 55.0
8667 55.0
8668 55.0
8669 55.0
8670 55.0
8671 55.0
8672 55.0
8673 55.0
8674 55.0
8675 55.0
8676 55.0
8677 55.0
8678 55.0
8679 55.0
8680 55.0
8681 55.0
8682 55.0
8683 55.0
8684 55.0
8685 55.0
8686 55.0
8687 55.0
8688 55.0
8689 55.0
8690 55.0
8691 55.0
8692 55.0
8693 55.0
8694 56.0
8695 56.0
8696 56.0
8697 56.0
8698 56.0
8699 56.0
8700 56.0
8701 56.0
8702 56.0
8703 56.0
8704 56.0
8705 56.0
8706 56.0
8707 56.0
8708 56.0
8709 56.0
8710 56.0
8711 56.0
8712 56.0
8713 56.0
8714 56.0
8715 56.0
8716 56.0
8717 56.0
8718 56.0
8719 56.0
8720 56.0
8721 56.0
8722 56.0
8723 56.0


A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["epi_week"][row] = (df["epi_week"][row]-100+53)


10245 63.0
10246 63.0
10247 63.0
10248 63.0
10249 63.0
10250 63.0
10251 63.0
10252 63.0
10253 63.0
10254 63.0
10255 63.0
10256 63.0
10257 63.0
10258 63.0
10259 63.0
10260 63.0
10261 63.0
10262 64.0
10263 64.0
10264 64.0
10265 64.0
10266 64.0
10267 64.0
10268 64.0
10269 64.0
10270 64.0
10271 64.0
10272 64.0
10273 64.0
10274 64.0
10275 64.0
10276 64.0
10277 64.0
10278 64.0
10279 64.0
10280 64.0
10281 64.0
10282 64.0
10283 64.0
10284 64.0
10285 64.0
10286 64.0
10287 64.0
10288 64.0
10289 64.0
10290 64.0
10291 64.0
10292 64.0
10293 64.0
10294 64.0
10295 64.0
10296 64.0
10297 64.0
10298 64.0
10299 64.0
10300 64.0
10301 64.0
10302 64.0
10303 64.0
10304 64.0
10305 64.0
10306 64.0
10307 64.0
10308 64.0
10309 64.0
10310 64.0
10311 64.0
10312 64.0
10313 64.0
10314 64.0
10315 64.0
10316 64.0
10317 64.0
10318 64.0
10319 64.0
10320 64.0
10321 64.0
10322 64.0
10323 64.0
10324 64.0
10325 64.0
10326 64.0
10327 64.0
10328 64.0
10329 64.0
10330 64.0
10331 64.0
10332 64.0
10333 64.0
10334 64.0
10335 64.0

12113 73.0
12114 73.0
12115 73.0
12116 73.0
12117 73.0
12118 73.0
12119 73.0
12120 73.0
12121 73.0
12122 73.0
12123 73.0
12124 73.0
12125 73.0
12126 73.0
12127 73.0
12128 73.0
12129 73.0
12130 73.0
12131 73.0
12132 73.0
12133 73.0
12134 73.0
12135 73.0
12136 73.0
12137 73.0
12138 73.0
12139 73.0
12140 73.0
12141 73.0
12142 73.0
12143 73.0
12144 73.0
12145 73.0
12146 73.0
12147 73.0
12148 73.0
12149 73.0
12150 73.0
12151 73.0
12152 73.0
12153 73.0
12154 73.0
12155 73.0
12156 73.0
12157 73.0
12158 73.0
12159 73.0
12160 73.0
12161 73.0
12162 73.0
12163 73.0
12164 73.0
12165 73.0
12166 73.0
12167 73.0
12168 73.0
12169 73.0
12170 73.0
12171 73.0
12172 73.0
12173 73.0
12174 73.0
12175 73.0
12176 73.0
12177 73.0
12178 73.0
12179 73.0
12180 73.0
12181 73.0
12182 73.0
12183 73.0
12184 73.0
12185 73.0
12186 73.0
12187 73.0
12188 73.0
12189 73.0
12190 73.0
12191 73.0
12192 73.0
12193 73.0
12194 73.0
12195 73.0
12196 73.0
12197 73.0
12198 73.0
12199 73.0
12200 73.0
12201 73.0
12202 73.0
12203 73.0

13616 81.0
13617 81.0
13618 81.0
13619 81.0
13620 81.0
13621 81.0
13622 81.0
13623 81.0
13624 81.0
13625 81.0
13626 81.0
13627 81.0
13628 81.0
13629 81.0
13630 81.0
13631 81.0
13632 81.0
13633 81.0
13634 81.0
13635 81.0
13636 81.0
13637 81.0
13638 81.0
13639 81.0
13640 81.0
13641 81.0
13642 81.0
13643 81.0
13644 81.0
13645 81.0
13646 81.0
13647 81.0
13648 81.0
13649 81.0
13650 81.0
13651 81.0
13652 81.0
13653 81.0
13654 81.0
13655 81.0
13656 81.0
13657 81.0
13658 81.0
13659 81.0
13660 81.0
13661 81.0
13662 81.0
13663 81.0
13664 81.0
13665 81.0
13666 81.0
13667 81.0
13668 81.0
13669 81.0
13670 81.0
13671 81.0
13672 81.0
13673 81.0
13674 81.0
13675 81.0
13676 81.0
13677 81.0
13678 81.0
13679 81.0
13680 81.0
13681 81.0
13682 81.0
13683 81.0
13684 81.0
13685 81.0
13686 81.0
13687 81.0
13688 81.0
13689 81.0
13690 81.0
13691 81.0
13692 81.0
13693 81.0
13694 81.0
13695 81.0
13696 81.0
13697 81.0
13698 81.0
13699 81.0
13700 81.0
13701 81.0
13702 81.0
13703 81.0
13704 81.0
13705 81.0
13706 81.0

14851 87.0
14852 87.0
14853 87.0
14854 87.0
14855 87.0
14856 87.0
14857 87.0
14858 87.0
14859 87.0
14860 87.0
14861 87.0
14862 87.0
14863 87.0
14864 87.0
14865 87.0
14866 87.0
14867 87.0
14868 87.0
14869 87.0
14870 87.0
14871 87.0
14872 87.0
14873 87.0
14874 87.0
14875 87.0
14876 87.0
14877 87.0
14878 87.0
14879 87.0
14880 87.0
14881 87.0
14882 87.0
14883 87.0
14884 87.0
14885 87.0
14886 87.0
14887 87.0
14888 87.0
14889 87.0
14890 87.0
14891 87.0
14892 87.0
14893 87.0
14894 87.0
14895 87.0
14896 87.0
14897 87.0
14898 87.0
14899 87.0
14900 87.0
14901 87.0
14902 87.0
14903 87.0
14904 87.0
14905 87.0
14906 87.0
14907 87.0
14908 87.0
14909 87.0
14910 87.0
14911 87.0
14912 87.0
14913 87.0
14914 87.0
14915 87.0
14916 87.0
14917 87.0
14918 87.0
14919 87.0
14920 87.0
14921 87.0
14922 87.0
14923 87.0
14924 87.0
14925 87.0
14926 87.0
14927 87.0
14928 87.0
14929 87.0
14930 87.0
14931 87.0
14932 87.0
14933 87.0
14934 87.0
14935 87.0
14936 87.0
14937 87.0
14938 87.0
14939 87.0
14940 87.0
14941 87.0

15658 91.0
15659 91.0
15660 91.0
15661 91.0
15662 91.0
15663 91.0
15664 91.0
15665 91.0
15666 91.0
15667 91.0
15668 91.0
15669 91.0
15670 91.0
15671 91.0
15672 91.0
15673 91.0
15674 91.0
15675 91.0
15676 91.0
15677 91.0
15678 91.0
15679 91.0
15680 91.0
15681 91.0
15682 91.0
15683 91.0
15684 91.0
15685 91.0
15686 91.0
15687 91.0
15688 91.0
15689 91.0
15690 91.0
15691 91.0
15692 91.0
15693 91.0
15694 91.0
15695 91.0
15696 91.0
15697 91.0
15698 91.0
15699 91.0
15700 91.0
15701 91.0
15702 91.0
15703 91.0
15704 91.0
15705 91.0
15706 91.0
15707 91.0
15708 91.0
15709 91.0
15710 91.0
15711 91.0
15712 91.0
15713 91.0
15714 91.0
15715 91.0
15716 91.0
15717 91.0
15718 91.0
15719 91.0
15720 91.0
15721 91.0
15722 91.0
15723 91.0
15724 91.0
15725 91.0
15726 91.0
15727 91.0
15728 91.0
15729 91.0
15730 91.0
15731 91.0
15732 91.0
15733 91.0
15734 91.0
15735 91.0
15736 91.0
15737 91.0
15738 91.0
15739 91.0
15740 91.0
15741 91.0
15742 91.0
15743 91.0
15744 91.0
15745 91.0
15746 91.0
15747 91.0
15748 91.0

16483 95.0
16484 95.0
16485 95.0
16486 95.0
16487 95.0
16488 95.0
16489 95.0
16490 95.0
16491 95.0
16492 95.0
16493 95.0
16494 95.0
16495 95.0
16496 95.0
16497 95.0
16498 95.0
16499 95.0
16500 95.0
16501 95.0
16502 95.0
16503 95.0
16504 95.0
16505 95.0
16506 95.0
16507 95.0
16508 95.0
16509 95.0
16510 95.0
16511 95.0
16512 95.0
16513 95.0
16514 95.0
16515 95.0
16516 95.0
16517 95.0
16518 95.0
16519 95.0
16520 95.0
16521 95.0
16522 95.0
16523 95.0
16524 95.0
16525 95.0
16526 95.0
16527 95.0
16528 95.0
16529 95.0
16530 95.0
16531 95.0
16532 95.0
16533 95.0
16534 96.0
16535 96.0
16536 96.0
16537 96.0
16538 96.0
16539 96.0
16540 96.0
16541 96.0
16542 96.0
16543 96.0
16544 96.0
16545 96.0
16546 96.0
16547 96.0
16548 96.0
16549 96.0
16550 96.0
16551 96.0
16552 96.0
16553 96.0
16554 96.0
16555 96.0
16556 96.0
16557 96.0
16558 96.0
16559 96.0
16560 96.0
16561 96.0
16562 96.0
16563 96.0
16564 96.0
16565 96.0
16566 96.0
16567 96.0
16568 96.0
16569 96.0
16570 96.0
16571 96.0
16572 96.0
16573 96.0

17678 101.0
17679 101.0
17680 101.0
17681 101.0
17682 101.0
17683 101.0
17684 101.0
17685 101.0
17686 101.0
17687 101.0
17688 101.0
17689 101.0
17690 101.0
17691 101.0
17692 101.0
17693 101.0
17694 101.0
17695 101.0
17696 101.0
17697 101.0
17698 101.0
17699 101.0
17700 101.0
17701 101.0
17702 101.0
17703 101.0
17704 101.0
17705 101.0
17706 101.0
17707 101.0
17708 101.0
17709 101.0
17710 102.0
17711 102.0
17712 102.0
17713 102.0
17714 102.0
17715 102.0
17716 102.0
17717 102.0
17718 102.0
17719 102.0
17720 102.0
17721 102.0
17722 102.0
17723 102.0
17724 102.0
17725 102.0
17726 102.0
17727 102.0
17728 102.0
17729 102.0
17730 102.0
17731 102.0
17732 102.0
17733 102.0
17734 102.0
17735 102.0
17736 102.0
17737 102.0
17738 102.0
17739 102.0
17740 102.0
17741 102.0
17742 102.0
17743 102.0
17744 102.0
17745 102.0
17746 102.0
17747 102.0
17748 102.0
17749 102.0
17750 102.0
17751 102.0
17752 102.0
17753 102.0
17754 102.0
17755 102.0
17756 102.0
17757 102.0
17758 102.0
17759 102.0
17760 102.0
1776

19470 110.0
19471 110.0
19472 110.0
19473 110.0
19474 111.0
19475 111.0
19476 111.0
19477 111.0
19478 111.0
19479 111.0
19480 111.0
19481 111.0
19482 111.0
19483 111.0
19484 111.0
19485 111.0
19486 111.0
19487 111.0
19488 111.0
19489 111.0
19490 111.0
19491 111.0
19492 111.0
19493 111.0
19494 111.0
19495 111.0
19496 111.0
19497 111.0
19498 111.0
19499 111.0
19500 111.0
19501 111.0
19502 111.0
19503 111.0
19504 111.0
19505 111.0
19506 111.0
19507 111.0
19508 111.0
19509 111.0
19510 111.0
19511 111.0
19512 111.0
19513 111.0
19514 111.0
19515 111.0
19516 111.0
19517 111.0
19518 111.0
19519 111.0
19520 111.0
19521 111.0
19522 111.0
19523 111.0
19524 111.0
19525 111.0
19526 111.0
19527 111.0
19528 111.0
19529 111.0
19530 111.0
19531 111.0
19532 111.0
19533 111.0
19534 111.0
19535 111.0
19536 111.0
19537 111.0
19538 111.0
19539 111.0
19540 111.0
19541 111.0
19542 111.0
19543 111.0
19544 111.0
19545 111.0
19546 111.0
19547 111.0
19548 111.0
19549 111.0
19550 111.0
19551 111.0
19552 111.0
1955

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["epi_week"][row] = (df["epi_week"][row]-200+105)


20653 117.0
20654 117.0
20655 117.0
20656 117.0
20657 117.0
20658 117.0
20659 117.0
20660 117.0
20661 117.0
20662 117.0
20663 117.0
20664 117.0
20665 117.0
20666 117.0
20667 117.0
20668 117.0
20669 117.0
20670 117.0
20671 117.0
20672 117.0
20673 117.0
20674 117.0
20675 117.0
20676 117.0
20677 117.0
20678 117.0
20679 117.0
20680 117.0
20681 117.0
20682 117.0
20683 117.0
20684 117.0
20685 117.0
20686 117.0
20687 117.0
20688 117.0
20689 117.0
20690 117.0
20691 117.0
20692 117.0
20693 117.0
20694 117.0
20695 117.0
20696 117.0
20697 117.0
20698 117.0
20699 117.0
20700 117.0
20701 117.0
20702 117.0
20703 117.0
20704 117.0
20705 117.0
20706 117.0
20707 117.0
20708 117.0
20709 117.0
20710 117.0
20711 117.0
20712 117.0
20713 117.0
20714 117.0
20715 117.0
20716 117.0
20717 117.0
20718 117.0
20719 117.0
20720 117.0
20721 117.0
20722 117.0
20723 117.0
20724 117.0
20725 117.0
20726 117.0
20727 117.0
20728 117.0
20729 117.0
20730 117.0
20731 117.0
20732 117.0
20733 117.0
20734 117.0
20735 117.0
2073

26942 149.0
26943 149.0
26944 149.0
26945 149.0
26946 149.0
26947 149.0
26948 149.0
26949 149.0
26950 149.0
26951 149.0
26952 149.0
26953 149.0
26954 149.0
26955 149.0
26956 149.0
26957 149.0
26958 149.0
26959 149.0
26960 149.0
26961 149.0
26962 149.0
26963 149.0
26964 149.0
26965 149.0
26966 149.0
26967 149.0
26968 149.0
26969 149.0
26970 149.0
26971 149.0
26972 149.0
26973 149.0
26974 149.0
26975 149.0
26976 149.0
26977 149.0
26978 149.0
26979 149.0
26980 149.0
26981 149.0
26982 149.0
26983 149.0
26984 149.0
26985 149.0
26986 149.0
26987 149.0
26988 149.0
26989 149.0
26990 149.0
26991 149.0
26992 149.0
26993 149.0
26994 149.0
26995 149.0
26996 149.0
26997 149.0
26998 149.0
26999 149.0
27000 149.0
27001 149.0
27002 149.0
27003 149.0
27004 149.0
27005 149.0
27006 149.0
27007 149.0
27008 149.0
27009 149.0
27010 149.0
27011 149.0
27012 149.0
27013 149.0
27014 149.0
27015 149.0
27016 149.0
27017 149.0
27018 149.0
27019 149.0
27020 149.0
27021 149.0
27022 149.0
27023 149.0
27024 149.0
2702

In [15]:
brazil = df.loc[df["state"]=="TOTAL"]

In [16]:
profile = ProfileReport(brazil.reset_index(drop=True), title="Relatório Covid Brasil", explorative = True)

In [17]:
#profile