In [1]:
import pandas as pd

# Series

In [2]:
record1 = pd.Series({"Name": "Alex",
                    "Class": "Physics",
                    "Score": 85})
record1

Name        Alex
Class    Physics
Score         85
dtype: object

In [3]:
record2 = pd.Series({"Name": "John",
                    "Class": "Math",
                    "Score": 88})
record1

Name        Alex
Class    Physics
Score         85
dtype: object

In [4]:
df = pd.DataFrame([record1, record2], index = ['school1', 'school2'])
df

Unnamed: 0,Name,Class,Score
school1,Alex,Physics,85
school2,John,Math,88


In [5]:
df.head(1)

Unnamed: 0,Name,Class,Score
school1,Alex,Physics,85


In [6]:
type(df)

pandas.core.frame.DataFrame

# Comparing Series & Dataframe

In [7]:
import numpy as np
import matplotlib.pyplot as plt

In [8]:
s = pd.Series([1, 2, 3, 4, 5])
s

0    1
1    2
2    3
3    4
4    5
dtype: int64

In [9]:
pd.Series([30, 35, 40], index = ['2015 Sales', '2016 Sales', '2017 Sales'], name = 'Product A')

2015 Sales    30
2016 Sales    35
2017 Sales    40
Name: Product A, dtype: int64

In [10]:
df = pd.DataFrame({'High': [20, 10, 40, 23, 34],
                  'Low': [14, 18, 12, 19, 25]}, 
                 index = ['Austin', 'Los Angeles', 'Seattle', 'Nashville', 'Salt Lake City'])
df

Unnamed: 0,High,Low
Austin,20,14
Los Angeles,10,18
Seattle,40,12
Nashville,23,19
Salt Lake City,34,25


In [11]:
my_dict = {'a': 1, 'aa': 2}, {'b': 3}, {'c': 4}
my_dict

({'a': 1, 'aa': 2}, {'b': 3}, {'c': 4})

In [12]:
s = pd.Series(my_dict)
s

0    {'a': 1, 'aa': 2}
1             {'b': 3}
2             {'c': 4}
dtype: object

In [13]:
df = pd.DataFrame(my_dict)
df

Unnamed: 0,a,aa,b,c
0,1.0,2.0,,
1,,,3.0,
2,,,,4.0


# Read in TSLA Dataset

In [14]:
tsla = pd.read_csv('./TSLA.csv')
tsla

Unnamed: 0,Date,Open,High,Low,Close,Adj Close,Volume
0,2020-09-21,453.130005,455.679993,407.070007,449.390015,449.390015,109476800
1,2020-09-22,429.600006,437.760010,417.600006,424.230011,424.230011,79580800
2,2020-09-23,405.160004,412.149994,375.880005,380.359985,380.359985,95074200
3,2020-09-24,363.799988,399.500000,351.299988,387.790009,387.790009,96561100
4,2020-09-25,393.470001,408.730011,391.299988,407.339996,407.339996,67208500
...,...,...,...,...,...,...,...
247,2021-09-14,742.570007,754.469971,736.400024,744.489990,744.489990,18524900
248,2021-09-15,745.000000,756.859985,738.359985,755.830017,755.830017,15357700
249,2021-09-16,752.830017,758.909973,747.609985,756.989990,756.989990,13923400
250,2021-09-17,757.150024,761.039978,750.000000,759.489990,759.489990,28186100


In [15]:
tsla.head(10)

Unnamed: 0,Date,Open,High,Low,Close,Adj Close,Volume
0,2020-09-21,453.130005,455.679993,407.070007,449.390015,449.390015,109476800
1,2020-09-22,429.600006,437.76001,417.600006,424.230011,424.230011,79580800
2,2020-09-23,405.160004,412.149994,375.880005,380.359985,380.359985,95074200
3,2020-09-24,363.799988,399.5,351.299988,387.790009,387.790009,96561100
4,2020-09-25,393.470001,408.730011,391.299988,407.339996,407.339996,67208500
5,2020-09-28,424.619995,428.079987,415.549988,421.200012,421.200012,49719600
6,2020-09-29,416.0,428.5,411.600006,419.070007,419.070007,50219300
7,2020-09-30,421.320007,433.929993,420.470001,429.01001,429.01001,48145600
8,2020-10-01,440.76001,448.880005,434.420013,448.160004,448.160004,50741500
9,2020-10-02,421.390015,439.130005,415.0,415.089996,415.089996,71430000


In [16]:
column_names = tsla.columns
column_names
tsla.dtypes

Date          object
Open         float64
High         float64
Low          float64
Close        float64
Adj Close    float64
Volume         int64
dtype: object

# Index-Based Selection (iloc)

In [17]:
tsla.iloc[0]

Date         2020-09-21
Open         453.130005
High         455.679993
Low          407.070007
Close        449.390015
Adj Close    449.390015
Volume        109476800
Name: 0, dtype: object

In [18]:
# First row, second row, fourth row - first column
tsla.iloc[[0, 1, 3], 0]

0    2020-09-21
1    2020-09-22
3    2020-09-24
Name: Date, dtype: object

# Label-Based Selection (loc)

In [19]:
tsla.loc[0]['Close']

449.390015

In [20]:
tsla.set_index('Date', inplace = True)

In [21]:
tsla.loc['2020-09-21']['Close']

449.390015

In [22]:
tsla.loc['2020-09-21', 'Close']

449.390015

In [23]:
tsla.loc['2020-09-21', ['Close', 'High']]

Close    449.390015
High     455.679993
Name: 2020-09-21, dtype: float64

# Conditional Selection

In [24]:
bc = pd.read_csv("./bcwisconsin.csv", index_col = 0)
bc

Unnamed: 0_level_0,diagnosis,radius_mean,texture_mean,perimeter_mean,area_mean,smoothness_mean,compactness_mean,concavity_mean,concave points_mean,symmetry_mean,...,texture_worst,perimeter_worst,area_worst,smoothness_worst,compactness_worst,concavity_worst,concave points_worst,symmetry_worst,fractal_dimension_worst,Unnamed: 32
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
842302,M,17.99,10.38,122.80,1001.0,0.11840,0.27760,0.30010,0.14710,0.2419,...,17.33,184.60,2019.0,0.16220,0.66560,0.7119,0.2654,0.4601,0.11890,
842517,M,20.57,17.77,132.90,1326.0,0.08474,0.07864,0.08690,0.07017,0.1812,...,23.41,158.80,1956.0,0.12380,0.18660,0.2416,0.1860,0.2750,0.08902,
84300903,M,19.69,21.25,130.00,1203.0,0.10960,0.15990,0.19740,0.12790,0.2069,...,25.53,152.50,1709.0,0.14440,0.42450,0.4504,0.2430,0.3613,0.08758,
84348301,M,11.42,20.38,77.58,386.1,0.14250,0.28390,0.24140,0.10520,0.2597,...,26.50,98.87,567.7,0.20980,0.86630,0.6869,0.2575,0.6638,0.17300,
84358402,M,20.29,14.34,135.10,1297.0,0.10030,0.13280,0.19800,0.10430,0.1809,...,16.67,152.20,1575.0,0.13740,0.20500,0.4000,0.1625,0.2364,0.07678,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
926424,M,21.56,22.39,142.00,1479.0,0.11100,0.11590,0.24390,0.13890,0.1726,...,26.40,166.10,2027.0,0.14100,0.21130,0.4107,0.2216,0.2060,0.07115,
926682,M,20.13,28.25,131.20,1261.0,0.09780,0.10340,0.14400,0.09791,0.1752,...,38.25,155.00,1731.0,0.11660,0.19220,0.3215,0.1628,0.2572,0.06637,
926954,M,16.60,28.08,108.30,858.1,0.08455,0.10230,0.09251,0.05302,0.1590,...,34.12,126.70,1124.0,0.11390,0.30940,0.3403,0.1418,0.2218,0.07820,
927241,M,20.60,29.33,140.10,1265.0,0.11780,0.27700,0.35140,0.15200,0.2397,...,39.42,184.60,1821.0,0.16500,0.86810,0.9387,0.2650,0.4087,0.12400,


In [25]:
bc.area_mean >= 1300

id
842302      False
842517       True
84300903    False
84348301    False
84358402    False
            ...  
926424       True
926682      False
926954      False
927241      False
92751       False
Name: area_mean, Length: 569, dtype: bool

In [26]:
bc.loc[bc.area_mean >= 1300]

Unnamed: 0_level_0,diagnosis,radius_mean,texture_mean,perimeter_mean,area_mean,smoothness_mean,compactness_mean,concavity_mean,concave points_mean,symmetry_mean,...,texture_worst,perimeter_worst,area_worst,smoothness_worst,compactness_worst,concavity_worst,concave points_worst,symmetry_worst,fractal_dimension_worst,Unnamed: 32
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
842517,M,20.57,17.77,132.9,1326.0,0.08474,0.07864,0.0869,0.07017,0.1812,...,23.41,158.8,1956.0,0.1238,0.1866,0.2416,0.186,0.275,0.08902,
851509,M,21.16,23.04,137.2,1404.0,0.09428,0.1022,0.1097,0.08632,0.1769,...,35.59,188.0,2615.0,0.1401,0.26,0.3155,0.2009,0.2822,0.07526,
8611555,M,25.22,24.91,171.5,1878.0,0.1063,0.2665,0.3339,0.1845,0.1829,...,33.62,211.7,2562.0,0.1573,0.6076,0.6476,0.2867,0.2355,0.1051,
86355,M,22.27,19.67,152.8,1509.0,0.1326,0.2768,0.4264,0.1823,0.2556,...,28.01,206.8,2360.0,0.1701,0.6997,0.9608,0.291,0.4055,0.09789,
865423,M,24.25,20.2,166.2,1761.0,0.1447,0.2867,0.4268,0.2012,0.2655,...,23.99,180.9,2073.0,0.1696,0.4244,0.5803,0.2248,0.3222,0.08009,
8712289,M,23.27,22.04,152.1,1686.0,0.08439,0.1145,0.1324,0.09702,0.1801,...,28.22,184.2,2403.0,0.1228,0.3583,0.3948,0.2346,0.3589,0.09187,
873592,M,27.22,21.87,182.1,2250.0,0.1094,0.1914,0.2871,0.1878,0.18,...,32.85,220.8,3216.0,0.1472,0.4034,0.534,0.2688,0.2856,0.08082,
873593,M,21.09,26.57,142.7,1311.0,0.1141,0.2832,0.2487,0.1496,0.2395,...,33.48,176.5,2089.0,0.1491,0.7584,0.678,0.2903,0.4098,0.1284,
878796,M,23.29,26.67,158.9,1685.0,0.1141,0.2084,0.3523,0.162,0.22,...,32.68,177.0,1986.0,0.1536,0.4167,0.7892,0.2733,0.3198,0.08762,
8810703,M,28.11,18.47,188.5,2499.0,0.1142,0.1516,0.3201,0.1595,0.1648,...,18.47,188.5,2499.0,0.1142,0.1516,0.3201,0.1595,0.1648,0.05525,


In [27]:
bc.loc[(bc.perimeter_mean >= 150) & (bc.radius_mean >= 25)]

Unnamed: 0_level_0,diagnosis,radius_mean,texture_mean,perimeter_mean,area_mean,smoothness_mean,compactness_mean,concavity_mean,concave points_mean,symmetry_mean,...,texture_worst,perimeter_worst,area_worst,smoothness_worst,compactness_worst,concavity_worst,concave points_worst,symmetry_worst,fractal_dimension_worst,Unnamed: 32
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
8611555,M,25.22,24.91,171.5,1878.0,0.1063,0.2665,0.3339,0.1845,0.1829,...,33.62,211.7,2562.0,0.1573,0.6076,0.6476,0.2867,0.2355,0.1051,
873592,M,27.22,21.87,182.1,2250.0,0.1094,0.1914,0.2871,0.1878,0.18,...,32.85,220.8,3216.0,0.1472,0.4034,0.534,0.2688,0.2856,0.08082,
8810703,M,28.11,18.47,188.5,2499.0,0.1142,0.1516,0.3201,0.1595,0.1648,...,18.47,188.5,2499.0,0.1142,0.1516,0.3201,0.1595,0.1648,0.05525,
899987,M,25.73,17.46,174.2,2010.0,0.1149,0.2363,0.3368,0.1913,0.1956,...,23.58,229.3,3234.0,0.153,0.5937,0.6451,0.2756,0.369,0.08815,
911296202,M,27.42,26.27,186.9,2501.0,0.1084,0.1988,0.3635,0.1689,0.2061,...,31.37,251.2,4254.0,0.1357,0.4256,0.6833,0.2625,0.2641,0.07427,


In [28]:
bc.diagnosis[bc.diagnosis.isin(['M'])]

id
842302      M
842517      M
84300903    M
84348301    M
84358402    M
           ..
926125      M
926424      M
926682      M
926954      M
927241      M
Name: diagnosis, Length: 212, dtype: object

# Summary Functions

In [29]:
bc.symmetry_mean.describe()

count    569.000000
mean       0.181162
std        0.027414
min        0.106000
25%        0.161900
50%        0.179200
75%        0.195700
max        0.304000
Name: symmetry_mean, dtype: float64

In [30]:
bc.symmetry_mean.mean()

0.18116186291739894

In [31]:
bc.symmetry_mean.unique()

array([0.2419, 0.1812, 0.2069, 0.2597, 0.1809, 0.2087, 0.1794, 0.2196,
       0.235 , 0.203 , 0.1528, 0.1842, 0.2397, 0.1847, 0.2303, 0.1586,
       0.2164, 0.1582, 0.1885, 0.1967, 0.1815, 0.2521, 0.1769, 0.1995,
       0.304 , 0.2252, 0.1697, 0.1926, 0.1739, 0.2183, 0.2301, 0.2248,
       0.1853, 0.1998, 0.1896, 0.1467, 0.1565, 0.172 , 0.1784, 0.1895,
       0.231 , 0.1974, 0.1746, 0.1907, 0.2128, 0.1675, 0.1495, 0.1353,
       0.1868, 0.2092, 0.1616, 0.192 , 0.1917, 0.2027, 0.1819, 0.1683,
       0.2743, 0.1828, 0.1949, 0.2341, 0.1905, 0.1953, 0.1717, 0.1516,
       0.2111, 0.159 , 0.1902, 0.1927, 0.1662, 0.1798, 0.2403, 0.2152,
       0.2906, 0.1718, 0.1942, 0.1829, 0.1634, 0.2079, 0.2132, 0.2075,
       0.193 , 0.2116, 0.1685, 0.1386, 0.1638, 0.1855, 0.2095, 0.19  ,
       0.135 , 0.162 , 0.1879, 0.1609, 0.1945, 0.2217, 0.1925, 0.1801,
       0.1602, 0.2556, 0.1487, 0.1584, 0.1735, 0.1704, 0.1922, 0.1649,
       0.1688, 0.1305, 0.2157, 0.2096, 0.2129, 0.1667, 0.1966, 0.2655,
      

In [32]:
bc.symmetry_mean.value_counts()

symmetry_mean
0.1714    4
0.1769    4
0.1893    4
0.1601    4
0.1717    4
         ..
0.2251    1
0.2200    1
0.1979    1
0.1950    1
0.1587    1
Name: count, Length: 432, dtype: int64

# groupby

In [33]:
bc.groupby('diagnosis').radius_mean.max()

diagnosis
B    17.85
M    28.11
Name: radius_mean, dtype: float64

In [34]:
bc.groupby('area_mean').radius_mean.min()

area_mean
143.5      6.981
170.4      7.691
178.8      7.729
181.0      7.760
201.9      8.196
           ...  
1878.0    25.220
2010.0    25.730
2250.0    27.220
2499.0    28.110
2501.0    27.420
Name: radius_mean, Length: 539, dtype: float64

In [35]:
bc.groupby('diagnosis').symmetry_mean.agg([len, 'min', 'max'])

Unnamed: 0_level_0,len,min,max
diagnosis,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
B,357,0.106,0.2743
M,212,0.1308,0.304


In [36]:
bc.sort_values('diagnosis')

Unnamed: 0_level_0,diagnosis,radius_mean,texture_mean,perimeter_mean,area_mean,smoothness_mean,compactness_mean,concavity_mean,concave points_mean,symmetry_mean,...,texture_worst,perimeter_worst,area_worst,smoothness_worst,compactness_worst,concavity_worst,concave points_worst,symmetry_worst,fractal_dimension_worst,Unnamed: 32
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
8912284,B,12.89,15.70,84.08,516.6,0.07818,0.09580,0.11150,0.03390,0.1432,...,19.69,92.12,595.6,0.09926,0.2317,0.3344,0.10170,0.1999,0.07127,
9012568,B,15.19,13.21,97.65,711.8,0.07963,0.06934,0.03393,0.02657,0.1721,...,15.73,104.50,819.1,0.11260,0.1737,0.1362,0.08178,0.2487,0.06766,
9011495,B,12.21,18.02,78.31,458.4,0.09231,0.07175,0.04392,0.02027,0.1695,...,24.04,93.85,624.6,0.13680,0.2170,0.2413,0.08829,0.3218,0.07470,
9010877,B,13.40,16.95,85.48,552.4,0.07937,0.05696,0.02181,0.01473,0.1650,...,21.70,93.76,663.5,0.12130,0.1676,0.1364,0.06987,0.2741,0.07582,
9010872,B,16.50,18.29,106.60,838.1,0.09686,0.08468,0.05862,0.04835,0.1495,...,25.45,117.20,1009.0,0.13380,0.1679,0.1663,0.09123,0.2394,0.06469,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
869691,M,11.80,16.58,78.99,432.0,0.10910,0.17000,0.16590,0.07415,0.2678,...,26.38,91.93,591.7,0.13850,0.4092,0.4504,0.18650,0.5774,0.10300,
9013838,M,11.08,18.83,73.30,361.6,0.12160,0.21540,0.16890,0.06367,0.2196,...,32.82,91.76,508.1,0.21840,0.9379,0.8402,0.25240,0.4154,0.14030,
869104,M,16.11,18.05,105.10,813.0,0.09721,0.11370,0.09447,0.05943,0.1861,...,25.27,129.00,1233.0,0.13140,0.2236,0.2802,0.12160,0.2792,0.08158,
868826,M,14.95,17.57,96.85,678.1,0.11670,0.13050,0.15390,0.08624,0.1957,...,21.43,121.40,971.4,0.14110,0.2164,0.3355,0.16670,0.3414,0.07147,


In [37]:
bc.sort_values(by=['diagnosis', 'texture_mean'])

Unnamed: 0_level_0,diagnosis,radius_mean,texture_mean,perimeter_mean,area_mean,smoothness_mean,compactness_mean,concavity_mean,concave points_mean,symmetry_mean,...,texture_worst,perimeter_worst,area_worst,smoothness_worst,compactness_worst,concavity_worst,concave points_worst,symmetry_worst,fractal_dimension_worst,Unnamed: 32
id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
87127,B,10.80,9.71,68.77,357.6,0.09594,0.05736,0.02531,0.016980,0.1381,...,12.02,73.66,414.0,0.1436,0.1257,0.10470,0.04603,0.2090,0.07699,
893988,B,11.54,10.72,73.73,409.1,0.08597,0.05969,0.01367,0.008907,0.1833,...,12.87,81.23,467.8,0.1092,0.1626,0.08324,0.04715,0.3390,0.07434,
865137,B,11.41,10.82,73.34,403.3,0.09373,0.06685,0.03512,0.026230,0.1667,...,15.97,83.74,510.5,0.1548,0.2390,0.21020,0.08958,0.3016,0.08523,
865432,B,14.50,10.89,94.28,640.7,0.11010,0.10990,0.08842,0.057780,0.1856,...,15.98,102.80,745.5,0.1313,0.1788,0.25600,0.12210,0.2889,0.08006,
904647,B,11.93,10.91,76.14,442.7,0.08872,0.05242,0.02606,0.017960,0.1601,...,20.14,87.64,589.5,0.1374,0.1575,0.15140,0.06876,0.2460,0.07262,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
925622,M,15.22,30.62,103.40,716.9,0.10480,0.20870,0.25500,0.094290,0.2128,...,42.79,128.70,915.0,0.1417,0.7917,1.17000,0.23560,0.4089,0.14090,
88995002,M,20.73,31.12,135.70,1419.0,0.09469,0.11430,0.13670,0.086460,0.1769,...,47.16,214.00,3432.0,0.1401,0.2644,0.34420,0.16590,0.2868,0.08218,
88119002,M,19.53,32.47,128.00,1223.0,0.08420,0.11300,0.11450,0.066370,0.1428,...,45.41,180.20,2477.0,0.1408,0.4097,0.39950,0.16250,0.2713,0.07568,
88725602,M,15.53,33.56,103.70,744.9,0.10630,0.16390,0.17510,0.083990,0.2091,...,49.54,126.30,1035.0,0.1883,0.5564,0.57030,0.20140,0.3512,0.12040,


In [38]:
bc.diagnosis.dtype

dtype('O')

# Missing Values

In [39]:
bc.isna().sum()

diagnosis                    0
radius_mean                  0
texture_mean                 0
perimeter_mean               0
area_mean                    0
smoothness_mean              0
compactness_mean             0
concavity_mean               0
concave points_mean          0
symmetry_mean                0
fractal_dimension_mean       0
radius_se                    0
texture_se                   0
perimeter_se                 0
area_se                      0
smoothness_se                0
compactness_se               0
concavity_se                 0
concave points_se            0
symmetry_se                  0
fractal_dimension_se         0
radius_worst                 0
texture_worst                0
perimeter_worst              0
area_worst                   0
smoothness_worst             0
compactness_worst            0
concavity_worst              0
concave points_worst         0
symmetry_worst               0
fractal_dimension_worst      0
Unnamed: 32                569
dtype: i

In [40]:
# bc.dropna(axis=1, inplace=True)
# bc

In [41]:
bc.isna().sum().sum()

569

In [44]:
bc.fillna(0, inplace=True)
bc
bc.isna().sum().sum()

0