In [1]:
### Select All Rows for a Specific Column
# Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4),
                  index=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'],
                  columns=['A', 'B', 'C', 'D'])

# Select all rows for a specific column
print(df.loc[:, 'A'])

a    0.196259
b    1.434991
c   -0.004174
d   -0.374509
e    0.331503
f    0.483656
g    1.369615
h   -0.321272
Name: A, dtype: float64


In [2]:
### Select All Rows for Multiple Columns
# Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4),
                  index=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'],
                  columns=['A', 'B', 'C', 'D'])

# Select all rows for multiple columns
print(df.loc[:, ['A', 'C']])

          A         C
a -0.181934  0.212624
b  0.403990  1.217080
c -0.750694 -0.424770
d  0.436291 -0.744339
e  0.204500  0.910286
f  0.009917 -1.171323
g  0.185161  0.592968
h -1.363985 -0.091439


In [3]:
### Select Specific Rows for Multiple Columns
# Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4),
                  index=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'],
                  columns=['A', 'B', 'C', 'D'])

# Select specific rows for multiple columns
print(df.loc[['a', 'b', 'f', 'h'], ['A', 'C']])

          A         C
a  1.051824  0.883908
b -0.174819 -0.598584
f  0.022879  1.079548
h  0.025114  1.253147


In [4]:
### Select a Range of Rows for All Columns
# # Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4),
                  index=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'],
                  columns=['A', 'B', 'C', 'D'])

# Select range of rows for all columns
print(df.loc['a':'h'])


          A         B         C         D
a  0.506918  2.362317 -0.654453  0.574913
b  0.827210  0.543290  0.135855 -0.677111
c -0.222821 -0.181891 -0.176565  2.019095
d -0.780202 -0.117181  0.865895 -0.901596
e -1.013491 -0.377970  0.760280 -0.740760
f -1.733604  0.530876 -0.546408  1.147406
g  0.389700 -0.360376 -1.599787  0.085662
h  1.289178 -0.857156  0.504773 -1.087564


In [5]:
### Use Boolean Array for Selection
# Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4),
                  index=['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h'],
                  columns=['A', 'B', 'C', 'D'])

# Select rows where a specific condition is met
print(df.loc['a'] > 0)

A    False
B    False
C     True
D    False
Name: a, dtype: bool


In [7]:
### Select First Four Rows
# Import the pandas library and aliasing as pd
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])

# Select first four rows
print(df.iloc[:4])

          A         B         C         D
0  0.214596 -0.523092 -0.543191 -1.022958
1 -0.091368 -0.016128  0.713424 -1.713760
2  1.103907 -0.368438 -0.169606 -0.610596
3  1.149771 -0.190553  0.567994 -1.037220


In [8]:
### Perform Integer Slicing
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])

# Perform integer slicing
print(df.iloc[:4])  # First 4 rows
print(df.iloc[1:5, 2:4])  # Specific rows and columns

          A         B         C         D
0  0.431874 -1.425459 -0.917371  0.205127
1  1.167831  0.074489 -0.965210  0.019236
2 -0.257922  0.089826 -0.782447  0.369651
3  0.091757  0.541240 -0.337417 -0.755581
          C         D
1 -0.965210  0.019236
2 -0.782447  0.369651
3 -0.337417 -0.755581
4  1.614886 -1.186342


In [9]:
### Slice Through List of Values
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])

# Slice through specific rows and columns
print(df.iloc[[1, 3, 5], [1, 3]])  # Specific rows and columns
print(df.iloc[1:3, :])  # Range of rows for all columns
print(df.iloc[:, 1:3])  # All rows for a range of columns

          B         D
1 -0.823307  0.865853
3  0.953122  0.201618
5 -0.003606  0.923255
          A         B         C         D
1 -0.206535 -0.823307  1.315921  0.865853
2 -0.866460  0.579018  1.332218  0.249021
          B         C
0  2.252716 -0.663053
1 -0.823307  1.315921
2  0.579018  1.332218
3  0.953122 -1.853312
4  1.365082  0.757751
5 -0.003606 -0.385228
6 -0.589695 -1.212084
7  0.687448  0.743236


In [None]:
### Use of Notations
### Select a Single Column
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
print(df['A'])  # Access column 'A'

0    0.682317
1   -0.128628
2   -1.055731
3    1.738396
4   -0.477582
5   -0.134324
6   -1.431104
7    0.513190
Name: A, dtype: float64


In [11]:
### Select Multiple Columns
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
print(df[['A', 'B']])  # Access columns 'A' and 'B'

          A         B
0 -0.415283 -0.967988
1  0.362871  0.725250
2 -0.805102  0.397980
3 -0.092607  0.013380
4  0.191090 -0.140240
5 -0.434819 -0.642901
6 -0.345689 -0.102643
7 -0.722529  1.211096


In [12]:
### Select Rows Using Range
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])
print(df[2:2])  # This will return an empty DataFrame because the range is invalid

Empty DataFrame
Columns: [A, B, C, D]
Index: []


In [13]:
###  Attribute Access
import pandas as pd
import numpy as np

df = pd.DataFrame(np.random.randn(8, 4), columns=['A', 'B', 'C', 'D'])

# Attribute-style access for column 'A'
print(df.A)

0   -1.214911
1   -1.695665
2   -0.331709
3   -1.946075
4    0.179899
5   -0.382293
6    1.526396
7    0.083577
Name: A, dtype: float64
