In [None]:
import pandas as pd

**1. Loading the dataset**

In [None]:
df = pd.read_csv(r"/content/Indian_Kids_Screen_Time.csv")
print(df.head())

   Age  Gender  Avg_Daily_Screen_Time_hr Primary_Device  \
0   14    Male                      3.99     Smartphone   
1   11  Female                      4.61         Laptop   
2   18  Female                      3.73             TV   
3   15  Female                      1.21         Laptop   
4   12  Female                      5.89     Smartphone   

   Exceeded_Recommended_Limit  Educational_to_Recreational_Ratio  \
0                        True                               0.42   
1                        True                               0.30   
2                        True                               0.32   
3                       False                               0.39   
4                        True                               0.49   

           Health_Impacts Urban_or_Rural  
0  Poor Sleep, Eye Strain          Urban  
1              Poor Sleep          Urban  
2              Poor Sleep          Urban  
3                     NaN          Urban  
4     Poor Sleep, Anx

**2.check for null values**

In [None]:
print(df.isnull().sum())


Age                                     0
Gender                                  0
Avg_Daily_Screen_Time_hr                0
Primary_Device                          0
Exceeded_Recommended_Limit              0
Educational_to_Recreational_Ratio       0
Health_Impacts                       3218
Urban_or_Rural                          0
dtype: int64


**3. checking Duplicate values**

In [None]:
print("Number of duplicate rows:", df.duplicated().sum())
print("Number of duplicate columns:", df.columns.duplicated().sum())


Number of duplicate rows: 44
Number of duplicate columns: 0


**4. check Correlation**

In [None]:
print(df.corr(numeric_only=True))

                                        Age  Avg_Daily_Screen_Time_hr  \
Age                                1.000000                  0.118328   
Avg_Daily_Screen_Time_hr           0.118328                  1.000000   
Exceeded_Recommended_Limit         0.159173                  0.664950   
Educational_to_Recreational_Ratio -0.488617                 -0.087552   

                                   Exceeded_Recommended_Limit  \
Age                                                  0.159173   
Avg_Daily_Screen_Time_hr                             0.664950   
Exceeded_Recommended_Limit                           1.000000   
Educational_to_Recreational_Ratio                   -0.126643   

                                   Educational_to_Recreational_Ratio  
Age                                                        -0.488617  
Avg_Daily_Screen_Time_hr                                   -0.087552  
Exceeded_Recommended_Limit                                 -0.126643  
Educational_to_Recreatio

**5. check info of columns**

In [None]:
print("Number of columns:", df.shape[1])
print("Number of rows:", df.shape[0])

Number of columns: 8
Number of rows: 9712


**6. check datatype of columns**

In [None]:
print(df.dtypes)

Age                                    int64
Gender                                object
Avg_Daily_Screen_Time_hr             float64
Primary_Device                        object
Exceeded_Recommended_Limit              bool
Educational_to_Recreational_Ratio    float64
Health_Impacts                        object
Urban_or_Rural                        object
dtype: object


**7. IQR**

In [None]:
for col in df.select_dtypes(include=['int64', 'float64']).columns:
    Q1 = df[col].quantile(0.25)
    Q3 = df[col].quantile(0.75)
    IQR = Q3 - Q1
    print(f"Column: {col}")
    print(f"Q1 (25th percentile): {Q1}")
    print(f"Q3 (75th percentile): {Q3}")
    print(f"IQR: {IQR}\n")

Column: Age
Q1 (25th percentile): 10.0
Q3 (75th percentile): 16.0
IQR: 6.0

Column: Avg_Daily_Screen_Time_hr
Q1 (25th percentile): 3.41
Q3 (75th percentile): 5.38
IQR: 1.9699999999999998

Column: Educational_to_Recreational_Ratio
Q1 (25th percentile): 0.37
Q3 (75th percentile): 0.48
IQR: 0.10999999999999999

