# Topic: Climate-Resilient Farming Practice

In [1]:
# Import libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

In [4]:
# Import Argricultural Survey data
raw_data = pd.read_csv('C:/Users/DONKAMS/Downloads/Hamoye-Premier-Project/Dataset/data.csv', low_memory=False)
pd.set_option('display.max_columns', None)
raw_data.head

<bound method NDFrame.head of       Unnamed: 0     hhcode  gender1  gender2  gender3  gender4  gender5  \
0              0   10010601      1.0      2.0      1.0      1.0      2.0   
1              1   10010602      1.0      2.0      1.0      1.0      1.0   
2              2   10010603      2.0      1.0      2.0      2.0      2.0   
3              3   10010604      2.0      2.0      2.0      1.0      1.0   
4              4   10010605      1.0      2.0      1.0      1.0      1.0   
...          ...        ...      ...      ...      ...      ...      ...   
9592        9592  100090113      1.0      2.0      2.0      1.0      1.0   
9593        9593  100090114      1.0      2.0      2.0      2.0      1.0   
9594        9594  100090115      1.0      2.0      1.0      2.0      2.0   
9595        9595  100090116      1.0      2.0      2.0      1.0      2.0   
9596        9596  100090117      1.0      1.0      1.0      2.0      2.0   

      gender6  gender7  gender8  age1  age2  age3  age4  

In [5]:
# Store names of columns externally to select needed columns
with open('columns.txt', 'w') as file:
    for item in raw_data.columns:
        file.write('%s\n' % item)

In [6]:
# Open the txt file in read mode
with open('columns_needed.txt', 'r') as file:
    # Read lines from the file and create a list
    columns_needed = [column.strip() for column in file.readlines()]
# Print the list of columns needed    
print(columns_needed)

['farmtype', 'fplots', 'fplotarea1', 'fplotarea2', 'fplotarea3', 'plotunits', 'fsystem1', 'fsystem2', 'fsystem3', 'fsystem4', 'tenure1', 'tenure2', 'tenure3', 'tenure4', 'yearsuse1', 'yearsuse2', 'yearsuse3', 'yearsuse4', 'rentplot1', 'rentplot2', 'rentplot3', 'rentplot4', 'farmbuyv', 'farmsalev', 'season1s', 'season1e', 'season2s', 'season2e', 'season3s', 'season3e', 'seas1nam', 'seas2nam', 'seas3nam', 's1p1c1', 's1p1c1plant', 's1p1c1harv', 's1p1c1area', 's1p1c1qharv', 's1p1c1cons', 's1p1c1lives', 's1p1c1lost', 's1p1c1mkt', 's1p1c1sold', 's1p1c1cval', 's1p1c1seed', 's1p1c1sval', 's1p1c2', 's1p1c2plant', 's1p1c2harv', 's1p1c2area', 's1p1c2qharv', 's1p1c2cons', 's1p1c2lives', 's1p1c2lost', 's1p1c2mkt', 's1p1c2sold', 's1p1c2cval', 's1p1c2seed', 's1p1c2sval', 's1p1c3', 's1p1c3plant', 's1p1c3harv', 's1p1c3area', 's1p1c3qharv', 's1p1c3cons', 's1p1c3lives', 's1p1c3lost', 's1p1c3mkt', 's1p1c3sold', 's1p1c3cval', 's1p1c3seed', 's1p1c3sval', 's1p1c4', 's1p1c4plant', 's1p1c4harv', 's1p1c4area', 

In [7]:
# Filter raw data to contain columns needed
filtered_data = raw_data[columns_needed]
# Print filtered_data
print(filtered_data)

      farmtype  fplots  fplotarea1  fplotarea2  fplotarea3 plotunits  \
0          2.0     1.0         5.0        0.00         0.0        HA   
1          2.0     1.0         5.0        3.00         0.0        HA   
2          2.0     1.0         3.0        4.00         0.0        HA   
3          1.0     1.0         1.0        0.50         0.0        HA   
4          2.0     1.0         5.0        1.75         0.0        HA   
...        ...     ...         ...         ...         ...       ...   
9592       2.0     1.0         3.0        0.00         0.0        HA   
9593       2.0     1.0         3.0        0.00         0.0        HA   
9594       2.0     1.0         1.0        0.00         0.0        HA   
9595       1.0     1.0         1.0        0.00         0.0        HA   
9596       2.0     1.0         2.0        0.00         0.0        HA   

      fsystem1  fsystem2  fsystem3  fsystem4  tenure1  tenure2  tenure3  \
0          2.0       NaN       NaN       NaN      1.0      N

In [8]:
# Calculate sum of missing data in each column
filtered_data.isna().sum()

farmtype                 109
fplots                    29
fplotarea1                 0
fplotarea2                 0
fplotarea3                 0
                        ... 
adjtempshifts2_1        9554
adjtempshifts3_1        9586
adjrainfallshifts1_1    8938
adjrainfallshifts2_1    9535
adjrainfallshifts3_1    9580
Length: 823, dtype: int64

In [9]:
# Calculate the percentage of NaN values in each column
na_percentage = (filtered_data.isna().mean() * 100)

# Drop columns with more than 80% NaN values
columns_to_drop = na_percentage[na_percentage > 80].index
filtered_data = filtered_data.drop(columns=columns_to_drop)

# Store data of columns droped
with open('columns_droped.txt', 'w') as file:
    for item in columns_to_drop:
        file.write('%s\n' % item)
        
print(filtered_data.info())

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 9597 entries, 0 to 9596
Columns: 636 entries, farmtype to ad7625
dtypes: float64(519), object(117)
memory usage: 46.6+ MB
None


In [10]:
# Calculate threshold for no of na values in each row, 80%
threshold = 0.8 * len(filtered_data.columns)

# Number of rows to be dropped
dropped_indices = filtered_data.index[filtered_data.isnull().sum(axis=1) > threshold].tolist()
print(len(dropped_indices))

# Drop rows with more than 80% NaN values
filtered_data = filtered_data.dropna(thresh=threshold)

273


In [11]:
filtered_data.describe()

Unnamed: 0,farmtype,fplots,fplotarea1,fplotarea2,fplotarea3,fsystem1,fsystem2,tenure1,tenure2,yearsuse1,yearsuse2,rentplot1,rentplot2,farmbuyv,farmsalev,s1p1c1,s1p1c1area,s1p1c1qharv,s1p1c1cons,s1p1c1lives,s1p1c1lost,s1p1c1mkt,s1p1c1sold,s1p1c1cval,s1p1c2,s1p1c2area,s1p1c2qharv,s1p1c2cons,s1p1c2lives,s1p1c2lost,s1p1c2mkt,s1p1c2sold,s1p1c2cval,s1p1c3,s1p1c3area,s1p1c3qharv,s1p1c3cons,s1p1c3lives,s1p1c3lost,s1p1c3mkt,s1p1c3sold,s1p1c4,s1p1c4area,s1p1c4qharv,s1p1c4cons,s1p1c4lives,s1p1c4lost,s1p1c4mkt,s1p1c4sold,s1p1c5qharv,s1p1c5cons,s1p1c5lives,s1p1c5lost,s1p1c5mkt,s1p1c5sold,s1p1c6qharv,s1p1c6cons,s1p1c6lives,s1p1c6lost,s1p1c6mkt,s1p1c6sold,s1p2c1,s1p2c1qharv,s1p2c1cons,s1p2c1lives,s1p2c1lost,s1p2c1mkt,s1p2c1sold,s1p2c2qharv,s1p2c2cons,s1p2c2lives,s1p2c2lost,s1p2c2mkt,s1p2c2sold,s1p2c3qharv,s1p2c3cons,s1p2c3lives,s1p2c3lost,s1p2c3mkt,s1p2c3sold,s1p2c3seed,s1p2c3sval,s1p2c4qharv,s1p2c4cons,s1p2c4lives,s1p2c4lost,s1p2c4mkt,s1p2c4sold,s1p2c4seed,s1p2c4sval,s1p2c5qharv,s1p2c5cons,s1p2c5lives,s1p2c5lost,s1p2c5mkt,s1p2c5sold,s1p2c5seed,s1p2c5sval,s1p2c6qharv,s1p2c6cons,s1p2c6lives,s1p2c6lost,s1p2c6mkt,s1p2c6sold,s1p2c6seed,s1p2c6sval,s2p1c1,s2p1c1area,s2p1c1qharv,s2p1c1cons,s2p1c1lives,s2p1c1lost,s2p1c1mkt,s2p1c1sold,s2p1c2,s2p1c2area,s2p1c2qharv,s2p1c2cons,s2p1c2lives,s2p1c2lost,s2p1c2mkt,s2p1c2sold,s2p1c3qharv,s2p1c3cons,s2p1c3lives,s2p1c3lost,s2p1c3mkt,s2p1c3sold,s2p1c4qharv,s2p1c4cons,s2p1c4lives,s2p1c4lost,s2p1c4mkt,s2p1c4sold,s2p1c5qharv,s2p1c5cons,s2p1c5lives,s2p1c5lost,s2p1c5mkt,s2p1c5sold,s2p1c5seed,s2p1c5sval,s2p1c6qharv,s2p1c6cons,s2p1c6lives,s2p1c6lost,s2p1c6mkt,s2p1c6sold,s2p1c6seed,s2p1c6sval,s2p2c1qharv,s2p2c1cons,s2p2c1lives,s2p2c1lost,s2p2c1mkt,s2p2c1sold,s2p2c2qharv,s2p2c2cons,s2p2c2lives,s2p2c2lost,s2p2c2mkt,s2p2c2sold,s2p2c3qharv,s2p2c3cons,s2p2c3lives,s2p2c3lost,s2p2c3mkt,s2p2c3sold,s2p2c3seed,s2p2c3sval,s2p2c4qharv,s2p2c4cons,s2p2c4lives,s2p2c4lost,s2p2c4mkt,s2p2c4sold,s2p2c4seed,s2p2c4sval,s2p2c5qharv,s2p2c5cons,s2p2c5lives,s2p2c5lost,s2p2c5mkt,s2p2c5sold,s2p2c5seed,s2p2c5sval,s2p2c6qharv,s2p2c6cons,s2p2c6lives,s2p2c6lost,s2p2c6mkt,s2p2c6sold,s2p2c6seed,s2p2c6sval,s3p1c1qharv,s3p1c1cons,s3p1c1mkt,s3p1c1sold,s3p1c2qharv,s3p1c2cons,s3p1c2mkt,s3p1c2sold,s3p1c3mkt,s3p1c3seed,s3p1c3sval,s3p1c4mkt,s3p1c4sval,s3p1c5mkt,s3p1c6mkt,s3p2c1mkt,s3p2c2mkt,s3p2c2seed,s3p2c3mkt,s3p2c4plant,s3p2c4mkt,s3p2c5mkt,s3p2c6plant,s3p2c6harv,s3p2c6mkt,pc1,pc2,pc3,pc4,pc5,nyieldc1,nyieldc2,nyieldc3,nyieldc4,nyieldc5,s1p1fert,s1p1irrig1,s1p1irrig2,s1p1irrig3,s1p1irrig4,s1p1pest,s1p1wat1,s1p1wat2,s1p1wat3,s1p1wat4,s1p1wat5,s1p2fert,s1p2irrig1,s1p2irrig2,s1p2irrig3,s1p2irrig4,s1p2pest,s1p2wat1,s1p2wat2,s1p2wat3,s1p2wat4,s1p2wat5,s2p1fert,s2p1irrig1,s2p1irrig2,s2p1irrig3,s2p1irrig4,s2p1pest,s2p1wat1,s2p1wat2,s2p1wat3,s2p1wat4,s2p1wat5,s2p2fert,s2p2irrig1,s2p2irrig2,s2p2irrig3,s2p2irrig4,s2p2pest,s2p2wat1,s2p2wat2,s2p2wat3,s2p2wat4,s2p2wat5,s3p1fert,s3p1irrig1,s3p1irrig2,s3p1irrig3,s3p1irrig4,s3p1pest,s3p1wat1,s3p1wat2,s3p1wat3,s3p1wat4,s3p1wat5,s3p2fert,s3p2irrig1,s3p2irrig2,s3p2irrig3,s3p2irrig4,s3p2pest,s3p2wat1,s3p2wat2,s3p2wat3,s3p2wat4,s3p2wat5,lvsown,lvs1born,lvs1graze1,lvs1graze2,lvs1graze3,lvs1lost,lvs1num,lvs1pprice,lvs1purch,lvs1sold,lvs1sprice,lvs2born,lvs2graze1,lvs2graze2,lvs2graze3,lvs2lost,lvs2num,lvs2pprice,lvs2purch,lvs2sold,lvs2sprice,lvs3born,lvs3graze1,lvs3graze2,lvs3graze3,lvs3lost,lvs3num,lvs3pprice,lvs3purch,lvs3sold,lvs3sprice,lvs4born,lvs4graze1,lvs4graze2,lvs4graze3,lvs4lost,lvs4num,lvs4pprice,lvs4purch,lvs4sold,lvs4sprice,lvs5born,lvs5graze1,lvs5graze2,lvs5graze3,lvs5lost,lvs5num,lvs5pprice,lvs5purch,lvs5sold,lvs5sprice,lvs6born,lvs6graze1,lvs6graze2,lvs6graze3,lvs6lost,lvs6num,lvs6pprice,lvs6purch,lvs6sold,lvs6sprice,lvs7born,lvs7graze1,lvs7graze2,lvs7graze3,lvs7lost,lvs7num,lvs7pprice,lvs7purch,lvs7sold,lvs7sprice,lvs8born,lvs8graze1,lvs8graze2,lvs8graze3,lvs8lost,lvs8num,lvs8pprice,lvs8purch,lvs8sold,lvs8sprice,lvs9born,lvs9graze1,lvs9graze2,lvs9graze3,lvs9lost,lvs9num,lvs9pprice,lvs9purch,lvs9sold,lvs9sprice,lvsp1price,lvsp1sell,lvsp1use,lvsp2price,lvsp2sell,lvsp2use,lvsp3price,lvsp3sell,lvsp3use,lvsp4price,lvsp4sell,lvsp4use,lvsp5price,lvsp5sell,lvsp5use,lvsp6price,lvsp6sell,lvsp6use,lvsp7price,lvsp7sell,lvsp7use,lvsp8price,lvsp8sell,lvsp8use,lvsp9price,lvsp9sell,lvsp9use,cost1crop,cost1lvs,cost2crop,cost2lvs,cost3crop,cost3lvs,cost4crop,cost4lvs,cost5crop,cost5lvs,ad711,ad712,ad713,ad714,ad715,ad716,ad717,ad718,ad719,ad7110,ad7111,ad7112,ad7113,ad7114,ad7115,ad7116,ad7117,ad7118,ad7119,ad7120,ad7122,ad7123,ad7124,ad7125,ad721,ad722,ad723,ad724,ad725,ad726,ad727,ad728,ad729,ad7210,ad7212,ad731,ad732,ad733,ad734,ad735,ad736,ad741,ad742,ad743,ad744,ad745,ad746,ad747,ad751,ad752,ad753,ad754,ad755,ad756,ad757,ad758,ad759,ad7510,ad7511,ad7512,ad7513,ad7514,ad7515,ad7516,ad7517,ad7518,ad7519,ad7520,ad7522,ad7523,ad7524,ad7525,ad761,ad762,ad763,ad764,ad765,ad766,ad767,ad768,ad769,ad7610,ad7611,ad7612,ad7613,ad7614,ad7615,ad7616,ad7617,ad7618,ad7619,ad7620,ad7621,ad7622,ad7623,ad7625
count,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1655.0,1655.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,689.0,1052.0,1052.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,315.0,588.0,588.0,1798.0,1800.0,1799.0,1800.0,1800.0,1800.0,238.0,239.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,598.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1799.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,830.0,975.0,900.0,1800.0,1800.0,1800.0,1800.0,900.0,207.0,207.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,900.0,900.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1.0,1800.0,1800.0,1.0,1.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1799.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1797.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1798.0,1800.0,1798.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1770.0,1799.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1799.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1798.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1798.0,1799.0,1800.0,1800.0,1799.0,1800.0,1800.0,1799.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0,1800.0
mean,1.725556,1.885556,3.775825,1.164083,0.533577,2.403889,1.136111,1.443889,0.795,24.869167,10.847778,185.172067,215.45225,325334.3,654759.7,31.143202,63.184949,12395.3,924.509444,6559.703,130.606944,0.764444,5267.469167,30880.56,24.739544,25.46403,3921.193,198.123556,2865.899,17.060278,0.351667,872.263611,81547.86,25.931973,16.294303,1921.456,76.057778,1408.919,4.993889,0.161111,475.931667,30.630252,10.332803,235.982778,31.678722,111.705556,0.909722,0.061667,92.187222,122.86159,1.688889,5.555556,0.023333,0.018333,113.390773,83.72,2.052222,0.0,0.0,0.007778,81.311111,28.167224,3710.3725,187.591111,2001.182324,5.045,0.289444,1515.544722,978.809616,108.021111,216.524167,2.044444,0.140634,675.511117,208.397778,35.338889,12.888889,0.643333,0.066111,159.825556,2.429039,14.529094,17.777778,13.505556,0.166667,0.1,0.011667,4.006667,1.115556,4.333333,15.5,0.0,14.444444,0.0,0.002222,1.055556,0.1,0.177778,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,31.013253,55.832133,244.961111,261.699722,2208.453,3.308889,0.891667,201.756667,37.966184,34.904976,2560.846,63.491667,1557.364,1.094444,0.178889,919.01625,1070.975,14.252778,782.8667,0.166667,0.07,769.257778,102.988333,2.207778,15.611111,0.0,0.02,85.169444,20.544444,0.0,3.722222,0.0,0.002778,16.822222,0.0,0.012983,0.416667,0.138889,0.0,0.0,0.001111,0.277778,0.0,0.001333,936.249444,48.015556,201.398333,0.0,0.283889,699.737222,261.663889,16.943333,17.823611,0.0,0.106111,232.138611,70.846667,0.666667,1.597222,0.0,0.033333,63.027222,0.000556,0.0755,0.596111,0.027778,0.277778,0.0,0.002778,0.290556,0.000556,0.0,0.833333,0.222222,0.222222,0.0,0.001111,0.388889,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5966.486,22.313889,0.250556,5818.833,1667.152778,5.155556,0.046111,1659.544444,0.015564,45.886158,1.324797,0.001111,0.008206,0.0,0.0,0.038889,0.007222,4.389556,0.001111,-99.0,0.0,0.0,-99.0,-99.0,0.0,29.547778,24.688889,20.485833,12.675556,5.264444,5660.542594,4690.118789,2517.181911,1479.483239,839.465228,413.826406,0.687778,0.004444,0.041667,0.077778,1.281539,0.435242,0.002222,0.0,1.991111,0.0,145.765183,0.306667,0.011673,0.035019,0.013341,0.48395,0.269444,0.003333,0.005556,0.335556,0.002778,366.85,0.371111,0.011111,0.016667,0.016111,0.822144,0.387222,0.008333,0.0,0.017778,0.0,120.832222,0.189444,0.001111,0.01,0.006667,0.307847,0.192778,0.001113,0.0,0.0,0.014444,180.366111,0.101111,0.002222,0.033333,0.033333,0.524444,0.111667,0.017778,0.000556,0.002222,0.005556,28.028889,0.031684,0.0,0.005,0.011117,0.105333,0.033333,0.006667,0.0,0.0,0.0,1.007222,0.115,0.123889,0.638333,0.041667,0.028889,0.766667,617.351111,0.338333,0.372222,881.869299,0.480556,0.401001,1.510839,0.45,0.226111,1.818889,2407.786667,0.233333,0.268889,1698.249444,0.112778,0.186667,0.685556,0.252362,0.023333,0.78,495.166667,0.218333,0.302946,749.461111,0.377966,0.51473,1.894444,0.777098,0.811111,2.806111,730.788333,1.010556,4.820456,1768.474444,0.262222,0.437222,1.943889,0.714444,0.406111,1.994444,1758.957222,0.176111,0.490556,2403.350195,0.0,0.028349,0.038889,0.023889,22.228333,10.017222,47.228889,0.003889,0.000556,13.896609,0.0,0.147778,0.989444,0.363333,0.145,1.118889,6076.724444,27.844444,0.046111,4965.527778,1.578889,0.05,1.482778,0.061111,1.389444,494.344444,67.149878,712.262222,562.106726,43.366009,3.512222,0.086667,0.442778,0.080556,0.211111,2.335186,310.5475,0.772222,0.246111,106.838243,5.440861,1917.402,294.062222,6.958611,43.715,7.272778,0.655556,1.925,10.511667,0.242778,1.848333,5.583889,1.00485,2.91,3.665,0.474194,1159.036111,234.661389,0.228278,0.321667,0.0,0.705367,0.471111,0.005,0.366111,276.887222,2.069444,3674.656667,303.741667,2115.588333,195.448583,1387.982778,260.949444,3787.797222,10.444444,131.772778,3782.449,0.165,0.004444,0.016667,0.063333,0.0,0.001111,0.007778,0.005556,0.001111,0.0,0.005,0.342222,0.016667,0.061111,0.004444,0.002222,0.098333,0.111111,0.005,0.030556,0.117222,0.013333,0.029444,0.077778,0.077778,0.043889,0.021679,0.280556,0.001111,0.021667,0.004444,0.002778,0.002222,0.017222,0.522778,0.623889,0.062778,0.157222,0.033889,0.128889,0.050556,0.092222,0.565628,0.047804,0.047222,0.028333,0.190106,0.035,0.048889,0.010006,0.011667,0.085,0.001667,0.001667,0.051667,0.000556,0.0,0.0,0.003333,0.326111,0.027222,0.077778,0.003333,0.001111,0.047222,0.099444,0.005556,0.055556,0.121111,0.016667,0.015556,0.112778,0.171667,0.003889,0.002778,0.011667,0.0,0.0,0.08,0.005,0.001111,0.0,0.002222,0.138333,0.020556,0.056111,0.027222,0.000556,0.074444,0.066667,0.008889,0.013889,0.074444,0.286111,0.065556,0.069444
std,0.739734,1.007041,6.5085,2.204666,1.942052,0.729499,1.304129,1.314462,1.432831,24.319732,21.132319,1414.373995,5184.715254,974335.1,2100542.0,15.932655,24.126652,104133.8,1868.210249,102422.2,4427.437852,0.969268,28162.823868,97305.73,16.204704,15.152534,58230.22,581.664183,58068.5,113.386726,0.764119,4556.220956,186189.6,16.380551,10.650255,46480.18,337.88407,46342.19,55.544267,0.535186,3694.250181,14.029424,8.586376,3984.137474,228.875438,3691.509741,26.463989,0.338518,1473.35108,3506.774881,31.81717,235.70226,0.989949,0.186234,3482.53671,3394.556533,51.629076,0.0,0.0,0.124514,3394.202342,17.373774,13732.941998,852.47656,9564.28965,47.445293,0.693093,8905.163857,6170.564443,1401.213977,2463.195138,24.286808,0.485278,5352.627484,2029.480797,622.209614,322.748737,14.344662,0.353756,1814.318711,21.438967,79.012914,546.782855,542.199256,7.071068,4.242641,0.157727,65.245966,15.537379,39.951305,446.403421,0.0,444.611018,0.0,0.066648,40.343126,2.235073,3.769138,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11.984251,36.338678,1495.176923,796.020299,77869.76,39.032136,1.109331,1355.472336,13.850583,15.777916,46477.39,349.108075,45500.95,21.320289,0.591019,9565.15486,33145.9,151.595132,32998.29,4.080213,0.386817,23658.34509,1588.541368,60.956533,371.265977,0.0,0.201826,1538.631595,647.149076,0.0,111.747604,0.0,0.070676,637.526236,0.0,0.312759,17.67767,5.892557,0.0,0.0,0.04714,11.785113,0.0,0.056569,5225.136067,277.209274,3284.219435,0.0,0.736537,3252.052906,2667.700224,221.464385,187.2742,0.0,0.464847,2508.453703,880.969097,15.976637,47.599596,0.0,0.268817,828.474402,0.016667,0.702369,16.386951,1.178511,11.785113,0.0,0.084962,11.210182,0.016667,0.0,35.355339,9.42809,9.42809,0.0,0.04714,16.499158,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,49399.01,140.152557,0.707303,49371.14,26249.785473,76.558502,0.303008,26248.696212,0.185042,847.481066,36.685772,0.04714,0.345782,0.0,0.0,0.303104,0.139295,118.557103,0.04714,,0.0,0.0,,,0.0,16.922015,21.65285,26.591702,18.811704,14.249233,17151.12036,10582.003313,13641.977152,6441.891734,5961.72511,2443.223852,1.007623,0.115417,0.351187,0.552477,3.74512,0.495926,0.057708,0.0,2.000536,0.0,557.440727,0.605111,0.171292,0.31885,0.230683,2.019874,0.456148,0.081604,0.137363,1.108691,0.117851,2547.259655,0.49009,0.148698,0.223047,0.258843,3.06451,0.497412,0.122225,0.0,0.266147,0.0,560.77078,0.39197,0.04714,0.172964,0.163209,1.444553,0.39459,0.04718,0.0,0.0,0.210382,2291.233478,0.30156,0.094281,0.314553,0.363725,2.966108,0.315043,0.187774,0.02357,0.094281,0.16662,237.159575,0.175207,0.0,0.122406,0.210642,1.280067,0.179555,0.115309,0.0,0.0,0.0,0.485994,0.853074,1.00454,2.177447,0.568721,0.381986,2.741808,6288.844396,1.755948,1.665564,10692.232697,2.133316,1.870885,3.183971,1.973631,1.089893,5.30037,18782.735872,1.159824,1.067447,11468.899672,1.127282,1.300635,2.20112,1.509965,0.273958,3.74944,6606.294813,2.213104,2.150341,10167.581512,1.624456,2.022862,3.796955,2.485063,2.494215,6.011076,2868.438567,35.361885,165.62832,7919.61095,1.600485,1.893041,3.955796,2.386643,1.522142,6.937982,9044.572513,0.706978,3.893085,11620.896984,0.0,0.425517,0.516153,0.385949,942.808909,424.263745,1531.76212,0.126905,0.02357,589.419401,0.0,1.153743,3.161996,1.828132,1.281231,23.717821,26569.633999,1178.509801,0.270026,28722.838522,26.53573,0.740138,3.907026,0.847872,6.429763,8667.549682,333.305017,11247.864689,10248.611063,429.91188,141.45016,0.901015,2.167539,0.85181,2.962784,27.119835,6222.702673,5.844122,3.596983,2520.09442,42.586865,27407.63,588.008492,282.843337,734.223505,102.470199,12.691544,36.522739,34.112684,2.109681,28.562168,31.411463,35.384747,35.126559,62.218549,3.628393,23877.894962,590.976716,1.729345,2.251151,0.0,29.480472,16.674774,0.097081,3.362294,6594.986692,27.040479,18065.785202,3227.463241,17514.683807,2743.505112,7098.631886,5928.05535,18996.106138,237.533701,2539.806686,60203.91,0.371284,0.066537,0.128055,0.243629,0.0,0.033324,0.087872,0.074349,0.033324,0.0,0.070553,0.474585,0.128055,0.239601,0.066537,0.047101,0.297848,0.314357,0.070553,0.172158,0.321774,0.11473,0.169096,0.267896,0.267896,0.204905,0.145673,0.449396,0.033324,0.145633,0.066537,0.052646,0.047101,0.130135,0.49962,0.484543,0.24263,0.364111,0.180993,0.33517,0.219149,0.28942,0.495812,0.213411,0.212173,0.165969,0.392493,0.183831,0.215696,0.099554,0.10741,0.278959,0.040802,0.040802,0.221415,0.02357,0.0,0.0,0.057655,0.468919,0.162776,0.267896,0.057655,0.033324,0.212173,0.299341,0.074349,0.229125,0.326347,0.128055,0.123782,0.316409,0.377195,0.062257,0.052646,0.10741,0.0,0.0,0.271369,0.070553,0.033324,0.0,0.047101,0.345345,0.14193,0.2302,0.162776,0.02357,0.262566,0.249513,0.093887,0.117062,0.262566,0.452068,0.247572,0.254279
min,1.0,1.0,0.0001,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,4.55,0.0,0.0,0.0,0.0,0.0,0.0,75.0,3.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,25.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,1.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-99.0,0.0,0.0,-99.0,-99.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
25%,1.0,1.0,0.625,0.0,0.0,2.0,0.0,1.0,0.0,10.0,0.0,0.0,0.0,0.0,50450.0,27.0,50.0,548.25,0.0,0.0,0.0,0.0,0.0,1100.0,12.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,2500.0,12.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,22.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26.0,28.57,0.0,0.0,0.0,0.0,0.0,0.0,26.0,22.665,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-99.0,0.0,0.0,-99.0,-99.0,0.0,14.0,12.0,0.0,0.0,0.0,400.0,197.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
50%,2.0,2.0,2.0833,0.208,0.0,2.0,0.0,1.0,0.0,20.0,0.0,0.0,0.0,0.0,186250.0,27.0,60.0,1777.5,450.0,0.0,0.0,0.0,0.0,2441.0,12.0,20.0,50.0,0.0,0.0,0.0,0.0,0.0,25000.0,14.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,29.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,27.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,26.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,39.0,33.330002,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-99.0,0.0,0.0,-99.0,-99.0,0.0,27.0,22.0,12.0,0.0,0.0,1000.0,700.0,318.399994,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,70.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
75%,2.0,2.0,5.0,1.5,0.0,3.0,2.0,1.0,1.0,32.0,15.0,0.0,0.0,275000.0,576000.0,54.0,80.0,5010.0,1076.25,0.0,0.0,2.0,1800.0,9350.0,44.0,33.330002,500.0,200.0,0.0,0.0,0.0,0.0,96000.0,44.0,23.647501,60.0,10.0,0.0,0.0,0.0,0.0,44.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,44.0,750.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,39.0,100.0,0.0,20.0,0.0,0.0,2.0,0.0,53.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,-99.0,0.0,0.0,-99.0,-99.0,0.0,48.0,39.0,39.0,26.0,0.0,3000.0,3000.0,1600.0,550.25,0.0,300.0,1.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,4.0,0.0,100.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,300.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,500.0,400.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,28.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1500.0,0.0,131.25,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
max,3.0,10.0,150.0,40.0,40.0,5.0,6.0,7.0,20.0,202.0,200.0,20000.0,210000.0,20000000.0,46800000.0,56.0,100.0,4200000.0,31258.0,4200000.0,187500.0,3.0,900000.0,1600000.0,56.0,100.0,2400000.0,10000.0,2400000.0,3125.0,3.0,62400.0,2600000.0,56.0,66.669998,1960000.0,8000.0,1960000.0,1000.0,3.0,70000.0,56.0,50.0,150000.0,5000.0,150000.0,1000.0,3.0,45000.0,144000.0,1200.0,10000.0,42.0,2.0,144000.0,144000.0,1800.0,0.0,0.0,2.0,144000.0,56.0,245000.0,20000.0,150000.0,1250.0,4.0,245000.0,110400.0,51050.0,54000.0,625.0,3.0,110400.0,50000.0,25000.0,10000.0,500.0,2.0,50000.0,600.0,1000.0,23000.0,23000.0,300.0,180.0,3.0,1740.0,400.0,500.0,16000.0,0.0,16000.0,0.0,2.0,1700.0,60.0,80.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,56.0,100.0,23000.0,15000.0,3300000.0,1000.0,4.0,20000.0,56.0,100.0,1800000.0,5500.0,1800000.0,700.0,3.0,300000.0,1400000.0,3500.0,1400000.0,100.0,3.0,1000000.0,48000.0,2100.0,12000.0,0.0,3.0,48000.0,26880.0,0.0,3500.0,0.0,2.0,26880.0,0.0,10.0,750.0,250.0,0.0,0.0,2.0,500.0,0.0,2.4,150000.0,4000.0,100000.0,0.0,3.0,50000.0,74000.0,6000.0,5250.0,0.0,3.0,68000.0,20000.0,500.0,1800.0,0.0,3.0,20000.0,0.5,10.0,500.0,50.0,500.0,0.0,3.0,473.0,0.5,0.0,1500.0,400.0,400.0,0.0,2.0,700.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1500000.0,2000.0,3.0,1500000.0,750000.0,1925.0,3.0,750000.0,3.0,22000.0,1176.0,2.0,14.67,0.0,0.0,3.0,3.0,4000.0,2.0,-99.0,0.0,0.0,-99.0,-99.0,0.0,56.0,600.0,800.0,200.0,58.0,420000.0,130000.0,495000.0,80000.0,170000.0,82720.0,4.0,4.0,3.0,4.0,60.0,1.0,2.0,0.0,4.0,0.0,15000.0,4.0,4.0,3.0,4.0,40.0,5.0,2.0,4.0,5.0,5.0,90000.0,4.0,2.0,3.0,5.0,80.0,3.0,2.0,0.0,4.0,0.0,13500.0,1.0,2.0,3.0,4.0,20.0,1.0,2.0,0.0,0.0,4.0,92500.0,1.0,4.0,3.0,4.0,50.0,1.0,2.0,1.0,4.0,5.0,4500.0,1.0,0.0,3.0,4.0,36.0,1.0,2.0,0.0,0.0,0.0,2.0,20.0,12.0,12.0,12.0,10.0,43.0,120000.0,30.0,30.0,300000.0,65.0,12.0,12.0,12.0,15.0,125.0,430000.0,20.0,18.0,150000.0,40.0,12.0,12.0,12.0,6.0,86.0,150000.0,50.0,50.0,260000.0,21.0,12.0,16.0,12.0,50.0,100.0,20000.0,1500.0,7000.0,150000.0,30.0,12.0,24.0,12.0,20.0,200.0,200000.0,8.0,150.0,250000.0,0.0,10.0,12.0,9.0,40000.0,18000.0,60000.0,5.0,1.0,25000.0,0.0,12.0,12.0,12.0,22.0,1000.0,250000.0,50000.0,4.0,300000.0,1000.0,12.0,12.0,12.0,120.0,300000.0,9000.0,300000.0,285000.0,12000.0,6000.0,12.0,12.0,12.0,100.0,1000.0,250000.0,150.0,100.0,100000.0,1200.0,1095000.0,7000.0,12000.0,25000.0,3650.0,500.0,1440.0,400.0,25.0,1000.0,750.0,1500.0,1000.0,2000.0,35.0,823200.0,3600.0,40.0,40.0,0.0,1250.0,700.0,3.0,100.0,262500.0,550.0,500000.0,100000.0,600000.0,96000.0,100000.0,236000.0,240000.0,7000.0,70000.0,2295000.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,1.0,1.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0


In [13]:
filtered_data.shape

(1800, 636)

So means have been made to reduce this to 636 columns, great I will be working with that then. below are the procedures I am following to preprocess and clean the dataset 
1. Create an empty dataframe to acquire all newly processed column
2. create a list for columns having homogeuity
3. Through documentation reading and research a means is devised to aggregrate the columns into one or two
4. The newly created column which has same information as those columns is added to the new dataframe

In [14]:
# Create an empty dataframe
df = pd.DataFrame()
df.shape

(0, 0)

I will be using the columns needed list as my base columns to work with

In [18]:
#checkig out the first 22 columns
first_22_columns = filtered_data.iloc[:, :22]

In [19]:
first_22_column_names = filtered_data.columns[:22]

In [20]:
first_22_column_names

Index(['farmtype', 'fplots', 'fplotarea1', 'fplotarea2', 'fplotarea3',
       'plotunits', 'fsystem1', 'fsystem2', 'tenure1', 'tenure2', 'yearsuse1',
       'yearsuse2', 'rentplot1', 'rentplot2', 'farmbuyv', 'farmsalev',
       'season1s', 'season1e', 'season2s', 'season2e', 'season3s', 'season3e'],
      dtype='object')

In [21]:
first_22_columns

Unnamed: 0,farmtype,fplots,fplotarea1,fplotarea2,fplotarea3,plotunits,fsystem1,fsystem2,tenure1,tenure2,yearsuse1,yearsuse2,rentplot1,rentplot2,farmbuyv,farmsalev,season1s,season1e,season2s,season2e,season3s,season3e
1087,3.0,1.0,2.5000,0.0000,0.0000,HA,3.0,0.0,1.0,0.0,16.0,0.0,0.0,0.0,0.0,150000.0,w1oct2001,w1may2002,w1may2002,w1oct2002,w1aug2002,w4dec2002
1088,2.0,3.0,0.5042,0.4500,0.4875,HA,2.0,2.0,1.0,1.0,33.0,33.0,0.0,0.0,0.0,175000.0,w1oct2001,w1may2002,w1may2002,w1oct2002,w1aug2002,w4dec2002
1089,2.0,3.0,0.4500,0.5208,0.5542,HA,3.0,3.0,1.0,1.0,33.0,33.0,0.0,0.0,0.0,210000.0,w1oct2001,w1may2002,w1may2002,w1oct2002,w1aug2002,w4dec2002
1090,2.0,3.0,0.5542,0.5542,0.5542,HA,3.0,3.0,1.0,1.0,33.0,33.0,0.0,0.0,0.0,240000.0,w1oct2001,w1may2002,w1may2002,w1oct2002,w1aug2002,w4dec2002
1091,1.0,2.0,0.4167,0.2083,0.0000,HA,2.0,2.0,1.0,1.0,25.0,25.0,0.0,0.0,0.0,30000.0,w1oct2001,w1may2002,w1may2002,w1oct2002,w1aug2002,w4dec2002
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,2.0,1.0,5.0000,0.0000,0.0000,HA,3.0,0.0,1.0,0.0,9.0,0.0,0.0,0.0,0.0,200000.0,1-Jun,30-Sep,1-Nov,31-Mar,1-Dec,1-May
5475,2.0,1.0,8.0000,0.0000,0.0000,HA,1.0,0.0,1.0,0.0,11.0,0.0,0.0,0.0,0.0,400000.0,1-Jun,30-Sep,1-Nov,31-Mar,1-Dec,1-May
5476,2.0,2.0,11.0000,6.0000,0.0000,HA,3.0,2.0,1.0,1.0,26.0,18.0,0.0,0.0,0.0,600000.0,1-Jun,30-Sep,1-Nov,31-Mar,1-Dec,1-May
5477,2.0,1.0,8.0000,0.0000,0.0000,HA,3.0,0.0,1.0,0.0,8.0,0.0,0.0,0.0,0.0,300000.0,1-Jun,30-Sep,1-Nov,31-Mar,1-Dec,1-May


1. for the farm type, this is an important key which is a labelled data that is of immense importance in the study
2. The classifcation of family plots is also a significant but not really needed feature in this study
3. The fplotareas represent the area of plot of land for the families, To represent the area of land for families more efficiently, we can combine the three columns into a single column. We create a new column called "TotalPlotArea" to store the sum of the individual plot areas for each family.
4. We combined related information into new columns, making it easier to understand and analyze the data.
 'LandSystem' now represents the land system information, combining fsystem1 and fsystem2.
 'TenureType' summarizes the tenure information from tenure1 and tenure2.
 'UsageYears' provides a concise description of years of usage.

In [23]:
df['farmtype'] = filtered_data['farmtype']
# Create a new column 'TotalPlotArea' that sums the individual plot areas
df['TotalPlotArea'] = filtered_data['fplotarea1'] + filtered_data['fplotarea2'] + filtered_data['fplotarea3']

# Combine fsystem1 and fsystem2 into a new column 'LandSystem'
df['LandSystem'] = filtered_data['fsystem1'].astype(str) + ' ' + filtered_data['fsystem2'].astype(str)

# Combine tenure1 and tenure2 into a new column 'TenureType'
df['TenureType'] = filtered_data['tenure1'].astype(str) + ' ' + filtered_data['tenure2'].astype(str)

# Combine yearsuse1 and yearsuse2 into a new column 'UsageYears'
df['UsageYears'] = filtered_data['yearsuse1'].astype(str) + ' ' + filtered_data['yearsuse2'].astype(str)

In [24]:
df

Unnamed: 0,farmtype,TotalPlotArea,LandSystem,TenureType,UsageYears
1087,3.0,2.5000,3.0 0.0,1.0 0.0,16.0 0.0
1088,2.0,1.4417,2.0 2.0,1.0 1.0,33.0 33.0
1089,2.0,1.5250,3.0 3.0,1.0 1.0,33.0 33.0
1090,2.0,1.6626,3.0 3.0,1.0 1.0,33.0 33.0
1091,1.0,0.6250,2.0 2.0,1.0 1.0,25.0 25.0
...,...,...,...,...,...
5474,2.0,5.0000,3.0 0.0,1.0 0.0,9.0 0.0
5475,2.0,8.0000,1.0 0.0,1.0 0.0,11.0 0.0
5476,2.0,17.0000,3.0 2.0,1.0 1.0,26.0 18.0
5477,2.0,8.0000,3.0 0.0,1.0 0.0,8.0 0.0


In [28]:
#checking out columns from index 23 to 501
second_23_200_columns = filtered_data.iloc[:, 23:200]
second_23_200_columns_names = filtered_data.columns[23:200]

In [29]:
second_23_200_columns_names

Index(['seas2nam', 'seas3nam', 's1p1c1', 's1p1c1plant', 's1p1c1harv',
       's1p1c1area', 's1p1c1qharv', 's1p1c1cons', 's1p1c1lives', 's1p1c1lost',
       ...
       's2p1c4plant', 's2p1c4harv', 's2p1c4qharv', 's2p1c4cons', 's2p1c4lives',
       's2p1c4lost', 's2p1c4mkt', 's2p1c4sold', 's2p1c4seed', 's2p1c4sval'],
      dtype='object', length=177)

In [30]:
second_23_200_columns

Unnamed: 0,seas2nam,seas3nam,s1p1c1,s1p1c1plant,s1p1c1harv,s1p1c1area,s1p1c1qharv,s1p1c1cons,s1p1c1lives,s1p1c1lost,s1p1c1mkt,s1p1c1sold,s1p1c1cval,s1p1c1seed,s1p1c1sval,s1p1c2,s1p1c2plant,s1p1c2harv,s1p1c2area,s1p1c2qharv,s1p1c2cons,s1p1c2lives,s1p1c2lost,s1p1c2mkt,s1p1c2sold,s1p1c2cval,s1p1c2seed,s1p1c2sval,s1p1c3,s1p1c3plant,s1p1c3harv,s1p1c3area,s1p1c3qharv,s1p1c3cons,s1p1c3lives,s1p1c3lost,s1p1c3mkt,s1p1c3sold,s1p1c3seed,s1p1c3sval,s1p1c4,s1p1c4plant,s1p1c4harv,s1p1c4area,s1p1c4qharv,s1p1c4cons,s1p1c4lives,s1p1c4lost,s1p1c4mkt,s1p1c4sold,s1p1c4seed,s1p1c4sval,s1p1c5plant,s1p1c5harv,s1p1c5qharv,s1p1c5cons,s1p1c5lives,s1p1c5lost,s1p1c5mkt,s1p1c5sold,s1p1c5seed,s1p1c5sval,s1p1c6plant,s1p1c6harv,s1p1c6qharv,s1p1c6cons,s1p1c6lives,s1p1c6lost,s1p1c6mkt,s1p1c6sold,s1p1c6seed,s1p1c6sval,s1p2c1,s1p2c1plant,s1p2c1harv,s1p2c1qharv,s1p2c1cons,s1p2c1lives,s1p2c1lost,s1p2c1mkt,s1p2c1sold,s1p2c1seed,s1p2c1sval,s1p2c2plant,s1p2c2harv,s1p2c2qharv,s1p2c2cons,s1p2c2lives,s1p2c2lost,s1p2c2mkt,s1p2c2sold,s1p2c2seed,s1p2c2sval,s1p2c3plant,s1p2c3harv,s1p2c3qharv,s1p2c3cons,s1p2c3lives,s1p2c3lost,s1p2c3mkt,s1p2c3sold,s1p2c3seed,s1p2c3sval,s1p2c4plant,s1p2c4harv,s1p2c4qharv,s1p2c4cons,s1p2c4lives,s1p2c4lost,s1p2c4mkt,s1p2c4sold,s1p2c4seed,s1p2c4sval,s1p2c5plant,s1p2c5harv,s1p2c5qharv,s1p2c5cons,s1p2c5lives,s1p2c5lost,s1p2c5mkt,s1p2c5sold,s1p2c5seed,s1p2c5sval,s1p2c6plant,s1p2c6harv,s1p2c6qharv,s1p2c6cons,s1p2c6lives,s1p2c6lost,s1p2c6mkt,s1p2c6sold,s1p2c6seed,s1p2c6sval,s2p1c1,s2p1c1plant,s2p1c1harv,s2p1c1area,s2p1c1qharv,s2p1c1cons,s2p1c1lives,s2p1c1lost,s2p1c1mkt,s2p1c1sold,s2p1c1seed,s2p1c1sval,s2p1c2,s2p1c2plant,s2p1c2harv,s2p1c2area,s2p1c2qharv,s2p1c2cons,s2p1c2lives,s2p1c2lost,s2p1c2mkt,s2p1c2sold,s2p1c2seed,s2p1c2sval,s2p1c3plant,s2p1c3harv,s2p1c3qharv,s2p1c3cons,s2p1c3lives,s2p1c3lost,s2p1c3mkt,s2p1c3sold,s2p1c3seed,s2p1c3sval,s2p1c4plant,s2p1c4harv,s2p1c4qharv,s2p1c4cons,s2p1c4lives,s2p1c4lost,s2p1c4mkt,s2p1c4sold,s2p1c4seed,s2p1c4sval
1087,2,3,54.0,15Nov2001,15May2002,33.330002,4800.0,24000.0,0.0,0.0,2.0,2400.0,1710.0,140,2,9.0,10Sep2001,08Apr2002,33.330002,60000.0,0.0,60000.0,0.0,0.0,0.0,,50,4,4.0,04Nov2001,06Apr2002,33.330002,2550.0,0.0,0.0,0.0,2.0,2550.0,50,3,,,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,26.0,03Jun2002,01Oct2002,33.330002,,0.0,6000.0,0.0,0.0,,24,10,53.0,08Apr2002,05Aug2002,33.330002,40000.0,200.0,0.0,0.0,2.0,39800.0,.3400000036,5294,13May2002,05Aug2002,10000.0,0.0,0.0,0.0,2.0,10000.0,.400000006,1200,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1088,2,3,54.0,15Nov2001,15May2002,34.970001,2480.0,1550.0,0.0,0.0,2.0,930.0,720.0,60,2.5,9.0,10Sep2001,01May2002,31.209999,35000.0,0.0,35000.0,0.0,0.0,0.0,,30,4,38.0,01Jan2002,08May2002,33.820000,13500.0,0.0,0.0,0.0,2.0,13500.0,700,2.700000048,,,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,56.0,20May2002,12Aug2002,34.970001,,200.0,0.0,0.0,2.0,,600,.8299999833,39.0,10Jun2002,07Oct2002,31.209999,3000.0,2500.0,0.0,0.0,2.0,500.0,100,2,08Jun2002,02Dec2002,1200.0,100.0,0.0,0.0,2.0,1100.0,5.25,124,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1089,2,3,54.0,15Nov2001,15May2002,29.510000,2700.0,2000.0,0.0,0.0,2.0,700.0,560.0,60,2.329999924,38.0,01Jan2002,30Apr2002,34.150002,15000.0,500.0,0.0,0.0,2.0,14500.0,9400.0,750,5.329999924,9.0,10Sep2001,10May2002,36.340000,50000.0,0.0,50000.0,0.0,0.0,0.0,30,4.329999924,,,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,39.0,03Jun2002,04Nov2002,29.510000,,3000.0,0.0,0.0,0.0,,100,1.799999952,56.0,01Jun2002,02Sep2002,34.150002,5500.0,100.0,0.0,0.0,2.0,5400.0,1,80,13May2002,02Sep2002,10000.0,200.0,0.0,0.0,2.0,9800.0,1000,.5,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1090,2,3,54.0,15Nov2001,15May2002,33.330002,2250.0,1250.0,0.0,0.0,2.0,1000.0,800.0,60,2.5,9.0,10Sep2001,01May2002,33.330002,38000.0,0.0,38000.0,0.0,0.0,0.0,,30,4.329999924,38.0,01Jan2002,01May2002,33.330002,17500.0,500.0,0.0,0.0,2.0,17000.0,750,2.329999924,,,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,56.0,13May2002,23Sep2002,33.330002,,100.0,0.0,0.0,2.0,,600,.6600000262,39.0,27May2002,01Oct2002,33.330002,2500.0,3000.0,0.0,0.0,2.0,500.0,100,1.5,02Jul2002,02Dec2002,10000.0,200.0,0.0,0.0,2.0,9800.0,4,163,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1091,2,3,54.0,15Nov2001,15May2002,66.669998,2250.0,1250.0,0.0,0.0,2.0,1000.0,1000.0,60,2,9.0,17Sep2001,08May2002,33.330002,14000.0,0.0,14000.0,0.0,0.0,0.0,,15,4.75,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,0.0,0.0,0.0,0.0,0.0,0.0,.,0,,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,39.0,10Jun2002,07Oct2002,66.669998,,2000.0,0.0,0.0,2.0,,100,2,56.0,10Jun2002,01Oct2002,33.330002,5500.0,200.0,0.0,0.0,2.0,5300.0,400,1.5,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,1,3,27.0,1-Jun,30-Sep,90.000000,2000.0,400.0,0.0,0.0,2.0,1600.0,112000.0,10,425,12.0,1-Jun,30-Sep,10.000000,600.0,200.0,0.0,100.0,2.0,300.0,27000.0,4,400,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5475,1,3,26.0,1-Jun,30-Sep,50.000000,2800.0,600.0,0.0,0.0,2.0,2200.0,110000.0,10,375,29.0,1-Jun,30-Sep,50.000000,3200.0,200.0,0.0,0.0,2.0,3000.0,210000.0,10,500,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5476,1,3,27.0,1-Jun,30-Sep,80.000000,3200.0,1200.0,0.0,0.0,2.0,2000.0,140000.0,20,425,12.0,1-Jun,30-Sep,20.000000,1000.0,300.0,0.0,200.0,2.0,500.0,45000.0,6,400,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,29.0,1-Jun,30-Sep,2100.0,200.0,0.0,0.0,2.0,1900.0,8,500,6-Jun,30-Sep,1800.0,300.0,0.0,0.0,2.0,1500.0,8,350,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5477,1,3,27.0,1-Jun,30-Sep,50.000000,2000.0,600.0,0.0,0.0,2.0,1400.0,98000.0,10,450,12.0,1-Jun,30-Sep,50.000000,1600.0,200.0,0.0,100.0,2.0,1300.0,117000.0,10,400,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,0,0,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0


In [37]:
#check for missing values in each columns
second_23_200_columns.isnull().any().sum()

# Check for missing values in each column
columns_with_missing_values = second_23_200_columns.columns[second_23_200_columns.isnull().any()]

# Drop columns with missing values
second_23_200_columns_dropped = second_23_200_columns.drop(columns=columns_with_missing_values, axis=1)

# second_23_200_columns_dropped now contains only columns without missing values

In [38]:
second_23_200_columns_dropped

Unnamed: 0,seas2nam,seas3nam,s1p1c1qharv,s1p1c1cons,s1p1c1lives,s1p1c1lost,s1p1c1mkt,s1p1c1sold,s1p1c1seed,s1p1c1sval,s1p1c2qharv,s1p1c2cons,s1p1c2lives,s1p1c2lost,s1p1c2mkt,s1p1c2sold,s1p1c2seed,s1p1c2sval,s1p1c3cons,s1p1c3lost,s1p1c3mkt,s1p1c3sold,s1p1c3seed,s1p1c3sval,s1p1c4qharv,s1p1c4cons,s1p1c4lives,s1p1c4lost,s1p1c4mkt,s1p1c4sold,s1p1c4seed,s1p1c4sval,s1p1c5cons,s1p1c5lives,s1p1c5lost,s1p1c5mkt,s1p1c5seed,s1p1c5sval,s1p1c6qharv,s1p1c6cons,s1p1c6lives,s1p1c6lost,s1p1c6mkt,s1p1c6sold,s1p1c6seed,s1p1c6sval,s1p2c1qharv,s1p2c1cons,s1p2c1lost,s1p2c1mkt,s1p2c1sold,s1p2c1seed,s1p2c1sval,s1p2c2cons,s1p2c2lives,s1p2c2lost,s1p2c2seed,s1p2c2sval,s1p2c3qharv,s1p2c3cons,s1p2c3lives,s1p2c3lost,s1p2c3mkt,s1p2c3sold,s1p2c3seed,s1p2c3sval,s1p2c4qharv,s1p2c4cons,s1p2c4lives,s1p2c4lost,s1p2c4mkt,s1p2c4sold,s1p2c5qharv,s1p2c5cons,s1p2c5lives,s1p2c5lost,s1p2c5mkt,s1p2c5sold,s1p2c6qharv,s1p2c6cons,s1p2c6lives,s1p2c6lost,s1p2c6mkt,s1p2c6sold,s2p1c1cons,s2p1c1lives,s2p1c1lost,s2p1c1mkt,s2p1c1seed,s2p1c1sval,s2p1c2qharv,s2p1c2cons,s2p1c2lives,s2p1c2lost,s2p1c2mkt,s2p1c2sold,s2p1c2seed,s2p1c2sval,s2p1c3qharv,s2p1c3cons,s2p1c3lives,s2p1c3lost,s2p1c3mkt,s2p1c3sold,s2p1c3seed,s2p1c3sval,s2p1c4qharv,s2p1c4cons,s2p1c4lives,s2p1c4lost,s2p1c4mkt,s2p1c4sold,s2p1c4seed,s2p1c4sval
1087,2,3,4800.0,24000.0,0.0,0.0,2.0,2400.0,140,2,60000.0,0.0,60000.0,0.0,0.0,0.0,50,4,0.0,0.0,2.0,2550.0,50,3,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6000.0,0.0,0.0,24,10,40000.0,200.0,0.0,0.0,2.0,39800.0,.3400000036,5294,10000.0,0.0,0.0,0.0,2.0,10000.0,.400000006,1200,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1088,2,3,2480.0,1550.0,0.0,0.0,2.0,930.0,60,2.5,35000.0,0.0,35000.0,0.0,0.0,0.0,30,4,0.0,0.0,2.0,13500.0,700,2.700000048,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,0.0,2.0,600,.8299999833,3000.0,2500.0,0.0,0.0,2.0,500.0,100,2,1200.0,100.0,0.0,0.0,2.0,1100.0,5.25,124,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1089,2,3,2700.0,2000.0,0.0,0.0,2.0,700.0,60,2.329999924,15000.0,500.0,0.0,0.0,2.0,14500.0,750,5.329999924,0.0,0.0,0.0,0.0,30,4.329999924,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3000.0,0.0,0.0,0.0,100,1.799999952,5500.0,100.0,0.0,0.0,2.0,5400.0,1,80,10000.0,200.0,0.0,0.0,2.0,9800.0,1000,.5,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1090,2,3,2250.0,1250.0,0.0,0.0,2.0,1000.0,60,2.5,38000.0,0.0,38000.0,0.0,0.0,0.0,30,4.329999924,500.0,0.0,2.0,17000.0,750,2.329999924,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,2.0,600,.6600000262,2500.0,3000.0,0.0,0.0,2.0,500.0,100,1.5,10000.0,200.0,0.0,0.0,2.0,9800.0,4,163,0.0,0.0,0.0,0.0,0.0,0.0,0,0
1091,2,3,2250.0,1250.0,0.0,0.0,2.0,1000.0,60,2,14000.0,0.0,14000.0,0.0,0.0,0.0,15,4.75,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0.0,.,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2000.0,0.0,0.0,2.0,100,2,5500.0,200.0,0.0,0.0,2.0,5300.0,400,1.5,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,1,3,2000.0,400.0,0.0,0.0,2.0,1600.0,10,425,600.0,200.0,0.0,100.0,2.0,300.0,4,400,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5475,1,3,2800.0,600.0,0.0,0.0,2.0,2200.0,10,375,3200.0,200.0,0.0,0.0,2.0,3000.0,10,500,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5476,1,3,3200.0,1200.0,0.0,0.0,2.0,2000.0,20,425,1000.0,300.0,0.0,200.0,2.0,500.0,6,400,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,2100.0,200.0,0.0,2.0,1900.0,8,500,300.0,0.0,0.0,8,350,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0
5477,1,3,2000.0,600.0,0.0,0.0,2.0,1400.0,10,450,1600.0,200.0,0.0,100.0,2.0,1300.0,10,400,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0


In [39]:
second_23_200_columns_dropped.columns

Index(['seas2nam', 'seas3nam', 's1p1c1qharv', 's1p1c1cons', 's1p1c1lives',
       's1p1c1lost', 's1p1c1mkt', 's1p1c1sold', 's1p1c1seed', 's1p1c1sval',
       ...
       's2p1c3seed', 's2p1c3sval', 's2p1c4qharv', 's2p1c4cons', 's2p1c4lives',
       's2p1c4lost', 's2p1c4mkt', 's2p1c4sold', 's2p1c4seed', 's2p1c4sval'],
      dtype='object', length=114)

In [40]:
selected_columns = filtered_data[
    ['seas2nam', 'seas3nam',
     's1p1c1qharv', 's1p1c1cons', 's1p1c1lives', 's1p1c1lost', 's1p1c1mkt', 's1p1c1sold', 's1p1c1seed', 's1p1c1sval',
     's1p1c2qharv', 's1p1c2cons', 's1p1c2lives', 's1p1c2lost', 's1p1c2mkt', 's1p1c2sold', 's1p1c2seed', 's1p1c2sval',
     's1p1c3cons', 's1p1c3lost', 's1p1c3mkt', 's1p1c3sold', 's1p1c3seed', 's1p1c3sval',
     's1p1c4qharv', 's1p1c4cons', 's1p1c4lives', 's1p1c4lost', 's1p1c4mkt', 's1p1c4sold', 's1p1c4seed', 's1p1c4sval',
     's1p1c5cons', 's1p1c5lives', 's1p1c5lost', 's1p1c5mkt', 's1p1c5seed', 's1p1c5sval',
     's1p1c6qharv', 's1p1c6cons', 's1p1c6lives', 's1p1c6lost', 's1p1c6mkt', 's1p1c6sold', 's1p1c6seed', 's1p1c6sval']
]

# Group similar columns and aggregate them
aggregated_columns = selected_columns.groupby(selected_columns.columns, axis=1).sum()

# Select the first 10 aggregated columns
selected_columns_10 = aggregated_columns.iloc[:, :10]

# dump the columns into df
df[['spcq1', 'spcq2', 'spcq3', 'spcq4', 'spcq5', 'spcq6', 'spcq7', 'spcq8', 'spcq9', 'spcq10']] = selected_columns_10

  aggregated_columns = selected_columns.groupby(selected_columns.columns, axis=1).sum()


In [41]:
df

Unnamed: 0,farmtype,TotalPlotArea,LandSystem,TenureType,UsageYears,spcq1,spcq2,spcq3,spcq4,spcq5,spcq6,spcq7,spcq8,spcq9,spcq10
1087,3.0,2.5000,3.0 0.0,1.0 0.0,16.0 0.0,24000.0,0.0,0.0,2.0,4800.0,140,2400.0,2,0.0,60000.0
1088,2.0,1.4417,2.0 2.0,1.0 1.0,33.0 33.0,1550.0,0.0,0.0,2.0,2480.0,60,930.0,2.5,0.0,35000.0
1089,2.0,1.5250,3.0 3.0,1.0 1.0,33.0 33.0,2000.0,0.0,0.0,2.0,2700.0,60,700.0,2.329999924,500.0,0.0
1090,2.0,1.6626,3.0 3.0,1.0 1.0,33.0 33.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2.5,0.0,38000.0
1091,1.0,0.6250,2.0 2.0,1.0 1.0,25.0 25.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2,0.0,14000.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,2.0,5.0000,3.0 0.0,1.0 0.0,9.0 0.0,400.0,0.0,0.0,2.0,2000.0,10,1600.0,425,200.0,0.0
5475,2.0,8.0000,1.0 0.0,1.0 0.0,11.0 0.0,600.0,0.0,0.0,2.0,2800.0,10,2200.0,375,200.0,0.0
5476,2.0,17.0000,3.0 2.0,1.0 1.0,26.0 18.0,1200.0,0.0,0.0,2.0,3200.0,20,2000.0,425,300.0,0.0
5477,2.0,8.0000,3.0 0.0,1.0 0.0,8.0 0.0,600.0,0.0,0.0,2.0,2000.0,10,1400.0,450,200.0,0.0


In [42]:
#checking out columns from index 23 to 501
third_201_400_columns = filtered_data.iloc[:, 201:400]
third_201_400_columns_names = filtered_data.columns[201:400]

In [43]:
third_201_400_columns

Unnamed: 0,s2p1c5harv,s2p1c5qharv,s2p1c5cons,s2p1c5lives,s2p1c5lost,s2p1c5mkt,s2p1c5sold,s2p1c5seed,s2p1c5sval,s2p1c6plant,s2p1c6harv,s2p1c6qharv,s2p1c6cons,s2p1c6lives,s2p1c6lost,s2p1c6mkt,s2p1c6sold,s2p1c6seed,s2p1c6sval,s2p2c1plant,s2p2c1harv,s2p2c1qharv,s2p2c1cons,s2p2c1lives,s2p2c1lost,s2p2c1mkt,s2p2c1sold,s2p2c1seed,s2p2c1sval,s2p2c2plant,s2p2c2harv,s2p2c2qharv,s2p2c2cons,s2p2c2lives,s2p2c2lost,s2p2c2mkt,s2p2c2sold,s2p2c2seed,s2p2c2sval,s2p2c3plant,s2p2c3harv,s2p2c3qharv,s2p2c3cons,s2p2c3lives,s2p2c3lost,s2p2c3mkt,s2p2c3sold,s2p2c3seed,s2p2c3sval,s2p2c4plant,s2p2c4harv,s2p2c4qharv,s2p2c4cons,s2p2c4lives,s2p2c4lost,s2p2c4mkt,s2p2c4sold,s2p2c4seed,s2p2c4sval,s2p2c5plant,s2p2c5harv,s2p2c5qharv,s2p2c5cons,s2p2c5lives,s2p2c5lost,s2p2c5mkt,s2p2c5sold,s2p2c5seed,s2p2c5sval,s2p2c6plant,s2p2c6harv,s2p2c6qharv,s2p2c6cons,s2p2c6lives,s2p2c6lost,s2p2c6mkt,s2p2c6sold,s2p2c6seed,s2p2c6sval,s3p1c1plant,s3p1c1harv,s3p1c1qharv,s3p1c1cons,s3p1c1mkt,s3p1c1sold,s3p1c1seed,s3p1c1sval,s3p1c2plant,s3p1c2harv,s3p1c2qharv,s3p1c2cons,s3p1c2mkt,s3p1c2sold,s3p1c2seed,s3p1c2sval,s3p1c3plant,s3p1c3harv,s3p1c3mkt,s3p1c3seed,s3p1c3sval,s3p1c4plant,s3p1c4harv,s3p1c4mkt,s3p1c4sval,s3p1c5plant,s3p1c5harv,s3p1c5mkt,s3p1c6plant,s3p1c6harv,s3p1c6mkt,s3p2c1plant,s3p2c1harv,s3p2c1mkt,s3p2c1sval,s3p2c2plant,s3p2c2harv,s3p2c2mkt,s3p2c2seed,s3p2c2sval,s3p2c3plant,s3p2c3harv,s3p2c3mkt,s3p2c4plant,s3p2c4harv,s3p2c4mkt,s3p2c5plant,s3p2c5harv,s3p2c5mkt,s3p2c6plant,s3p2c6harv,s3p2c6mkt,pc1,pc2,pc3,pc4,pc5,nyieldc1,nyieldc2,nyieldc3,nyieldc4,nyieldc5,s1p1fert,s1p1irrig1,s1p1irrig2,s1p1irrig3,s1p1irrig4,s1p1pest,s1p1wat1,s1p1wat2,s1p1wat3,s1p1wat4,s1p1wat5,s1p2fert,s1p2irrig1,s1p2irrig2,s1p2irrig3,s1p2irrig4,s1p2pest,s1p2wat1,s1p2wat2,s1p2wat3,s1p2wat4,s1p2wat5,s2p1fert,s2p1irrig1,s2p1irrig2,s2p1irrig3,s2p1irrig4,s2p1pest,s2p1wat1,s2p1wat2,s2p1wat3,s2p1wat4,s2p1wat5,s2p2fert,s2p2irrig1,s2p2irrig2,s2p2irrig3,s2p2irrig4,s2p2pest,s2p2wat1,s2p2wat2,s2p2wat3,s2p2wat4,s2p2wat5,s3p1fert,s3p1irrig1,s3p1irrig2,s3p1irrig3,s3p1irrig4,s3p1pest,s3p1wat1,s3p1wat2,s3p1wat3,s3p1wat4,s3p1wat5,s3p2fert,s3p2irrig1,s3p2irrig2
1087,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,,,0.0,0.0,.,.,0.0,.,.,0.0,,,0.0,0,,,0.0,0.0,0,,,0.0,,.,0.0,.,.,0.0,,,0.0,54.0,4.0,53.0,56.0,0.0,2400.0,1350.0,22000.0,8000.0,0.0,2750.0,1.0,0.0,0.0,0.0,6.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2800.0,1.0,0.0,0.0,0.0,14.00,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1088,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,19Aug2002,07Jan2003,30050.0,50.0,2.0,30000.0,.1480000019,75,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,,,0.0,0.0,.,.,0.0,.,.,0.0,,,0.0,0,,,0.0,0.0,0,,,0.0,,.,0.0,.,.,0.0,,,0.0,54.0,38.0,56.0,39.0,56.0,2700.0,16000.0,12000.0,4000.0,15000.0,2000.0,1.0,0.0,0.0,0.0,10.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1000.0,1.0,0.0,0.0,0.0,2.50,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,1.0,0.0,0.0,0.0,0.5,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1089,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,12Aug2002,04Nov2002,3000.0,100.0,2.0,2900.0,1,10,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,,,0.0,0.0,.,.,0.0,.,.,0.0,,,0.0,0,,,0.0,0.0,0,,,0.0,,.,0.0,.,.,0.0,,,0.0,54.0,38.0,39.0,56.0,47.0,3000.0,15000.0,3000.0,7000.0,3000.0,3100.0,1.0,0.0,0.0,0.0,6.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1350.0,1.0,0.0,0.0,0.0,5.00,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,1.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1090,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,,,0.0,0.0,.,.,0.0,.,.,0.0,,,0.0,0,,,0.0,0.0,0,,,0.0,,.,0.0,.,.,0.0,,,0.0,38.0,54.0,56.0,39.0,56.0,25000.0,2400.0,11000.0,3500.0,10000.0,3150.0,1.0,0.0,0.0,0.0,12.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400.0,1.0,0.0,0.0,0.0,5.25,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1091,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0.0,0.0,,,.,.,0.0,0.0,0.0,0.0,0.0,0.0,,,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,0.0,0,0,,,0.0,0.0,0.0,,,0.0,0.0,.,.,0.0,.,.,0.0,,,0.0,0,,,0.0,0.0,0,,,0.0,,.,0.0,.,.,0.0,,,0.0,54.0,39.0,56.0,0.0,0.0,2500.0,3000.0,16000.0,0.0,0.0,500.0,1.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,0.0,0.0,250.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,600.0,1.0,0.0,0.0,0.0,1.00,1.0,0.0,0.0,0.0,0.0,500.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,,,0.0,0.0,,,0.0,,,0.0,0,0,0.0,0,0,0,0.0,0.0,0,,,0.0,,,0.0,,,0.0,,,0.0,27.0,12.0,0.0,0.0,0.0,500.0,600.0,0.0,0.0,0.0,100.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5475,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,,,0.0,0.0,,,0.0,,,0.0,0,0,0.0,0,0,0,0.0,0.0,0,,,0.0,,,0.0,,,0.0,,,0.0,29.0,26.0,0.0,0.0,0.0,700.0,600.0,0.0,0.0,0.0,300.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5476,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,,,0.0,0.0,,,0.0,,,0.0,0,0,0.0,0,0,0,0.0,0.0,0,,,0.0,,,0.0,,,0.0,,,0.0,27.0,29.0,44.0,12.0,0.0,400.0,700.0,600.0,500.0,0.0,350.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,150.0,0.0,0.0,0.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5477,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,0.0,0,0,0,0,0.0,0.0,0.0,,,0.0,0.0,,,0.0,,,0.0,0,0,0.0,0,0,0,0.0,0.0,0,,,0.0,,,0.0,,,0.0,,,0.0,12.0,12.0,0.0,0.0,0.0,400.0,500.0,0.0,0.0,0.0,200.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [44]:
# Remove columns with missing values
third_201_400_columns_cleaned = third_201_400_columns.dropna(axis=1)

# Now, third_201_400_columns_cleaned contains the DataFrame with missing columns removed


In [45]:
third_201_400_columns_cleaned

Unnamed: 0,s2p1c5qharv,s2p1c5cons,s2p1c5lives,s2p1c5lost,s2p1c5mkt,s2p1c5sold,s2p1c5sval,s2p1c6qharv,s2p1c6cons,s2p1c6lives,s2p1c6lost,s2p1c6mkt,s2p1c6sold,s2p1c6sval,s2p2c1qharv,s2p2c1cons,s2p2c1lives,s2p2c1lost,s2p2c1mkt,s2p2c1sold,s2p2c1seed,s2p2c1sval,s2p2c2qharv,s2p2c2cons,s2p2c2lives,s2p2c2lost,s2p2c2mkt,s2p2c2sold,s2p2c2seed,s2p2c2sval,s2p2c3qharv,s2p2c3cons,s2p2c3lives,s2p2c3lost,s2p2c3mkt,s2p2c3sold,s2p2c3sval,s2p2c4qharv,s2p2c4cons,s2p2c4lives,s2p2c4lost,s2p2c4mkt,s2p2c4sold,s2p2c5qharv,s2p2c5cons,s2p2c5lives,s2p2c5lost,s2p2c5mkt,s2p2c5sold,s2p2c6qharv,s2p2c6cons,s2p2c6lives,s2p2c6lost,s2p2c6mkt,s2p2c6sold,s3p1c1qharv,s3p1c1cons,s3p1c1mkt,s3p1c1sold,s3p1c1seed,s3p1c1sval,s3p1c2qharv,s3p1c2cons,s3p1c2mkt,s3p1c2sold,s3p1c2seed,s3p1c2sval,s3p1c3seed,s3p1c4mkt,s3p1c4sval,s3p1c5mkt,s3p1c6mkt,s3p2c1mkt,s3p2c1sval,s3p2c2mkt,s3p2c2seed,s3p2c2sval,s3p2c3mkt,s3p2c4mkt,s3p2c5mkt,s3p2c6mkt,pc1,pc2,pc3,pc4,pc5,nyieldc1,nyieldc2,nyieldc3,nyieldc4,nyieldc5,s1p1fert,s1p1irrig1,s1p1irrig2,s1p1irrig3,s1p1irrig4,s1p1pest,s1p1wat2,s1p1wat3,s1p1wat4,s1p1wat5,s1p2fert,s1p2irrig1,s1p2pest,s1p2wat1,s1p2wat2,s1p2wat3,s1p2wat4,s1p2wat5,s2p1fert,s2p1irrig1,s2p1irrig2,s2p1irrig3,s2p1irrig4,s2p1pest,s2p1wat1,s2p1wat2,s2p1wat3,s2p1wat4,s2p1wat5,s2p2fert,s2p2irrig1,s2p2irrig2,s2p2irrig3,s2p2irrig4,s2p2pest,s2p2wat1,s2p2wat3,s2p2wat4,s2p2wat5,s3p1fert,s3p1irrig1,s3p1irrig2,s3p1irrig3,s3p1irrig4,s3p1pest,s3p1wat1,s3p1wat2,s3p1wat3,s3p1wat4,s3p1wat5,s3p2fert,s3p2irrig2
1087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,54.0,4.0,53.0,56.0,0.0,2400.0,1350.0,22000.0,8000.0,0.0,2750.0,1.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2800.0,1.0,0.0,0.0,0.0,14.00,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1088,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,30050.0,50.0,2.0,30000.0,.1480000019,75,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,54.0,38.0,56.0,39.0,56.0,2700.0,16000.0,12000.0,4000.0,15000.0,2000.0,1.0,0.0,0.0,0.0,10.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1000.0,1.0,0.0,0.0,0.0,2.50,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,1.0,0.0,0.0,0.0,0.5,1.0,0.0,0.0,0.0,0.0,0.0,0.0
1089,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3000.0,100.0,2.0,2900.0,1,10,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,54.0,38.0,39.0,56.0,47.0,3000.0,15000.0,3000.0,7000.0,3000.0,3100.0,1.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1350.0,1.0,0.0,0.0,0.0,5.00,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,1.0,0.0,0.0,0.0,2.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0
1090,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,38.0,54.0,56.0,39.0,56.0,25000.0,2400.0,11000.0,3500.0,10000.0,3150.0,1.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1400.0,1.0,0.0,0.0,0.0,5.25,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1091,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,54.0,39.0,56.0,0.0,0.0,2500.0,3000.0,16000.0,0.0,0.0,500.0,1.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,250.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,600.0,1.0,0.0,0.0,0.0,1.00,1.0,0.0,0.0,0.0,0.0,500.0,1.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,27.0,12.0,0.0,0.0,0.0,500.0,600.0,0.0,0.0,0.0,100.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5475,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,29.0,26.0,0.0,0.0,0.0,700.0,600.0,0.0,0.0,0.0,300.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5476,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,27.0,29.0,44.0,12.0,0.0,400.0,700.0,600.0,500.0,0.0,350.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,150.0,0.0,7.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5477,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0,0.0,0.0,0.0,0.0,12.0,12.0,0.0,0.0,0.0,400.0,500.0,0.0,0.0,0.0,200.0,4.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [51]:

# Select only numeric columns
numeric_columns = third_201_400_columns.select_dtypes(include=[float, int])

# Group and aggregate columns by similar names (you can adjust this as needed)
aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()

# Select only the first 10 columns
result = aggregated_data.iloc[:, :10]

# result now contains the DataFrame with reduced columns
result

  aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()


Unnamed: 0,nyieldc,pc,s
1087,6750.0,33.4,42.549618
1088,9940.0,48.6,483.366412
1089,6200.0,46.8,81.458015
1090,10380.0,48.6,34.895038
1091,4300.0,29.8,14.206107
...,...,...,...
5474,220.0,7.8,0.785714
5475,260.0,11.0,2.242857
5476,440.0,22.4,3.678571
5477,180.0,4.8,1.521429


In [52]:
df[['nyieldc', 'pc', 's']] = result

In [53]:
df

Unnamed: 0,farmtype,TotalPlotArea,LandSystem,TenureType,UsageYears,spcq1,spcq2,spcq3,spcq4,spcq5,spcq6,spcq7,spcq8,spcq9,spcq10,nyieldc,pc,s
1087,3.0,2.5000,3.0 0.0,1.0 0.0,16.0 0.0,24000.0,0.0,0.0,2.0,4800.0,140,2400.0,2,0.0,60000.0,6750.0,33.4,42.549618
1088,2.0,1.4417,2.0 2.0,1.0 1.0,33.0 33.0,1550.0,0.0,0.0,2.0,2480.0,60,930.0,2.5,0.0,35000.0,9940.0,48.6,483.366412
1089,2.0,1.5250,3.0 3.0,1.0 1.0,33.0 33.0,2000.0,0.0,0.0,2.0,2700.0,60,700.0,2.329999924,500.0,0.0,6200.0,46.8,81.458015
1090,2.0,1.6626,3.0 3.0,1.0 1.0,33.0 33.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2.5,0.0,38000.0,10380.0,48.6,34.895038
1091,1.0,0.6250,2.0 2.0,1.0 1.0,25.0 25.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2,0.0,14000.0,4300.0,29.8,14.206107
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,2.0,5.0000,3.0 0.0,1.0 0.0,9.0 0.0,400.0,0.0,0.0,2.0,2000.0,10,1600.0,425,200.0,0.0,220.0,7.8,0.785714
5475,2.0,8.0000,1.0 0.0,1.0 0.0,11.0 0.0,600.0,0.0,0.0,2.0,2800.0,10,2200.0,375,200.0,0.0,260.0,11.0,2.242857
5476,2.0,17.0000,3.0 2.0,1.0 1.0,26.0 18.0,1200.0,0.0,0.0,2.0,3200.0,20,2000.0,425,300.0,0.0,440.0,22.4,3.678571
5477,2.0,8.0000,3.0 0.0,1.0 0.0,8.0 0.0,600.0,0.0,0.0,2.0,2000.0,10,1400.0,450,200.0,0.0,180.0,4.8,1.521429


In [61]:
#checking out columns from index 401 to 600
fourth_401_600_columns = filtered_data.iloc[:, 401:600]
fourth_401_600_columns_names = filtered_data.columns[401:600]

In [62]:
fourth_401_600_columns

Unnamed: 0,s3p2irrig4,s3p2pest,s3p2wat1,s3p2wat2,s3p2wat3,s3p2wat4,s3p2wat5,lvsown,lvs1born,lvs1graze1,lvs1graze2,lvs1graze3,lvs1lost,lvs1num,lvs1pprice,lvs1purch,lvs1sold,lvs1sprice,lvs2born,lvs2graze1,lvs2graze2,lvs2graze3,lvs2lost,lvs2num,lvs2pprice,lvs2purch,lvs2sold,lvs2sprice,lvs3born,lvs3graze1,lvs3graze2,lvs3graze3,lvs3lost,lvs3num,lvs3pprice,lvs3purch,lvs3sold,lvs3sprice,lvs4born,lvs4graze1,lvs4graze2,lvs4graze3,lvs4lost,lvs4num,lvs4pprice,lvs4purch,lvs4sold,lvs4sprice,lvs5born,lvs5graze1,lvs5graze2,lvs5graze3,lvs5lost,lvs5num,lvs5pprice,lvs5purch,lvs5sold,lvs5sprice,lvs6born,lvs6graze1,lvs6graze2,lvs6graze3,lvs6lost,lvs6num,lvs6pprice,lvs6purch,lvs6sold,lvs6sprice,lvs7born,lvs7graze1,lvs7graze2,lvs7graze3,lvs7lost,lvs7num,lvs7pprice,lvs7purch,lvs7sold,lvs7sprice,lvs8born,lvs8graze1,lvs8graze2,lvs8graze3,lvs8lost,lvs8num,lvs8pprice,lvs8purch,lvs8sold,lvs8sprice,lvs9born,lvs9graze1,lvs9graze2,lvs9graze3,lvs9lost,lvs9num,lvs9pprice,lvs9purch,lvs9sold,lvs9sprice,lvsp1price,lvsp1sell,lvsp1use,lvsp2price,lvsp2sell,lvsp2use,lvsp3price,lvsp3sell,lvsp3use,lvsp4price,lvsp4sell,lvsp4use,lvsp5price,lvsp5sell,lvsp5use,lvsp6price,lvsp6sell,lvsp6use,lvsp7price,lvsp7sell,lvsp7use,lvsp8price,lvsp8sell,lvsp8use,lvsp9price,lvsp9sell,lvsp9use,cost1crop,cost1lvs,cost2crop,cost2lvs,cost3crop,cost3lvs,cost4crop,cost4lvs,cost5crop,cost5lvs,ad711,ad712,ad713,ad714,ad715,ad716,ad717,ad718,ad719,ad7110,ad7111,ad7112,ad7113,ad7114,ad7115,ad7116,ad7117,ad7118,ad7119,ad7120,ad7121,ad7122,ad7123,ad7124,ad7125,ad721,ad722,ad723,ad724,ad725,ad726,ad727,ad728,ad729,ad7210,ad7211,ad7212,ad731,ad732,ad733,ad734,ad735,ad736,ad741,ad742,ad743,ad744,ad745,ad746,ad747,ad751,ad752,ad753,ad754,ad755,ad756,ad757,ad758,ad759,ad7510,ad7511,ad7512,ad7513,ad7514
1087,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,5.0,3000.0,2.0,7.0,3500.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10.0,1.0,10.0,0.0,0.0,0.75,1500.0,450.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,500.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,0.0,0.0,300.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1088,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,2.0,3800.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,1000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,300.0,0.0,150.0,0.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0
1089,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,1.0,2000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,1200.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,100.0,0.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1090,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,2.0,2700.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,2000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,100.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1091,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,6.0,0.0,0.0,2.0,3600.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,14.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.00,0.0,800.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,50.0,0.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,2.0,6.0,0.0,0.0,1.0,8000.0,0.0,0.0,12.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7600.0,0.0,2850.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5475,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,3.0,7.0,0.0,9.0,0.0,0.0,0.0,0.0,3.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,7.0,16.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,2.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,3.0,0.0,0.0,1.0,95000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,320.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,150.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10000.0,0.0,3750.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5476,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,3000.0,0.0,6.0,0.0,8.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,3.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,8.0,4.0,13.0,0.0,0.0,2.0,7500.0,0.0,0.0,4.0,8.0,1.0,4.0,0.0,0.0,1.0,25000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,8.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,360.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23000.0,0.0,8250.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5477,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,51000.0,0.0,0.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,0.0,0.0,6.0,6.0,9.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6800.0,0.0,4050.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [63]:
fourth_401_600_columns_names

Index(['s3p2irrig4', 's3p2pest', 's3p2wat1', 's3p2wat2', 's3p2wat3',
       's3p2wat4', 's3p2wat5', 'lvsown', 'lvs1born', 'lvs1graze1',
       ...
       'ad755', 'ad756', 'ad757', 'ad758', 'ad759', 'ad7510', 'ad7511',
       'ad7512', 'ad7513', 'ad7514'],
      dtype='object', length=199)

In [64]:
# Remove columns with missing values
fourth_401_600_columns = fourth_401_600_columns.dropna(axis=1)

In [65]:
fourth_401_600_columns

Unnamed: 0,s3p2pest,s3p2wat1,s3p2wat2,s3p2wat3,s3p2wat4,s3p2wat5,lvsown,lvs1born,lvs1graze1,lvs1graze2,lvs1graze3,lvs1lost,lvs1num,lvs1pprice,lvs1purch,lvs1sold,lvs2born,lvs2graze3,lvs2lost,lvs2num,lvs2pprice,lvs2purch,lvs2sold,lvs2sprice,lvs3born,lvs3graze1,lvs3graze2,lvs3lost,lvs3num,lvs3pprice,lvs3purch,lvs3sprice,lvs4graze2,lvs4lost,lvs4num,lvs4pprice,lvs4purch,lvs4sprice,lvs5born,lvs5graze1,lvs5graze2,lvs5graze3,lvs5lost,lvs5num,lvs5pprice,lvs5purch,lvs5sold,lvs6born,lvs6graze2,lvs6graze3,lvs6lost,lvs6num,lvs6pprice,lvs6purch,lvs6sold,lvs7born,lvs7graze1,lvs7graze2,lvs7graze3,lvs7lost,lvs7num,lvs7pprice,lvs7purch,lvs7sold,lvs7sprice,lvs8born,lvs8graze1,lvs8graze2,lvs8graze3,lvs8lost,lvs8num,lvs8pprice,lvs8purch,lvs9born,lvs9graze1,lvs9graze2,lvs9graze3,lvs9lost,lvs9pprice,lvs9purch,lvs9sold,lvsp1price,lvsp1use,lvsp2price,lvsp2sell,lvsp2use,lvsp3price,lvsp3sell,lvsp3use,lvsp4price,lvsp4sell,lvsp4use,lvsp5price,lvsp5sell,lvsp5use,lvsp6price,lvsp6sell,lvsp6use,lvsp7price,lvsp7sell,lvsp7use,lvsp8sell,lvsp8use,lvsp9price,lvsp9sell,lvsp9use,cost1crop,cost1lvs,cost2crop,cost3crop,cost3lvs,cost4crop,cost4lvs,cost5crop,ad711,ad712,ad713,ad714,ad715,ad716,ad717,ad718,ad719,ad7110,ad7111,ad7112,ad7113,ad7114,ad7115,ad7116,ad7117,ad7118,ad7119,ad7120,ad7121,ad7122,ad7123,ad7124,ad7125,ad721,ad722,ad724,ad725,ad726,ad727,ad728,ad729,ad7210,ad7211,ad7212,ad731,ad732,ad733,ad734,ad735,ad736,ad741,ad744,ad745,ad747,ad751,ad753,ad754,ad755,ad756,ad757,ad758,ad759,ad7510,ad7511,ad7512,ad7513,ad7514
1087,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,5.0,3000.0,2.0,7.0,3500.0,0.0,0.0,0.0,0.0,2.0,0.0,0.0,0.0,0.0,0.0,5.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,15.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,10.0,0.0,0.75,450.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,500.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,0.0,300.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1088,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,2.0,3800.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,1000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,300.0,0.0,150.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,1.0
1089,0.0,0.0,0.0,0.0,0.0,0.0,1.0,2.0,0.0,0.0,0.0,0.0,4.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,1200.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,100.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1090,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,2.0,2700.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,2000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,100.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
1091,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,2.0,3600.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,14.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,800.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,200.0,0.0,50.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,9.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,12.0,2.0,6.0,0.0,0.0,8000.0,0.0,0.0,12.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7600.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5475,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,3.0,7.0,0.0,9.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,12.0,7.0,16.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,2.0,6.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,12.0,0.0,3.0,0.0,0.0,1.0,95000.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,320.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,150.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10000.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5476,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,7.0,0.0,8.0,0.0,0.0,6.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,0.0,4.0,4.0,13.0,0.0,0.0,7500.0,0.0,0.0,4.0,8.0,1.0,4.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,4.0,8.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,360.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,23000.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
5477,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3.0,0.0,0.0,0.0,0.0,6.0,0.0,3.0,0.0,0.0,6.0,6.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.00,0.0,0.0,0.0,0.0,0.0,0.0,100.0,0.0,0.0,100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,6800.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [66]:
# Select only numeric columns
numeric_columns = fourth_401_600_columns.select_dtypes(include=[float, int])

# Group and aggregate columns by similar names (you can adjust this as needed)
aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()

# Select only the first 10 columns
result = aggregated_data.iloc[:, :10]

# result now contains the DataFrame with reduced columns
result

  aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()


Unnamed: 0,ad,cost,lvs,lvsown,lvsp,s
1087,0.070175,62.50,88.500000,1.0,38.03,0.0
1088,0.122807,62.50,51.405405,1.0,40.00,0.0
1089,0.087719,43.75,0.094595,1.0,48.00,0.0
1090,0.087719,50.00,36.540541,1.0,80.00,0.0
1091,0.087719,37.50,48.891892,1.0,32.00,0.0
...,...,...,...,...,...,...
5474,0.070175,950.00,108.716216,1.0,4.48,0.0
5475,0.070175,1250.00,1285.202703,1.0,22.80,0.0
5476,0.087719,2875.00,102.378378,1.0,22.40,0.0
5477,0.070175,850.00,0.337838,1.0,8.00,0.0


In [67]:
df[['ad','cost','lvs', 'lvsown',	'lvsp',	's2']] = result

In [68]:
df

Unnamed: 0,farmtype,TotalPlotArea,LandSystem,TenureType,UsageYears,spcq1,spcq2,spcq3,spcq4,spcq5,spcq6,spcq7,spcq8,spcq9,spcq10,nyieldc,pc,s,ad,cost,lvs,lvsown,lvsp,s2
1087,3.0,2.5000,3.0 0.0,1.0 0.0,16.0 0.0,24000.0,0.0,0.0,2.0,4800.0,140,2400.0,2,0.0,60000.0,6750.0,33.4,42.549618,0.070175,62.50,88.500000,1.0,38.03,0.0
1088,2.0,1.4417,2.0 2.0,1.0 1.0,33.0 33.0,1550.0,0.0,0.0,2.0,2480.0,60,930.0,2.5,0.0,35000.0,9940.0,48.6,483.366412,0.122807,62.50,51.405405,1.0,40.00,0.0
1089,2.0,1.5250,3.0 3.0,1.0 1.0,33.0 33.0,2000.0,0.0,0.0,2.0,2700.0,60,700.0,2.329999924,500.0,0.0,6200.0,46.8,81.458015,0.087719,43.75,0.094595,1.0,48.00,0.0
1090,2.0,1.6626,3.0 3.0,1.0 1.0,33.0 33.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2.5,0.0,38000.0,10380.0,48.6,34.895038,0.087719,50.00,36.540541,1.0,80.00,0.0
1091,1.0,0.6250,2.0 2.0,1.0 1.0,25.0 25.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2,0.0,14000.0,4300.0,29.8,14.206107,0.087719,37.50,48.891892,1.0,32.00,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,2.0,5.0000,3.0 0.0,1.0 0.0,9.0 0.0,400.0,0.0,0.0,2.0,2000.0,10,1600.0,425,200.0,0.0,220.0,7.8,0.785714,0.070175,950.00,108.716216,1.0,4.48,0.0
5475,2.0,8.0000,1.0 0.0,1.0 0.0,11.0 0.0,600.0,0.0,0.0,2.0,2800.0,10,2200.0,375,200.0,0.0,260.0,11.0,2.242857,0.070175,1250.00,1285.202703,1.0,22.80,0.0
5476,2.0,17.0000,3.0 2.0,1.0 1.0,26.0 18.0,1200.0,0.0,0.0,2.0,3200.0,20,2000.0,425,300.0,0.0,440.0,22.4,3.678571,0.087719,2875.00,102.378378,1.0,22.40,0.0
5477,2.0,8.0000,3.0 0.0,1.0 0.0,8.0 0.0,600.0,0.0,0.0,2.0,2000.0,10,1400.0,450,200.0,0.0,180.0,4.8,1.521429,0.070175,850.00,0.337838,1.0,8.00,0.0


In [70]:
#checking out columns from index 401 to 600
last_601_823_columns = filtered_data.iloc[:, 601:823]
last_601_823_columns_names = filtered_data.columns[601:823]

In [71]:
last_601_823_columns

Unnamed: 0,ad7516,ad7517,ad7518,ad7519,ad7520,ad7521,ad7522,ad7523,ad7524,ad7525,ad761,ad762,ad763,ad764,ad765,ad766,ad767,ad768,ad769,ad7610,ad7611,ad7612,ad7613,ad7614,ad7615,ad7616,ad7617,ad7618,ad7619,ad7620,ad7621,ad7622,ad7623,ad7624,ad7625
1087,0.0,0.0,1.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0
1088,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0
1089,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0
1090,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0.0
1091,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0,0.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0.0
5475,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0.0
5476,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0.0
5477,0.0,0.0,0.0,0.0,0.0,0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0,0.0


In [72]:
# Select only numeric columns
numeric_columns = last_601_823_columns.select_dtypes(include=[float, int])

# Group and aggregate columns by similar names (you can adjust this as needed)
aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()

# Select only the first 10 columns
result = aggregated_data.iloc[:, :10]

# result now contains the DataFrame with reduced columns
result

  aggregated_data = numeric_columns.groupby(numeric_columns.columns.str.extract('([a-z]+)', expand=False), axis=1).mean()


Unnamed: 0,ad
1087,0.060606
1088,0.090909
1089,0.090909
1090,0.090909
1091,0.030303
...,...
5474,0.060606
5475,0.060606
5476,0.060606
5477,0.060606


In [73]:
df['ads'] = result

In [74]:
df

Unnamed: 0,farmtype,TotalPlotArea,LandSystem,TenureType,UsageYears,spcq1,spcq2,spcq3,spcq4,spcq5,spcq6,spcq7,spcq8,spcq9,spcq10,nyieldc,pc,s,ad,cost,lvs,lvsown,lvsp,s2,ads
1087,3.0,2.5000,3.0 0.0,1.0 0.0,16.0 0.0,24000.0,0.0,0.0,2.0,4800.0,140,2400.0,2,0.0,60000.0,6750.0,33.4,42.549618,0.070175,62.50,88.500000,1.0,38.03,0.0,0.060606
1088,2.0,1.4417,2.0 2.0,1.0 1.0,33.0 33.0,1550.0,0.0,0.0,2.0,2480.0,60,930.0,2.5,0.0,35000.0,9940.0,48.6,483.366412,0.122807,62.50,51.405405,1.0,40.00,0.0,0.090909
1089,2.0,1.5250,3.0 3.0,1.0 1.0,33.0 33.0,2000.0,0.0,0.0,2.0,2700.0,60,700.0,2.329999924,500.0,0.0,6200.0,46.8,81.458015,0.087719,43.75,0.094595,1.0,48.00,0.0,0.090909
1090,2.0,1.6626,3.0 3.0,1.0 1.0,33.0 33.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2.5,0.0,38000.0,10380.0,48.6,34.895038,0.087719,50.00,36.540541,1.0,80.00,0.0,0.090909
1091,1.0,0.6250,2.0 2.0,1.0 1.0,25.0 25.0,1250.0,0.0,0.0,2.0,2250.0,60,1000.0,2,0.0,14000.0,4300.0,29.8,14.206107,0.087719,37.50,48.891892,1.0,32.00,0.0,0.030303
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5474,2.0,5.0000,3.0 0.0,1.0 0.0,9.0 0.0,400.0,0.0,0.0,2.0,2000.0,10,1600.0,425,200.0,0.0,220.0,7.8,0.785714,0.070175,950.00,108.716216,1.0,4.48,0.0,0.060606
5475,2.0,8.0000,1.0 0.0,1.0 0.0,11.0 0.0,600.0,0.0,0.0,2.0,2800.0,10,2200.0,375,200.0,0.0,260.0,11.0,2.242857,0.070175,1250.00,1285.202703,1.0,22.80,0.0,0.060606
5476,2.0,17.0000,3.0 2.0,1.0 1.0,26.0 18.0,1200.0,0.0,0.0,2.0,3200.0,20,2000.0,425,300.0,0.0,440.0,22.4,3.678571,0.087719,2875.00,102.378378,1.0,22.40,0.0,0.060606
5477,2.0,8.0000,3.0 0.0,1.0 0.0,8.0 0.0,600.0,0.0,0.0,2.0,2000.0,10,1400.0,450,200.0,0.0,180.0,4.8,1.521429,0.070175,850.00,0.337838,1.0,8.00,0.0,0.060606


In [75]:
df.shape

(1800, 25)