In [None]:
import pandas as pd

file_path = r'1_Raichur_NDVI_SampledPoints_2010_2023.csv'

data = pd.read_csv(file_path)

print("Columns in the CSV:")
print(data.columns)

print("\nFirst 5 rows in the CSV:")
print(data.head())


Columns in the CSV:
Index(['system:index', 'NDVI', 'date', 'latitude', 'longitude', '.geo'], dtype='object')

First 5 rows in the CSV:
     system:index    NDVI        date   latitude  longitude  \
0  2010_01_01_0_0  0.3633  2010-01-01  16.056737  76.506498   
1  2010_01_01_1_0  0.5937  2010-01-01  16.090461  76.748791   
2  2010_01_01_2_0  0.3168  2010-01-01  15.726236  76.754677   
3  2010_01_01_3_0  0.4591  2010-01-01  16.128682  76.574005   
4  2010_01_01_4_0  0.4924  2010-01-01  16.025261  77.313135   

                                                .geo  
0  {"geodesic":false,"type":"Point","coordinates"...  
1  {"geodesic":false,"type":"Point","coordinates"...  
2  {"geodesic":false,"type":"Point","coordinates"...  
3  {"geodesic":false,"type":"Point","coordinates"...  
4  {"geodesic":false,"type":"Point","coordinates"...  


In [None]:
data = data.drop(columns=['system:index', '.geo'])

print("\nData after dropping 'system:index' and '.geo':")
print(data.head())

output_file_path = r'2_Processed_Raichur_NDVI_SampledPoints.csv'
data.to_csv(output_file_path, index=False)


Data after dropping 'system:index' and '.geo':
     NDVI        date   latitude  longitude
0  0.3633  2010-01-01  16.056737  76.506498
1  0.5937  2010-01-01  16.090461  76.748791
2  0.3168  2010-01-01  15.726236  76.754677
3  0.4591  2010-01-01  16.128682  76.574005
4  0.4924  2010-01-01  16.025261  77.313135


In [None]:
grouped_data = data.groupby(['latitude', 'longitude']).size().reset_index(name='count')

print("\nGrouped data by latitude and longitude with count of data points:")
print(grouped_data)

output_grouped_file = r'3_Grouped_Raichur_NDVI_SampledPoints.csv'
grouped_data.to_csv(output_grouped_file, index=False)


Grouped data by latitude and longitude with count of data points:
      latitude  longitude  count
0    15.650239  76.733093      5
1    15.650684  76.733260      1
2    15.652042  76.733769    215
3    15.652042  76.733769     62
4    15.652042  76.733769     18
..         ...        ...    ...
245  16.468176  77.016256    216
246  16.468176  77.016256     62
247  16.468176  77.016256     18
248  16.468621  77.016433      5
249  16.469066  77.016610      1

[250 rows x 3 columns]


In [None]:
import pandas as pd

csv_path = r"3_Grouped_Raichur_NDVI_SampledPoints.csv"

df = pd.read_csv(csv_path)

df['latitude'] = df['latitude'].round(2)
df['longitude'] = df['longitude'].round(2)

grouped_df = df.groupby(['latitude', 'longitude'], as_index=False).agg({'count': 'sum'})

output_path = r"4_Grouped_Raichur_NDVI_SampledPoints_Summed.csv"

grouped_df.to_csv(output_path, index=False)

print("Processed CSV saved to:", output_path)


Processed CSV saved to: 4_Grouped_Raichur_NDVI_SampledPoints_Summed.csv


In [None]:
import pandas as pd

csv_path = r"4_Grouped_Raichur_NDVI_SampledPoints_Summed.csv"

df = pd.read_csv(csv_path)

filtered_df = df[df['count'] > 250]

output_path = r"5_Grouped_Raichur_NDVI_SampledPoints_Filtered.csv"

filtered_df.to_csv(output_path, index=False)

print("Filtered CSV saved to:", output_path)


Filtered CSV saved to: 5_Grouped_Raichur_NDVI_SampledPoints_Filtered.csv


In [None]:
import os
import pandas as pd

# Path to the input CSV file
csv_path = r"5_Processed_Raichur_NDVI_SampledPoints_Filtered.csv"

df = pd.read_csv(csv_path)

df['latitude'] = df['latitude'].round(2)
df['longitude'] = df['longitude'].round(2)

raichur_folder = r"Raichur"
if not os.path.exists(raichur_folder):
    os.makedirs(raichur_folder)

lat_lon_to_folder = {}

location_counter = 1

for (lat, lon), group in df.groupby(['latitude', 'longitude']):
    location_folder = os.path.join(raichur_folder, f"Location{location_counter}")
    os.makedirs(location_folder)
    
    location_data = group[['NDVI', 'date', 'latitude', 'longitude']]
    location_data.to_csv(os.path.join(location_folder, f"data_{lat}_{lon}.csv"), index=False)
    
    lat_lon_to_folder[f"{lat},{lon}"] = f"Location{location_counter}"
    
    location_counter += 1

with open(os.path.join(raichur_folder, "lat_lon_to_folder_mapping.txt"), 'w') as f:
    for lat_lon, folder_name in lat_lon_to_folder.items():
        f.write(f"{lat_lon} -> {folder_name}\n")

print(f"Data has been organized and saved in {raichur_folder}.")


Data has been organized and saved in C:\Users\anand\Code_basics\GDA\GDA_Project\GDA_Final\Raichur.
