# Merge ndvi split data sets and reformat them for further analysis
In order to do this you must have downloaded the ndvi data sets.

In [1]:
import pandas as pd


In [2]:
# Read the two datasets
df_p1 = pd.read_csv("data/ndvi_CWP_2022_watering_p1.csv")
df_p2 = pd.read_csv("data/ndvi_CWP_2022_watering_p2.csv")

# Merge (stack) them row-wise
df = pd.concat([df_p1, df_p2], ignore_index=True)

In [3]:

# Pivot: one row per tree_id, one column per month
df_wide = (
    df.pivot_table(
        index="tree_id",
        columns="month",
        values="NDVI",
        aggfunc="mean"   # in case there are duplicates
    )
    .rename(columns=lambda m: f"NDVI_m{m}")
    .reset_index()
)

# Optional: ensure all months 3â€“9 exist as columns
all_months = [f"NDVI_m{m}" for m in range(3, 10)]
df_wide = df_wide.reindex(columns=["tree_id"] + all_months)

print(df_wide.head())


month            tree_id   NDVI_m3   NDVI_m4   NDVI_m5   NDVI_m6   NDVI_m7  \
0      00008100:000c09d7  0.224754  0.268153  0.306351  0.276893  0.251684   
1      00008100:000c09e9  0.157686  0.199009  0.183150  0.220465  0.204459   
2      00008100:000c09ea  0.180522  0.211626  0.199039  0.230015  0.227425   
3      00008100:000c0a20  0.309235  0.346179  0.363654  0.332270  0.322522   
4      00008100:000c0a21  0.352739  0.492772  0.479558  0.477902  0.478470   

month   NDVI_m8   NDVI_m9  
0      0.203854  0.358751  
1      0.187151  0.210316  
2      0.216174  0.237977  
3      0.311283  0.398499  
4      0.457277  0.547352  
