In [None]:
import pandas as pd
import numpy as np

## Lectura dataset

In [None]:
df = pd.read_excel('inversion-minera-2000-2024.xlsx', engine='openpyxl', header=None)
df = df.iloc[5:]
df = df.iloc[:-7]

In [None]:
len(df)

156

In [None]:
df.head()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,316,317,318,319,320,321,322,323,324,325
5,DESARROLLO Y PREPARACIÓN,,,,,,,,,,...,,,,,,,,,,
6,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0.0,0.0,0.0,0.0,0.0,,,,,0.0
7,ÁNCASH,5764915.0,5764915.0,5764915.0,5839325.67,5839325.67,5839325.67,15745.0,15745.0,15745.0,...,1463499.0,1380163.0,804619.0,573803.0,720378.0,,,,,9640962.0
8,APURÍMAC,155972.67,155972.67,155972.67,334638.0,334638.0,334638.0,486312.0,486312.0,486312.0,...,1330984.0,1306917.0,2477511.0,2131464.0,1914097.0,,,,,11662147.0
9,AREQUIPA,18087.0,18087.0,18087.0,18750.0,18750.0,18750.0,9087.33,9087.33,9087.33,...,1851635.0,2646747.0,1264830.0,1166860.0,744518.0,,,,,10832705.0


## Procesamiento y reestructuración del datatset

In [None]:
def split_into_dfs(df, n):

    rows_per_df = 26
    total_rows_needed = n * rows_per_df

    if len(df) < total_rows_needed:
        raise ValueError(f"El DataFrame debe tener al menos {total_rows_needed} filas para dividirlo en {n} partes de 26 registros cada una.")

    # dfs = [df.iloc[i*rows_per_df : (i+1)*rows_per_df].copy() for i in range(n)]
    dfs = [df.iloc[i * rows_per_df : (i + 1) * rows_per_df].iloc[1:].copy() for i in range(n)]

    return dfs

In [None]:
df_desarrollo_preparacion, df_equipamento_minero, df_exploracion, df_infraestructura, df_planta_beneficio, df_otros = split_into_dfs(df, 6)

In [None]:
df_desarrollo_preparacion.head()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,316,317,318,319,320,321,322,323,324,325
6,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,0,0,0,0,0,,,,,0
7,ÁNCASH,5764915.0,5764915.0,5764915.0,5839325.67,5839325.67,5839325.67,15745.0,15745.0,15745.0,...,1463499,1380163,804619,573803,720378,,,,,9640962
8,APURÍMAC,155972.67,155972.67,155972.67,334638.0,334638.0,334638.0,486312.0,486312.0,486312.0,...,1330984,1306917,2477511,2131464,1914097,,,,,11662147
9,AREQUIPA,18087.0,18087.0,18087.0,18750.0,18750.0,18750.0,9087.33,9087.33,9087.33,...,1851635,2646747,1264830,1166860,744518,,,,,10832705
10,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,...,7376144,6747035,7317525,7669981,7372911,,,,,56806099


In [None]:
df_desarrollo_preparacion.shape

(25, 326)

In [None]:
def add_columns(df):

    if df.shape != (25, 326):
        raise ValueError("El DataFrame debe tener 25 filas y 326 columnas.")

    # Copia la columna 1 para utilizarla en las columnas nuevas
    col_to_copy = df.iloc[:, 0]

    # Inserta una columna nueva cada 14 columnas
    for i in range(14, df.shape[1] + 1, 14):
        df.insert(i, f"new_col_{i//14}", col_to_copy)

    return df

In [None]:
df_desarrollo_preparacion_nc = add_columns(df_desarrollo_preparacion)

In [None]:
def add_last_columns(df):
  col_to_copy = df.iloc[:, 0]

  df.insert(336, 'col_312', col_to_copy)

  return df

In [None]:
df_desarrollo_preparacion_nc = add_last_columns(df_desarrollo_preparacion_nc)

In [None]:
df_desarrollo_preparacion_nc.shape

(25, 350)

In [None]:
def reshape_dataframe(df):

    generated_dfs = []

    for start_col in range(0, df.shape[1], 14):
        end_col = start_col + 14
        generated_dfs.append(df.iloc[:, start_col:end_col])

    return generated_dfs

In [None]:
df_ncc_rsh_2000, df_ncc_rsh_2001, df_ncc_rsh_2002, df_ncc_rsh_2003, df_ncc_rsh_2004, df_ncc_rsh_2005, df_ncc_rsh_2006, df_ncc_rsh_2007, df_ncc_rsh_2008, df_ncc_rsh_2009, df_ncc_rsh_2010, df_ncc_rsh_2011, df_ncc_rsh_2012, df_ncc_rsh_2013, df_ncc_rsh_2014, df_ncc_rsh_2015, df_ncc_rsh_2016, df_ncc_rsh_2017, df_ncc_rsh_2018, df_ncc_rsh_2019, df_ncc_rsh_2020, df_ncc_rsh_2021, df_ncc_rsh_2022, df_ncc_rsh_2023, df_ncc_rsh_2024  = reshape_dataframe(df_desarrollo_preparacion_nc)

In [None]:

def add_column_from_df_name(df, df_name):

    new_column_value = df_name[-4:]

    df.insert(0, new_column_value, new_column_value)

    return df

## Procesamiento de inversion minera en desarrollo y preparacion

### Procesamiento del año 2000

In [None]:
df_desarrollo_preparacion_2000 = add_column_from_df_name(df_ncc_rsh_2000, 'df_ncc_rsh_2000')

In [None]:
df_desarrollo_preparacion_2000.head()

Unnamed: 0,2000,0,1,2,3,4,5,6,7,8,9,10,11,12,13
6,2000,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2000,ÁNCASH,5764915.0,5764915.0,5764915.0,5839325.67,5839325.67,5839325.67,15745.0,15745.0,15745.0,25800.33,25800.33,25800.33,34937358.0
8,2000,APURÍMAC,155972.67,155972.67,155972.67,334638.0,334638.0,334638.0,486312.0,486312.0,486312.0,235749.67,235749.67,235749.67,3638017.02
9,2000,AREQUIPA,18087.0,18087.0,18087.0,18750.0,18750.0,18750.0,9087.33,9087.33,9087.33,25311.66,25311.66,25311.66,213707.97
10,2000,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
df_desarrollo_preparacion_2000.shape

(25, 15)

In [None]:
def rename_columns(df):
  new_columns_name = ["año", "region", "enero", "febrero", "marzo", "abril", "mayo", "junio", "julio", "agosto", "setiembre", "octubre", "noviembre", "diciembre", "inversion_total"]

  df.columns = new_columns_name

  return df

In [None]:
df_desarrollo_preparacion_2000 = rename_columns(df_desarrollo_preparacion_2000)

In [None]:
df_desarrollo_preparacion_2000.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2000,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2000,ÁNCASH,5764915.0,5764915.0,5764915.0,5839325.67,5839325.67,5839325.67,15745.0,15745.0,15745.0,25800.33,25800.33,25800.33,34937358.0
8,2000,APURÍMAC,155972.67,155972.67,155972.67,334638.0,334638.0,334638.0,486312.0,486312.0,486312.0,235749.67,235749.67,235749.67,3638017.02
9,2000,AREQUIPA,18087.0,18087.0,18087.0,18750.0,18750.0,18750.0,9087.33,9087.33,9087.33,25311.66,25311.66,25311.66,213707.97
10,2000,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
def transformar_inversion_mensual(df):
    # Usamos melt para convertir las columnas de los meses en filas
    df_transformado = df.melt(
        id_vars=["año", "region"],  # Columnas que queremos mantener como identificadores
        var_name="mes",            # Nombre de la nueva columna que contendrá los meses
        value_name="inversion_mensual"  # Nombre de la nueva columna con los valores de inversión
    )

    # Renombramos las columnas y ordenamos los datos
    df_transformado = df_transformado.rename(columns={"region": "region", "año": "año", "mes": "mes", "inversion_mensual": "inversion_mensual"})

    # Ordenar los meses según su orden cronológico
    meses_ordenados = ["enero", "febrero", "marzo", "abril", "mayo", "junio", "julio", "agosto", "setiembre", "octubre", "noviembre", "diciembre"]
    df_transformado["mes"] = pd.Categorical(df_transformado["mes"], categories=meses_ordenados, ordered=True)
    df_transformado = df_transformado.sort_values(by=["region", "año", "mes"]).reset_index(drop=True)

    return df_transformado

In [None]:
df_desarrollo_preparacion_2000 = transformar_inversion_mensual(df_desarrollo_preparacion_2000)

In [None]:
df_desarrollo_preparacion_2000.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,febrero,0
2,2000,AMAZONAS,marzo,0
3,2000,AMAZONAS,abril,0
4,2000,AMAZONAS,mayo,0
...,...,...,...,...
320,2000,ÁNCASH,setiembre,15745
321,2000,ÁNCASH,octubre,25800.33
322,2000,ÁNCASH,noviembre,25800.33
323,2000,ÁNCASH,diciembre,25800.33


### procesamiento año 2001

In [None]:
df_desarrollo_preparacion_2001 = add_column_from_df_name(df_ncc_rsh_2001, 'df_ncc_rsh_2001')
df_desarrollo_preparacion_2001.head(5)

Unnamed: 0,2001,new_col_1,14,15,16,17,18,19,20,21,22,23,24,25,26
6,2001,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2001,ÁNCASH,64334.5,64334.5,64334.5,57807.83,57807.83,57807.83,32736.16,32736.16,32736.16,13098.5,13098.5,13098.5,503930.97
8,2001,APURÍMAC,159603.67,159603.67,159603.67,0.0,0.0,0.0,83260.33,83260.33,83260.33,0.0,0.0,0.0,728592.0
9,2001,AREQUIPA,238341.19,238341.19,238341.19,220895.54,220895.54,220895.54,156714.86,156714.86,156714.86,252180.93,252180.93,252180.93,2604397.56
10,2001,AYACUCHO,55263.83,55263.83,55263.83,54364.98,54364.98,54364.98,74336.04,74336.04,74336.04,353263.84,353263.84,353263.84,1611686.07


In [None]:
df_desarrollo_preparacion_2001.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2001 = rename_columns(df_desarrollo_preparacion_2001)

df_desarrollo_preparacion_2001.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2001,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2001,ÁNCASH,64334.5,64334.5,64334.5,57807.83,57807.83,57807.83,32736.16,32736.16,32736.16,13098.5,13098.5,13098.5,503930.97
8,2001,APURÍMAC,159603.67,159603.67,159603.67,0.0,0.0,0.0,83260.33,83260.33,83260.33,0.0,0.0,0.0,728592.0
9,2001,AREQUIPA,238341.19,238341.19,238341.19,220895.54,220895.54,220895.54,156714.86,156714.86,156714.86,252180.93,252180.93,252180.93,2604397.56
10,2001,AYACUCHO,55263.83,55263.83,55263.83,54364.98,54364.98,54364.98,74336.04,74336.04,74336.04,353263.84,353263.84,353263.84,1611686.07


In [None]:
df_desarrollo_preparacion_2001 = transformar_inversion_mensual(df_desarrollo_preparacion_2001)

df_desarrollo_preparacion_2001.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2001,AMAZONAS,enero,0
1,2001,AMAZONAS,febrero,0
2,2001,AMAZONAS,marzo,0
3,2001,AMAZONAS,abril,0
4,2001,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2001.shape

(325, 4)

### concatenado de df

In [None]:
df_desarrollo_preparacion_2000_2001 = pd.concat([df_desarrollo_preparacion_2000, df_desarrollo_preparacion_2001], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2001 = df_desarrollo_preparacion_2000_2001.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2001

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,PASCO,enero,205812
2,2000,MOQUEGUA,,0
3,2000,MOQUEGUA,diciembre,0
4,2000,MOQUEGUA,noviembre,0
...,...,...,...,...
645,2001,HUÁNUCO,enero,0
646,2001,HUANCAVELICA,,278931.0
647,2001,HUANCAVELICA,diciembre,47727.33
648,2001,ICA,abril,0


### procesamiento año 2002

In [None]:
df_desarrollo_preparacion_2002 = add_column_from_df_name(df_ncc_rsh_2002, 'df_ncc_rsh_2002')

df_desarrollo_preparacion_2002.head()

Unnamed: 0,2002,new_col_2,27,28,29,30,31,32,33,34,35,36,37,38,39
6,2002,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2002,ÁNCASH,29212.15,29212.15,29212.15,13442.12,13442.12,13442.12,31185.66,31185.66,31185.66,13050.0,13050.0,13050.0,260669.79
8,2002,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2002,AREQUIPA,389042.85,389042.85,389042.85,522251.88,522251.88,522251.88,510805.54,510805.54,510805.54,536425.4,536425.4,536425.4,5875577.01
10,2002,AYACUCHO,65475.35,65475.35,65475.35,41945.39,41945.39,41945.39,35891.75,35891.75,35891.75,27976.3,27976.3,27976.3,513866.37


In [None]:
df_desarrollo_preparacion_2002.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2002 = rename_columns(df_desarrollo_preparacion_2002)

df_desarrollo_preparacion_2002.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2002,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2002,ÁNCASH,29212.15,29212.15,29212.15,13442.12,13442.12,13442.12,31185.66,31185.66,31185.66,13050.0,13050.0,13050.0,260669.79
8,2002,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2002,AREQUIPA,389042.85,389042.85,389042.85,522251.88,522251.88,522251.88,510805.54,510805.54,510805.54,536425.4,536425.4,536425.4,5875577.01
10,2002,AYACUCHO,65475.35,65475.35,65475.35,41945.39,41945.39,41945.39,35891.75,35891.75,35891.75,27976.3,27976.3,27976.3,513866.37


In [None]:
df_desarrollo_preparacion_2002 = transformar_inversion_mensual(df_desarrollo_preparacion_2002)

df_desarrollo_preparacion_2002.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2002,AMAZONAS,enero,0
1,2002,AMAZONAS,febrero,0
2,2002,AMAZONAS,marzo,0
3,2002,AMAZONAS,abril,0
4,2002,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2002.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2002 = pd.concat([df_desarrollo_preparacion_2000_2001, df_desarrollo_preparacion_2002], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2002 = df_desarrollo_preparacion_2000_2002.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2002

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,agosto,0
2,2000,LAMBAYEQUE,julio,0
3,2000,AMAZONAS,febrero,0
4,2000,AMAZONAS,marzo,0
...,...,...,...,...
970,2002,HUÁNUCO,enero,0
971,2002,HUANCAVELICA,,35598.87
972,2002,HUANCAVELICA,diciembre,8248.33
973,2002,ICA,abril,0


In [None]:
df_desarrollo_preparacion_2000_2002.shape

(975, 4)

### Procesamiento año 2003

In [None]:
df_desarrollo_preparacion_2003 = add_column_from_df_name(df_ncc_rsh_2003, 'df_ncc_rsh_2003')

df_desarrollo_preparacion_2003.head()

Unnamed: 0,2003,new_col_3,40,41,42,43,44,45,46,47,48,49,50,51,52
6,2003,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2003,ÁNCASH,38039.0,38039.0,38039.0,71467.0,71467.0,71467.0,61235.67,61235.67,61235.67,53278.33,53278.33,53278.33,672060.0
8,2003,APURÍMAC,450774.33,450774.33,450774.33,707476.67,707476.67,707476.67,1256508.33,1256508.33,1256508.33,154194.33,154194.33,154194.33,7706860.98
9,2003,AREQUIPA,461224.33,461224.33,461224.33,425405.64,425405.64,425405.64,315270.67,315270.67,315270.67,141508.68,141508.68,141508.68,4030227.96
10,2003,AYACUCHO,20637.64,20637.64,20637.64,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,61912.92


In [None]:
df_desarrollo_preparacion_2003.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2003 = rename_columns(df_desarrollo_preparacion_2003)

df_desarrollo_preparacion_2003.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2003,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2003,ÁNCASH,38039.0,38039.0,38039.0,71467.0,71467.0,71467.0,61235.67,61235.67,61235.67,53278.33,53278.33,53278.33,672060.0
8,2003,APURÍMAC,450774.33,450774.33,450774.33,707476.67,707476.67,707476.67,1256508.33,1256508.33,1256508.33,154194.33,154194.33,154194.33,7706860.98
9,2003,AREQUIPA,461224.33,461224.33,461224.33,425405.64,425405.64,425405.64,315270.67,315270.67,315270.67,141508.68,141508.68,141508.68,4030227.96
10,2003,AYACUCHO,20637.64,20637.64,20637.64,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,61912.92


In [None]:
df_desarrollo_preparacion_2003 = transformar_inversion_mensual(df_desarrollo_preparacion_2003)

df_desarrollo_preparacion_2003.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2003,AMAZONAS,enero,0
1,2003,AMAZONAS,febrero,0
2,2003,AMAZONAS,marzo,0
3,2003,AMAZONAS,abril,0
4,2003,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2003.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2003 = pd.concat([df_desarrollo_preparacion_2000_2002, df_desarrollo_preparacion_2003], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2003 = df_desarrollo_preparacion_2000_2003.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2003

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,PASCO,febrero,205812
2,2000,ÁNCASH,,34937358
3,2000,MOQUEGUA,,0
4,2000,MOQUEGUA,diciembre,0
...,...,...,...,...
1295,2003,HUÁNUCO,enero,2115.54
1296,2003,HUANCAVELICA,,262144.02
1297,2003,HUANCAVELICA,diciembre,22045.1
1298,2003,ICA,abril,0


### procesamiento 2004

In [None]:
df_desarrollo_preparacion_2004 = add_column_from_df_name(df_ncc_rsh_2004, 'df_ncc_rsh_2004')

df_desarrollo_preparacion_2004.head()

Unnamed: 0,2004,new_col_4,53,54,55,56,57,58,59,60,61,62,63,64,65
6,2004,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2004,ÁNCASH,71168.67,71168.67,71168.67,74220.33,74220.33,74220.33,49073.33,49073.33,49073.33,46815.34,46815.34,46815.34,723833.01
8,2004,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2004,AREQUIPA,149978.34,149978.34,149978.34,110770.34,110770.34,110770.34,874793.99,874793.99,874793.99,871443.09,871443.09,871443.09,6020957.28
10,2004,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
df_desarrollo_preparacion_2004.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2004 = rename_columns(df_desarrollo_preparacion_2004)

df_desarrollo_preparacion_2004.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2004,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2004,ÁNCASH,71168.67,71168.67,71168.67,74220.33,74220.33,74220.33,49073.33,49073.33,49073.33,46815.34,46815.34,46815.34,723833.01
8,2004,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2004,AREQUIPA,149978.34,149978.34,149978.34,110770.34,110770.34,110770.34,874793.99,874793.99,874793.99,871443.09,871443.09,871443.09,6020957.28
10,2004,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
df_desarrollo_preparacion_2004 = transformar_inversion_mensual(df_desarrollo_preparacion_2004)

df_desarrollo_preparacion_2004.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2004,AMAZONAS,enero,0
1,2004,AMAZONAS,febrero,0
2,2004,AMAZONAS,marzo,0
3,2004,AMAZONAS,abril,0
4,2004,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2004.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2004 = pd.concat([df_desarrollo_preparacion_2000_2003, df_desarrollo_preparacion_2004], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2004 = df_desarrollo_preparacion_2000_2004.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2004

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,APURÍMAC,mayo,334638
2,2000,CUSCO,marzo,0
3,2000,LAMBAYEQUE,julio,0
4,2000,AMAZONAS,febrero,0
...,...,...,...,...
1620,2004,HUÁNUCO,enero,0
1621,2004,HUANCAVELICA,,932901.99
1622,2004,HUANCAVELICA,diciembre,149941.67
1623,2004,ICA,abril,0


### procesamiento año 2005

In [None]:
df_desarrollo_preparacion_2005 = add_column_from_df_name(df_ncc_rsh_2005, 'df_ncc_rsh_2005')

df_desarrollo_preparacion_2005.head()

Unnamed: 0,2005,new_col_5,66,67,68,69,70,71,72,73,74,75,76,77,78
6,2005,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,96810.03,96810.03,96810.03,290430.09
7,2005,ÁNCASH,50335.0,50335.0,50335.0,12857.66,12857.66,12857.66,9747.34,9747.34,9747.34,12604.67,12604.67,12604.67,256634.01
8,2005,APURÍMAC,0.0,0.0,0.0,25713.0,25713.0,25713.0,2145.67,2145.67,2145.67,3330.33,3330.33,3330.33,93567.0
9,2005,AREQUIPA,978648.17,978648.17,978648.17,1073995.08,1073995.08,1073995.08,1284211.77,1284211.77,1284211.77,863672.66,863672.66,863672.66,12601583.04
10,2005,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10756.67,10756.67,10756.67,32270.01


In [None]:
df_desarrollo_preparacion_2005 = rename_columns(df_desarrollo_preparacion_2005)

df_desarrollo_preparacion_2005.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2005,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,96810.03,96810.03,96810.03,290430.09
7,2005,ÁNCASH,50335.0,50335.0,50335.0,12857.66,12857.66,12857.66,9747.34,9747.34,9747.34,12604.67,12604.67,12604.67,256634.01
8,2005,APURÍMAC,0.0,0.0,0.0,25713.0,25713.0,25713.0,2145.67,2145.67,2145.67,3330.33,3330.33,3330.33,93567.0
9,2005,AREQUIPA,978648.17,978648.17,978648.17,1073995.08,1073995.08,1073995.08,1284211.77,1284211.77,1284211.77,863672.66,863672.66,863672.66,12601583.04
10,2005,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,10756.67,10756.67,10756.67,32270.01


In [None]:
df_desarrollo_preparacion_2005 = transformar_inversion_mensual(df_desarrollo_preparacion_2005)

df_desarrollo_preparacion_2005.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2005,AMAZONAS,enero,0
1,2005,AMAZONAS,febrero,0
2,2005,AMAZONAS,marzo,0
3,2005,AMAZONAS,abril,0
4,2005,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2005.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2005 = pd.concat([df_desarrollo_preparacion_2000_2004, df_desarrollo_preparacion_2005], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2005 = df_desarrollo_preparacion_2000_2005.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2005

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MADRE DE DIOS,noviembre,0
2,2000,PIURA,noviembre,0
3,2000,ÁNCASH,,34937358
4,2000,MOQUEGUA,,0
...,...,...,...,...
1945,2005,HUÁNUCO,enero,0
1946,2005,HUANCAVELICA,,2624111.13
1947,2005,HUANCAVELICA,diciembre,137952
1948,2005,ICA,abril,0


### procesamiento año 2006

In [None]:
df_desarrollo_preparacion_2006 = add_column_from_df_name(df_ncc_rsh_2006, 'df_ncc_rsh_2006')

df_desarrollo_preparacion_2006.head()

Unnamed: 0,2006,new_col_6,79,80,81,82,83,84,85,86,87,88,89,90,91
6,2006,AMAZONAS,103873.3,103873.3,103873.3,170256.64,170256.64,170256.64,184340.97,184340.97,184340.97,252495.0,252495.0,252495.0,2132897.73
7,2006,ÁNCASH,15880.34,15880.34,15880.34,19362.33,19362.33,19362.33,14651.33,14651.33,14651.33,916.67,916.67,916.67,152432.01
8,2006,APURÍMAC,39063.33,39063.33,39063.33,3910.33,3910.33,3910.33,50063.13,50063.13,50063.13,1335.0,1335.0,1335.0,283115.37
9,2006,AREQUIPA,931796.64,931796.64,931796.64,1628559.75,1628559.75,1628559.75,1871640.67,1871640.67,1871640.67,2000803.18,2000803.18,2000803.18,19298400.72
10,2006,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,20482.33,20482.33,20482.33,28055.0,28055.0,28055.0,145611.99


In [None]:
df_desarrollo_preparacion_2006.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2006 = rename_columns(df_desarrollo_preparacion_2006)

df_desarrollo_preparacion_2006.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2006,AMAZONAS,103873.3,103873.3,103873.3,170256.64,170256.64,170256.64,184340.97,184340.97,184340.97,252495.0,252495.0,252495.0,2132897.73
7,2006,ÁNCASH,15880.34,15880.34,15880.34,19362.33,19362.33,19362.33,14651.33,14651.33,14651.33,916.67,916.67,916.67,152432.01
8,2006,APURÍMAC,39063.33,39063.33,39063.33,3910.33,3910.33,3910.33,50063.13,50063.13,50063.13,1335.0,1335.0,1335.0,283115.37
9,2006,AREQUIPA,931796.64,931796.64,931796.64,1628559.75,1628559.75,1628559.75,1871640.67,1871640.67,1871640.67,2000803.18,2000803.18,2000803.18,19298400.72
10,2006,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,20482.33,20482.33,20482.33,28055.0,28055.0,28055.0,145611.99


In [None]:
df_desarrollo_preparacion_2006 = transformar_inversion_mensual(df_desarrollo_preparacion_2006)

df_desarrollo_preparacion_2006.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2006,AMAZONAS,enero,103873.3
1,2006,AMAZONAS,febrero,103873.3
2,2006,AMAZONAS,marzo,103873.3
3,2006,AMAZONAS,abril,170256.64
4,2006,AMAZONAS,mayo,170256.64


In [None]:
df_desarrollo_preparacion_2006.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2006.drop(df_desarrollo_preparacion_2000_2006.index, inplace=True)
df_desarrollo_preparacion_2000_2006

Unnamed: 0,año,region,mes,inversion_mensual


In [None]:
df_desarrollo_preparacion_2000_2006 = pd.concat([df_desarrollo_preparacion_2000_2005, df_desarrollo_preparacion_2006], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2006 = df_desarrollo_preparacion_2000_2006.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2006

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,APURÍMAC,marzo,155972.67
2,2000,CUSCO,mayo,0
3,2000,CUSCO,marzo,0
4,2000,LAMBAYEQUE,julio,0
...,...,...,...,...
2270,2006,HUÁNUCO,enero,0
2271,2006,HUANCAVELICA,,3455261.73
2272,2006,HUANCAVELICA,diciembre,184970.33
2273,2006,ICA,abril,0


### procesamiento año 2007

In [None]:
df_desarrollo_preparacion_2007 = add_column_from_df_name(df_ncc_rsh_2007, 'df_ncc_rsh_2007')

df_desarrollo_preparacion_2007.head()

Unnamed: 0,2007,new_col_7,92,93,94,95,96,97,98,99,100,101,102,103,104
6,2007,AMAZONAS,61323.03,61323.03,61323.03,20976.7,20976.7,20976.7,16175.0,16175.0,16175.0,76732.0,76732.0,76732.0,525620.19
7,2007,ÁNCASH,4627.0,4627.0,4627.0,8816.33,8816.33,8816.33,22525.0,22525.0,22525.0,23996.67,23996.67,23996.67,179895.0
8,2007,APURÍMAC,162282.0,162282.0,162282.0,468955.0,468955.0,468955.0,0.0,0.0,0.0,0.0,0.0,0.0,1893711.0
9,2007,AREQUIPA,1181409.67,1181409.67,1181409.67,919765.33,919765.33,919765.33,259868.46,259868.46,259868.46,805376.86,805376.86,805376.86,9499260.96
10,2007,AYACUCHO,6813.67,6813.67,6813.67,500380.67,500380.67,500380.67,0.0,0.0,0.0,0.0,0.0,0.0,1521583.02


In [None]:
df_desarrollo_preparacion_2007.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2007 = rename_columns(df_desarrollo_preparacion_2007)

df_desarrollo_preparacion_2007.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2007,AMAZONAS,61323.03,61323.03,61323.03,20976.7,20976.7,20976.7,16175.0,16175.0,16175.0,76732.0,76732.0,76732.0,525620.19
7,2007,ÁNCASH,4627.0,4627.0,4627.0,8816.33,8816.33,8816.33,22525.0,22525.0,22525.0,23996.67,23996.67,23996.67,179895.0
8,2007,APURÍMAC,162282.0,162282.0,162282.0,468955.0,468955.0,468955.0,0.0,0.0,0.0,0.0,0.0,0.0,1893711.0
9,2007,AREQUIPA,1181409.67,1181409.67,1181409.67,919765.33,919765.33,919765.33,259868.46,259868.46,259868.46,805376.86,805376.86,805376.86,9499260.96
10,2007,AYACUCHO,6813.67,6813.67,6813.67,500380.67,500380.67,500380.67,0.0,0.0,0.0,0.0,0.0,0.0,1521583.02


In [None]:
df_desarrollo_preparacion_2007 = transformar_inversion_mensual(df_desarrollo_preparacion_2007)

df_desarrollo_preparacion_2007.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2007,AMAZONAS,enero,61323.03
1,2007,AMAZONAS,febrero,61323.03
2,2007,AMAZONAS,marzo,61323.03
3,2007,AMAZONAS,abril,20976.7
4,2007,AMAZONAS,mayo,20976.7


In [None]:
df_desarrollo_preparacion_2007.shape

(325, 4)

In [None]:
df_desarrollo_preparacion_2000_2007 = pd.concat([df_desarrollo_preparacion_2000_2006, df_desarrollo_preparacion_2007], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2007 = df_desarrollo_preparacion_2000_2007.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2007

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MADRE DE DIOS,diciembre,0
2,2000,TACNA,diciembre,0
3,2000,PIURA,noviembre,0
4,2000,ÁNCASH,,34937358
...,...,...,...,...
2595,2007,HUÁNUCO,enero,0
2596,2007,HUANCAVELICA,,3230374.02
2597,2007,HUANCAVELICA,diciembre,317083.67
2598,2007,ICA,abril,0


### procesamiento año 2008

In [None]:
df_desarrollo_preparacion_2008 = add_column_from_df_name(df_ncc_rsh_2008, 'df_ncc_rsh_2008')

df_desarrollo_preparacion_2008.head()

Unnamed: 0,2008,new_col_8,105,106,107,108,109,110,111,112,113,114,115,116,117
6,2008,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2008,ÁNCASH,27548.67,27548.67,27548.67,41934.67,41934.67,41934.67,32216.67,32216.67,32216.67,15745.67,15745.67,15745.67,352337.04
8,2008,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2008,AREQUIPA,663415.21,663415.21,663415.21,884949.07,884949.07,884949.07,750126.66,750126.66,750126.66,983757.07,983757.07,983757.07,9846744.03
10,2008,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
df_desarrollo_preparacion_2008.shape

(25, 15)

In [None]:
df_desarrollo_preparacion_2008 = rename_columns(df_desarrollo_preparacion_2008)

df_desarrollo_preparacion_2008.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2008,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2008,ÁNCASH,27548.67,27548.67,27548.67,41934.67,41934.67,41934.67,32216.67,32216.67,32216.67,15745.67,15745.67,15745.67,352337.04
8,2008,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2008,AREQUIPA,663415.21,663415.21,663415.21,884949.07,884949.07,884949.07,750126.66,750126.66,750126.66,983757.07,983757.07,983757.07,9846744.03
10,2008,AYACUCHO,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [None]:
df_desarrollo_preparacion_2008 = transformar_inversion_mensual(df_desarrollo_preparacion_2008)

df_desarrollo_preparacion_2008.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2008,AMAZONAS,enero,0
1,2008,AMAZONAS,febrero,0
2,2008,AMAZONAS,marzo,0
3,2008,AMAZONAS,abril,0
4,2008,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2008 = pd.concat([df_desarrollo_preparacion_2000_2007, df_desarrollo_preparacion_2008], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2008 = df_desarrollo_preparacion_2000_2008.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2008

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,APURÍMAC,febrero,155972.67
2,2000,JUNÍN,octubre,0
3,2000,CUSCO,mayo,0
4,2000,CUSCO,marzo,0
...,...,...,...,...
2920,2008,HUÁNUCO,enero,0
2921,2008,HUANCAVELICA,,3961737.96
2922,2008,HUANCAVELICA,diciembre,314241.66
2923,2008,ICA,abril,0


### procesamiento año 2009

In [None]:
df_desarrollo_preparacion_2009 = add_column_from_df_name(df_ncc_rsh_2009, 'df_ncc_rsh_2009')

df_desarrollo_preparacion_2009.head()

Unnamed: 0,2009,new_col_9,118,119,120,121,122,123,124,125,126,127,128,129,130
6,2009,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2009,ÁNCASH,25886.33,25886.33,25886.33,63118.25,29422.0,37050.0,38303.0,77784.0,176638.0,374726.0,183180.0,178827.5,1236707.74
8,2009,APURÍMAC,0.0,0.0,0.0,148644.0,102100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,250744.0
9,2009,AREQUIPA,732894.54,732894.54,732894.54,1326369.61,1753377.71,1895644.45,2278016.02,3026241.99,3411297.54,2666724.7,2969843.15,1455698.8,22981897.59
10,2009,AYACUCHO,0.0,0.0,0.0,1132259.0,1483831.0,1491869.0,1439120.0,756462.0,1232660.0,1563295.0,1387877.0,1483743.0,11971116.0


In [None]:
df_desarrollo_preparacion_2009 = rename_columns(df_desarrollo_preparacion_2009)

df_desarrollo_preparacion_2009.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2009,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2009,ÁNCASH,25886.33,25886.33,25886.33,63118.25,29422.0,37050.0,38303.0,77784.0,176638.0,374726.0,183180.0,178827.5,1236707.74
8,2009,APURÍMAC,0.0,0.0,0.0,148644.0,102100.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,250744.0
9,2009,AREQUIPA,732894.54,732894.54,732894.54,1326369.61,1753377.71,1895644.45,2278016.02,3026241.99,3411297.54,2666724.7,2969843.15,1455698.8,22981897.59
10,2009,AYACUCHO,0.0,0.0,0.0,1132259.0,1483831.0,1491869.0,1439120.0,756462.0,1232660.0,1563295.0,1387877.0,1483743.0,11971116.0


In [None]:
df_desarrollo_preparacion_2009 = transformar_inversion_mensual(df_desarrollo_preparacion_2009)

df_desarrollo_preparacion_2009.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2009,AMAZONAS,enero,0
1,2009,AMAZONAS,febrero,0
2,2009,AMAZONAS,marzo,0
3,2009,AMAZONAS,abril,0
4,2009,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2009 = pd.concat([df_desarrollo_preparacion_2000_2008, df_desarrollo_preparacion_2009], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2009 = df_desarrollo_preparacion_2000_2009.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2009

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MADRE DE DIOS,,0
2,2000,PUNO,julio,0
3,2000,TACNA,diciembre,0
4,2000,PIURA,noviembre,0
...,...,...,...,...
3245,2009,HUÁNUCO,enero,0
3246,2009,HUANCAVELICA,,5951311.64
3247,2009,HUANCAVELICA,diciembre,807220.64
3248,2009,ICA,abril,3200


### procesamiento año 2010

In [None]:
df_desarrollo_preparacion_2010 = add_column_from_df_name(df_ncc_rsh_2010, 'df_ncc_rsh_2010')

df_desarrollo_preparacion_2010.head()

Unnamed: 0,2010,new_col_10,131,132,133,134,135,136,137,138,139,140,141,142,143
6,2010,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2010,ÁNCASH,239407.0,606553.0,219328.0,239721.0,325238.0,375610.0,354090.0,392618.98,278748.0,297400.0,283494.0,318021.0,3930228.98
8,2010,APURÍMAC,0.0,0.0,0.0,0.0,0.0,11615.48,0.0,0.0,0.0,0.0,0.0,0.0,11615.48
9,2010,AREQUIPA,2568054.46,2648516.61,2637573.95,2569669.66,2329849.55,2553364.9,1621105.79,786736.37,1088376.04,1912756.52,1885350.67,1999805.87,24601160.39
10,2010,AYACUCHO,980374.0,1060815.0,1176272.0,1072515.0,1116671.0,1587174.0,1694616.0,2068237.0,1985154.0,2088299.0,2286406.0,2743115.0,19859648.0


In [None]:
df_desarrollo_preparacion_2010 = rename_columns(df_desarrollo_preparacion_2010)

df_desarrollo_preparacion_2010.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2010,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2010,ÁNCASH,239407.0,606553.0,219328.0,239721.0,325238.0,375610.0,354090.0,392618.98,278748.0,297400.0,283494.0,318021.0,3930228.98
8,2010,APURÍMAC,0.0,0.0,0.0,0.0,0.0,11615.48,0.0,0.0,0.0,0.0,0.0,0.0,11615.48
9,2010,AREQUIPA,2568054.46,2648516.61,2637573.95,2569669.66,2329849.55,2553364.9,1621105.79,786736.37,1088376.04,1912756.52,1885350.67,1999805.87,24601160.39
10,2010,AYACUCHO,980374.0,1060815.0,1176272.0,1072515.0,1116671.0,1587174.0,1694616.0,2068237.0,1985154.0,2088299.0,2286406.0,2743115.0,19859648.0


In [None]:
df_desarrollo_preparacion_2010 = transformar_inversion_mensual(df_desarrollo_preparacion_2010)

df_desarrollo_preparacion_2010.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2010,AMAZONAS,enero,0
1,2010,AMAZONAS,febrero,0
2,2010,AMAZONAS,marzo,0
3,2010,AMAZONAS,abril,0
4,2010,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2010 = pd.concat([df_desarrollo_preparacion_2000_2009, df_desarrollo_preparacion_2010], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2010 = df_desarrollo_preparacion_2000_2010.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2010

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,APURÍMAC,enero,155972.67
2,2000,JUNÍN,febrero,0
3,2000,JUNÍN,octubre,0
4,2000,CUSCO,mayo,0
...,...,...,...,...
3570,2010,HUÁNUCO,enero,0
3571,2010,HUANCAVELICA,,7147448.21
3572,2010,HUANCAVELICA,diciembre,174345
3573,2010,ICA,abril,316411


### procesamiento año 2011

In [None]:
df_desarrollo_preparacion_2011 = add_column_from_df_name(df_ncc_rsh_2011, 'df_ncc_rsh_2011')

df_desarrollo_preparacion_2011.head()

Unnamed: 0,2011,new_col_11,144,145,146,147,148,149,150,151,152,153,154,155,156
6,2011,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2011,ÁNCASH,350489.0,347138.0,305743.0,445660.7,573454.0,333253.3,555714.0,656523.79,676212.0,819896.42,827771.72,1484908.09,7376764.02
8,2011,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2011,AREQUIPA,1782217.79,2741544.81,3831088.54,3449929.31,3797716.36,4293906.82,3914181.18,3750073.78,4868828.9,5387094.1,4925240.11,4715960.2,47457781.9
10,2011,AYACUCHO,213513.0,1767110.0,1509422.0,1511340.0,2309110.0,2446034.0,2614986.0,2592787.0,2688948.0,2619356.0,2396727.0,1408766.0,24078099.0


In [None]:
df_desarrollo_preparacion_2011 = rename_columns(df_desarrollo_preparacion_2011)

df_desarrollo_preparacion_2011.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2011,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2011,ÁNCASH,350489.0,347138.0,305743.0,445660.7,573454.0,333253.3,555714.0,656523.79,676212.0,819896.42,827771.72,1484908.09,7376764.02
8,2011,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2011,AREQUIPA,1782217.79,2741544.81,3831088.54,3449929.31,3797716.36,4293906.82,3914181.18,3750073.78,4868828.9,5387094.1,4925240.11,4715960.2,47457781.9
10,2011,AYACUCHO,213513.0,1767110.0,1509422.0,1511340.0,2309110.0,2446034.0,2614986.0,2592787.0,2688948.0,2619356.0,2396727.0,1408766.0,24078099.0


In [None]:
df_desarrollo_preparacion_2011 = transformar_inversion_mensual(df_desarrollo_preparacion_2011)

df_desarrollo_preparacion_2011.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2011,AMAZONAS,enero,0
1,2011,AMAZONAS,febrero,0
2,2011,AMAZONAS,marzo,0
3,2011,AMAZONAS,abril,0
4,2011,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2011 = pd.concat([df_desarrollo_preparacion_2000_2010, df_desarrollo_preparacion_2011], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2011 = df_desarrollo_preparacion_2000_2011.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2011

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,enero,0
2,2000,PUNO,agosto,0
3,2000,PUNO,julio,0
4,2000,TACNA,diciembre,0
...,...,...,...,...
3895,2011,HUÁNUCO,enero,0
3896,2011,HUANCAVELICA,,16276040.5
3897,2011,HUANCAVELICA,diciembre,1788179.47
3898,2011,ICA,abril,521167


### procesamiento año 2012

In [None]:
df_desarrollo_preparacion_2012 = add_column_from_df_name(df_ncc_rsh_2012, 'df_ncc_rsh_2012')

df_desarrollo_preparacion_2012.head()

Unnamed: 0,2012,new_col_12,157,158,159,160,161,162,163,164,165,166,167,168,169
6,2012,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2012,ÁNCASH,813618.99,892386.16,671495.33,751767.48,960362.31,789719.34,726925.59,704255.64,875322.09,777149.54,1029217.04,750094.86,9742314.37
8,2012,APURÍMAC,11400.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11400.0
9,2012,AREQUIPA,2756528.17,4426512.44,4802172.62,4614017.63,4557101.8,3920826.12,4580137.95,6462142.49,3814076.49,4230613.66,3873766.53,5825683.98,53863579.88
10,2012,AYACUCHO,1852554.0,1860615.0,2260501.0,2525002.94,2100005.0,3409026.2,4063959.58,4185393.75,5045043.69,5488150.37,2728292.0,2965480.0,38484023.53


In [None]:
df_desarrollo_preparacion_2012 = rename_columns(df_desarrollo_preparacion_2012)

df_desarrollo_preparacion_2012.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2012,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2012,ÁNCASH,813618.99,892386.16,671495.33,751767.48,960362.31,789719.34,726925.59,704255.64,875322.09,777149.54,1029217.04,750094.86,9742314.37
8,2012,APURÍMAC,11400.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,11400.0
9,2012,AREQUIPA,2756528.17,4426512.44,4802172.62,4614017.63,4557101.8,3920826.12,4580137.95,6462142.49,3814076.49,4230613.66,3873766.53,5825683.98,53863579.88
10,2012,AYACUCHO,1852554.0,1860615.0,2260501.0,2525002.94,2100005.0,3409026.2,4063959.58,4185393.75,5045043.69,5488150.37,2728292.0,2965480.0,38484023.53


In [None]:
df_desarrollo_preparacion_2012 = transformar_inversion_mensual(df_desarrollo_preparacion_2012)

df_desarrollo_preparacion_2012.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2012,AMAZONAS,enero,0
1,2012,AMAZONAS,febrero,0
2,2012,AMAZONAS,marzo,0
3,2012,AMAZONAS,abril,0
4,2012,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2012 = pd.concat([df_desarrollo_preparacion_2000_2011, df_desarrollo_preparacion_2012], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2012 = df_desarrollo_preparacion_2000_2012.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2012

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,,0
2,2000,ICA,,0
3,2000,JUNÍN,febrero,0
4,2000,JUNÍN,octubre,0
...,...,...,...,...
4220,2012,HUÁNUCO,enero,218896.57
4221,2012,HUANCAVELICA,,27446552.02
4222,2012,HUANCAVELICA,diciembre,2847269.66
4223,2012,ICA,abril,3100


### procesamiento año 2013

In [None]:
df_desarrollo_preparacion_2013 = add_column_from_df_name(df_ncc_rsh_2013, 'df_ncc_rsh_2013')

df_desarrollo_preparacion_2013.head()

Unnamed: 0,2013,new_col_13,170,171,172,173,174,175,176,177,178,179,180,181,182
6,2013,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2013,ÁNCASH,704044.99,1226362.42,1222932.85,1025080.72,990188.48,1005386.0,1103604.95,788062.0,476978.0,512997.65,554224.66,563421.49,10173284.21
8,2013,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2013,AREQUIPA,3899024.58,6653141.45,5111755.51,5491924.04,5521741.4,5049621.32,5697296.83,4468544.02,6651661.41,4793331.75,4272898.31,3822501.68,61433442.3
10,2013,AYACUCHO,1756134.0,2642733.0,2915116.0,3018902.0,2997439.55,1689455.51,2717457.0,1557250.0,1425472.0,1456350.0,1444641.0,1669112.0,25290062.06


In [None]:
df_desarrollo_preparacion_2013 = rename_columns(df_desarrollo_preparacion_2013)

df_desarrollo_preparacion_2013.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2013,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
7,2013,ÁNCASH,704044.99,1226362.42,1222932.85,1025080.72,990188.48,1005386.0,1103604.95,788062.0,476978.0,512997.65,554224.66,563421.49,10173284.21
8,2013,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2013,AREQUIPA,3899024.58,6653141.45,5111755.51,5491924.04,5521741.4,5049621.32,5697296.83,4468544.02,6651661.41,4793331.75,4272898.31,3822501.68,61433442.3
10,2013,AYACUCHO,1756134.0,2642733.0,2915116.0,3018902.0,2997439.55,1689455.51,2717457.0,1557250.0,1425472.0,1456350.0,1444641.0,1669112.0,25290062.06


In [None]:
df_desarrollo_preparacion_2013 = transformar_inversion_mensual(df_desarrollo_preparacion_2013)

df_desarrollo_preparacion_2013.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2013,AMAZONAS,enero,0
1,2013,AMAZONAS,febrero,0
2,2013,AMAZONAS,marzo,0
3,2013,AMAZONAS,abril,0
4,2013,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2013 = pd.concat([df_desarrollo_preparacion_2000_2012, df_desarrollo_preparacion_2013], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2013 = df_desarrollo_preparacion_2000_2013.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2013

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,febrero,0
2,2000,PUNO,setiembre,0
3,2000,PUNO,agosto,0
4,2000,PUNO,julio,0
...,...,...,...,...
4545,2013,HUÁNUCO,enero,0
4546,2013,HUANCAVELICA,,22919278.36
4547,2013,HUANCAVELICA,diciembre,1260630.18
4548,2013,ICA,abril,3237623


### procesamiento año 2014

In [None]:
df_desarrollo_preparacion_2014 = add_column_from_df_name(df_ncc_rsh_2014, 'df_ncc_rsh_2014')

df_desarrollo_preparacion_2014.head()

Unnamed: 0,2014,new_col_14,183,184,185,186,187,188,189,190,191,192,193,194,195
6,2014,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,35.0,0.0,35.0
7,2014,ÁNCASH,704858.26,850226.3,693267.01,699468.58,770063.36,844897.01,1040342.22,1062071.51,1185764.81,1369682.24,1484846.66,3073027.58,13778515.54
8,2014,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2000.0,24361.0,16000.0,42361.0
9,2014,AREQUIPA,3288667.99,3785893.2,3958680.98,4257484.11,11949519.85,6700858.03,6241671.13,5483252.08,5936900.6,5915199.28,4525028.63,3753558.13,65796714.01
10,2014,AYACUCHO,1346319.0,2043866.0,1397916.0,1516888.0,1245633.0,1599513.0,1620814.0,2664544.0,1826615.0,1748966.0,1670082.0,1704994.29,20386150.29


In [None]:
df_desarrollo_preparacion_2014 = rename_columns(df_desarrollo_preparacion_2014)

df_desarrollo_preparacion_2014.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2014,AMAZONAS,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,35.0,0.0,35.0
7,2014,ÁNCASH,704858.26,850226.3,693267.01,699468.58,770063.36,844897.01,1040342.22,1062071.51,1185764.81,1369682.24,1484846.66,3073027.58,13778515.54
8,2014,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2000.0,24361.0,16000.0,42361.0
9,2014,AREQUIPA,3288667.99,3785893.2,3958680.98,4257484.11,11949519.85,6700858.03,6241671.13,5483252.08,5936900.6,5915199.28,4525028.63,3753558.13,65796714.01
10,2014,AYACUCHO,1346319.0,2043866.0,1397916.0,1516888.0,1245633.0,1599513.0,1620814.0,2664544.0,1826615.0,1748966.0,1670082.0,1704994.29,20386150.29


In [None]:
df_desarrollo_preparacion_2014 = transformar_inversion_mensual(df_desarrollo_preparacion_2014)

df_desarrollo_preparacion_2014.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2014,AMAZONAS,enero,0
1,2014,AMAZONAS,febrero,0
2,2014,AMAZONAS,marzo,0
3,2014,AMAZONAS,abril,0
4,2014,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2014 = pd.concat([df_desarrollo_preparacion_2000_2013, df_desarrollo_preparacion_2014], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2014 = df_desarrollo_preparacion_2000_2014.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2014

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,diciembre,0
2,2000,ICA,diciembre,0
3,2000,ICA,,0
4,2000,JUNÍN,febrero,0
...,...,...,...,...
4870,2014,HUÁNUCO,enero,0
4871,2014,HUANCAVELICA,,9639808.35
4872,2014,HUANCAVELICA,diciembre,488981.57
4873,2014,ICA,abril,4202184


### procesamiento año 2015

In [None]:
df_desarrollo_preparacion_2015 = add_column_from_df_name(df_ncc_rsh_2015, 'df_ncc_rsh_2015')

df_desarrollo_preparacion_2015.head()

Unnamed: 0,2015,new_col_15,196,197,198,199,200,201,202,203,204,205,206,207,208
6,2015,AMAZONAS,1.0,1.0,18589.0,0.0,10519.0,12957.0,29098.0,16999.0,31920.0,28983.0,30411.0,44579.0,224057.0
7,2015,ÁNCASH,853946.23,850193.0,25360341.22,599857.16,744018.53,802364.22,816807.0,832836.27,821730.58,801064.41,1028948.09,831313.12,34343419.83
8,2015,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,515482.31,0.0,148230.52,206950.59,263292.36,249596.82,1383552.6
9,2015,AREQUIPA,4346580.76,5673593.41,5109386.95,5186600.49,4094931.6,4944901.81,4168225.23,4804510.99,5911167.42,4307260.29,4863300.82,5213480.45,58623940.22
10,2015,AYACUCHO,1088781.0,1299512.0,1195206.0,942142.0,1118435.0,323027.5,546524.0,657334.0,2973887.0,1576437.0,2746281.0,3157807.0,17625373.5


In [None]:
df_desarrollo_preparacion_2015 = rename_columns(df_desarrollo_preparacion_2015)

df_desarrollo_preparacion_2015.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2015,AMAZONAS,1.0,1.0,18589.0,0.0,10519.0,12957.0,29098.0,16999.0,31920.0,28983.0,30411.0,44579.0,224057.0
7,2015,ÁNCASH,853946.23,850193.0,25360341.22,599857.16,744018.53,802364.22,816807.0,832836.27,821730.58,801064.41,1028948.09,831313.12,34343419.83
8,2015,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,515482.31,0.0,148230.52,206950.59,263292.36,249596.82,1383552.6
9,2015,AREQUIPA,4346580.76,5673593.41,5109386.95,5186600.49,4094931.6,4944901.81,4168225.23,4804510.99,5911167.42,4307260.29,4863300.82,5213480.45,58623940.22
10,2015,AYACUCHO,1088781.0,1299512.0,1195206.0,942142.0,1118435.0,323027.5,546524.0,657334.0,2973887.0,1576437.0,2746281.0,3157807.0,17625373.5


In [None]:
df_desarrollo_preparacion_2015 = transformar_inversion_mensual(df_desarrollo_preparacion_2015)

df_desarrollo_preparacion_2015.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2015,AMAZONAS,enero,1
1,2015,AMAZONAS,febrero,1
2,2015,AMAZONAS,marzo,18589
3,2015,AMAZONAS,abril,0
4,2015,AMAZONAS,mayo,10519


In [None]:
df_desarrollo_preparacion_2000_2015 = pd.concat([df_desarrollo_preparacion_2000_2014, df_desarrollo_preparacion_2015], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2015 = df_desarrollo_preparacion_2000_2015.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2015

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,marzo,0
2,2000,PUNO,octubre,0
3,2000,PUNO,setiembre,0
4,2000,PUNO,agosto,0
...,...,...,...,...
5195,2015,HUÁNUCO,enero,0
5196,2015,HUANCAVELICA,,6000492.73
5197,2015,HUANCAVELICA,diciembre,549122.12
5198,2015,ICA,abril,816900


### procesamiento año 2016

In [None]:
df_desarrollo_preparacion_2016 = add_column_from_df_name(df_ncc_rsh_2016, 'df_ncc_rsh_2016')

df_desarrollo_preparacion_2016.head()

Unnamed: 0,2016,new_col_16,209,210,211,212,213,214,215,216,217,218,219,220,221
6,2016,AMAZONAS,29075.0,70413.0,64375.0,50.0,57159.0,500.0,3500.0,4000.0,270.0,20.0,2500.0,8104.0,239966.0
7,2016,ÁNCASH,739115.69,653032.76,659355.92,773662.21,615716.95,647879.62,729778.3,929457.34,835398.22,722782.23,507246.73,1109321.0,8922746.97
8,2016,APURÍMAC,0.0,87277.74,131909.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,219186.77
9,2016,AREQUIPA,3949190.46,4787931.74,4494559.27,6220525.35,6002570.1,6140217.31,2912250.76,5989161.63,8742589.06,2903302.48,6384083.58,5522129.02,64048510.76
10,2016,AYACUCHO,2235529.0,2491353.0,2638622.0,2674989.0,2619054.6,2687472.0,2706396.35,2898480.72,3280726.0,3051363.0,2876495.97,1708009.0,31868490.64


In [None]:
df_desarrollo_preparacion_2016 = rename_columns(df_desarrollo_preparacion_2016)

df_desarrollo_preparacion_2016.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2016,AMAZONAS,29075.0,70413.0,64375.0,50.0,57159.0,500.0,3500.0,4000.0,270.0,20.0,2500.0,8104.0,239966.0
7,2016,ÁNCASH,739115.69,653032.76,659355.92,773662.21,615716.95,647879.62,729778.3,929457.34,835398.22,722782.23,507246.73,1109321.0,8922746.97
8,2016,APURÍMAC,0.0,87277.74,131909.03,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,219186.77
9,2016,AREQUIPA,3949190.46,4787931.74,4494559.27,6220525.35,6002570.1,6140217.31,2912250.76,5989161.63,8742589.06,2903302.48,6384083.58,5522129.02,64048510.76
10,2016,AYACUCHO,2235529.0,2491353.0,2638622.0,2674989.0,2619054.6,2687472.0,2706396.35,2898480.72,3280726.0,3051363.0,2876495.97,1708009.0,31868490.64


In [None]:
df_desarrollo_preparacion_2016 = transformar_inversion_mensual(df_desarrollo_preparacion_2016)

df_desarrollo_preparacion_2016.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2016,AMAZONAS,enero,29075
1,2016,AMAZONAS,febrero,70413
2,2016,AMAZONAS,marzo,64375
3,2016,AMAZONAS,abril,50
4,2016,AMAZONAS,mayo,57159


In [None]:
df_desarrollo_preparacion_2000_2016 = pd.concat([df_desarrollo_preparacion_2000_2015, df_desarrollo_preparacion_2016], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2016 = df_desarrollo_preparacion_2000_2016.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2016

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,noviembre,0
2,2000,ICA,noviembre,0
3,2000,ICA,diciembre,0
4,2000,ICA,,0
...,...,...,...,...
5520,2016,HUÁNUCO,enero,687463.34
5521,2016,HUANCAVELICA,,6518156.96
5522,2016,HUANCAVELICA,diciembre,2356960.06
5523,2016,ICA,abril,4225000


### procesamiento año 2017

In [None]:
df_desarrollo_preparacion_2017 = add_column_from_df_name(df_ncc_rsh_2017, 'df_ncc_rsh_2017')

df_desarrollo_preparacion_2017.head()

Unnamed: 0,2017,new_col_17,222,223,224,225,226,227,228,229,230,231,232,233,234
6,2017,AMAZONAS,0.0,6051.0,6000.0,3500.0,3000.0,567.0,0.0,5800.0,7100.0,6500.0,7500.0,0.0,46018.0
7,2017,ÁNCASH,526566.0,355243.0,406858.0,308835.0,458781.0,487430.0,392877.0,465520.0,433038.0,451164.0,406408.07,385750.0,5078470.07
8,2017,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2017,AREQUIPA,7751125.99,8232619.75,21595540.77,16323892.35,16041094.11,8799932.45,8589861.52,4787434.49,4686132.06,4823201.99,4590667.43,4187083.43,110408586.34
10,2017,AYACUCHO,2002371.75,2319528.38,2394517.1,2255041.92,3335784.74,3236475.86,3398270.45,3165169.33,3287351.12,3505340.35,3559094.37,3427867.49,35886812.86


In [None]:
df_desarrollo_preparacion_2017 = rename_columns(df_desarrollo_preparacion_2017)

df_desarrollo_preparacion_2017.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2017,AMAZONAS,0.0,6051.0,6000.0,3500.0,3000.0,567.0,0.0,5800.0,7100.0,6500.0,7500.0,0.0,46018.0
7,2017,ÁNCASH,526566.0,355243.0,406858.0,308835.0,458781.0,487430.0,392877.0,465520.0,433038.0,451164.0,406408.07,385750.0,5078470.07
8,2017,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
9,2017,AREQUIPA,7751125.99,8232619.75,21595540.77,16323892.35,16041094.11,8799932.45,8589861.52,4787434.49,4686132.06,4823201.99,4590667.43,4187083.43,110408586.34
10,2017,AYACUCHO,2002371.75,2319528.38,2394517.1,2255041.92,3335784.74,3236475.86,3398270.45,3165169.33,3287351.12,3505340.35,3559094.37,3427867.49,35886812.86


In [None]:
df_desarrollo_preparacion_2017 = transformar_inversion_mensual(df_desarrollo_preparacion_2017)

df_desarrollo_preparacion_2017.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2017,AMAZONAS,enero,0
1,2017,AMAZONAS,febrero,6051
2,2017,AMAZONAS,marzo,6000
3,2017,AMAZONAS,abril,3500
4,2017,AMAZONAS,mayo,3000


In [None]:
df_desarrollo_preparacion_2000_2017 = pd.concat([df_desarrollo_preparacion_2000_2016, df_desarrollo_preparacion_2017], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2017 = df_desarrollo_preparacion_2000_2017.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2017

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,abril,0
2,2000,PUNO,noviembre,0
3,2000,PUNO,octubre,0
4,2000,PUNO,setiembre,0
...,...,...,...,...
5845,2017,HUÁNUCO,enero,0
5846,2017,HUANCAVELICA,,5821765.67
5847,2017,HUANCAVELICA,diciembre,754390.88
5848,2017,ICA,abril,1555088


### procesamiento año 2018

In [None]:
df_desarrollo_preparacion_2018 = add_column_from_df_name(df_ncc_rsh_2018, 'df_ncc_rsh_2018')

df_desarrollo_preparacion_2018.head()

Unnamed: 0,2018,new_col_18,235,236,237,238,239,240,241,242,243,244,245,246,247
6,2018,AMAZONAS,6700.0,0.0,0.0,0.0,8000.0,7200.0,5000.0,5000,5000,6000,6000,6000,54900.0
7,2018,ÁNCASH,500444.0,817094.0,1047120.83,645792.06,894211.23,1112216.16,1055064.23,1180748,1147798,1108130,1232431,1009316,11750365.51
8,2018,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
9,2018,AREQUIPA,2427648.28,3701736.1,3375128.04,3463181.8,3047165.87,2562038.02,3077131.41,2647751,3091491,2801881,3209424,2812036,36216612.52
10,2018,AYACUCHO,3674763.08,4029043.5,4270696.0,6541658.0,4597685.55,4271936.3,5064881.5,5212326,5735257,5143210,5483763,7546879,61572098.93


In [None]:
df_desarrollo_preparacion_2018 = rename_columns(df_desarrollo_preparacion_2018)

df_desarrollo_preparacion_2018.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2018,AMAZONAS,6700.0,0.0,0.0,0.0,8000.0,7200.0,5000.0,5000,5000,6000,6000,6000,54900.0
7,2018,ÁNCASH,500444.0,817094.0,1047120.83,645792.06,894211.23,1112216.16,1055064.23,1180748,1147798,1108130,1232431,1009316,11750365.51
8,2018,APURÍMAC,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0,0,0,0.0
9,2018,AREQUIPA,2427648.28,3701736.1,3375128.04,3463181.8,3047165.87,2562038.02,3077131.41,2647751,3091491,2801881,3209424,2812036,36216612.52
10,2018,AYACUCHO,3674763.08,4029043.5,4270696.0,6541658.0,4597685.55,4271936.3,5064881.5,5212326,5735257,5143210,5483763,7546879,61572098.93


In [None]:
df_desarrollo_preparacion_2018 = transformar_inversion_mensual(df_desarrollo_preparacion_2018)

df_desarrollo_preparacion_2018.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2018,AMAZONAS,enero,6700
1,2018,AMAZONAS,febrero,0
2,2018,AMAZONAS,marzo,0
3,2018,AMAZONAS,abril,0
4,2018,AMAZONAS,mayo,8000


In [None]:
df_desarrollo_preparacion_2000_2018 = pd.concat([df_desarrollo_preparacion_2000_2017, df_desarrollo_preparacion_2018], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2018 = df_desarrollo_preparacion_2000_2018.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2018

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,octubre,0
2,2000,ICA,octubre,0
3,2000,ICA,noviembre,0
4,2000,ICA,diciembre,0
...,...,...,...,...
6170,2018,HUÁNUCO,enero,996258.23
6171,2018,HUANCAVELICA,,3200877.88
6172,2018,HUANCAVELICA,diciembre,230484
6173,2018,ICA,abril,16477349.87


### procesamiento año 2019

In [None]:
df_desarrollo_preparacion_2019 = add_column_from_df_name(df_ncc_rsh_2019, 'df_ncc_rsh_2019')

df_desarrollo_preparacion_2019.head()

Unnamed: 0,2019,new_col_19,248,249,250,251,252,253,254,255,256,257,258,259,260
6,2019,AMAZONAS,6000,6500,6000,6000,5500,0,0,0,0,0,0,0,30000
7,2019,ÁNCASH,644381,1258927,1222900,1192722,1424709,1377920,804505,1495318,1231828,1181349,947338,729908,13511805
8,2019,APURÍMAC,709464,279351,229725,665037,542112,1418951,2031553,1465958,829123,2243078,1898353,1771494,14084199
9,2019,AREQUIPA,2259025,3169862,3124624,3195742,2940283,3304309,3071190,3040571,2736805,3056259,2522812,1328056,33749538
10,2019,AYACUCHO,5966284,5474741,5824193,5637030,4785287,5226769,5381205,4862771,4163116,4563648,3908357,4702422,60495823


In [None]:
df_desarrollo_preparacion_2019 = rename_columns(df_desarrollo_preparacion_2019)

df_desarrollo_preparacion_2019.head(5)


Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2019,AMAZONAS,6000,6500,6000,6000,5500,0,0,0,0,0,0,0,30000
7,2019,ÁNCASH,644381,1258927,1222900,1192722,1424709,1377920,804505,1495318,1231828,1181349,947338,729908,13511805
8,2019,APURÍMAC,709464,279351,229725,665037,542112,1418951,2031553,1465958,829123,2243078,1898353,1771494,14084199
9,2019,AREQUIPA,2259025,3169862,3124624,3195742,2940283,3304309,3071190,3040571,2736805,3056259,2522812,1328056,33749538
10,2019,AYACUCHO,5966284,5474741,5824193,5637030,4785287,5226769,5381205,4862771,4163116,4563648,3908357,4702422,60495823


In [None]:
df_desarrollo_preparacion_2019 = transformar_inversion_mensual(df_desarrollo_preparacion_2019)

df_desarrollo_preparacion_2019.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2019,AMAZONAS,enero,6000
1,2019,AMAZONAS,febrero,6500
2,2019,AMAZONAS,marzo,6000
3,2019,AMAZONAS,abril,6000
4,2019,AMAZONAS,mayo,5500


In [None]:
df_desarrollo_preparacion_2000_2019 = pd.concat([df_desarrollo_preparacion_2000_2018, df_desarrollo_preparacion_2019], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2019 = df_desarrollo_preparacion_2000_2019.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2019

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,mayo,0
2,2000,PUNO,diciembre,0
3,2000,PUNO,noviembre,0
4,2000,PUNO,octubre,0
...,...,...,...,...
6495,2019,HUÁNUCO,enero,1303197
6496,2019,HUANCAVELICA,,2825427
6497,2019,HUANCAVELICA,diciembre,158279
6498,2019,ICA,abril,59203819


### procesamiento año 2020

In [None]:
df_desarrollo_preparacion_2020 = add_column_from_df_name(df_ncc_rsh_2020, 'df_ncc_rsh_2020')

df_desarrollo_preparacion_2020.head()

Unnamed: 0,2020,new_col_20,261,262,263,264,265,266,267,268,269,270,271,272,273
6,2020,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2020,ÁNCASH,767384,718469,417830,270575,178169,272951,442398,325047,329087,437141,432127,490422,5081600
8,2020,APURÍMAC,1078614,2190008,2081844,1334220,1643816,542850,968868,716693,699376,808983,477531,495328,13038131
9,2020,AREQUIPA,1135026,1310036,1201516,1002203,1134758,1402516,1282817,943255,856757,929516,842664,776124,12817188
10,2020,AYACUCHO,4144597,4651299,2729131,3000,2500,2976011,1241527,905924,3166488,3494083,2597550,3120964,29033074


In [None]:
df_desarrollo_preparacion_2020 = rename_columns(df_desarrollo_preparacion_2020)

df_desarrollo_preparacion_2020.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2020,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2020,ÁNCASH,767384,718469,417830,270575,178169,272951,442398,325047,329087,437141,432127,490422,5081600
8,2020,APURÍMAC,1078614,2190008,2081844,1334220,1643816,542850,968868,716693,699376,808983,477531,495328,13038131
9,2020,AREQUIPA,1135026,1310036,1201516,1002203,1134758,1402516,1282817,943255,856757,929516,842664,776124,12817188
10,2020,AYACUCHO,4144597,4651299,2729131,3000,2500,2976011,1241527,905924,3166488,3494083,2597550,3120964,29033074


In [None]:
df_desarrollo_preparacion_2020 = transformar_inversion_mensual(df_desarrollo_preparacion_2020)

df_desarrollo_preparacion_2020.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2020,AMAZONAS,enero,0
1,2020,AMAZONAS,febrero,0
2,2020,AMAZONAS,marzo,0
3,2020,AMAZONAS,abril,0
4,2020,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2020 = pd.concat([df_desarrollo_preparacion_2000_2019, df_desarrollo_preparacion_2020], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2020 = df_desarrollo_preparacion_2000_2020.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2020

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,APURÍMAC,abril,334638
2,2000,ICA,setiembre,0
3,2000,ICA,octubre,0
4,2000,ICA,noviembre,0
...,...,...,...,...
6820,2020,HUÁNUCO,enero,83814
6821,2020,HUANCAVELICA,,2216275
6822,2020,HUANCAVELICA,diciembre,178315
6823,2020,ICA,abril,4751275


### procesamiento año 2021

In [None]:
df_desarrollo_preparacion_2021 = add_column_from_df_name(df_ncc_rsh_2021, 'df_ncc_rsh_2021')

df_desarrollo_preparacion_2021.head()

Unnamed: 0,2021,new_col_21,274,275,276,277,278,279,280,281,282,283,284,285,286
6,2021,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2021,ÁNCASH,414586,419263,422769,599074,498947,559112,556447,616213,754454,986997,846080,704889,7378831
8,2021,APURÍMAC,215885,552735,424099,546183,1002634,479264,926926,787113,714354,503989,643384,249715,7046281
9,2021,AREQUIPA,1231610,831675,865838,905136,1053137,894591,1082053,1094709,1260180,1086140,907859,859499,12072427
10,2021,AYACUCHO,3150477,3491808,3074549,3257864,3291849,3775261,4039956,4499700,4125818,4334912,4251332,4238160,45531686


In [None]:
df_desarrollo_preparacion_2021 = rename_columns(df_desarrollo_preparacion_2021)

df_desarrollo_preparacion_2021.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2021,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2021,ÁNCASH,414586,419263,422769,599074,498947,559112,556447,616213,754454,986997,846080,704889,7378831
8,2021,APURÍMAC,215885,552735,424099,546183,1002634,479264,926926,787113,714354,503989,643384,249715,7046281
9,2021,AREQUIPA,1231610,831675,865838,905136,1053137,894591,1082053,1094709,1260180,1086140,907859,859499,12072427
10,2021,AYACUCHO,3150477,3491808,3074549,3257864,3291849,3775261,4039956,4499700,4125818,4334912,4251332,4238160,45531686


In [None]:
df_desarrollo_preparacion_2021 = transformar_inversion_mensual(df_desarrollo_preparacion_2021)

df_desarrollo_preparacion_2021.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2021,AMAZONAS,enero,0
1,2021,AMAZONAS,febrero,0
2,2021,AMAZONAS,marzo,0
3,2021,AMAZONAS,abril,0
4,2021,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2021 = pd.concat([df_desarrollo_preparacion_2000_2020, df_desarrollo_preparacion_2021], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2021 = df_desarrollo_preparacion_2000_2021.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2021

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,junio,0
2,2000,PUNO,,0
3,2000,PUNO,diciembre,0
4,2000,PUNO,noviembre,0
...,...,...,...,...
7145,2021,HUÁNUCO,enero,1703
7146,2021,HUANCAVELICA,,835765
7147,2021,HUANCAVELICA,diciembre,154416
7148,2021,ICA,abril,15900285


### procesamiento año 2022

In [None]:
df_desarrollo_preparacion_2022 = add_column_from_df_name(df_ncc_rsh_2022, 'df_ncc_rsh_2022')

df_desarrollo_preparacion_2022.head()

Unnamed: 0,2022,new_col_22,287,288,289,290,291,292,293,294,295,296,297,298,299
6,2022,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2022,ÁNCASH,678756,478048,538399,545233,675558,603423,824513,1050495,835863,973432,881243,1014861,9099824
8,2022,APURÍMAC,398396,513447,1301580,721953,529482,533472,1177632,636795,1358424,1176504,1931642,1827311,12106638
9,2022,AREQUIPA,907561,1388005,2044958,1666078,1902755,1759003,2151858,1227682,1822580,1146826,10070927,1626484,27714717
10,2022,AYACUCHO,3540650,3775656,4258422,4596675,6475320,5142905,5361639,5466941,5696063,5418746,5972537,5008371,60713925


In [None]:
df_desarrollo_preparacion_2022 = rename_columns(df_desarrollo_preparacion_2022)

df_desarrollo_preparacion_2022.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2022,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2022,ÁNCASH,678756,478048,538399,545233,675558,603423,824513,1050495,835863,973432,881243,1014861,9099824
8,2022,APURÍMAC,398396,513447,1301580,721953,529482,533472,1177632,636795,1358424,1176504,1931642,1827311,12106638
9,2022,AREQUIPA,907561,1388005,2044958,1666078,1902755,1759003,2151858,1227682,1822580,1146826,10070927,1626484,27714717
10,2022,AYACUCHO,3540650,3775656,4258422,4596675,6475320,5142905,5361639,5466941,5696063,5418746,5972537,5008371,60713925


In [None]:
df_desarrollo_preparacion_2022 = transformar_inversion_mensual(df_desarrollo_preparacion_2022)

df_desarrollo_preparacion_2022.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2022,AMAZONAS,enero,0
1,2022,AMAZONAS,febrero,0
2,2022,AMAZONAS,marzo,0
3,2022,AMAZONAS,abril,0
4,2022,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2022 = pd.concat([df_desarrollo_preparacion_2000_2021, df_desarrollo_preparacion_2022], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2022 = df_desarrollo_preparacion_2000_2022.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2022

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,setiembre,0
2,2000,ICA,agosto,0
3,2000,ICA,setiembre,0
4,2000,ICA,octubre,0
...,...,...,...,...
7470,2022,HUÁNUCO,enero,210020
7471,2022,HUANCAVELICA,,1956640
7472,2022,HUANCAVELICA,diciembre,338971
7473,2022,ICA,abril,11159999


### procesamiento año 2023

In [None]:
df_desarrollo_preparacion_2023 = add_column_from_df_name(df_ncc_rsh_2023, 'df_ncc_rsh_2023')

df_desarrollo_preparacion_2023.head()

Unnamed: 0,2023,new_col_23,300,301,302,303,304,305,306,307,308,309,310,311,312
6,2023,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2023,ÁNCASH,1019169,1042392,1456465,3195508,1257680,1251717,1282351,1268139,1534434,1546849,1615487,1240134,17710325
8,2023,APURÍMAC,925184,1074607,1293793,1069707,1387174,1051839,1781305,1342144,1604163,3310354,2261518,3186498,20288286
9,2023,AREQUIPA,1661859,1912870,1581081,1916813,1753752,1743398,1719315,2128919,1920192,1632677,1896610,2160563,22028049
10,2023,AYACUCHO,5867736,4843444,5908701,5669610,5590510,5554484,5729355,6240227,5605253,5600667,6404392,6872629,69887008


In [None]:
df_desarrollo_preparacion_2023 = rename_columns(df_desarrollo_preparacion_2023)

df_desarrollo_preparacion_2023.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2023,AMAZONAS,0,0,0,0,0,0,0,0,0,0,0,0,0
7,2023,ÁNCASH,1019169,1042392,1456465,3195508,1257680,1251717,1282351,1268139,1534434,1546849,1615487,1240134,17710325
8,2023,APURÍMAC,925184,1074607,1293793,1069707,1387174,1051839,1781305,1342144,1604163,3310354,2261518,3186498,20288286
9,2023,AREQUIPA,1661859,1912870,1581081,1916813,1753752,1743398,1719315,2128919,1920192,1632677,1896610,2160563,22028049
10,2023,AYACUCHO,5867736,4843444,5908701,5669610,5590510,5554484,5729355,6240227,5605253,5600667,6404392,6872629,69887008


In [None]:
df_desarrollo_preparacion_2023 = transformar_inversion_mensual(df_desarrollo_preparacion_2023)

df_desarrollo_preparacion_2023.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2023,AMAZONAS,enero,0
1,2023,AMAZONAS,febrero,0
2,2023,AMAZONAS,marzo,0
3,2023,AMAZONAS,abril,0
4,2023,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2023 = pd.concat([df_desarrollo_preparacion_2000_2022, df_desarrollo_preparacion_2023], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2023 = df_desarrollo_preparacion_2000_2023.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2023

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,MOQUEGUA,julio,0
2,2000,SAN MARTÍN,enero,0
3,2000,PUNO,,0
4,2000,PUNO,diciembre,0
...,...,...,...,...
7795,2023,HUÁNUCO,enero,40020
7796,2023,HUANCAVELICA,,2599290
7797,2023,HUANCAVELICA,diciembre,457289
7798,2023,ICA,abril,10859185


### procesamiento año 2024

In [None]:
df_desarrollo_preparacion_2024 = add_column_from_df_name(df_ncc_rsh_2024, 'df_ncc_rsh_2024')

df_desarrollo_preparacion_2024.head()

Unnamed: 0,2024,col_312,313,314,315,316,317,318,319,320,321,322,323,324,325
6,2024,AMAZONAS,0,0,0,0,0,0,0,0,,,,,0
7,2024,ÁNCASH,1628139,1518038,1552323,1463499,1380163,804619,573803,720378,,,,,9640962
8,2024,APURÍMAC,509742,825800,1165632,1330984,1306917,2477511,2131464,1914097,,,,,11662147
9,2024,AREQUIPA,1220706,1156590,780819,1851635,2646747,1264830,1166860,744518,,,,,10832705
10,2024,AYACUCHO,7013815,6622059,6686629,7376144,6747035,7317525,7669981,7372911,,,,,56806099


In [None]:
df_desarrollo_preparacion_2024 = rename_columns(df_desarrollo_preparacion_2024)

df_desarrollo_preparacion_2024.head(5)

Unnamed: 0,año,region,enero,febrero,marzo,abril,mayo,junio,julio,agosto,setiembre,octubre,noviembre,diciembre,inversion_total
6,2024,AMAZONAS,0,0,0,0,0,0,0,0,,,,,0
7,2024,ÁNCASH,1628139,1518038,1552323,1463499,1380163,804619,573803,720378,,,,,9640962
8,2024,APURÍMAC,509742,825800,1165632,1330984,1306917,2477511,2131464,1914097,,,,,11662147
9,2024,AREQUIPA,1220706,1156590,780819,1851635,2646747,1264830,1166860,744518,,,,,10832705
10,2024,AYACUCHO,7013815,6622059,6686629,7376144,6747035,7317525,7669981,7372911,,,,,56806099


In [None]:
df_desarrollo_preparacion_2024 = transformar_inversion_mensual(df_desarrollo_preparacion_2024)

df_desarrollo_preparacion_2024.head(5)

Unnamed: 0,año,region,mes,inversion_mensual
0,2024,AMAZONAS,enero,0
1,2024,AMAZONAS,febrero,0
2,2024,AMAZONAS,marzo,0
3,2024,AMAZONAS,abril,0
4,2024,AMAZONAS,mayo,0


In [None]:
df_desarrollo_preparacion_2000_2024 = pd.concat([df_desarrollo_preparacion_2000_2023, df_desarrollo_preparacion_2024], ignore_index=True)

# Ordenamos de menor a mayor por la columna "año"
df_desarrollo_preparacion_2000_2024 = df_desarrollo_preparacion_2000_2024.sort_values(by="año", ascending=True).reset_index(drop=True)
df_desarrollo_preparacion_2000_2024

Unnamed: 0,año,region,mes,inversion_mensual
0,2000,AMAZONAS,enero,0
1,2000,AMAZONAS,julio,0
2,2000,ICA,julio,0
3,2000,ICA,agosto,0
4,2000,ICA,setiembre,0
...,...,...,...,...
8120,2024,HUÁNUCO,enero,20
8121,2024,HUANCAVELICA,,6066593
8122,2024,HUANCAVELICA,diciembre,
8123,2024,ICA,abril,11114833


In [None]:
df_desarrollo_preparacion_2000_2024['id'] = range(1, len(df_desarrollo_preparacion_2000_2024) + 1)

In [None]:
df_desarrollo_preparacion_2000_2024 = df_desarrollo_preparacion_2000_2024[['id'] + [col for col in df_desarrollo_preparacion_2000_2024.columns if col != 'id']]

In [None]:
df_desarrollo_preparacion_2000_2024

Unnamed: 0,id,año,region,mes,inversion_mensual
0,1,2000,AMAZONAS,enero,0
1,2,2000,AMAZONAS,julio,0
2,3,2000,ICA,julio,0
3,4,2000,ICA,agosto,0
4,5,2000,ICA,setiembre,0
...,...,...,...,...,...
8120,8121,2024,HUÁNUCO,enero,20
8121,8122,2024,HUANCAVELICA,,6066593
8122,8123,2024,HUANCAVELICA,diciembre,
8123,8124,2024,ICA,abril,11114833


In [None]:
df_desarrollo_preparacion_2000_2024.to_csv('process_data/df_inversion_minera_desarrollo_preparacion_2000_2024.csv', index=False)