In [1]:
import pandas as pd

# O nome do arquivo CSV que você criou
csv_filename = 'house_data_classificacao.csv' # Ou o nome que você usou

try:
    # Ler o arquivo CSV para um DataFrame
    df = pd.read_csv(csv_filename)
    print("Arquivo CSV original carregado com sucesso.")
    print("Colunas originais:", df.columns.tolist())

    # Criar o dicionário de mapeamento: {'Nome_Antigo': 'Nome_Novo'}
    column_mapping = {
        'P1': 'Population',
        'P5p1': 'HouseholdSize',
        'P6p2': 'RacePctWhite',
        'P11p4': 'RentQrange',
        'P14p9': 'PctPopUnder18',
        'P15p1': 'PctPopOver65',
        'P15p3': 'PctRecentImmig',
        'P16p2': 'PctUnemployed',
        'P18p2': 'PctOccupMgmt',
        'P27p4': 'PctSameHouse1985',
        'H2p2': 'Households',
        'H8p2': 'MedianHouseAge',
        'H10p1': 'MedianIncome',
        'H13p1': 'PctVacant',
        'H18pA': 'OwnRentRatio',
        'H40p4': 'PctLargHouseLiv',
    }

    # Usar o método .rename() para renomear as colunas
    df.rename(columns=column_mapping, inplace=True)
    
    print("\nColunas renomeadas com sucesso!")
    
    # --- Verificação ---
    print("\n--- Visualizando as 5 primeiras linhas com as colunas legíveis: ---")
    print(df.head())
    
    print("\nNovas colunas:", df.columns.tolist())

except FileNotFoundError:
    print(f"ERRO: Arquivo '{csv_filename}' não encontrado. Verifique o nome do arquivo.")
except Exception as e:
    print(f"Ocorreu um erro: {e}")

Arquivo CSV original carregado com sucesso.
Colunas originais: ['P1', 'P5p1', 'P6p2', 'P11p4', 'P14p9', 'P15p1', 'P15p3', 'P16p2', 'P18p2', 'P27p4', 'H2p2', 'H8p2', 'H10p1', 'H13p1', 'H18pA', 'H40p4', 'binaryClass']

Colunas renomeadas com sucesso!

--- Visualizando as 5 primeiras linhas com as colunas legíveis: ---
   Population  HouseholdSize  RacePctWhite  RentQrange  PctPopUnder18  \
0     15512.0       0.460869      0.049252    0.226470       0.149827   
1      1550.0       0.470968      0.002581    0.137419       0.096342   
2      4741.0       0.485341      0.000211    0.189412       0.135656   
3       467.0       0.498929      0.000000    0.100642       0.085470   
4       310.0       0.474194      0.680645    0.225807       0.128834   

   PctPopOver65  PctRecentImmig  PctUnemployed  PctOccupMgmt  \
0      0.752837        0.010057       0.579729      0.003251   
1      0.862581        0.000000       0.695142      0.005025   
2      0.856992        0.000000       0.683584     

In [2]:
df.head(20)

Unnamed: 0,Population,HouseholdSize,RacePctWhite,RentQrange,PctPopUnder18,PctPopOver65,PctRecentImmig,PctUnemployed,PctOccupMgmt,PctSameHouse1985,Households,MedianHouseAge,MedianIncome,PctVacant,OwnRentRatio,PctLargHouseLiv,binaryClass
0,15512.0,0.460869,0.049252,0.22647,0.149827,0.752837,0.010057,0.579729,0.003251,0.075912,0.625318,0.036613,0.991377,0.260116,0.052246,0.774059,b'N'
1,1550.0,0.470968,0.002581,0.137419,0.096342,0.862581,0.0,0.695142,0.005025,0.043551,0.064263,0.00335,0.994975,0.285267,0.060606,0.142857,b'P'
2,4741.0,0.485341,0.000211,0.189412,0.135656,0.856992,0.0,0.683584,0.004143,0.027965,0.065796,0.0,0.997411,0.315433,0.065116,0.6875,b'P'
3,467.0,0.498929,0.0,0.100642,0.08547,0.907923,0.0,0.780488,0.006098,0.018293,0.057471,0.0,1.0,0.149425,0.139535,1.0,b'P'
4,310.0,0.474194,0.680645,0.225807,0.128834,0.896774,0.0,0.756303,0.008403,0.016807,0.077519,0.672269,0.991597,0.147287,0.0,0.0,b'P'
5,461.0,0.475054,0.086768,0.130152,0.095041,0.924078,0.0,0.792683,0.0,0.006098,0.088889,0.054878,0.993902,0.272222,0.294118,0.5,b'P'
6,723.0,0.506224,0.0,0.121715,0.109244,0.865837,0.0,0.724138,0.011494,0.072797,0.1,0.0,1.0,0.189655,0.146342,0.0,b'P'
7,75728.0,0.468334,0.291213,0.169686,0.123913,0.795254,0.009719,0.614848,0.002398,0.062126,0.083928,0.263982,0.987077,0.381526,0.024669,0.248781,b'N'
8,2949.0,0.467955,0.004408,0.1804,0.135755,0.828416,0.012886,0.674938,0.002481,0.047974,0.197211,0.004136,0.995037,0.23506,0.042857,0.571429,b'N'
9,4490.0,0.5098,0.00735,0.051893,0.035438,0.95078,0.003118,0.885986,0.001584,0.037213,0.026965,0.009501,0.777514,0.190293,0.24537,0.0,b'N'


In [3]:
csv_filename = 'house_data_classificacao.csv'
df.to_csv(csv_filename, index=False)