# Convert Excel to csv files with format
This notebook converts all Excel (.xlsx) files in the /xlsx_files directory to CSV files, replacing 'Unnamed' columns with blank spaces.

In [1]:
import os
import pandas as pd

In [2]:
current_directory = os.getcwd()
current_directory

'c:\\Users\\PLLOBET.DISTFORM\\Desktop\\UdL\\TFM\\csv-parser'

Create 'output' directory if it does not exist

In [3]:
output_directory = os.path.join(current_directory, 'output')
os.makedirs(output_directory, exist_ok=True)
os.listdir(current_directory)

['format_csv.ipynb', 'output', 'venv', 'xlsx_files']

Iterates through all the files in the current directory.
Initializes a list to store the names of converted files.

In [4]:
# Initializes a list to store the names of converted files
converted_files = []

# Defines the directory where the .xlsx files are located
xlsx_directory = os.path.join(current_directory, 'xlsx_files')

# Iterates through all the files in the /xlsx_files directory
for filename in os.listdir(xlsx_directory):
    if filename.endswith('.xlsx'):
        file_path = os.path.join(xlsx_directory, filename)
        xlsx_data = pd.read_excel(file_path)

        xlsx_data.dropna(axis=1, how='all', inplace=True)

        # Replaces 'Unnamed' columns with ' '
        xlsx_data.columns = [col if 'Unnamed' not in col else ' ' for col in xlsx_data.columns]

        print(f"Table after replacing 'Unnamed' columns with spaces for {filename}:")
        print(xlsx_data)

        # Renames columns to remove spaces and special characters
        xlsx_data.columns = [col.strip().replace(' ', '_').replace('-', '_') for col in xlsx_data.columns]

        csv_filename = f"{os.path.splitext(filename)[0]}.csv"
        csv_file_path = os.path.join(output_directory, csv_filename)

        xlsx_data.to_csv(csv_file_path, index=False, encoding='utf-8')

        converted_files.append(csv_filename)

        print(f"Converted: {filename} to {csv_filename} in the 'output' folder")

Table after replacing 'Unnamed' columns with spaces for Abatidores.xlsx:
       ItemCode                                           ItemName  \
0      0CHAT001                                  Chatarra INOX 304   
1      0CHAT002                                           Chatarra   
2      0CHAT003                            Chatarra INOX FERRITICO   
3      0CHAT005                               Carton para reciclar   
4      0CHAT006                             Plástico para reciclar   
...         ...                                                ...   
23623  VMRA64GN  Vitrina Buffet refrigerada recta mural  con pu...   
23624  VMRT03GN  Vitrina Buffet refrigerada recta mural con ter...   
23625  VMRT04GN  Vitrina Buffet refrigerada recta mural  con te...   
23626  VRE00016  Termómetro analógico redondo, escala 0-120º  M...   
23627  ZUMFERIA                       Zumos ecologicos para ferias   

                                                 English  \
0                         

In [5]:
# Show all converted files
converted_files

['Abatidores.csv',
 'Envasadoras.csv',
 'Hornos.csv',
 'Hornos_coccion_acelerada.csv',
 'Regeneradores.csv',
 'Tabla valores iSeal.csv',
 'Video tutoriales Youtube.csv']