In [11]:
import requests
from bs4 import BeautifulSoup
import os
import re
import pandas as pd

# URL de la página
url = "https://www.nyc.gov/site/tlc/about/tlc-trip-record-data.page"

# Realizar la solicitud GET a la página
response = requests.get(url)
soup = BeautifulSoup(response.content, 'html.parser')

# Crear una carpeta para almacenar los archivos descargados
os.makedirs('parquet_files', exist_ok=True)
os.makedirs('transformed_files', exist_ok=True)

# Función para verificar si el archivo está dentro del rango de años
def is_within_year_range(file_name, start_year, end_year):
    match = re.search(r'(\d{4})', file_name)
    if match:
        year = int(match.group(1))
        return start_year >= year >= end_year
    return False

# Rango de años
start_year = 2023
end_year = 2017

# Función para transformar los datos
def transform_data(df):
    if('green_tripdata' in file_name):
        columns_to_keep = ['lpep_pickup_datetime', 'lpep_dropoff_datetime', 'trip_distance', 'fare_amount', 'PULocationID', 'DOLocationID']
        df = df[columns_to_keep]
        df['es_verde'] = 1
    if('yellow_tripdata' in file_name):
        columns_to_keep = ['tpep_pickup_datetime', 'tpep_dropoff_datetime', 'trip_distance', 'fare_amount', 'PULocationID', 'DOLocationID']
        df = df[columns_to_keep]
        df['es_verde'] = 0
    return df

# Buscar todos los enlaces de archivos Parquet
for link in soup.find_all('a', href=True):
    href = link['href']
    if href.endswith('.parquet'):
        file_name = href.split('/')[-1]
        # Filtrar solo archivos que contengan 'green_tripdata' o 'yellow_tripdata' y estén en el rango de años
        if ('green_tripdata' in file_name or 'yellow_tripdata' in file_name) and is_within_year_range(file_name, start_year, end_year):
            # Descargar el archivo
            file_url = href
            file_response = requests.get(file_url)
            parquet_path = os.path.join('parquet_files', file_name)
            with open(parquet_path, 'wb') as file:
                file.write(file_response.content)
            
            print(f"Descargado: {file_name}")
            
            # Leer el archivo .parquet
            df = pd.read_parquet(parquet_path)
        
            # Transformar los datos
            transformed_df = transform_data(df)
            
            # Guardar el archivo transformado
            transformed_file_name = f"transformed_{file_name.replace('.parquet', '.csv')}"
            transformed_path = os.path.join('transformed_files', transformed_file_name)
            transformed_df.to_parquet(transformed_path, index=False)
            
            print(f"Transformado y guardado: {transformed_file_name}")

print("Descarga y transformación completadas.")


Descargado: yellow_tripdata_2023-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-01.csv
Descargado: green_tripdata_2023-01.parquet
Transformado y guardado: transformed_green_tripdata_2023-01.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2023-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-02.csv
Descargado: green_tripdata_2023-02.parquet
Transformado y guardado: transformed_green_tripdata_2023-02.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2023-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-03.csv
Descargado: yellow_tripdata_2023-04.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-04.csv
Descargado: green_tripdata_2023-04.parquet
Transformado y guardado: transformed_green_tripdata_2023-04.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2023-06.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-06.csv
Descargado: green_tripdata_2023-06.parquet
Transformado y guardado: transformed_green_tripdata_2023-06.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2023-12.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2023-12.csv
Descargado: green_tripdata_2023-12.parquet
Transformado y guardado: transformed_green_tripdata_2023-12.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-01.csv
Descargado: green_tripdata_2022-01.parquet
Transformado y guardado: transformed_green_tripdata_2022-01.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-02.csv
Descargado: green_tripdata_2022-02.parquet
Transformado y guardado: transformed_green_tripdata_2022-02.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-03.csv
Descargado: green_tripdata_2022-03.parquet
Transformado y guardado: transformed_green_tripdata_2022-03.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-04.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-04.csv
Descargado: green_tripdata_2022-04.parquet
Transformado y guardado: transformed_green_tripdata_2022-04.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-05.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-05.csv
Descargado: green_tripdata_2022-05.parquet
Transformado y guardado: transformed_green_tripdata_2022-05.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-06.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-06.csv
Descargado: green_tripdata_2022-06.parquet
Transformado y guardado: transformed_green_tripdata_2022-06.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-07.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-07.csv
Descargado: green_tripdata_2022-07.parquet
Transformado y guardado: transformed_green_tripdata_2022-07.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-08.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-08.csv
Descargado: green_tripdata_2022-08.parquet
Transformado y guardado: transformed_green_tripdata_2022-08.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-09.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-09.csv
Descargado: green_tripdata_2022-09.parquet
Transformado y guardado: transformed_green_tripdata_2022-09.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-10.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-10.csv
Descargado: green_tripdata_2022-10.parquet
Transformado y guardado: transformed_green_tripdata_2022-10.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-11.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-11.csv
Descargado: green_tripdata_2022-11.parquet
Transformado y guardado: transformed_green_tripdata_2022-11.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2022-12.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2022-12.csv
Descargado: green_tripdata_2022-12.parquet
Transformado y guardado: transformed_green_tripdata_2022-12.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-01.csv
Descargado: green_tripdata_2021-01.parquet
Transformado y guardado: transformed_green_tripdata_2021-01.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-02.csv
Descargado: green_tripdata_2021-02.parquet
Transformado y guardado: transformed_green_tripdata_2021-02.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-03.csv
Descargado: green_tripdata_2021-03.parquet
Transformado y guardado: transformed_green_tripdata_2021-03.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-04.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-04.csv
Descargado: green_tripdata_2021-04.parquet
Transformado y guardado: transformed_green_tripdata_2021-04.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-05.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-05.csv
Descargado: green_tripdata_2021-05.parquet
Transformado y guardado: transformed_green_tripdata_2021-05.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-06.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-06.csv
Descargado: green_tripdata_2021-06.parquet
Transformado y guardado: transformed_green_tripdata_2021-06.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-07.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-07.csv
Descargado: green_tripdata_2021-07.parquet
Transformado y guardado: transformed_green_tripdata_2021-07.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-08.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-08.csv
Descargado: green_tripdata_2021-08.parquet
Transformado y guardado: transformed_green_tripdata_2021-08.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-09.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-09.csv
Descargado: green_tripdata_2021-09.parquet
Transformado y guardado: transformed_green_tripdata_2021-09.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-10.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-10.csv
Descargado: green_tripdata_2021-10.parquet
Transformado y guardado: transformed_green_tripdata_2021-10.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-11.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-11.csv
Descargado: green_tripdata_2021-11.parquet
Transformado y guardado: transformed_green_tripdata_2021-11.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2021-12.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2021-12.csv
Descargado: green_tripdata_2021-12.parquet
Transformado y guardado: transformed_green_tripdata_2021-12.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-01.csv
Descargado: green_tripdata_2020-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2020-01.csv
Descargado: yellow_tripdata_2020-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-02.csv
Descargado: green_tripdata_2020-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2020-02.csv
Descargado: yellow_tripdata_2020-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-03.csv
Descargado: green_tripdata_2020-03.parquet
Transformado y guardado: transformed_green_tripdata_2020-03.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-04.parquet
Transformado y guardado: transformed_yellow_tripdata_2020-04.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Descargado: green_tripdata_2020-04.parquet
Transformado y guardado: transformed_green_tripdata_2020-04.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-05.parquet
Transformado y guardado: transformed_yellow_tripdata_2020-05.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Descargado: green_tripdata_2020-05.parquet
Transformado y guardado: transformed_green_tripdata_2020-05.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-06.parquet
Transformado y guardado: transformed_yellow_tripdata_2020-06.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Descargado: green_tripdata_2020-06.parquet
Transformado y guardado: transformed_green_tripdata_2020-06.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-07.parquet
Transformado y guardado: transformed_yellow_tripdata_2020-07.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Descargado: green_tripdata_2020-07.parquet
Transformado y guardado: transformed_green_tripdata_2020-07.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-08.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-08.csv
Descargado: green_tripdata_2020-08.parquet
Transformado y guardado: transformed_green_tripdata_2020-08.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-09.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-09.csv
Descargado: green_tripdata_2020-09.parquet
Transformado y guardado: transformed_green_tripdata_2020-09.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-10.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-10.csv
Descargado: green_tripdata_2020-10.parquet
Transformado y guardado: transformed_green_tripdata_2020-10.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-11.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-11.csv
Descargado: green_tripdata_2020-11.parquet
Transformado y guardado: transformed_green_tripdata_2020-11.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2020-12.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2020-12.csv
Descargado: green_tripdata_2020-12.parquet
Transformado y guardado: transformed_green_tripdata_2020-12.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2019-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-01.csv
Descargado: green_tripdata_2019-01.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-01.csv
Descargado: yellow_tripdata_2019-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-02.csv
Descargado: green_tripdata_2019-02.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-02.csv
Descargado: yellow_tripdata_2019-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-03.csv
Descargado: green_tripdata_2019-03.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-03.csv
Descargado: yellow_tripdata_2019-04.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-04.csv
Descargado: green_tripdata_2019-04.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-04.csv
Descargado: yellow_tripdata_2019-05.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-05.csv
Descargado: green_tripdata_2019-05.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-05.csv
Descargado: yellow_tripdata_2019-06.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-06.csv
Descargado: green_tripdata_2019-06.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-06.csv
Descargado: yellow_tripdata_2019-07.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-07.csv
Descargado: green_tripdata_2019-07.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-07.csv
Descargado: yellow_tripdata_2019-08.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-08.csv
Descargado: green_tripdata_2019-08.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-08.csv
Descargado: yellow_tripdata_2019-09.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-09.csv
Descargado: green_tripdata_2019-09.parquet
Transformado y guardado: transformed_green_tripdata_2019-09.csv


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Descargado: yellow_tripdata_2019-10.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-10.csv
Descargado: green_tripdata_2019-10.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-10.csv
Descargado: yellow_tripdata_2019-11.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-11.csv
Descargado: green_tripdata_2019-11.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 1


Transformado y guardado: transformed_green_tripdata_2019-11.csv
Descargado: yellow_tripdata_2019-12.parquet


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df['es_verde'] = 0


Transformado y guardado: transformed_yellow_tripdata_2019-12.csv
Descargado: green_tripdata_2019-12.parquet


ArrowInvalid: Could not open Parquet input source '<Buffer>': Parquet magic bytes not found in footer. Either the file is corrupted or this is not a parquet file.

In [17]:
data = pd.read_parquet('transformed_files/transformed_green_tripdata_2019-01.csv')

In [None]:
data