### [User Input Required] Read CSV Source with Autoloader.

__Common data loading patterns__: https://docs.databricks.com/en/ingestion/auto-loader/patterns.html

__Autoloader Options for CSV__: https://docs.databricks.com/en/ingestion/auto-loader/options.html#csv-options

__Common Autoloader Options__: https://docs.databricks.com/en/ingestion/auto-loader/options.html#common-auto-loader-options

__Schema Evolution Modes__: https://docs.databricks.com/en/ingestion/auto-loader/schema.html#how-does-auto-loader-schema-evolution-work

In [0]:
import dlt

# [User Input Required] Set the input/output locations, metadata
input_location = "dbfs:/databricks-datasets/nyctaxi/tripdata/green"
output_table = "bronze_nyctaxi_tripdata_green"
output_table_comments = "Bronze data for green NYC taxi trips"

# [User Input Required] Configure schema evolution and rescue data.
schema_evolution_mode = "addNewColumns"
rescue_data_column_name = "_rescued_data"


@dlt.view(name=f"{output_table}_autoloader")
def tmp():
  # [User Input Required] Configure Autoloader settings 
  df = (
    spark.readStream.format("cloudFiles")
    .option("cloudFiles.format", "csv")
    .option("cloudFiles.schemaEvolutionMode", schema_evolution_mode)
    .option("cloudFiles.rescuedDataColumn", rescue_data_column_name)
    # Add additional autoloader settings below
    # Add csv autoloader settings below
    .option("header", "true")
    .option("inferSchema","true")
    .load(input_location)
  )
  return df

[0;31m---------------------------------------------------------------------------[0m
[0;31mModuleNotFoundError[0m                       Traceback (most recent call last)
File [0;32m<command-4246314222309621>, line 1[0m
[0;32m----> 1[0m [38;5;28;01mimport[39;00m [38;5;21;01mdlt[39;00m
[1;32m      3[0m [38;5;66;03m# [User Input Required] Set the input/output locations, metadata[39;00m
[1;32m      4[0m input_location [38;5;241m=[39m [38;5;124m"[39m[38;5;124mdbfs:/databricks-datasets/nyctaxi/tripdata/green[39m[38;5;124m"[39m

[0;31mModuleNotFoundError[0m: No module named 'dlt'

### [Optional User Input Required] Transformations + Write Data to Unity Catalog

In [0]:
@dlt.table(name=output_table, comment=output_table_comments)
def t():
    # Read data from temporary autoloader table
    df = spark.readStream.table(f"live.{output_table}_autoloader")

    # [User Input Required] Optional Transformations
    ## Rename Trip_type column to remove trailing space
    df = df.withColumnRenamed("Trip_type ", "trip_type").drop("trip_type")
    return df

The column name(s) 'Trip_type', 'trip_type' are duplicated in dataset 'bronze_nyctaxi_tripdata_green'.
