In [5]:
import pandas as pd
import re
 
# Input and output file paths
input_file = "nyc_taxi_data.csv"
output_file = "nyc_taxi_data_cleaned.csv"
chunk_size = 100_000  # Process 100,000 rows at a time
 
# Function to clean timestamp format
def clean_timestamp(value):
    try:
        # Check if the value contains AM/PM notation
        if re.search(r"\bAM\b|\bPM\b", str(value), re.IGNORECASE):
            return pd.to_datetime(value, format="%m/%d/%Y %I:%M:%S %p", errors="coerce")
        else:
            return pd.to_datetime(value, format="%m/%d/%Y %H:%M:%S", errors="coerce")
    except Exception:
        return pd.NaT  # Return NaT (Not a Time) for invalid values
 
# Process the file in chunks
with pd.read_csv(input_file, chunksize=chunk_size) as reader:
    for i, chunk in enumerate(reader):
        print(f"Processing chunk {i+1}...")
 
        # Apply the timestamp cleaning function
        chunk["tpep_pickup_datetime"] = chunk["tpep_pickup_datetime"].apply(clean_timestamp)
        chunk["tpep_dropoff_datetime"] = chunk["tpep_dropoff_datetime"].apply(clean_timestamp)
 
        # Drop rows with NaT values (optional)
        chunk = chunk.dropna(subset=["tpep_pickup_datetime", "tpep_dropoff_datetime"])
 
        # Append to the output file (write header only for the first chunk)
        mode = "w" if i == 0 else "a"
        header = i == 0
        chunk.to_csv(output_file, mode=mode, index=False, header=header)
 
        print(f"Chunk {i+1} processed and saved.")
 
print("Data cleaning complete! Cleaned file saved as 'nyc_taxi_data_cleaned.csv'.")

Processing chunk 1...
Chunk 1 processed and saved.
Processing chunk 2...
Chunk 2 processed and saved.
Processing chunk 3...
Chunk 3 processed and saved.
Processing chunk 4...
Chunk 4 processed and saved.
Processing chunk 5...
Chunk 5 processed and saved.
Processing chunk 6...
Chunk 6 processed and saved.
Processing chunk 7...
Chunk 7 processed and saved.
Processing chunk 8...
Chunk 8 processed and saved.
Processing chunk 9...
Chunk 9 processed and saved.
Processing chunk 10...
Chunk 10 processed and saved.
Processing chunk 11...
Chunk 11 processed and saved.
Processing chunk 12...
Chunk 12 processed and saved.
Processing chunk 13...
Chunk 13 processed and saved.
Processing chunk 14...
Chunk 14 processed and saved.
Processing chunk 15...
Chunk 15 processed and saved.
Processing chunk 16...
Chunk 16 processed and saved.
Processing chunk 17...
Chunk 17 processed and saved.
Processing chunk 18...
Chunk 18 processed and saved.
Processing chunk 19...
Chunk 19 processed and saved.
Processing 

  for i, chunk in enumerate(reader):


Chunk 30 processed and saved.
Processing chunk 31...


  for i, chunk in enumerate(reader):


Chunk 31 processed and saved.
Processing chunk 32...
Chunk 32 processed and saved.
Processing chunk 33...
Chunk 33 processed and saved.
Processing chunk 34...
Chunk 34 processed and saved.
Processing chunk 35...
Chunk 35 processed and saved.
Processing chunk 36...
Chunk 36 processed and saved.
Processing chunk 37...
Chunk 37 processed and saved.
Processing chunk 38...
Chunk 38 processed and saved.
Processing chunk 39...
Chunk 39 processed and saved.
Processing chunk 40...
Chunk 40 processed and saved.
Processing chunk 41...
Chunk 41 processed and saved.
Processing chunk 42...
Chunk 42 processed and saved.
Processing chunk 43...
Chunk 43 processed and saved.
Processing chunk 44...
Chunk 44 processed and saved.
Processing chunk 45...
Chunk 45 processed and saved.
Processing chunk 46...
Chunk 46 processed and saved.
Processing chunk 47...
Chunk 47 processed and saved.
Processing chunk 48...
Chunk 48 processed and saved.
Processing chunk 49...
Chunk 49 processed and saved.
Processing chunk

  for i, chunk in enumerate(reader):


Chunk 60 processed and saved.
Processing chunk 61...
Chunk 61 processed and saved.
Processing chunk 62...
Chunk 62 processed and saved.
Processing chunk 63...
Chunk 63 processed and saved.
Processing chunk 64...
Chunk 64 processed and saved.
Processing chunk 65...
Chunk 65 processed and saved.
Processing chunk 66...
Chunk 66 processed and saved.
Processing chunk 67...
Chunk 67 processed and saved.
Processing chunk 68...
Chunk 68 processed and saved.
Processing chunk 69...
Chunk 69 processed and saved.
Processing chunk 70...
Chunk 70 processed and saved.
Processing chunk 71...
Chunk 71 processed and saved.
Processing chunk 72...
Chunk 72 processed and saved.
Processing chunk 73...
Chunk 73 processed and saved.
Processing chunk 74...
Chunk 74 processed and saved.
Processing chunk 75...
Chunk 75 processed and saved.
Processing chunk 76...
Chunk 76 processed and saved.
Processing chunk 77...
Chunk 77 processed and saved.
Processing chunk 78...
Chunk 78 processed and saved.
Processing chunk

  for i, chunk in enumerate(reader):


Chunk 93 processed and saved.
Processing chunk 94...


  for i, chunk in enumerate(reader):


Chunk 94 processed and saved.
Processing chunk 95...
Chunk 95 processed and saved.
Processing chunk 96...
Chunk 96 processed and saved.
Processing chunk 97...
Chunk 97 processed and saved.
Processing chunk 98...
Chunk 98 processed and saved.
Processing chunk 99...
Chunk 99 processed and saved.
Processing chunk 100...
Chunk 100 processed and saved.
Processing chunk 101...
Chunk 101 processed and saved.
Processing chunk 102...
Chunk 102 processed and saved.
Processing chunk 103...
Chunk 103 processed and saved.
Processing chunk 104...
Chunk 104 processed and saved.
Processing chunk 105...
Chunk 105 processed and saved.
Processing chunk 106...
Chunk 106 processed and saved.
Processing chunk 107...
Chunk 107 processed and saved.
Processing chunk 108...
Chunk 108 processed and saved.
Processing chunk 109...
Chunk 109 processed and saved.
Processing chunk 110...
Chunk 110 processed and saved.
Processing chunk 111...
Chunk 111 processed and saved.
Processing chunk 112...
Chunk 112 processed a

  for i, chunk in enumerate(reader):


Chunk 126 processed and saved.
Processing chunk 127...


  for i, chunk in enumerate(reader):


Chunk 127 processed and saved.
Processing chunk 128...
Chunk 128 processed and saved.
Processing chunk 129...
Chunk 129 processed and saved.
Processing chunk 130...
Chunk 130 processed and saved.
Processing chunk 131...
Chunk 131 processed and saved.
Processing chunk 132...
Chunk 132 processed and saved.
Processing chunk 133...
Chunk 133 processed and saved.
Processing chunk 134...
Chunk 134 processed and saved.
Processing chunk 135...
Chunk 135 processed and saved.
Processing chunk 136...
Chunk 136 processed and saved.
Processing chunk 137...
Chunk 137 processed and saved.
Processing chunk 138...
Chunk 138 processed and saved.
Processing chunk 139...
Chunk 139 processed and saved.
Processing chunk 140...
Chunk 140 processed and saved.
Processing chunk 141...
Chunk 141 processed and saved.
Processing chunk 142...
Chunk 142 processed and saved.
Processing chunk 143...
Chunk 143 processed and saved.
Processing chunk 144...
Chunk 144 processed and saved.
Processing chunk 145...
Chunk 145 

  for i, chunk in enumerate(reader):


Chunk 161 processed and saved.
Processing chunk 162...


  for i, chunk in enumerate(reader):


Chunk 162 processed and saved.
Processing chunk 163...
Chunk 163 processed and saved.
Processing chunk 164...
Chunk 164 processed and saved.
Processing chunk 165...
Chunk 165 processed and saved.
Processing chunk 166...
Chunk 166 processed and saved.
Processing chunk 167...
Chunk 167 processed and saved.
Processing chunk 168...
Chunk 168 processed and saved.
Processing chunk 169...
Chunk 169 processed and saved.
Processing chunk 170...
Chunk 170 processed and saved.
Processing chunk 171...
Chunk 171 processed and saved.
Processing chunk 172...
Chunk 172 processed and saved.
Processing chunk 173...
Chunk 173 processed and saved.
Processing chunk 174...
Chunk 174 processed and saved.
Processing chunk 175...
Chunk 175 processed and saved.
Processing chunk 176...
Chunk 176 processed and saved.
Processing chunk 177...
Chunk 177 processed and saved.
Processing chunk 178...
Chunk 178 processed and saved.
Processing chunk 179...
Chunk 179 processed and saved.
Processing chunk 180...
Chunk 180 

  for i, chunk in enumerate(reader):


Chunk 194 processed and saved.
Processing chunk 195...


  for i, chunk in enumerate(reader):


Chunk 195 processed and saved.
Processing chunk 196...
Chunk 196 processed and saved.
Processing chunk 197...
Chunk 197 processed and saved.
Processing chunk 198...
Chunk 198 processed and saved.
Processing chunk 199...
Chunk 199 processed and saved.
Processing chunk 200...
Chunk 200 processed and saved.
Processing chunk 201...
Chunk 201 processed and saved.
Processing chunk 202...
Chunk 202 processed and saved.
Processing chunk 203...
Chunk 203 processed and saved.
Processing chunk 204...
Chunk 204 processed and saved.
Processing chunk 205...
Chunk 205 processed and saved.
Processing chunk 206...
Chunk 206 processed and saved.
Processing chunk 207...
Chunk 207 processed and saved.
Processing chunk 208...
Chunk 208 processed and saved.
Processing chunk 209...
Chunk 209 processed and saved.
Processing chunk 210...
Chunk 210 processed and saved.
Processing chunk 211...
Chunk 211 processed and saved.
Processing chunk 212...
Chunk 212 processed and saved.
Processing chunk 213...
Chunk 213 

  for i, chunk in enumerate(reader):


Chunk 224 processed and saved.
Processing chunk 225...
Chunk 225 processed and saved.
Processing chunk 226...
Chunk 226 processed and saved.
Processing chunk 227...
Chunk 227 processed and saved.
Processing chunk 228...
Chunk 228 processed and saved.
Processing chunk 229...
Chunk 229 processed and saved.
Processing chunk 230...
Chunk 230 processed and saved.
Processing chunk 231...
Chunk 231 processed and saved.
Processing chunk 232...
Chunk 232 processed and saved.
Processing chunk 233...
Chunk 233 processed and saved.
Processing chunk 234...
Chunk 234 processed and saved.
Processing chunk 235...
Chunk 235 processed and saved.
Processing chunk 236...
Chunk 236 processed and saved.
Processing chunk 237...
Chunk 237 processed and saved.
Processing chunk 238...
Chunk 238 processed and saved.
Processing chunk 239...
Chunk 239 processed and saved.
Processing chunk 240...
Chunk 240 processed and saved.
Processing chunk 241...
Chunk 241 processed and saved.
Processing chunk 242...
Chunk 242 

  for i, chunk in enumerate(reader):


Chunk 252 processed and saved.
Processing chunk 253...
Chunk 253 processed and saved.
Processing chunk 254...
Chunk 254 processed and saved.
Processing chunk 255...
Chunk 255 processed and saved.
Processing chunk 256...
Chunk 256 processed and saved.
Processing chunk 257...
Chunk 257 processed and saved.
Processing chunk 258...
Chunk 258 processed and saved.
Processing chunk 259...
Chunk 259 processed and saved.
Processing chunk 260...
Chunk 260 processed and saved.
Processing chunk 261...
Chunk 261 processed and saved.
Processing chunk 262...
Chunk 262 processed and saved.
Processing chunk 263...
Chunk 263 processed and saved.
Processing chunk 264...
Chunk 264 processed and saved.
Processing chunk 265...
Chunk 265 processed and saved.
Processing chunk 266...
Chunk 266 processed and saved.
Processing chunk 267...
Chunk 267 processed and saved.
Processing chunk 268...
Chunk 268 processed and saved.
Processing chunk 269...
Chunk 269 processed and saved.
Processing chunk 270...
Chunk 270 

  for i, chunk in enumerate(reader):


Chunk 280 processed and saved.
Processing chunk 281...


  for i, chunk in enumerate(reader):


Chunk 281 processed and saved.
Processing chunk 282...
Chunk 282 processed and saved.
Processing chunk 283...
Chunk 283 processed and saved.
Processing chunk 284...
Chunk 284 processed and saved.
Processing chunk 285...
Chunk 285 processed and saved.
Processing chunk 286...
Chunk 286 processed and saved.
Processing chunk 287...
Chunk 287 processed and saved.
Processing chunk 288...
Chunk 288 processed and saved.
Processing chunk 289...
Chunk 289 processed and saved.
Processing chunk 290...
Chunk 290 processed and saved.
Processing chunk 291...
Chunk 291 processed and saved.
Processing chunk 292...
Chunk 292 processed and saved.
Processing chunk 293...
Chunk 293 processed and saved.
Processing chunk 294...
Chunk 294 processed and saved.
Processing chunk 295...
Chunk 295 processed and saved.
Processing chunk 296...
Chunk 296 processed and saved.
Processing chunk 297...
Chunk 297 processed and saved.
Processing chunk 298...
Chunk 298 processed and saved.
Processing chunk 299...
Chunk 299 

  for i, chunk in enumerate(reader):


Chunk 315 processed and saved.
Processing chunk 316...


  for i, chunk in enumerate(reader):


Chunk 316 processed and saved.
Processing chunk 317...
Chunk 317 processed and saved.
Processing chunk 318...
Chunk 318 processed and saved.
Processing chunk 319...
Chunk 319 processed and saved.
Processing chunk 320...
Chunk 320 processed and saved.
Processing chunk 321...
Chunk 321 processed and saved.
Processing chunk 322...
Chunk 322 processed and saved.
Processing chunk 323...
Chunk 323 processed and saved.
Processing chunk 324...
Chunk 324 processed and saved.
Processing chunk 325...
Chunk 325 processed and saved.
Processing chunk 326...
Chunk 326 processed and saved.
Processing chunk 327...
Chunk 327 processed and saved.
Processing chunk 328...
Chunk 328 processed and saved.
Processing chunk 329...
Chunk 329 processed and saved.
Processing chunk 330...
Chunk 330 processed and saved.
Processing chunk 331...
Chunk 331 processed and saved.
Processing chunk 332...
Chunk 332 processed and saved.
Processing chunk 333...
Chunk 333 processed and saved.
Processing chunk 334...
Chunk 334 

  for i, chunk in enumerate(reader):


Chunk 349 processed and saved.
Processing chunk 350...


  for i, chunk in enumerate(reader):


Chunk 350 processed and saved.
Processing chunk 351...
Chunk 351 processed and saved.
Processing chunk 352...
Chunk 352 processed and saved.
Processing chunk 353...
Chunk 353 processed and saved.
Processing chunk 354...
Chunk 354 processed and saved.
Processing chunk 355...
Chunk 355 processed and saved.
Processing chunk 356...
Chunk 356 processed and saved.
Processing chunk 357...
Chunk 357 processed and saved.
Processing chunk 358...
Chunk 358 processed and saved.
Processing chunk 359...
Chunk 359 processed and saved.
Processing chunk 360...
Chunk 360 processed and saved.
Processing chunk 361...
Chunk 361 processed and saved.
Processing chunk 362...
Chunk 362 processed and saved.
Processing chunk 363...
Chunk 363 processed and saved.
Processing chunk 364...
Chunk 364 processed and saved.
Processing chunk 365...
Chunk 365 processed and saved.
Processing chunk 366...
Chunk 366 processed and saved.
Processing chunk 367...
Chunk 367 processed and saved.
Processing chunk 368...
Chunk 368 

  for i, chunk in enumerate(reader):


Chunk 382 processed and saved.
Processing chunk 383...
Chunk 383 processed and saved.
Processing chunk 384...
Chunk 384 processed and saved.
Data cleaning complete! Cleaned file saved as 'nyc_taxi_data_cleaned.csv'.


In [6]:
import pandas as pd
 
# Define the specific columns that should be integers
integer_columns = ["passenger_count", "PULocationID", "DOLocationID", "payment_type", "improvement_surcharge"]
 
def convert_specified_columns_to_int(chunk):
    """ Convert specified columns to integer type if possible. """
    for col in integer_columns:
        if col in chunk.columns:
            chunk[col] = pd.to_numeric(chunk[col], errors='coerce').fillna(0).astype(int)
    return chunk
 
# Define file paths
input_file = "nyc_taxi_data_cleaned.csv"
output_file = "nyc_taxi_data_cleaned_final.csv"
chunk_size = 10000  
 
# Process the file in chunks
with pd.read_csv(input_file, chunksize=chunk_size) as reader:
    for i, chunk in enumerate(reader):
        print(f"Processing chunk {i+1}...")
 
        # Convert only the specified columns to integers
        chunk = convert_specified_columns_to_int(chunk)
 
        # Append to the output file (write header only for the first chunk)
        mode = "w" if i == 0 else "a"
        header = i == 0
        chunk.to_csv(output_file, mode=mode, index=False, header=header)
 
        print(f"Chunk {i+1} processed and saved.")
 
print(f"Data cleaning complete! Cleaned file saved as '{output_file}'.")

Processing chunk 1...
Chunk 1 processed and saved.
Processing chunk 2...
Chunk 2 processed and saved.
Processing chunk 3...
Chunk 3 processed and saved.
Processing chunk 4...
Chunk 4 processed and saved.
Processing chunk 5...
Chunk 5 processed and saved.
Processing chunk 6...
Chunk 6 processed and saved.
Processing chunk 7...
Chunk 7 processed and saved.
Processing chunk 8...
Chunk 8 processed and saved.
Processing chunk 9...
Chunk 9 processed and saved.
Processing chunk 10...
Chunk 10 processed and saved.
Processing chunk 11...
Chunk 11 processed and saved.
Processing chunk 12...
Chunk 12 processed and saved.
Processing chunk 13...
Chunk 13 processed and saved.
Processing chunk 14...
Chunk 14 processed and saved.
Processing chunk 15...
Chunk 15 processed and saved.
Processing chunk 16...
Chunk 16 processed and saved.
Processing chunk 17...
Chunk 17 processed and saved.
Processing chunk 18...
Chunk 18 processed and saved.
Processing chunk 19...
Chunk 19 processed and saved.
Processing 

Chunk 155 processed and saved.
Processing chunk 156...
Chunk 156 processed and saved.
Processing chunk 157...
Chunk 157 processed and saved.
Processing chunk 158...
Chunk 158 processed and saved.
Processing chunk 159...
Chunk 159 processed and saved.
Processing chunk 160...
Chunk 160 processed and saved.
Processing chunk 161...
Chunk 161 processed and saved.
Processing chunk 162...
Chunk 162 processed and saved.
Processing chunk 163...
Chunk 163 processed and saved.
Processing chunk 164...
Chunk 164 processed and saved.
Processing chunk 165...
Chunk 165 processed and saved.
Processing chunk 166...
Chunk 166 processed and saved.
Processing chunk 167...
Chunk 167 processed and saved.
Processing chunk 168...
Chunk 168 processed and saved.
Processing chunk 169...
Chunk 169 processed and saved.
Processing chunk 170...
Chunk 170 processed and saved.
Processing chunk 171...
Chunk 171 processed and saved.
Processing chunk 172...
Chunk 172 processed and saved.
Processing chunk 173...
Chunk 173 

Chunk 304 processed and saved.
Processing chunk 305...
Chunk 305 processed and saved.
Processing chunk 306...
Chunk 306 processed and saved.
Processing chunk 307...
Chunk 307 processed and saved.
Processing chunk 308...
Chunk 308 processed and saved.
Processing chunk 309...
Chunk 309 processed and saved.
Processing chunk 310...
Chunk 310 processed and saved.
Processing chunk 311...
Chunk 311 processed and saved.
Processing chunk 312...
Chunk 312 processed and saved.
Processing chunk 313...
Chunk 313 processed and saved.
Processing chunk 314...
Chunk 314 processed and saved.
Processing chunk 315...
Chunk 315 processed and saved.
Processing chunk 316...
Chunk 316 processed and saved.
Processing chunk 317...
Chunk 317 processed and saved.
Processing chunk 318...
Chunk 318 processed and saved.
Processing chunk 319...
Chunk 319 processed and saved.
Processing chunk 320...
Chunk 320 processed and saved.
Processing chunk 321...
Chunk 321 processed and saved.
Processing chunk 322...
Chunk 322 

Chunk 454 processed and saved.
Processing chunk 455...
Chunk 455 processed and saved.
Processing chunk 456...
Chunk 456 processed and saved.
Processing chunk 457...
Chunk 457 processed and saved.
Processing chunk 458...
Chunk 458 processed and saved.
Processing chunk 459...
Chunk 459 processed and saved.
Processing chunk 460...
Chunk 460 processed and saved.
Processing chunk 461...
Chunk 461 processed and saved.
Processing chunk 462...
Chunk 462 processed and saved.
Processing chunk 463...
Chunk 463 processed and saved.
Processing chunk 464...
Chunk 464 processed and saved.
Processing chunk 465...
Chunk 465 processed and saved.
Processing chunk 466...
Chunk 466 processed and saved.
Processing chunk 467...
Chunk 467 processed and saved.
Processing chunk 468...
Chunk 468 processed and saved.
Processing chunk 469...
Chunk 469 processed and saved.
Processing chunk 470...
Chunk 470 processed and saved.
Processing chunk 471...
Chunk 471 processed and saved.
Processing chunk 472...
Chunk 472 

Processing chunk 605...
Chunk 605 processed and saved.
Processing chunk 606...
Chunk 606 processed and saved.
Processing chunk 607...
Chunk 607 processed and saved.
Processing chunk 608...
Chunk 608 processed and saved.
Processing chunk 609...
Chunk 609 processed and saved.
Processing chunk 610...
Chunk 610 processed and saved.
Processing chunk 611...
Chunk 611 processed and saved.
Processing chunk 612...
Chunk 612 processed and saved.
Processing chunk 613...
Chunk 613 processed and saved.
Processing chunk 614...
Chunk 614 processed and saved.
Processing chunk 615...
Chunk 615 processed and saved.
Processing chunk 616...
Chunk 616 processed and saved.
Processing chunk 617...
Chunk 617 processed and saved.
Processing chunk 618...
Chunk 618 processed and saved.
Processing chunk 619...
Chunk 619 processed and saved.
Processing chunk 620...
Chunk 620 processed and saved.
Processing chunk 621...
Chunk 621 processed and saved.
Processing chunk 622...
Chunk 622 processed and saved.
Processing

Chunk 755 processed and saved.
Processing chunk 756...
Chunk 756 processed and saved.
Processing chunk 757...
Chunk 757 processed and saved.
Processing chunk 758...
Chunk 758 processed and saved.
Processing chunk 759...
Chunk 759 processed and saved.
Processing chunk 760...
Chunk 760 processed and saved.
Processing chunk 761...
Chunk 761 processed and saved.
Processing chunk 762...
Chunk 762 processed and saved.
Processing chunk 763...
Chunk 763 processed and saved.
Processing chunk 764...
Chunk 764 processed and saved.
Processing chunk 765...
Chunk 765 processed and saved.
Processing chunk 766...
Chunk 766 processed and saved.
Processing chunk 767...
Chunk 767 processed and saved.
Processing chunk 768...
Chunk 768 processed and saved.
Processing chunk 769...
Chunk 769 processed and saved.
Processing chunk 770...
Chunk 770 processed and saved.
Processing chunk 771...
Chunk 771 processed and saved.
Processing chunk 772...
Chunk 772 processed and saved.
Processing chunk 773...
Chunk 773 

Chunk 904 processed and saved.
Processing chunk 905...
Chunk 905 processed and saved.
Processing chunk 906...
Chunk 906 processed and saved.
Processing chunk 907...
Chunk 907 processed and saved.
Processing chunk 908...
Chunk 908 processed and saved.
Processing chunk 909...
Chunk 909 processed and saved.
Processing chunk 910...
Chunk 910 processed and saved.
Processing chunk 911...
Chunk 911 processed and saved.
Processing chunk 912...
Chunk 912 processed and saved.
Processing chunk 913...
Chunk 913 processed and saved.
Processing chunk 914...
Chunk 914 processed and saved.
Processing chunk 915...
Chunk 915 processed and saved.
Processing chunk 916...
Chunk 916 processed and saved.
Processing chunk 917...
Chunk 917 processed and saved.
Processing chunk 918...
Chunk 918 processed and saved.
Processing chunk 919...
Chunk 919 processed and saved.
Processing chunk 920...
Chunk 920 processed and saved.
Processing chunk 921...
Chunk 921 processed and saved.
Processing chunk 922...
Chunk 922 

Chunk 1052 processed and saved.
Processing chunk 1053...
Chunk 1053 processed and saved.
Processing chunk 1054...
Chunk 1054 processed and saved.
Processing chunk 1055...
Chunk 1055 processed and saved.
Processing chunk 1056...
Chunk 1056 processed and saved.
Processing chunk 1057...
Chunk 1057 processed and saved.
Processing chunk 1058...
Chunk 1058 processed and saved.
Processing chunk 1059...
Chunk 1059 processed and saved.
Processing chunk 1060...
Chunk 1060 processed and saved.
Processing chunk 1061...
Chunk 1061 processed and saved.
Processing chunk 1062...
Chunk 1062 processed and saved.
Processing chunk 1063...
Chunk 1063 processed and saved.
Processing chunk 1064...
Chunk 1064 processed and saved.
Processing chunk 1065...
Chunk 1065 processed and saved.
Processing chunk 1066...
Chunk 1066 processed and saved.
Processing chunk 1067...
Chunk 1067 processed and saved.
Processing chunk 1068...
Chunk 1068 processed and saved.
Processing chunk 1069...
Chunk 1069 processed and saved.

Chunk 1196 processed and saved.
Processing chunk 1197...
Chunk 1197 processed and saved.
Processing chunk 1198...
Chunk 1198 processed and saved.
Processing chunk 1199...
Chunk 1199 processed and saved.
Processing chunk 1200...
Chunk 1200 processed and saved.
Processing chunk 1201...
Chunk 1201 processed and saved.
Processing chunk 1202...
Chunk 1202 processed and saved.
Processing chunk 1203...
Chunk 1203 processed and saved.
Processing chunk 1204...
Chunk 1204 processed and saved.
Processing chunk 1205...
Chunk 1205 processed and saved.
Processing chunk 1206...
Chunk 1206 processed and saved.
Processing chunk 1207...
Chunk 1207 processed and saved.
Processing chunk 1208...
Chunk 1208 processed and saved.
Processing chunk 1209...
Chunk 1209 processed and saved.
Processing chunk 1210...
Chunk 1210 processed and saved.
Processing chunk 1211...
Chunk 1211 processed and saved.
Processing chunk 1212...
Chunk 1212 processed and saved.
Processing chunk 1213...
Chunk 1213 processed and saved.

Chunk 1341 processed and saved.
Processing chunk 1342...
Chunk 1342 processed and saved.
Processing chunk 1343...
Chunk 1343 processed and saved.
Processing chunk 1344...
Chunk 1344 processed and saved.
Processing chunk 1345...
Chunk 1345 processed and saved.
Processing chunk 1346...
Chunk 1346 processed and saved.
Processing chunk 1347...
Chunk 1347 processed and saved.
Processing chunk 1348...
Chunk 1348 processed and saved.
Processing chunk 1349...
Chunk 1349 processed and saved.
Processing chunk 1350...
Chunk 1350 processed and saved.
Processing chunk 1351...
Chunk 1351 processed and saved.
Processing chunk 1352...
Chunk 1352 processed and saved.
Processing chunk 1353...
Chunk 1353 processed and saved.
Processing chunk 1354...
Chunk 1354 processed and saved.
Processing chunk 1355...
Chunk 1355 processed and saved.
Processing chunk 1356...
Chunk 1356 processed and saved.
Processing chunk 1357...
Chunk 1357 processed and saved.
Processing chunk 1358...
Chunk 1358 processed and saved.

Chunk 1485 processed and saved.
Processing chunk 1486...
Chunk 1486 processed and saved.
Processing chunk 1487...
Chunk 1487 processed and saved.
Processing chunk 1488...
Chunk 1488 processed and saved.
Processing chunk 1489...
Chunk 1489 processed and saved.
Processing chunk 1490...
Chunk 1490 processed and saved.
Processing chunk 1491...
Chunk 1491 processed and saved.
Processing chunk 1492...
Chunk 1492 processed and saved.
Processing chunk 1493...
Chunk 1493 processed and saved.
Processing chunk 1494...
Chunk 1494 processed and saved.
Processing chunk 1495...
Chunk 1495 processed and saved.
Processing chunk 1496...
Chunk 1496 processed and saved.
Processing chunk 1497...
Chunk 1497 processed and saved.
Processing chunk 1498...
Chunk 1498 processed and saved.
Processing chunk 1499...
Chunk 1499 processed and saved.
Processing chunk 1500...
Chunk 1500 processed and saved.
Processing chunk 1501...
Chunk 1501 processed and saved.
Processing chunk 1502...
Chunk 1502 processed and saved.

Chunk 1629 processed and saved.
Processing chunk 1630...
Chunk 1630 processed and saved.
Processing chunk 1631...
Chunk 1631 processed and saved.
Processing chunk 1632...
Chunk 1632 processed and saved.
Processing chunk 1633...
Chunk 1633 processed and saved.
Processing chunk 1634...
Chunk 1634 processed and saved.
Processing chunk 1635...
Chunk 1635 processed and saved.
Processing chunk 1636...
Chunk 1636 processed and saved.
Processing chunk 1637...
Chunk 1637 processed and saved.
Processing chunk 1638...
Chunk 1638 processed and saved.
Processing chunk 1639...
Chunk 1639 processed and saved.
Processing chunk 1640...
Chunk 1640 processed and saved.
Processing chunk 1641...
Chunk 1641 processed and saved.
Processing chunk 1642...
Chunk 1642 processed and saved.
Processing chunk 1643...
Chunk 1643 processed and saved.
Processing chunk 1644...
Chunk 1644 processed and saved.
Processing chunk 1645...
Chunk 1645 processed and saved.
Processing chunk 1646...
Chunk 1646 processed and saved.

Chunk 1775 processed and saved.
Processing chunk 1776...
Chunk 1776 processed and saved.
Processing chunk 1777...
Chunk 1777 processed and saved.
Processing chunk 1778...
Chunk 1778 processed and saved.
Processing chunk 1779...
Chunk 1779 processed and saved.
Processing chunk 1780...
Chunk 1780 processed and saved.
Processing chunk 1781...
Chunk 1781 processed and saved.
Processing chunk 1782...
Chunk 1782 processed and saved.
Processing chunk 1783...
Chunk 1783 processed and saved.
Processing chunk 1784...
Chunk 1784 processed and saved.
Processing chunk 1785...
Chunk 1785 processed and saved.
Processing chunk 1786...
Chunk 1786 processed and saved.
Processing chunk 1787...
Chunk 1787 processed and saved.
Processing chunk 1788...
Chunk 1788 processed and saved.
Processing chunk 1789...
Chunk 1789 processed and saved.
Processing chunk 1790...
Chunk 1790 processed and saved.
Processing chunk 1791...
Chunk 1791 processed and saved.
Processing chunk 1792...
Chunk 1792 processed and saved.

Chunk 1919 processed and saved.
Processing chunk 1920...
Chunk 1920 processed and saved.
Processing chunk 1921...
Chunk 1921 processed and saved.
Processing chunk 1922...
Chunk 1922 processed and saved.
Processing chunk 1923...
Chunk 1923 processed and saved.
Processing chunk 1924...
Chunk 1924 processed and saved.
Processing chunk 1925...
Chunk 1925 processed and saved.
Processing chunk 1926...
Chunk 1926 processed and saved.
Processing chunk 1927...
Chunk 1927 processed and saved.
Processing chunk 1928...
Chunk 1928 processed and saved.
Processing chunk 1929...
Chunk 1929 processed and saved.
Processing chunk 1930...
Chunk 1930 processed and saved.
Processing chunk 1931...
Chunk 1931 processed and saved.
Processing chunk 1932...
Chunk 1932 processed and saved.
Processing chunk 1933...
Chunk 1933 processed and saved.
Processing chunk 1934...
Chunk 1934 processed and saved.
Processing chunk 1935...
Chunk 1935 processed and saved.
Processing chunk 1936...
Chunk 1936 processed and saved.

Chunk 2063 processed and saved.
Processing chunk 2064...
Chunk 2064 processed and saved.
Processing chunk 2065...
Chunk 2065 processed and saved.
Processing chunk 2066...
Chunk 2066 processed and saved.
Processing chunk 2067...
Chunk 2067 processed and saved.
Processing chunk 2068...
Chunk 2068 processed and saved.
Processing chunk 2069...
Chunk 2069 processed and saved.
Processing chunk 2070...
Chunk 2070 processed and saved.
Processing chunk 2071...
Chunk 2071 processed and saved.
Processing chunk 2072...
Chunk 2072 processed and saved.
Processing chunk 2073...
Chunk 2073 processed and saved.
Processing chunk 2074...
Chunk 2074 processed and saved.
Processing chunk 2075...
Chunk 2075 processed and saved.
Processing chunk 2076...
Chunk 2076 processed and saved.
Processing chunk 2077...
Chunk 2077 processed and saved.
Processing chunk 2078...
Chunk 2078 processed and saved.
Processing chunk 2079...
Chunk 2079 processed and saved.
Processing chunk 2080...
Chunk 2080 processed and saved.

Chunk 2209 processed and saved.
Processing chunk 2210...
Chunk 2210 processed and saved.
Processing chunk 2211...
Chunk 2211 processed and saved.
Processing chunk 2212...
Chunk 2212 processed and saved.
Processing chunk 2213...
Chunk 2213 processed and saved.
Processing chunk 2214...
Chunk 2214 processed and saved.
Processing chunk 2215...
Chunk 2215 processed and saved.
Processing chunk 2216...
Chunk 2216 processed and saved.
Processing chunk 2217...
Chunk 2217 processed and saved.
Processing chunk 2218...
Chunk 2218 processed and saved.
Processing chunk 2219...
Chunk 2219 processed and saved.
Processing chunk 2220...
Chunk 2220 processed and saved.
Processing chunk 2221...
Chunk 2221 processed and saved.
Processing chunk 2222...
Chunk 2222 processed and saved.
Processing chunk 2223...
Chunk 2223 processed and saved.
Processing chunk 2224...
Chunk 2224 processed and saved.
Processing chunk 2225...
Chunk 2225 processed and saved.
Processing chunk 2226...
Chunk 2226 processed and saved.

Chunk 2354 processed and saved.
Processing chunk 2355...
Chunk 2355 processed and saved.
Processing chunk 2356...
Chunk 2356 processed and saved.
Processing chunk 2357...
Chunk 2357 processed and saved.
Processing chunk 2358...
Chunk 2358 processed and saved.
Processing chunk 2359...
Chunk 2359 processed and saved.
Processing chunk 2360...
Chunk 2360 processed and saved.
Processing chunk 2361...
Chunk 2361 processed and saved.
Processing chunk 2362...
Chunk 2362 processed and saved.
Processing chunk 2363...
Chunk 2363 processed and saved.
Processing chunk 2364...
Chunk 2364 processed and saved.
Processing chunk 2365...
Chunk 2365 processed and saved.
Processing chunk 2366...
Chunk 2366 processed and saved.
Processing chunk 2367...
Chunk 2367 processed and saved.
Processing chunk 2368...
Chunk 2368 processed and saved.
Processing chunk 2369...
Chunk 2369 processed and saved.
Processing chunk 2370...
Chunk 2370 processed and saved.
Processing chunk 2371...
Chunk 2371 processed and saved.

Chunk 2500 processed and saved.
Processing chunk 2501...
Chunk 2501 processed and saved.
Processing chunk 2502...
Chunk 2502 processed and saved.
Processing chunk 2503...
Chunk 2503 processed and saved.
Processing chunk 2504...
Chunk 2504 processed and saved.
Processing chunk 2505...
Chunk 2505 processed and saved.
Processing chunk 2506...
Chunk 2506 processed and saved.
Processing chunk 2507...
Chunk 2507 processed and saved.
Processing chunk 2508...
Chunk 2508 processed and saved.
Processing chunk 2509...
Chunk 2509 processed and saved.
Processing chunk 2510...
Chunk 2510 processed and saved.
Processing chunk 2511...
Chunk 2511 processed and saved.
Processing chunk 2512...
Chunk 2512 processed and saved.
Processing chunk 2513...
Chunk 2513 processed and saved.
Processing chunk 2514...
Chunk 2514 processed and saved.
Processing chunk 2515...
Chunk 2515 processed and saved.
Processing chunk 2516...
Chunk 2516 processed and saved.
Processing chunk 2517...
Chunk 2517 processed and saved.

Chunk 2646 processed and saved.
Processing chunk 2647...
Chunk 2647 processed and saved.
Processing chunk 2648...
Chunk 2648 processed and saved.
Processing chunk 2649...
Chunk 2649 processed and saved.
Processing chunk 2650...
Chunk 2650 processed and saved.
Processing chunk 2651...
Chunk 2651 processed and saved.
Processing chunk 2652...
Chunk 2652 processed and saved.
Processing chunk 2653...
Chunk 2653 processed and saved.
Processing chunk 2654...
Chunk 2654 processed and saved.
Processing chunk 2655...
Chunk 2655 processed and saved.
Processing chunk 2656...
Chunk 2656 processed and saved.
Processing chunk 2657...
Chunk 2657 processed and saved.
Processing chunk 2658...
Chunk 2658 processed and saved.
Processing chunk 2659...
Chunk 2659 processed and saved.
Processing chunk 2660...
Chunk 2660 processed and saved.
Processing chunk 2661...
Chunk 2661 processed and saved.
Processing chunk 2662...
Chunk 2662 processed and saved.
Processing chunk 2663...
Chunk 2663 processed and saved.

Chunk 2790 processed and saved.
Processing chunk 2791...
Chunk 2791 processed and saved.
Processing chunk 2792...
Chunk 2792 processed and saved.
Processing chunk 2793...
Chunk 2793 processed and saved.
Processing chunk 2794...
Chunk 2794 processed and saved.
Processing chunk 2795...
Chunk 2795 processed and saved.
Processing chunk 2796...
Chunk 2796 processed and saved.
Processing chunk 2797...
Chunk 2797 processed and saved.
Processing chunk 2798...
Chunk 2798 processed and saved.
Processing chunk 2799...
Chunk 2799 processed and saved.
Processing chunk 2800...
Chunk 2800 processed and saved.
Processing chunk 2801...
Chunk 2801 processed and saved.
Processing chunk 2802...
Chunk 2802 processed and saved.
Processing chunk 2803...
Chunk 2803 processed and saved.
Processing chunk 2804...
Chunk 2804 processed and saved.
Processing chunk 2805...
Chunk 2805 processed and saved.
Processing chunk 2806...
Chunk 2806 processed and saved.
Processing chunk 2807...
Chunk 2807 processed and saved.

Chunk 2936 processed and saved.
Processing chunk 2937...
Chunk 2937 processed and saved.
Processing chunk 2938...
Chunk 2938 processed and saved.
Processing chunk 2939...
Chunk 2939 processed and saved.
Processing chunk 2940...
Chunk 2940 processed and saved.
Processing chunk 2941...
Chunk 2941 processed and saved.
Processing chunk 2942...
Chunk 2942 processed and saved.
Processing chunk 2943...
Chunk 2943 processed and saved.
Processing chunk 2944...
Chunk 2944 processed and saved.
Processing chunk 2945...
Chunk 2945 processed and saved.
Processing chunk 2946...
Chunk 2946 processed and saved.
Processing chunk 2947...
Chunk 2947 processed and saved.
Processing chunk 2948...
Chunk 2948 processed and saved.
Processing chunk 2949...
Chunk 2949 processed and saved.
Processing chunk 2950...
Chunk 2950 processed and saved.
Processing chunk 2951...
Chunk 2951 processed and saved.
Processing chunk 2952...
Chunk 2952 processed and saved.
Processing chunk 2953...
Chunk 2953 processed and saved.

Chunk 3080 processed and saved.
Processing chunk 3081...
Chunk 3081 processed and saved.
Processing chunk 3082...
Chunk 3082 processed and saved.
Processing chunk 3083...
Chunk 3083 processed and saved.
Processing chunk 3084...
Chunk 3084 processed and saved.
Processing chunk 3085...
Chunk 3085 processed and saved.
Processing chunk 3086...
Chunk 3086 processed and saved.
Processing chunk 3087...
Chunk 3087 processed and saved.
Processing chunk 3088...
Chunk 3088 processed and saved.
Processing chunk 3089...
Chunk 3089 processed and saved.
Processing chunk 3090...
Chunk 3090 processed and saved.
Processing chunk 3091...
Chunk 3091 processed and saved.
Processing chunk 3092...
Chunk 3092 processed and saved.
Processing chunk 3093...
Chunk 3093 processed and saved.
Processing chunk 3094...
Chunk 3094 processed and saved.
Processing chunk 3095...
Chunk 3095 processed and saved.
Processing chunk 3096...
Chunk 3096 processed and saved.
Processing chunk 3097...
Chunk 3097 processed and saved.

Chunk 3226 processed and saved.
Processing chunk 3227...
Chunk 3227 processed and saved.
Processing chunk 3228...
Chunk 3228 processed and saved.
Processing chunk 3229...
Chunk 3229 processed and saved.
Processing chunk 3230...
Chunk 3230 processed and saved.
Processing chunk 3231...
Chunk 3231 processed and saved.
Processing chunk 3232...
Chunk 3232 processed and saved.
Processing chunk 3233...
Chunk 3233 processed and saved.
Processing chunk 3234...
Chunk 3234 processed and saved.
Processing chunk 3235...
Chunk 3235 processed and saved.
Processing chunk 3236...
Chunk 3236 processed and saved.
Processing chunk 3237...
Chunk 3237 processed and saved.
Processing chunk 3238...
Chunk 3238 processed and saved.
Processing chunk 3239...
Chunk 3239 processed and saved.
Processing chunk 3240...
Chunk 3240 processed and saved.
Processing chunk 3241...
Chunk 3241 processed and saved.
Processing chunk 3242...
Chunk 3242 processed and saved.
Processing chunk 3243...
Chunk 3243 processed and saved.

Chunk 3372 processed and saved.
Processing chunk 3373...
Chunk 3373 processed and saved.
Processing chunk 3374...
Chunk 3374 processed and saved.
Processing chunk 3375...
Chunk 3375 processed and saved.
Processing chunk 3376...
Chunk 3376 processed and saved.
Processing chunk 3377...
Chunk 3377 processed and saved.
Processing chunk 3378...
Chunk 3378 processed and saved.
Processing chunk 3379...
Chunk 3379 processed and saved.
Processing chunk 3380...
Chunk 3380 processed and saved.
Processing chunk 3381...
Chunk 3381 processed and saved.
Processing chunk 3382...
Chunk 3382 processed and saved.
Processing chunk 3383...
Chunk 3383 processed and saved.
Processing chunk 3384...
Chunk 3384 processed and saved.
Processing chunk 3385...
Chunk 3385 processed and saved.
Processing chunk 3386...
Chunk 3386 processed and saved.
Processing chunk 3387...
Chunk 3387 processed and saved.
Processing chunk 3388...
Chunk 3388 processed and saved.
Processing chunk 3389...
Chunk 3389 processed and saved.

Chunk 3517 processed and saved.
Processing chunk 3518...
Chunk 3518 processed and saved.
Processing chunk 3519...
Chunk 3519 processed and saved.
Processing chunk 3520...
Chunk 3520 processed and saved.
Processing chunk 3521...
Chunk 3521 processed and saved.
Processing chunk 3522...
Chunk 3522 processed and saved.
Processing chunk 3523...
Chunk 3523 processed and saved.
Processing chunk 3524...
Chunk 3524 processed and saved.
Processing chunk 3525...
Chunk 3525 processed and saved.
Processing chunk 3526...
Chunk 3526 processed and saved.
Processing chunk 3527...
Chunk 3527 processed and saved.
Processing chunk 3528...
Chunk 3528 processed and saved.
Processing chunk 3529...
Chunk 3529 processed and saved.
Processing chunk 3530...
Chunk 3530 processed and saved.
Processing chunk 3531...
Chunk 3531 processed and saved.
Processing chunk 3532...
Chunk 3532 processed and saved.
Processing chunk 3533...
Chunk 3533 processed and saved.
Processing chunk 3534...
Chunk 3534 processed and saved.

Chunk 3661 processed and saved.
Processing chunk 3662...
Chunk 3662 processed and saved.
Processing chunk 3663...
Chunk 3663 processed and saved.
Processing chunk 3664...
Chunk 3664 processed and saved.
Processing chunk 3665...
Chunk 3665 processed and saved.
Processing chunk 3666...
Chunk 3666 processed and saved.
Processing chunk 3667...
Chunk 3667 processed and saved.
Processing chunk 3668...
Chunk 3668 processed and saved.
Processing chunk 3669...
Chunk 3669 processed and saved.
Processing chunk 3670...
Chunk 3670 processed and saved.
Processing chunk 3671...
Chunk 3671 processed and saved.
Processing chunk 3672...
Chunk 3672 processed and saved.
Processing chunk 3673...
Chunk 3673 processed and saved.
Processing chunk 3674...
Chunk 3674 processed and saved.
Processing chunk 3675...
Chunk 3675 processed and saved.
Processing chunk 3676...
Chunk 3676 processed and saved.
Processing chunk 3677...
Chunk 3677 processed and saved.
Processing chunk 3678...
Chunk 3678 processed and saved.

Chunk 3805 processed and saved.
Processing chunk 3806...
Chunk 3806 processed and saved.
Processing chunk 3807...
Chunk 3807 processed and saved.
Processing chunk 3808...
Chunk 3808 processed and saved.
Processing chunk 3809...
Chunk 3809 processed and saved.
Processing chunk 3810...
Chunk 3810 processed and saved.
Processing chunk 3811...
Chunk 3811 processed and saved.
Processing chunk 3812...
Chunk 3812 processed and saved.
Processing chunk 3813...
Chunk 3813 processed and saved.
Processing chunk 3814...
Chunk 3814 processed and saved.
Processing chunk 3815...
Chunk 3815 processed and saved.
Processing chunk 3816...
Chunk 3816 processed and saved.
Processing chunk 3817...
Chunk 3817 processed and saved.
Processing chunk 3818...
Chunk 3818 processed and saved.
Processing chunk 3819...
Chunk 3819 processed and saved.
Processing chunk 3820...
Chunk 3820 processed and saved.
Processing chunk 3821...
Chunk 3821 processed and saved.
Processing chunk 3822...
Chunk 3822 processed and saved.

In [7]:
import pandas as pd
 
# Define file paths
input_file = "nyc_taxi_data_cleaned_final.csv"
output_file = "nyc_taxi_data_cleaned_final1.csv"
chunk_size = 100000  # Adjust based on your system's memory
 
# Define the specific columns that should be integers
integer_columns = ["RatecodeID"]
 
def convert_specified_columns_to_int(chunk):
    """ Convert specified columns to integer type if possible. """
    for col in integer_columns:
        if col in chunk.columns:
            chunk[col] = pd.to_numeric(chunk[col], errors='coerce').fillna(0).astype(int)
    return chunk
 
 
# Process the file in chunks
with pd.read_csv(input_file, chunksize=chunk_size) as reader:
    for i, chunk in enumerate(reader):
        print(f"Processing chunk {i+1}...")
 
        # Convert only the specified columns to integers
        chunk = convert_specified_columns_to_int(chunk)
 
        # Append to the output file (write header only for the first chunk)
        mode = "w" if i == 0 else "a"
        header = i == 0
        chunk.to_csv(output_file, mode=mode, index=False, header=header)
 
        print(f"Chunk {i+1} processed and saved.")
 
print(f"Data cleaning complete! Cleaned file saved as '{output_file}'.")

Processing chunk 1...
Chunk 1 processed and saved.
Processing chunk 2...
Chunk 2 processed and saved.
Processing chunk 3...
Chunk 3 processed and saved.
Processing chunk 4...
Chunk 4 processed and saved.
Processing chunk 5...
Chunk 5 processed and saved.
Processing chunk 6...
Chunk 6 processed and saved.
Processing chunk 7...
Chunk 7 processed and saved.
Processing chunk 8...
Chunk 8 processed and saved.
Processing chunk 9...
Chunk 9 processed and saved.
Processing chunk 10...
Chunk 10 processed and saved.
Processing chunk 11...
Chunk 11 processed and saved.
Processing chunk 12...
Chunk 12 processed and saved.
Processing chunk 13...
Chunk 13 processed and saved.
Processing chunk 14...
Chunk 14 processed and saved.
Processing chunk 15...
Chunk 15 processed and saved.
Processing chunk 16...
Chunk 16 processed and saved.
Processing chunk 17...
Chunk 17 processed and saved.
Processing chunk 18...
Chunk 18 processed and saved.
Processing chunk 19...
Chunk 19 processed and saved.
Processing 

  for i, chunk in enumerate(reader):


Processing chunk 30...
Chunk 30 processed and saved.
Processing chunk 31...


  for i, chunk in enumerate(reader):


Chunk 31 processed and saved.
Processing chunk 32...
Chunk 32 processed and saved.
Processing chunk 33...
Chunk 33 processed and saved.
Processing chunk 34...
Chunk 34 processed and saved.
Processing chunk 35...
Chunk 35 processed and saved.
Processing chunk 36...
Chunk 36 processed and saved.
Processing chunk 37...
Chunk 37 processed and saved.
Processing chunk 38...
Chunk 38 processed and saved.
Processing chunk 39...
Chunk 39 processed and saved.
Processing chunk 40...
Chunk 40 processed and saved.
Processing chunk 41...
Chunk 41 processed and saved.
Processing chunk 42...
Chunk 42 processed and saved.
Processing chunk 43...
Chunk 43 processed and saved.
Processing chunk 44...
Chunk 44 processed and saved.
Processing chunk 45...
Chunk 45 processed and saved.
Processing chunk 46...
Chunk 46 processed and saved.
Processing chunk 47...
Chunk 47 processed and saved.
Processing chunk 48...
Chunk 48 processed and saved.
Processing chunk 49...
Chunk 49 processed and saved.
Processing chunk

  for i, chunk in enumerate(reader):


Chunk 60 processed and saved.
Processing chunk 61...
Chunk 61 processed and saved.
Processing chunk 62...
Chunk 62 processed and saved.
Processing chunk 63...
Chunk 63 processed and saved.
Processing chunk 64...
Chunk 64 processed and saved.
Processing chunk 65...
Chunk 65 processed and saved.
Processing chunk 66...
Chunk 66 processed and saved.
Processing chunk 67...
Chunk 67 processed and saved.
Processing chunk 68...
Chunk 68 processed and saved.
Processing chunk 69...
Chunk 69 processed and saved.
Processing chunk 70...
Chunk 70 processed and saved.
Processing chunk 71...
Chunk 71 processed and saved.
Processing chunk 72...
Chunk 72 processed and saved.
Processing chunk 73...
Chunk 73 processed and saved.
Processing chunk 74...
Chunk 74 processed and saved.
Processing chunk 75...
Chunk 75 processed and saved.
Processing chunk 76...
Chunk 76 processed and saved.
Processing chunk 77...
Chunk 77 processed and saved.
Processing chunk 78...
Chunk 78 processed and saved.
Processing chunk

  for i, chunk in enumerate(reader):


Chunk 93 processed and saved.


  for i, chunk in enumerate(reader):


Processing chunk 94...
Chunk 94 processed and saved.
Processing chunk 95...
Chunk 95 processed and saved.
Processing chunk 96...
Chunk 96 processed and saved.
Processing chunk 97...
Chunk 97 processed and saved.
Processing chunk 98...
Chunk 98 processed and saved.
Processing chunk 99...
Chunk 99 processed and saved.
Processing chunk 100...
Chunk 100 processed and saved.
Processing chunk 101...
Chunk 101 processed and saved.
Processing chunk 102...
Chunk 102 processed and saved.
Processing chunk 103...
Chunk 103 processed and saved.
Processing chunk 104...
Chunk 104 processed and saved.
Processing chunk 105...
Chunk 105 processed and saved.
Processing chunk 106...
Chunk 106 processed and saved.
Processing chunk 107...
Chunk 107 processed and saved.
Processing chunk 108...
Chunk 108 processed and saved.
Processing chunk 109...
Chunk 109 processed and saved.
Processing chunk 110...
Chunk 110 processed and saved.
Processing chunk 111...
Chunk 111 processed and saved.
Processing chunk 112..

  for i, chunk in enumerate(reader):


Chunk 126 processed and saved.


  for i, chunk in enumerate(reader):


Processing chunk 127...
Chunk 127 processed and saved.
Processing chunk 128...
Chunk 128 processed and saved.
Processing chunk 129...
Chunk 129 processed and saved.
Processing chunk 130...
Chunk 130 processed and saved.
Processing chunk 131...
Chunk 131 processed and saved.
Processing chunk 132...
Chunk 132 processed and saved.
Processing chunk 133...
Chunk 133 processed and saved.
Processing chunk 134...
Chunk 134 processed and saved.
Processing chunk 135...
Chunk 135 processed and saved.
Processing chunk 136...
Chunk 136 processed and saved.
Processing chunk 137...
Chunk 137 processed and saved.
Processing chunk 138...
Chunk 138 processed and saved.
Processing chunk 139...
Chunk 139 processed and saved.
Processing chunk 140...
Chunk 140 processed and saved.
Processing chunk 141...
Chunk 141 processed and saved.
Processing chunk 142...
Chunk 142 processed and saved.
Processing chunk 143...
Chunk 143 processed and saved.
Processing chunk 144...
Chunk 144 processed and saved.
Processing

  for i, chunk in enumerate(reader):


Processing chunk 161...
Chunk 161 processed and saved.
Processing chunk 162...


  for i, chunk in enumerate(reader):


Chunk 162 processed and saved.
Processing chunk 163...
Chunk 163 processed and saved.
Processing chunk 164...
Chunk 164 processed and saved.
Processing chunk 165...
Chunk 165 processed and saved.
Processing chunk 166...
Chunk 166 processed and saved.
Processing chunk 167...
Chunk 167 processed and saved.
Processing chunk 168...
Chunk 168 processed and saved.
Processing chunk 169...
Chunk 169 processed and saved.
Processing chunk 170...
Chunk 170 processed and saved.
Processing chunk 171...
Chunk 171 processed and saved.
Processing chunk 172...
Chunk 172 processed and saved.
Processing chunk 173...
Chunk 173 processed and saved.
Processing chunk 174...
Chunk 174 processed and saved.
Processing chunk 175...
Chunk 175 processed and saved.
Processing chunk 176...
Chunk 176 processed and saved.
Processing chunk 177...
Chunk 177 processed and saved.
Processing chunk 178...
Chunk 178 processed and saved.
Processing chunk 179...
Chunk 179 processed and saved.
Processing chunk 180...
Chunk 180 

  for i, chunk in enumerate(reader):


Chunk 194 processed and saved.
Processing chunk 195...


  for i, chunk in enumerate(reader):


Chunk 195 processed and saved.
Processing chunk 196...
Chunk 196 processed and saved.
Processing chunk 197...
Chunk 197 processed and saved.
Processing chunk 198...
Chunk 198 processed and saved.
Processing chunk 199...
Chunk 199 processed and saved.
Processing chunk 200...
Chunk 200 processed and saved.
Processing chunk 201...
Chunk 201 processed and saved.
Processing chunk 202...
Chunk 202 processed and saved.
Processing chunk 203...
Chunk 203 processed and saved.
Processing chunk 204...
Chunk 204 processed and saved.
Processing chunk 205...
Chunk 205 processed and saved.
Processing chunk 206...
Chunk 206 processed and saved.
Processing chunk 207...
Chunk 207 processed and saved.
Processing chunk 208...
Chunk 208 processed and saved.
Processing chunk 209...
Chunk 209 processed and saved.
Processing chunk 210...
Chunk 210 processed and saved.
Processing chunk 211...
Chunk 211 processed and saved.
Processing chunk 212...
Chunk 212 processed and saved.
Processing chunk 213...
Chunk 213 

  for i, chunk in enumerate(reader):


Chunk 224 processed and saved.
Processing chunk 225...
Chunk 225 processed and saved.
Processing chunk 226...
Chunk 226 processed and saved.
Processing chunk 227...
Chunk 227 processed and saved.
Processing chunk 228...
Chunk 228 processed and saved.
Processing chunk 229...
Chunk 229 processed and saved.
Processing chunk 230...
Chunk 230 processed and saved.
Processing chunk 231...
Chunk 231 processed and saved.
Processing chunk 232...
Chunk 232 processed and saved.
Processing chunk 233...
Chunk 233 processed and saved.
Processing chunk 234...
Chunk 234 processed and saved.
Processing chunk 235...
Chunk 235 processed and saved.
Processing chunk 236...
Chunk 236 processed and saved.
Processing chunk 237...
Chunk 237 processed and saved.
Processing chunk 238...
Chunk 238 processed and saved.
Processing chunk 239...
Chunk 239 processed and saved.
Processing chunk 240...
Chunk 240 processed and saved.
Processing chunk 241...
Chunk 241 processed and saved.
Processing chunk 242...
Chunk 242 

  for i, chunk in enumerate(reader):


Chunk 252 processed and saved.
Processing chunk 253...
Chunk 253 processed and saved.
Processing chunk 254...
Chunk 254 processed and saved.
Processing chunk 255...
Chunk 255 processed and saved.
Processing chunk 256...
Chunk 256 processed and saved.
Processing chunk 257...
Chunk 257 processed and saved.
Processing chunk 258...
Chunk 258 processed and saved.
Processing chunk 259...
Chunk 259 processed and saved.
Processing chunk 260...
Chunk 260 processed and saved.
Processing chunk 261...
Chunk 261 processed and saved.
Processing chunk 262...
Chunk 262 processed and saved.
Processing chunk 263...
Chunk 263 processed and saved.
Processing chunk 264...
Chunk 264 processed and saved.
Processing chunk 265...
Chunk 265 processed and saved.
Processing chunk 266...
Chunk 266 processed and saved.
Processing chunk 267...
Chunk 267 processed and saved.
Processing chunk 268...
Chunk 268 processed and saved.
Processing chunk 269...
Chunk 269 processed and saved.
Processing chunk 270...
Chunk 270 

  for i, chunk in enumerate(reader):


Chunk 280 processed and saved.
Processing chunk 281...


  for i, chunk in enumerate(reader):


Chunk 281 processed and saved.
Processing chunk 282...
Chunk 282 processed and saved.
Processing chunk 283...
Chunk 283 processed and saved.
Processing chunk 284...
Chunk 284 processed and saved.
Processing chunk 285...
Chunk 285 processed and saved.
Processing chunk 286...
Chunk 286 processed and saved.
Processing chunk 287...
Chunk 287 processed and saved.
Processing chunk 288...
Chunk 288 processed and saved.
Processing chunk 289...
Chunk 289 processed and saved.
Processing chunk 290...
Chunk 290 processed and saved.
Processing chunk 291...
Chunk 291 processed and saved.
Processing chunk 292...
Chunk 292 processed and saved.
Processing chunk 293...
Chunk 293 processed and saved.
Processing chunk 294...
Chunk 294 processed and saved.
Processing chunk 295...
Chunk 295 processed and saved.
Processing chunk 296...
Chunk 296 processed and saved.
Processing chunk 297...
Chunk 297 processed and saved.
Processing chunk 298...
Chunk 298 processed and saved.
Processing chunk 299...
Chunk 299 

  for i, chunk in enumerate(reader):


Chunk 315 processed and saved.
Processing chunk 316...


  for i, chunk in enumerate(reader):


Chunk 316 processed and saved.
Processing chunk 317...
Chunk 317 processed and saved.
Processing chunk 318...
Chunk 318 processed and saved.
Processing chunk 319...
Chunk 319 processed and saved.
Processing chunk 320...
Chunk 320 processed and saved.
Processing chunk 321...
Chunk 321 processed and saved.
Processing chunk 322...
Chunk 322 processed and saved.
Processing chunk 323...
Chunk 323 processed and saved.
Processing chunk 324...
Chunk 324 processed and saved.
Processing chunk 325...
Chunk 325 processed and saved.
Processing chunk 326...
Chunk 326 processed and saved.
Processing chunk 327...
Chunk 327 processed and saved.
Processing chunk 328...
Chunk 328 processed and saved.
Processing chunk 329...
Chunk 329 processed and saved.
Processing chunk 330...
Chunk 330 processed and saved.
Processing chunk 331...
Chunk 331 processed and saved.
Processing chunk 332...
Chunk 332 processed and saved.
Processing chunk 333...
Chunk 333 processed and saved.
Processing chunk 334...
Chunk 334 

  for i, chunk in enumerate(reader):


Chunk 349 processed and saved.
Processing chunk 350...


  for i, chunk in enumerate(reader):


Chunk 350 processed and saved.
Processing chunk 351...
Chunk 351 processed and saved.
Processing chunk 352...
Chunk 352 processed and saved.
Processing chunk 353...
Chunk 353 processed and saved.
Processing chunk 354...
Chunk 354 processed and saved.
Processing chunk 355...
Chunk 355 processed and saved.
Processing chunk 356...
Chunk 356 processed and saved.
Processing chunk 357...
Chunk 357 processed and saved.
Processing chunk 358...
Chunk 358 processed and saved.
Processing chunk 359...
Chunk 359 processed and saved.
Processing chunk 360...
Chunk 360 processed and saved.
Processing chunk 361...
Chunk 361 processed and saved.
Processing chunk 362...
Chunk 362 processed and saved.
Processing chunk 363...
Chunk 363 processed and saved.
Processing chunk 364...
Chunk 364 processed and saved.
Processing chunk 365...
Chunk 365 processed and saved.
Processing chunk 366...
Chunk 366 processed and saved.
Processing chunk 367...
Chunk 367 processed and saved.
Processing chunk 368...
Chunk 368 

  for i, chunk in enumerate(reader):


Chunk 382 processed and saved.
Processing chunk 383...
Chunk 383 processed and saved.
Processing chunk 384...
Chunk 384 processed and saved.
Data cleaning complete! Cleaned file saved as 'nyc_taxi_data_cleaned_final1.csv'.
