In [1]:
import pandas as pd

In [7]:
import pandas as pd
import os
import glob
import json
from tqdm import tqdm

# Find all JSON files in data/ directory and subdirectories
all_json_files = glob.glob("data/**/*.json", recursive=True)
print(f"Found {len(all_json_files)} JSON files")

# Read and combine all JSON files into a single DataFrame
data_list = []
for json_file in tqdm(all_json_files, desc="Processing JSON files", unit="file"):
    try:
        with open(json_file, 'r', encoding='utf-8') as f:
            data = json.load(f)
            # If data is a dictionary, convert to list
            if isinstance(data, dict):
                data_list.append(data)
            elif isinstance(data, list):
                data_list.extend(data)
    except Exception as e:
        print(f"Error reading {json_file}: {e}")

# Convert to DataFrame and save as CSV
if data_list:
    print("Converting to DataFrame and saving...")
    df = pd.DataFrame(data_list)
    output_file = "data/combined_vessels.csv"
    df.to_csv(output_file, index=False)
    print(f"Combined {len(data_list)} records into {output_file}")
    print(f"DataFrame shape: {df.shape}")
else:
    print("No data found to combine")

Found 71041 JSON files


Processing JSON files: 100%|██████████| 71041/71041 [22:24<00:00, 52.85file/s]  


Converting to DataFrame and saving...
Combined 71041 records into data/combined_vessels.csv
DataFrame shape: (71041, 23)


In [8]:
df

Unnamed: 0,IMO number,Vessel type,Operating status,Flag,Year of build,Builder,Description,Vessel name,Gross tonnage (tons),source_url,...,Deadweight (tons),MMSI,Former names,Home port,Owner,Manager,Engine type,Engine model,Engine power,Draft
0,5388134,Fishing vessel,Decommissioned or lost,Canada,1943,"QUINCY ADAMS YACHT YARD - QUINCY MA, U.S.A.",WESTERN DISPATCHER is a Fishing vessel built i...,WESTERN DISPATCHER,133tons,https://www.balticshipping.com/vessel/imo/5388134,...,,,,,,,,,,
1,6855304,Tug boat,Decommissioned or lost,,1936,,KIM is a Tug boat built in 1936. Current statu...,KIM,376tons,https://www.balticshipping.com/vessel/imo/6855304,...,,,,,,,,,,
2,7329534,Lash/Barge carrier,Decommissioned or lost,India,1974,"DANYARD - FREDERIKSHAVN, DENMARK",BACAT I is a Lash/Barge carrier built in 1974 ...,BACAT I,1339tons,https://www.balticshipping.com/vessel/imo/7329534,...,1840tons,,,,,,,,,
3,8925218,General cargo vessel,Active,Japan,1996,"YANO SHIPBUILDING - IMABARI, JAPAN",SUNNY KISSHO is a General cargo vessel built i...,SUNNY KISSHO,199tons,https://www.balticshipping.com/vessel/imo/8925218,...,699tons,,,,,,,,,
4,9104902,Container ship,Decommissioned or lost,Palau,1995,"HYUNDAI HEAVY INDUSTRIES CO. LTD. - ULSAN, SOU...",OEL EMIRATES is a Container ship built in 1995...,OEL EMIRATES,36606tons,https://www.balticshipping.com/vessel/imo/9104902,...,45240tons,511966000,"OEL EMIRATES(2019, Panama)NORFOLK EXPRESS(2015...",HAMILTON,"HAPAG LLOYD - HAMBURG, GERMANY","ANGLO EASTERN SHIPMANAGEMENT - HONG KONG, CHINA",,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
71036,9451240,Bulk carrier,Active,Bahamas,2011,"STX DALIAN SHIPBUILDING - DALIAN, CHINA",SERENE JESSICA is a Bulk carrier built in 2011...,SERENE JESSICA,33226tons,https://www.balticshipping.com/vessel/imo/9451240,...,57275tons,311047600,MARIA V.LIVANOS(2013),NASSAU,"TROJAN MARITIME ATHENS, GREECE","TROJAN MARITIME ATHENS, GREECE",MAN-B&W,6S60MC,9480 KW,
71037,5163819,Chemical/Oil tanker,Decommissioned or lost,Bahamas,1944,CONSOLIDATED WESTERN STEEL SAN PEDRO - SAN PED...,IRVING HICKORY is a Chemical/Oil tanker built ...,IRVING HICKORY,614tons,https://www.balticshipping.com/vessel/imo/5163819,...,1006tons,,MELENGER(1962)YW 93,,,,,,,
71038,7205192,Bulk carrier,Decommissioned or lost,North Korea,1972,"SHIN YAMAMOTO SHIPBUILDING - KOCHI, JAPAN",JODIE is a Bulk carrier built in 1972 by SHIN ...,JODIE,10478tons,https://www.balticshipping.com/vessel/imo/7205192,...,16999tons,,EUROBULKER VII(2003)JODIE D(1997)CHIOS DESTINY...,,,,,,,
71039,7202657,Fishing vessel,Decommissioned or lost,,1914,"KING & WINGE - SEATTLE WA, U.S.A.",KING & WINGE is a Fishing vessel built in 1914...,KING & WINGE,143tons,https://www.balticshipping.com/vessel/imo/7202657,...,,,COLUMBIA(1914),,,,,,,
