In [None]:
import os
import pyarrow.parquet as pq
import report

In [None]:
label = ["_trg", "_lev"][0]
data = pq.read_table(f"../../data/fsq_osm_filtered_5{label}.parquet", memory_map=True)
print(data.column_names)

In [None]:
if not os.path.exists(f"../../data/fsq_osm_filtered_5_map{label}.csv"):
    # map_data = data[["fsq_latitude", "fsq_longitude"]]
    map_data = data.select(["fsq_latitude", "fsq_longitude"]).to_pandas()
    map_data.to_csv(f"../../data/fsq_osm_filtered_5_map{label}.csv", index=False)
    pass

In [None]:
save_dir = "../../visualization/report"
report.plot_count_per_year(data, col='fsq_date_created', save_path=f"{save_dir}/place_created_per_year{label}.png")
report.plot_count_per_year(data, col='fsq_date_refreshed', save_path=f"{save_dir}/place_refreshed_per_year{label}.png")
report.plot_distance_hist(data, save_path=f"{save_dir}/place_distance_hist{label}.png")
report.plot_name_similarity_hist(data, save_path=f"{save_dir}/place_name_similarity_hist{label}.png")
report.plot_country_distribution(data, save_path=f"{save_dir}/place_country_distribution{label}.png")
report.plot_region_distribution(data, save_path=f"{save_dir}/place_region_distribution{label}.png")
report.plot_locality_distribution(data, save_path=f"{save_dir}/place_locality_distribution{label}.png")
report.plot_category_by_country(data, save_path=f"{save_dir}/place_category_by_country{label}.png")
report.plot_osm_class_distribution(data, save_path=f"{save_dir}/place_osm_class_distribution{label}.png")


In [None]:
plot_names = [
    "place_created_per_year",
    "place_refreshed_per_year",
    "place_distance_hist",
    "place_name_similarity_hist",
    "place_country_distribution",
    "place_region_distribution",
    "place_locality_distribution",
    "place_category_by_country",
    "place_osm_class_distribution"
]


def get_latex_fig(fig_name, left_label, right_label):
    figure_latex = f"""
\\begin{{figure}}[htbp]
    \\centering
    \\begin{{subfigure}}[b]{{0.49\\linewidth}}
        \\centering
        \\includegraphics[width=\\linewidth]{{figs/{fig_name}{left_label}.png}}
        \\caption{{{fig_name.replace("_", "-")}{left_label.replace("_", "-")}}}
        \\label{{fig:{fig_name}{left_label}}}
    \\end{{subfigure}}
    \\hfill
    \\begin{{subfigure}}[b]{{0.49\\linewidth}}
        \\centering
        \\includegraphics[width=\\linewidth]{{figs/{fig_name}{right_label}.png}}
        \\caption{{{fig_name.replace("_", "-")}{right_label.replace("_", "-")}}}
        \\label{{fig:{fig_name}{right_label}}}
    \\end{{subfigure}}
    \\caption{{{fig_name.replace("_", " ").capitalize()}}}
    \\label{{fig:{fig_name}}}
\\end{{figure}}
"""
    return figure_latex

for plot_name in plot_names:
    print(get_latex_fig(plot_name, "_lev", "_trg"))

    