# Baseline - klasyfikacja



In [171]:
import srai
import pandas as pd
import geopandas as gpd
from srai.regionalizers import H3Regionalizer, geocode_to_region_gdf
from srai.embedders import CountEmbedder
from srai.joiners import IntersectionJoiner
from srai.loaders import OSMOnlineLoader
from srai.plotting import plot_regions
import overpy
import time
import pickle
from srai.constants import WGS84_CRS, FEATURES_INDEX

## Tworzenie zbioru danych

Wykorzystane tagi: highway, amenity, building

Dane wypadków (ilość) na rok 2023

In [17]:
area = geocode_to_region_gdf("Wrocław, Poland")

In [31]:
area.columns

Index(['geometry'], dtype='object')

In [117]:
def get_all_values_for_tag(tag):
    """
    Gets all unique values for given OSM key
    """
    api = overpy.Overpass()
    query = f"""
    area[name="Wrocław"];
    (nwr[{tag}](area););
    out tags;
    """ 
    values_all = []
# Execute the query
    result = api.query(query)
    for way in result.ways:
        for key, value in way.tags.items():
            if key ==tag:
                print(f"Way {way.id}: {key} = {value}")
                values_all.append(value)

    for node in result.nodes:
        for key, value in node.tags.items():
            if key ==tag:
                print(f"Node {node.id}: {key} = {value}")
                values_all.append(value)

    for relation in result.relations:
        for key, value in relation.tags.items():
            if key ==tag:
                print(f"Relation {relation.id}: {key} = {value}")
                values_all.append(value)
    values_set = set(values_all)
    return list(values_set)

In [70]:
def slice_list(input_list, max_elements_per_slice=20):
    sliced_list = []
    for i in range(0, len(input_list), max_elements_per_slice):
        sliced_list.append(input_list[i:i + max_elements_per_slice])
    return sliced_list

In [132]:
def get_list_of_features_gdf(tag_key_names):
    features_dict = {}
    for tag_key in tag_key_names:
        tag_values_list = get_all_values_for_tag(tag_key)
        sliced_values = slice_list(tag_values_list, max_elements_per_slice=10)
        features_dict[tag_key] = sliced_values
  
    features_list = []
    for key, val in features_dict.items():
        for i, inner in enumerate(val):
            query = {key: inner}
            loader = OSMOnlineLoader()
            features = loader.load(area, query)
            features_list.append(features)
            time.sleep(30)
    
    return features_list
        


In [163]:
download_features = False
if download_features:
    feature_key_names = ["highway", "amenity"]
    features_list1 = get_list_of_features_gdf(feature_key_names)
    feature_key_names2 = ["building"]
    features_list2 = get_list_of_features_gdf(feature_key_names2)
    features_list1.extend(features_list2)
    concat_gdf = gpd.GeoDataFrame(pd.concat(features_list1, ignore_index=False), crs=features_list1[0].crs)
    concat_gdf.to_pickle("data/features_gdf_highway_amenity_building.pkl")

In [139]:
all_features_gdf = pd.read_pickle("data/features_gdf_highway_amenity_building.pkl")

In [142]:
all_features_gdf.head()

Unnamed: 0_level_0,geometry,highway,amenity,building
feature_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
node/150597406,POINT (16.97786 51.09238),crossing,,
node/151334674,POINT (16.97939 51.09485),traffic_signals,,
node/153568043,POINT (16.96694 51.07828),crossing,,
node/158719856,POINT (17.03100 51.09441),crossing,,
node/158719876,POINT (17.04118 51.09612),traffic_signals,,


In [153]:
duplicates = all_features_gdf.index.duplicated(keep='first')
features_no_duplicates = all_features_gdf[~duplicates]

In [182]:
wypadki = gpd.read_file("./data/wypadki/2023_szczegoly_zdarzen_dr.shx")
wypadki = wypadki.to_crs('EPSG:4326')

In [183]:
def make_count_embeddings(def_area, features, regionalizer):
    # the indexes should be unique for count embedder
    assert len(features.index.unique()) == len(features)
    
    regions = regionalizer.transform(def_area)
    joiner = IntersectionJoiner()
    joint = joiner.transform(regions, features)
    embedder = CountEmbedder()
    embeddings = embedder.transform(regions, features, joint)
    return embeddings

def make_count_embeddings_wypadki(def_area, wypadki_df, regionalizer):
    query = {'rok': wypadki_df['ROK'], 'geometry': wypadki_df['geometry']}
    features_y = gpd.GeoDataFrame(
        query,
        crs=WGS84_CRS,
        index=gpd.pd.Index(name=FEATURES_INDEX, data=[i for i in range(len(wypadki_df))]),
    )
    regions = regionalizer.transform(def_area)
    joiner = IntersectionJoiner()
    joint = joiner.transform(regions, features_y, return_geom=True)
    embedder = CountEmbedder()
    embeddings = embedder.transform(regions, features_y, joint)
    return embeddings
   

In [184]:
regionalizer = H3Regionalizer(resolution=9)
embeddings_features = make_count_embeddings(area, features_no_duplicates, regionalizer)
embeddings_y = make_count_embeddings_wypadki(area, wypadki, regionalizer )


  return vector.wkb_to_cells(
  return vector.wkb_to_cells(


In [187]:
embeddings_y.index[0]

'891e204046bffff'

In [188]:
embeddings_features.index[0]

'891e204046bffff'

In [201]:
all_data = embeddings_features.join(embeddings_y)
all_data.head()

Unnamed: 0_level_0,highway_bridleway,highway_bus_stop,highway_construction,highway_corridor,highway_crossing,highway_cycleway,highway_elevator,highway_footway,highway_give_way,highway_living_street,highway_milestone,highway_mini_roundabout,highway_motorway,highway_motorway_junction,highway_motorway_link,highway_passing_place,highway_path,highway_pedestrian,highway_platform,highway_primary,highway_primary_link,highway_proposed,highway_raceway,highway_residential,highway_secondary,highway_secondary_link,highway_service,highway_steps,highway_stop,highway_street_lamp,highway_tertiary,highway_tertiary_link,highway_track,highway_traffic_mirror,highway_traffic_signals,highway_trunk,highway_trunk_link,highway_turning_circle,highway_turning_loop,highway_unclassified,amenity_animal_boarding,amenity_animal_shelter,amenity_animal_training,amenity_arts_centre,amenity_atm,amenity_baby_hatch,amenity_bank,amenity_bar,amenity_bbq,amenity_bench,amenity_bicycle_parking,amenity_bicycle_rental,amenity_bicycle_repair_station,amenity_biergarten,amenity_boat_rental,amenity_bts,amenity_bureau_de_change,amenity_bus_station,amenity_cafe,amenity_car_rental,amenity_car_wash,amenity_casino,amenity_charging_station,amenity_childcare,amenity_cinema,amenity_clinic,amenity_clock,amenity_college,amenity_community_centre,amenity_compressed_air,amenity_conference_centre,amenity_courthouse,amenity_coworking_space,amenity_crematorium,amenity_dancing_school,amenity_dentist,amenity_doctors,amenity_dog_toilet,amenity_dog_toilets,amenity_dormitory,amenity_dressing_room,amenity_drinking_water,amenity_driver_training,amenity_driving_school,amenity_events_venue,amenity_fast_food,amenity_feeding_place,amenity_fire_station,amenity_fixme,amenity_food_court,amenity_food_sharing,amenity_fountain,amenity_fridge,amenity_fuel,amenity_give_box,amenity_grave_yard,amenity_grit_bin,amenity_guitar_lessons,amenity_hookah_lounge,amenity_hospital,amenity_hunting_stand,amenity_ice_cream,amenity_internet_cafe,amenity_kindergarten,amenity_language_school,amenity_letter_box,amenity_library,amenity_loading_dock,amenity_lounger,amenity_luggage_locker,amenity_marketplace,amenity_mist_spraying_cooler,amenity_monastery,amenity_money_transfer,amenity_motorcycle_parking,amenity_music_school,amenity_music_venue,amenity_nightclub,amenity_nursing_home,amenity_parcel_locker,amenity_parking,amenity_parking_entrance,amenity_parking_locker,amenity_parking_space,amenity_payment_centre,amenity_payment_terminal,amenity_pharmacy,amenity_photo_booth,amenity_place_of_worship,amenity_police,amenity_post_box,amenity_post_depot,amenity_post_office,amenity_printer,amenity_prison,amenity_pub,amenity_public_bath,amenity_public_bookcase,amenity_reception_desk,amenity_recycling,amenity_research_institute,amenity_restaurant,amenity_safe_deposit,amenity_school,amenity_shelter,amenity_shower,amenity_singing_lessons,amenity_smoking_area,amenity_social_centre,amenity_social_facility,amenity_stage,amenity_stripclub,amenity_studio,amenity_table,amenity_taxi,amenity_theatre,amenity_toilets,amenity_townhall,amenity_traffic_park,amenity_training,amenity_trolley_bay,amenity_university,amenity_vacuum_cleaner,amenity_vehicle_inspection,amenity_vending_machine,amenity_veterinary,amenity_waste_basket,amenity_waste_disposal,amenity_watering_place,amenity_weighbridge,building_allotment_house,building_apartments,building_barn,building_being_demolished,building_boathouse,building_bridge,building_bungalow,building_bunker,building_buttress,building_carport,building_castle,building_chapel,building_chimney,building_church,building_civic,building_collapsed,building_college,building_commercial,building_construction,building_container,building_convent,building_corridor,building_cover,building_data_center,building_detached,building_dormitory,building_elevator_housing,building_entrance,building_farm,building_farm_auxiliary,building_fire_station,building_fountain,building_garage,building_garages,building_gate,building_gazebo,building_government,building_grandstand,building_greenhouse,building_guard_shed,building_guardhouse,building_gymnasium,building_hangar,building_healthcare,building_hospital,building_hostel,building_hotel,building_house,building_houseboat,building_hut,building_industrial,building_kindergarten,building_kiosk,building_manufacture,building_mini_castle,building_monastery,building_office,building_outbuilding,building_palace,building_parking,building_parking_entrance,building_pavilion,building_pedestal,building_porch,building_postument,building_presbytery,building_prison,building_public,building_railway,building_ramp,building_residential,building_retail,building_riding_hall,building_roof,building_ruins,building_school,building_semi,building_semidetached_house,building_service,building_shed,building_ship,building_silo,building_skywalk,building_sports_centre,building_sports_hall,building_stable,building_stadium,building_staircase,building_stairs,building_static_caravan,building_storage_tank,building_supermarket,building_tent,building_terrace,building_toilets,building_tower,building_train_station,building_transformer_tower,building_transportation,building_university,building_wall,building_warehouse,building_waste,building_water_tower,building_wayside_shrine,building_yes,rok_2023
region_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1
891e204046bffff,0,2,0,0,6,0,0,55,0,0,0,0,0,0,0,0,7,0,0,0,0,0,0,9,0,0,21,1,0,0,4,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,156,3
891e204304bffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0
891e20406c3ffff,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,2,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,0
891e2044647ffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0
891e205526fffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


## Czyszczenie danych
W pierwszej kolejności usunięto **amenity: waste_basket** jako tag, dla którego na pewno występuje niekonsekwencja tagowania ([ref](https://arxiv.org/pdf/2111.00970.pdf)). 
W kolejnym kroku usunięto rekordy, które nie posiadały żadnych cech (wszystkie features oprócz ilości wypadków == 0).

In [202]:
all_data = all_data.drop("amenity_waste_basket", axis=1)

In [203]:
all_data = all_data.rename(columns={'rok_2023': 'wypadki_count'})

In [204]:
all_data.isna().sum()

highway_bridleway          0
highway_bus_stop           0
highway_construction       0
highway_corridor           0
highway_crossing           0
                          ..
building_waste             0
building_water_tower       0
building_wayside_shrine    0
building_yes               0
wypadki_count              0
Length: 276, dtype: int64

In [205]:
all_data['wypadki_count'].describe()

count    2965.000000
mean        1.537943
std         3.986947
min         0.000000
25%         0.000000
50%         0.000000
75%         1.000000
max        40.000000
Name: wypadki_count, dtype: float64

In [216]:
bins = [0, 10, 20, 30, 40]

# Use pd.cut to categorize the numeric column
categories = [0, 1, 2, 3]
all_data['wypadki_category'] = pd.cut(all_data['wypadki_count'], bins, labels=categories, include_lowest=True)


In [220]:
all_data.head()

Unnamed: 0_level_0,highway_bridleway,highway_bus_stop,highway_construction,highway_corridor,highway_crossing,highway_cycleway,highway_elevator,highway_footway,highway_give_way,highway_living_street,highway_milestone,highway_mini_roundabout,highway_motorway,highway_motorway_junction,highway_motorway_link,highway_passing_place,highway_path,highway_pedestrian,highway_platform,highway_primary,highway_primary_link,highway_proposed,highway_raceway,highway_residential,highway_secondary,highway_secondary_link,highway_service,highway_steps,highway_stop,highway_street_lamp,highway_tertiary,highway_tertiary_link,highway_track,highway_traffic_mirror,highway_traffic_signals,highway_trunk,highway_trunk_link,highway_turning_circle,highway_turning_loop,highway_unclassified,amenity_animal_boarding,amenity_animal_shelter,amenity_animal_training,amenity_arts_centre,amenity_atm,amenity_baby_hatch,amenity_bank,amenity_bar,amenity_bbq,amenity_bench,amenity_bicycle_parking,amenity_bicycle_rental,amenity_bicycle_repair_station,amenity_biergarten,amenity_boat_rental,amenity_bts,amenity_bureau_de_change,amenity_bus_station,amenity_cafe,amenity_car_rental,amenity_car_wash,amenity_casino,amenity_charging_station,amenity_childcare,amenity_cinema,amenity_clinic,amenity_clock,amenity_college,amenity_community_centre,amenity_compressed_air,amenity_conference_centre,amenity_courthouse,amenity_coworking_space,amenity_crematorium,amenity_dancing_school,amenity_dentist,amenity_doctors,amenity_dog_toilet,amenity_dog_toilets,amenity_dormitory,amenity_dressing_room,amenity_drinking_water,amenity_driver_training,amenity_driving_school,amenity_events_venue,amenity_fast_food,amenity_feeding_place,amenity_fire_station,amenity_fixme,amenity_food_court,amenity_food_sharing,amenity_fountain,amenity_fridge,amenity_fuel,amenity_give_box,amenity_grave_yard,amenity_grit_bin,amenity_guitar_lessons,amenity_hookah_lounge,amenity_hospital,amenity_hunting_stand,amenity_ice_cream,amenity_internet_cafe,amenity_kindergarten,amenity_language_school,amenity_letter_box,amenity_library,amenity_loading_dock,amenity_lounger,amenity_luggage_locker,amenity_marketplace,amenity_mist_spraying_cooler,amenity_monastery,amenity_money_transfer,amenity_motorcycle_parking,amenity_music_school,amenity_music_venue,amenity_nightclub,amenity_nursing_home,amenity_parcel_locker,amenity_parking,amenity_parking_entrance,amenity_parking_locker,amenity_parking_space,amenity_payment_centre,amenity_payment_terminal,amenity_pharmacy,amenity_photo_booth,amenity_place_of_worship,amenity_police,amenity_post_box,amenity_post_depot,amenity_post_office,amenity_printer,amenity_prison,amenity_pub,amenity_public_bath,amenity_public_bookcase,amenity_reception_desk,amenity_recycling,amenity_research_institute,amenity_restaurant,amenity_safe_deposit,amenity_school,amenity_shelter,amenity_shower,amenity_singing_lessons,amenity_smoking_area,amenity_social_centre,amenity_social_facility,amenity_stage,amenity_stripclub,amenity_studio,amenity_table,amenity_taxi,amenity_theatre,amenity_toilets,amenity_townhall,amenity_traffic_park,amenity_training,amenity_trolley_bay,amenity_university,amenity_vacuum_cleaner,amenity_vehicle_inspection,amenity_vending_machine,amenity_veterinary,amenity_waste_disposal,amenity_watering_place,amenity_weighbridge,building_allotment_house,building_apartments,building_barn,building_being_demolished,building_boathouse,building_bridge,building_bungalow,building_bunker,building_buttress,building_carport,building_castle,building_chapel,building_chimney,building_church,building_civic,building_collapsed,building_college,building_commercial,building_construction,building_container,building_convent,building_corridor,building_cover,building_data_center,building_detached,building_dormitory,building_elevator_housing,building_entrance,building_farm,building_farm_auxiliary,building_fire_station,building_fountain,building_garage,building_garages,building_gate,building_gazebo,building_government,building_grandstand,building_greenhouse,building_guard_shed,building_guardhouse,building_gymnasium,building_hangar,building_healthcare,building_hospital,building_hostel,building_hotel,building_house,building_houseboat,building_hut,building_industrial,building_kindergarten,building_kiosk,building_manufacture,building_mini_castle,building_monastery,building_office,building_outbuilding,building_palace,building_parking,building_parking_entrance,building_pavilion,building_pedestal,building_porch,building_postument,building_presbytery,building_prison,building_public,building_railway,building_ramp,building_residential,building_retail,building_riding_hall,building_roof,building_ruins,building_school,building_semi,building_semidetached_house,building_service,building_shed,building_ship,building_silo,building_skywalk,building_sports_centre,building_sports_hall,building_stable,building_stadium,building_staircase,building_stairs,building_static_caravan,building_storage_tank,building_supermarket,building_tent,building_terrace,building_toilets,building_tower,building_train_station,building_transformer_tower,building_transportation,building_university,building_wall,building_warehouse,building_waste,building_water_tower,building_wayside_shrine,building_yes,wypadki_category
region_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1
891e204046bffff,0,2,0,0,6,0,0,55,0,0,0,0,0,0,0,0,7,0,0,0,0,0,0,9,0,0,21,1,0,0,4,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,156,0
891e204304bffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0
891e20406c3ffff,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,2,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,0
891e2044647ffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0
891e205526fffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [219]:
all_data = all_data.drop(['wypadki_count'], axis=1)

In [221]:
x_columns = all_data.drop(['wypadki_category'], axis=1).columns
all_data_filtered = all_data[all_data[x_columns].sum(axis=1) != 0]
all_data_filtered.head()

Unnamed: 0_level_0,highway_bridleway,highway_bus_stop,highway_construction,highway_corridor,highway_crossing,highway_cycleway,highway_elevator,highway_footway,highway_give_way,highway_living_street,highway_milestone,highway_mini_roundabout,highway_motorway,highway_motorway_junction,highway_motorway_link,highway_passing_place,highway_path,highway_pedestrian,highway_platform,highway_primary,highway_primary_link,highway_proposed,highway_raceway,highway_residential,highway_secondary,highway_secondary_link,highway_service,highway_steps,highway_stop,highway_street_lamp,highway_tertiary,highway_tertiary_link,highway_track,highway_traffic_mirror,highway_traffic_signals,highway_trunk,highway_trunk_link,highway_turning_circle,highway_turning_loop,highway_unclassified,amenity_animal_boarding,amenity_animal_shelter,amenity_animal_training,amenity_arts_centre,amenity_atm,amenity_baby_hatch,amenity_bank,amenity_bar,amenity_bbq,amenity_bench,amenity_bicycle_parking,amenity_bicycle_rental,amenity_bicycle_repair_station,amenity_biergarten,amenity_boat_rental,amenity_bts,amenity_bureau_de_change,amenity_bus_station,amenity_cafe,amenity_car_rental,amenity_car_wash,amenity_casino,amenity_charging_station,amenity_childcare,amenity_cinema,amenity_clinic,amenity_clock,amenity_college,amenity_community_centre,amenity_compressed_air,amenity_conference_centre,amenity_courthouse,amenity_coworking_space,amenity_crematorium,amenity_dancing_school,amenity_dentist,amenity_doctors,amenity_dog_toilet,amenity_dog_toilets,amenity_dormitory,amenity_dressing_room,amenity_drinking_water,amenity_driver_training,amenity_driving_school,amenity_events_venue,amenity_fast_food,amenity_feeding_place,amenity_fire_station,amenity_fixme,amenity_food_court,amenity_food_sharing,amenity_fountain,amenity_fridge,amenity_fuel,amenity_give_box,amenity_grave_yard,amenity_grit_bin,amenity_guitar_lessons,amenity_hookah_lounge,amenity_hospital,amenity_hunting_stand,amenity_ice_cream,amenity_internet_cafe,amenity_kindergarten,amenity_language_school,amenity_letter_box,amenity_library,amenity_loading_dock,amenity_lounger,amenity_luggage_locker,amenity_marketplace,amenity_mist_spraying_cooler,amenity_monastery,amenity_money_transfer,amenity_motorcycle_parking,amenity_music_school,amenity_music_venue,amenity_nightclub,amenity_nursing_home,amenity_parcel_locker,amenity_parking,amenity_parking_entrance,amenity_parking_locker,amenity_parking_space,amenity_payment_centre,amenity_payment_terminal,amenity_pharmacy,amenity_photo_booth,amenity_place_of_worship,amenity_police,amenity_post_box,amenity_post_depot,amenity_post_office,amenity_printer,amenity_prison,amenity_pub,amenity_public_bath,amenity_public_bookcase,amenity_reception_desk,amenity_recycling,amenity_research_institute,amenity_restaurant,amenity_safe_deposit,amenity_school,amenity_shelter,amenity_shower,amenity_singing_lessons,amenity_smoking_area,amenity_social_centre,amenity_social_facility,amenity_stage,amenity_stripclub,amenity_studio,amenity_table,amenity_taxi,amenity_theatre,amenity_toilets,amenity_townhall,amenity_traffic_park,amenity_training,amenity_trolley_bay,amenity_university,amenity_vacuum_cleaner,amenity_vehicle_inspection,amenity_vending_machine,amenity_veterinary,amenity_waste_disposal,amenity_watering_place,amenity_weighbridge,building_allotment_house,building_apartments,building_barn,building_being_demolished,building_boathouse,building_bridge,building_bungalow,building_bunker,building_buttress,building_carport,building_castle,building_chapel,building_chimney,building_church,building_civic,building_collapsed,building_college,building_commercial,building_construction,building_container,building_convent,building_corridor,building_cover,building_data_center,building_detached,building_dormitory,building_elevator_housing,building_entrance,building_farm,building_farm_auxiliary,building_fire_station,building_fountain,building_garage,building_garages,building_gate,building_gazebo,building_government,building_grandstand,building_greenhouse,building_guard_shed,building_guardhouse,building_gymnasium,building_hangar,building_healthcare,building_hospital,building_hostel,building_hotel,building_house,building_houseboat,building_hut,building_industrial,building_kindergarten,building_kiosk,building_manufacture,building_mini_castle,building_monastery,building_office,building_outbuilding,building_palace,building_parking,building_parking_entrance,building_pavilion,building_pedestal,building_porch,building_postument,building_presbytery,building_prison,building_public,building_railway,building_ramp,building_residential,building_retail,building_riding_hall,building_roof,building_ruins,building_school,building_semi,building_semidetached_house,building_service,building_shed,building_ship,building_silo,building_skywalk,building_sports_centre,building_sports_hall,building_stable,building_stadium,building_staircase,building_stairs,building_static_caravan,building_storage_tank,building_supermarket,building_tent,building_terrace,building_toilets,building_tower,building_train_station,building_transformer_tower,building_transportation,building_university,building_wall,building_warehouse,building_waste,building_water_tower,building_wayside_shrine,building_yes,wypadki_category
region_id,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1
891e204046bffff,0,2,0,0,6,0,0,55,0,0,0,0,0,0,0,0,7,0,0,0,0,0,0,9,0,0,21,1,0,0,4,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,5,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,156,0
891e204304bffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0
891e20406c3ffff,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,2,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,15,0
891e2044647ffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0
891e205526fffff,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [222]:
len(all_data)

2965

In [223]:
len(all_data_filtered)

2883

## Przygotowanie modelu

In [224]:
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.svm import SVC

In [225]:
X = all_data_filtered.drop(['wypadki_category'], axis=1)
y = all_data_filtered['wypadki_category']
X_train, X_test, y_train, y_test = train_test_split( X, y, test_size=0.33, random_state=42)