In [1]:
import polars as pl
pl.Config.set_tbl_cols(-1)
pl.Config.set_tbl_rows(-1)

import seaborn as sns
import matplotlib.pyplot as plt

import os
import sys
sys.path.append('../')

from exp.features import Features
from exp.models.cat import CatBoostModel
from exp.models._lgbm import LGBMModel
from exp.models.rf import RandomForestModel
from exp.models.rgf import RGFModel
from exp.models.xgb import XGBModel

import warnings
warnings.filterwarnings("ignore")

import gc
gc.enable()

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
train = pl.read_csv("../input/train.csv")
test = pl.read_csv("../input/test.csv")

In [3]:
from exp.features import FeatureSelecter


features = Features(train, test)
train, test = features.create_features()

selecter = FeatureSelecter(train, test)

predictions = pl.concat([train["price"].to_frame(), pl.DataFrame([None] * test.height, schema={"price": pl.Int64})])



In [4]:
selecter.get_dataframe("lgbm")[1].head(10)

year,cylinders,odometer,odometer_f,age,odometer/age,odometer/cylinders,lat,lng,lat_scaled,lng_scaled,lat_lng_cluster,manufacturer_rank,condition_rank,fuel_rank,title_status_rank,transmission_rank,drive_rank,size_rank,type_rank,paint_color_rank,state_rank,manufacturer_count,condition_count,fuel_count,title_status_count,transmission_count,drive_count,size_count,type_count,paint_color_count,state_count,type_base_price,type_base_year,type_base_odometer_f,manufacturer_base_price,manufacturer_base_year,manufacturer_base_odometer_f,type_manufacturer_base_price,type_manufacturer_base_year,type_manufacturer_base_odometer,type_manufacturer_year_diff,type_manufacturer_odometer_diff,type_manufacturer_odometer/age_base,type_manufacturer_odometer/age_diff,manufacturer_price_mean,fuel_price_mean,title_status_price_mean,transmission_price_mean,drive_price_mean,type_price_mean,paint_color_price_mean,state_price_mean,lat_lng_cluster_price_mean,title_status_type_manufacturer_price_ratio_mean,state_type_manufacturer_price_ratio_mean,region_type_manufacturer_price_ratio_mean,paint_color_type_manufacturer_price_ratio_mean,lat_lng_cluster_type_manufacturer_price_ratio_mean,condition_l,size_l,manufacturer_age_mean,manufacturer_age_std,manufacturer_age_max,manufacturer_age_min,manufacturer_age_diff,manufacturer_odometer_mean,manufacturer_odometer_std,manufacturer_odometer_max,manufacturer_odometer_min,manufacturer_odometer_diff,condition_age_mean,condition_age_std,condition_age_max,condition_age_min,condition_age_diff,condition_odometer_mean,condition_odometer_std,condition_odometer_max,condition_odometer_min,condition_odometer_diff,cylinders_age_mean,cylinders_age_std,cylinders_age_max,cylinders_age_min,cylinders_age_diff,cylinders_odometer_mean,cylinders_odometer_std,cylinders_odometer_max,cylinders_odometer_min,cylinders_odometer_diff,fuel_age_mean,fuel_age_std,fuel_age_max,fuel_age_min,fuel_age_diff,fuel_odometer_mean,fuel_odometer_std,fuel_odometer_max,fuel_odometer_min,fuel_odometer_diff,drive_age_mean,drive_age_std,drive_age_max,drive_age_min,drive_age_diff,drive_odometer_mean,drive_odometer_std,drive_odometer_max,drive_odometer_min,drive_odometer_diff,type_age_mean,type_age_std,type_age_max,type_age_min,type_age_diff,type_odometer_mean,type_odometer_std,type_odometer_max,type_odometer_min,type_odometer_diff,car_string_vec_norm2,car_string_vec_mean,car_string_vec_0,car_string_vec_1,car_string_vec_2,car_string_vec_3,car_string_vec_4,car_string_vec_5,car_string_vec_6,car_string_vec_7,car_string_vec_8,car_string_vec_9,car_string_vec_10,car_string_vec_11,car_string_vec_12,car_string_vec_13,car_string_vec_14,car_string_vec_15,car_string_vec_16,car_string_vec_17,car_string_vec_18,car_string_vec_19,car_string_vec_20,car_string_vec_21,car_string_vec_22,car_string_vec_23,car_string_vec_24,car_string_vec_25,car_string_vec_26,car_string_vec_27,car_string_vec_28,car_string_vec_29,car_string_vec_30,car_string_vec_31,car_string_vec_32,car_string_vec_33,car_string_vec_34,car_string_vec_35,car_string_vec_36,car_string_vec_37,car_string_vec_38,car_string_vec_39,car_string_vec_40,car_string_vec_41,car_string_vec_42,car_string_vec_43,car_string_vec_44,car_string_vec_45,car_string_vec_46,car_string_vec_47,car_string_vec_48,car_string_vec_49,manufacturer_acura,manufacturer_alfa_romeo,manufacturer_aston_martin,manufacturer_audi,manufacturer_buick,manufacturer_cadillac,manufacturer_chevrolet,manufacturer_chrysler,manufacturer_dodge,manufacturer_fiat,manufacturer_ford,manufacturer_gmc,manufacturer_honda,manufacturer_hyundai,manufacturer_infiniti,manufacturer_jaguar,manufacturer_jeep,manufacturer_kia,manufacturer_land_rover,manufacturer_lexus,manufacturer_lincoln,manufacturer_mazda,manufacturer_mercedes_benz,manufacturer_mercury,manufacturer_mini,manufacturer_mitsubishi,manufacturer_nissan,manufacturer_pontiac,manufacturer_porsche,manufacturer_ram,manufacturer_rover,manufacturer_saturn,manufacturer_subaru,manufacturer_toyota,manufacturer_volkswagen,manufacturer_volvo,fuel_diesel,fuel_electric,fuel_hybrid,fuel_other,title_status_lien,title_status_missing,title_status_parts only,title_status_rebuilt,title_status_salvage,transmission_automatic,transmission_other,drive_4wd,drive_fwd,type_SUV,type_bus,type_coupe,type_hatchback,type_mini-van,type_nan,type_offroad,type_other,type_pickup,type_sedan,type_truck,type_van,type_wagon,paint_color_black,paint_color_blue,paint_color_brown,paint_color_custom,paint_color_green,paint_color_grey,paint_color_purple,paint_color_red,paint_color_silver,paint_color_white,paint_color_yellow,state_ak,state_al,state_ar,state_az,state_ca,state_co,state_ct,state_dc,state_de,state_fl,state_ga,state_hi,state_ia,state_id,state_il,state_in,state_ks,state_ky,state_la,state_ma,state_md,state_me,state_mi,state_mn,state_mo,state_ms,state_mt,state_nc,state_nd,state_ne,state_nh,state_nj,state_nm,state_null,state_nv,state_ny,state_oh,state_ok,state_or,state_pa,state_ri,state_sc,state_sd,state_tx,state_ut,state_va,state_vt,state_wa,state_wi,state_wv,state_wy
i64,i8,f64,f64,i64,f64,f64,f64,f64,f64,f64,i8,f32,f32,f32,f32,f32,f32,f32,f32,f32,f32,u32,u32,u32,u32,u32,u32,u32,u32,u32,u32,f32,f32,f32,f32,f32,f32,f32,f32,f32,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,i64,i64,f64,f64,i64,i64,f64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64,f64,f64,f64,f64,f64,f64,f64,i64,i64,i64,f64,f64,f64,f64,f64,f64,f64,i64,i64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,f64,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8,u8
2015,4,92553.0,92553.0,8,11569.125,23138.25,39.0,-108.0,0.105995,-0.852625,13,36.0,6.0,5.0,6.0,3.0,3.0,4.0,13.0,7.0,43.0,3807,15219,24785,22821,20497,14602,14636,7311,1419,804,13821.114258,2009.394653,122670.5,14994.541016,2006.456299,106025.976562,14407.828125,2007.925537,114348.234375,7.074463,-21795.234375,7585.559446,3983.565554,14994.540583,12270.566996,13298.318128,13944.440064,9810.263663,13821.113801,11811.757576,12165.701493,12736.677094,0.954906,0.896019,0.887426,0.846305,0.927814,3,3,16.543735,12.018252,93,1,-1.273699,105960.952204,56874.563704,371297.0,120.0,11159.228185,13.90479,9.017663,102,1,101,111303.293102,55306.095717,396512.0,22.0,396490.0,12.261245,7.081156,95,1,94,117244.387609,58720.507136,396512.0,73.0,396439.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,13.605389,7.198899,77,1,1.664648,122776.648907,59081.487533,392519.0,110.0,-5656.468518,0.63937,-0.026509,-0.053422,-0.262332,0.0561,-0.029649,-0.110279,-0.210174,0.005696,0.033133,0.026766,-0.090514,-0.150434,-0.04756,-0.104572,0.052855,0.086445,0.087509,0.005271,-0.043431,0.030947,-0.024945,-0.094175,0.118563,-0.078773,-0.003865,0.036288,-0.090038,-0.085885,-0.081438,-0.031565,0.102988,0.054625,-0.002251,-0.036128,-0.090586,0.022774,-0.112328,0.037149,0.006995,-0.007258,-0.045719,-0.153026,-0.079475,-0.07224,0.196354,-0.15015,0.033945,0.112669,0.01728,-0.060876,-0.046733,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2013,4,134385.0,134385.0,10,13438.5,33596.25,43.216505,-123.341738,0.914012,-1.723605,7,30.0,4.0,5.0,4.0,3.0,3.0,3.0,14.0,12.0,37.0,1003,3810,24785,985,20497,14602,9411,9259,10143,645,9939.633789,2009.920288,115423.164062,10004.209961,2010.975098,122180.71875,9971.921875,2010.447754,118801.9375,2.552246,15583.0625,9464.595947,3973.904053,10004.210369,12270.566996,12351.056853,13944.440064,9810.263663,9939.633654,14798.718624,13653.979845,14139.177122,1.006917,0.955869,0.867631,1.070961,0.973221,4,2,12.024925,6.30752,95,1,3.245111,122262.582915,58456.216704,396512.0,491.0,-5142.402526,12.281627,9.051714,95,1,94,96607.548515,57656.409651,353896.0,73.0,353823.0,12.261245,7.081156,95,1,94,117244.387609,58720.507136,396512.0,73.0,396439.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,13.079706,7.103995,101,1,2.19033,115453.008422,55905.119734,396512.0,22.0,1667.171966,0.677599,-0.022331,-0.083137,-0.279436,0.053701,0.010422,-0.0903,-0.198562,0.047606,0.029799,0.064738,-0.059055,-0.109906,-0.055759,-0.151525,0.069319,0.127604,0.11272,-0.020854,-0.043077,0.016347,-0.028263,-0.032115,0.102439,-0.031133,0.039679,0.070629,-0.118567,-0.079499,-0.134956,-0.040677,0.113335,0.104623,0.072519,-0.072929,-0.078792,-0.02288,-0.08757,0.03396,-0.019675,-0.044283,-0.101145,-0.148642,-0.101709,-0.077746,0.176039,-0.160826,0.062919,0.109124,0.009816,-0.065628,-0.005227,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0
2011,4,102489.0,102489.0,12,8540.75,25622.25,41.083064,-81.518485,0.505177,0.65078,0,29.0,5.0,5.0,6.0,3.0,3.0,4.0,14.0,12.0,46.0,773,6009,24785,22821,20497,14602,14636,9259,10143,961,9939.633789,2009.920288,115423.164062,8000.623535,2010.654541,109916.398438,8970.128906,2010.287354,112669.78125,0.712646,-10180.78125,8862.810854,-322.060854,8000.623545,12270.566996,13298.318128,13944.440064,9810.263663,9939.633654,14798.718624,11751.83871,12681.925935,0.954906,0.872312,0.884552,1.070961,0.939412,2,3,12.345408,7.297595,66,2,2.924629,109897.374021,50800.374703,321350.0,1127.5,7222.806368,17.675487,10.603284,88,2,86,128569.68959,59559.074223,392834.0,34.0,392800.0,12.261245,7.081156,95,1,94,117244.387609,58720.507136,396512.0,73.0,396439.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,13.079706,7.103995,101,1,2.19033,115453.008422,55905.119734,396512.0,22.0,1667.171966,0.664905,-0.024488,-0.062365,-0.282244,0.042361,-0.029665,-0.097922,-0.211495,-0.002908,0.055334,0.067252,-0.069639,-0.150651,-0.029769,-0.122243,0.093562,0.096566,0.115777,0.003042,-0.042378,-0.006231,-0.004543,-0.063007,0.127325,-0.059739,-0.015672,0.013656,-0.100544,-0.094796,-0.141384,-0.02351,0.123812,0.064053,0.030814,-0.04001,-0.059275,0.017856,-0.08817,0.021825,-0.008503,-0.044351,-0.07663,-0.133873,-0.099616,-0.061989,0.180667,-0.151084,0.050914,0.13009,0.004706,-0.063826,-0.02599,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2016,6,64310.0,64310.0,7,9187.142857,10718.333333,39.739236,-104.984862,0.247657,-0.68145,13,31.0,6.0,4.0,6.0,3.0,2.0,3.0,13.0,7.0,43.0,1297,15219,2639,22821,20497,8096,9411,7311,1419,804,13821.114258,2009.394653,122670.5,15062.223633,2008.171143,124062.085938,14441.668945,2008.782959,123366.296875,7.217041,-59056.296875,8677.35394,509.788917,15062.223593,24804.856006,13298.318128,13944.440064,18647.268281,13821.113801,11811.757576,12165.701493,12736.677094,0.954906,0.896019,0.927786,0.846305,0.927814,3,2,14.828836,8.094923,81,2,0.441201,124203.237129,55275.381309,377569.0,1437.0,-7083.056741,13.90479,9.017663,102,1,101,111303.293102,55306.095717,396512.0,22.0,396490.0,15.482006,9.184283,102,2,100,117330.21341,58572.410377,392834.0,22.0,392812.0,15.82607,11.559536,102,2,100,110227.572028,62742.850081,392834.0,309.0,392525.0,14.457633,8.521437,92,1,91,120662.229529,60970.779193,396512.0,110.0,396402.0,13.605389,7.198899,77,1,1.664648,122776.648907,59081.487533,392519.0,110.0,-5656.468518,0.660938,-0.027703,-0.081553,-0.253706,0.040567,-0.034021,-0.077717,-0.233488,0.025457,0.006892,0.029538,-0.069713,-0.132072,-0.104035,-0.142151,-0.00445,0.117654,0.164131,-0.092695,-0.063095,-0.000651,-0.072191,-0.056555,0.04599,-0.046051,0.048872,0.070512,-0.103178,-0.107772,-0.056452,0.000803,0.05136,0.095086,-0.002238,-0.053151,-0.052522,0.087363,-0.083762,0.041063,-0.006759,-0.017938,-0.061358,-0.161382,-0.05752,-0.0793,0.201297,-0.136362,0.021916,0.105807,-0.012149,-0.063348,-0.020103,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
1999,8,180839.0,180839.0,24,7534.958333,22604.875,37.959055,-93.333475,-0.093483,-0.019979,4,33.0,6.0,5.0,5.0,3.0,2.0,3.0,13.0,11.0,41.0,1742,15219,24785,3004,20497,8096,9411,7311,4300,725,13821.114258,2009.394653,122670.5,8994.714844,2010.687744,122266.398438,11407.914062,2010.04126,122468.453125,-11.04126,58370.546875,9450.644963,-1915.68663,8994.71527,12270.566996,14823.253329,13944.440064,18647.268281,13821.113801,11324.39814,13136.195862,12457.56645,1.16087,0.958956,0.937104,0.872173,0.916414,3,2,12.312285,6.248543,61,2,2.957752,122391.687391,55903.320967,346965.0,2267.0,-5271.507002,13.90479,9.017663,102,1,101,111303.293102,55306.095717,396512.0,22.0,396490.0,20.173389,13.610512,98,2,96,115145.227637,60781.634084,379120.0,34.0,379086.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,14.457633,8.521437,92,1,91,120662.229529,60970.779193,396512.0,110.0,396402.0,13.605389,7.198899,77,1,1.664648,122776.648907,59081.487533,392519.0,110.0,-5656.468518,0.682447,-0.022547,-0.122347,-0.278095,0.068906,-0.010241,-0.080442,-0.222705,0.04545,0.010597,0.020686,-0.063984,-0.13373,-0.069831,-0.161975,0.041723,0.138926,0.144582,-0.058634,-0.071746,0.00794,-0.044157,0.004453,0.084837,0.004698,0.049974,0.097726,-0.122273,-0.092663,-0.080046,-0.043877,0.098696,0.096014,-0.01672,-0.100007,-0.035444,0.052995,-0.058996,0.044786,-0.053956,-0.021061,-0.084484,-0.138997,-0.040157,-0.086888,0.192366,-0.126913,0.055484,0.112913,-0.013658,-0.078085,0.011008,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2006,8,75166.0,75166.0,17,4421.529412,9395.75,44.050505,-123.095051,1.073833,-1.7096,7,36.0,4.0,5.0,5.0,3.0,1.0,3.0,12.0,8.0,37.0,3807,3810,24785,3004,20497,4834,9411,3837,2385,645,20267.474609,2005.376099,116080.78125,14994.541016,2006.456299,106025.976562,17631.007812,2005.91626,111053.375,0.08374,-35887.375,6500.530532,-2079.001121,14994.540583,12270.566996,14823.253329,13944.440064,15846.747621,20267.473808,8627.553878,13653.979845,14139.177122,1.16087,0.955869,0.900964,0.627944,0.973221,4,2,16.543735,12.018252,93,1,-1.273699,105960.952204,56874.563704,371297.0,120.0,11159.228185,12.281627,9.051714,95,1,94,96607.548515,57656.409651,353896.0,73.0,353823.0,20.173389,13.610512,98,2,96,115145.227637,60781.634084,379120.0,34.0,379086.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,21.912702,15.21553,102,2,100,97688.928301,55907.032427,360763.0,34.0,360729.0,17.623925,12.08443,102,1,-2.353888,116121.61433,62563.550082,392834.0,126.0,998.566059,0.671731,-0.02755,-0.075606,-0.304401,0.038772,-0.001267,-0.068213,-0.233489,0.04001,-0.019613,0.004698,-0.053456,-0.112367,-0.069243,-0.142635,0.071647,0.122803,0.087755,-0.044548,-0.101107,0.046298,-0.069821,0.012159,0.06477,-0.081939,0.049634,0.061841,-0.106917,-0.047391,-0.116487,0.015809,0.097174,0.055138,0.006447,-0.126798,-0.093245,0.015133,-0.092778,0.017072,0.010209,0.011758,-0.059714,-0.164421,-0.067923,-0.069006,0.177932,-0.15215,0.04931,0.107709,-0.018346,-0.040958,-0.00776,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0
2005,6,178611.0,178611.0,18,9922.833333,29768.5,40.712728,-74.006015,0.434209,1.077278,0,14.0,5.0,5.0,5.0,2.0,3.0,2.0,13.0,2.0,51.0,155,6009,24785,3004,6156,14602,3352,7311,30,2112,13821.114258,2009.394653,122670.5,5715.122559,2003.264526,152665.4375,9768.118164,2006.32959,137667.96875,-1.32959,40943.03125,8258.223251,1664.610083,5715.122581,12270.566996,14823.253329,12058.838856,9810.263663,13821.113801,14246.4,14700.314867,12681.925935,1.16087,1.059864,1.055377,1.085927,0.939412,2,1,19.735484,9.369803,62,3,-4.465447,152929.506494,57798.384142,340441.0,23314.0,-35809.326105,17.675487,10.603284,88,2,86,128569.68959,59559.074223,392834.0,34.0,392800.0,15.482006,9.184283,102,2,100,117330.21341,58572.410377,392834.0,22.0,392812.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,13.605389,7.198899,77,1,1.664648,122776.648907,59081.487533,392519.0,110.0,-5656.468518,0.582649,-0.019648,-0.037035,-0.250306,0.063658,-0.000492,-0.073161,-0.246116,-0.0168,0.116994,-0.028184,-0.035515,-0.058673,-0.043104,-0.091075,0.018227,0.019913,0.086536,0.033536,-0.073999,-0.035633,0.00253,-0.091591,0.097559,-0.040203,0.001327,0.057112,-0.062739,-0.077711,-0.0584,-0.012805,0.038889,0.075849,-0.024948,-0.079141,-0.066267,0.013438,-0.080706,0.088624,-0.019095,0.01068,-0.06338,-0.07012,-0.008432,-0.080453,0.201453,-0.113345,0.042786,0.096619,0.025592,-0.059602,-0.074669,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2002,6,216708.0,216708.0,21,10319.428571,36118.0,40.75962,-111.886797,0.443194,-1.073286,13,32.0,5.0,4.0,4.0,2.0,2.0,4.0,12.0,8.0,12.5,1639,6009,2639,985,6156,8096,14636,3837,2385,125,20267.474609,2005.376099,116080.78125,24430.691406,2007.360596,112458.054688,22349.082031,2006.368408,114269.421875,-4.368408,102438.578125,6870.624488,3448.804083,24430.690665,24804.856006,12351.056853,12058.838856,18647.268281,20267.473808,8627.553878,15833.92,12736.677094,1.006917,1.0433,1.150211,0.627944,0.927814,2,3,15.639414,10.528347,102,2,-0.369378,112463.158717,61946.234842,377872.0,438.0,4657.021672,17.675487,10.603284,88,2,86,128569.68959,59559.074223,392834.0,34.0,392800.0,15.482006,9.184283,102,2,100,117330.21341,58572.410377,392834.0,22.0,392812.0,15.82607,11.559536,102,2,100,110227.572028,62742.850081,392834.0,309.0,392525.0,14.457633,8.521437,92,1,91,120662.229529,60970.779193,396512.0,110.0,396402.0,17.623925,12.08443,102,1,-2.353888,116121.61433,62563.550082,392834.0,126.0,998.566059,0.637867,-0.02234,-0.043051,-0.240041,0.051827,-0.053985,-0.083545,-0.293033,-0.004294,0.034733,-0.013232,-0.060332,-0.13296,-0.11292,-0.094892,0.105913,0.011782,0.158664,-0.082195,-0.112025,0.00898,-0.081507,-0.033544,0.025444,-0.038093,0.033407,0.103027,-0.026143,-0.045641,-0.071073,0.07702,0.017348,0.02941,-0.053922,-0.061592,-0.005049,0.113875,-0.059518,0.025278,0.048438,-0.02133,-0.077421,-0.102783,-0.035447,-0.079699,0.179091,-0.120872,0.045258,0.096234,0.016149,-0.004631,-0.054128,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0
2013,4,185626.0,185626.0,10,18562.6,46406.5,30.36742,-89.092816,-1.548282,0.220771,8,9.0,3.0,5.0,3.0,2.0,3.0,2.0,11.0,10.0,2.0,43,2404,24785,465,6156,14602,3352,2255,3765,21,11654.478516,2000.894043,100402.414062,8673.953125,2011.767456,113910.921875,10164.21582,2006.330811,107156.671875,6.669189,78469.328125,6428.42726,12134.17274,8673.953488,12270.566996,17082.87957,12058.838856,9810.263663,11654.478936,13542.542629,12071.714286,12571.168205,1.229948,0.873254,0.518067,1.034805,0.961623,0,1,11.232558,5.635082,34,1,4.037479,113956.452381,47282.575923,264479.0,33815.0,3163.728008,23.037022,11.773379,93,4,89,154892.925693,61282.60534,392519.0,2013.0,390506.0,12.261245,7.081156,95,1,94,117244.387609,58720.507136,396512.0,73.0,396439.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,22.105987,15.358907,101,2,-6.83595,100272.413453,53956.470129,360763.0,59.0,16847.766936,0.652955,-0.019767,-0.012213,-0.2632,0.048975,0.000535,-0.10106,-0.188952,-0.040387,0.136089,0.065207,-0.071903,-0.059024,-0.054604,-0.130763,0.145607,0.035699,0.088812,0.043316,-0.090174,0.032368,0.005044,-0.040884,0.173315,-0.050171,-0.04549,0.063149,-0.097107,-0.076247,-0.094886,-0.029348,0.029011,0.10435,0.019265,-0.105912,-0.086815,0.028779,-0.030378,0.033471,-0.007678,-0.077416,-0.110236,-0.087173,-0.124586,-0.074917,0.177213,-0.122972,0.053417,0.087917,0.036175,-0.027845,-0.093706,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0
2015,6,230620.0,230620.0,8,28827.5,38436.666667,45.561608,-94.1642,1.363408,-0.067141,3,33.0,6.0,5.0,6.0,3.0,3.0,4.0,14.0,5.0,36.0,1742,15219,24785,22821,20497,14602,14636,9259,365,602,9939.633789,2009.920288,115423.164062,8994.714844,2010.687744,122266.398438,9467.173828,2010.303955,118844.78125,4.696045,111775.21875,9360.771955,19466.728045,8994.71527,12270.566996,13298.318128,13944.440064,9810.263663,9939.633654,10138.452055,15748.237542,14927.707038,0.954906,1.100115,1.000198,0.729809,1.044707,3,3,12.312285,6.248543,61,2,2.957752,122391.687391,55903.320967,346965.0,2267.0,-5271.507002,13.90479,9.017663,102,1,101,111303.293102,55306.095717,396512.0,22.0,396490.0,15.482006,9.184283,102,2,100,117330.21341,58572.410377,392834.0,22.0,392812.0,15.265281,9.940321,101,1,100,117500.260147,58684.114027,396512.0,22.0,396490.0,13.601151,7.653625,101,1,100,120973.966183,57934.27407,392519.0,22.0,392497.0,13.079706,7.103995,101,1,2.19033,115453.008422,55905.119734,396512.0,22.0,1667.171966,0.647433,-0.026189,-0.091452,-0.264556,0.047532,-0.034677,-0.138056,-0.228196,0.001683,0.06453,0.023997,-0.081182,-0.11199,-0.031808,-0.113443,0.078229,0.073237,0.111402,-0.012003,-0.024828,0.000149,0.000635,-0.056153,0.127549,-0.090539,0.016204,0.066525,-0.088857,-0.075312,-0.092981,-0.038009,0.078232,0.085667,-0.001545,-0.050781,-0.060351,0.025844,-0.07929,0.018093,-0.010271,-0.036637,-0.101229,-0.141224,-0.121236,-0.073023,0.182814,-0.124433,0.061327,0.101733,0.007109,-0.066697,-0.041201,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0


In [5]:
predictions = pl.concat([train["price"].to_frame(), pl.DataFrame([None] * test.height, schema={"price": pl.Int64})])

In [7]:
lgbm = LGBMModel(*selecter.get_dataframe("lgbm"), seed=0)
lgbm.objective(100)

[I 2023-08-18 06:00:33,558] A new study created in memory with name: no-name-3c8908db-a36a-4491-9224-738b2b1ff4dd
  0%|          | 0/100 [00:00<?, ?it/s]

Best trial: 0. Best value: 0.64751:   1%|          | 1/100 [00:02<04:40,  2.83s/it]

[I 2023-08-18 06:00:36,386] Trial 0 finished with value: 0.6475100620616894 and parameters: {'num_leaves': 36, 'max_depth': 18, 'min_child_samples': 78, 'subsample': 0.5903948646972071, 'colsample_bytree': 0.4812893194050143, 'reg_alpha': 0.0014694435419424668, 'reg_lambda': 3.167361913032263e-05, 'feature_fraction': 0.9350638004692479, 'bagging_fraction': 0.9781976563006176, 'bagging_freq': 5}. Best is trial 0 with value: 0.6475100620616894.


Best trial: 1. Best value: 0.64653:   2%|▏         | 2/100 [00:05<04:00,  2.46s/it]

[I 2023-08-18 06:00:38,580] Trial 1 finished with value: 0.6465300007336806 and parameters: {'num_leaves': 35, 'max_depth': 15, 'min_child_samples': 119, 'subsample': 0.16393245237809825, 'colsample_bytree': 0.17841636973138664, 'reg_alpha': 1.4512665303724043e-08, 'reg_lambda': 0.04580983888874032, 'feature_fraction': 0.8668940505699103, 'bagging_fraction': 0.9220072889480915, 'bagging_freq': 1}. Best is trial 1 with value: 0.6465300007336806.


Best trial: 1. Best value: 0.64653:   3%|▎         | 3/100 [00:06<03:13,  1.99s/it]

[I 2023-08-18 06:00:40,016] Trial 2 finished with value: 0.6507271906201563 and parameters: {'num_leaves': 31, 'max_depth': 19, 'min_child_samples': 16, 'subsample': 0.6759289191947714, 'colsample_bytree': 0.22901795866814179, 'reg_alpha': 0.36087046265775286, 'reg_lambda': 0.00014955005393691516, 'feature_fraction': 0.6487971639943142, 'bagging_fraction': 0.5587333672627762, 'bagging_freq': 1}. Best is trial 1 with value: 0.6465300007336806.


Best trial: 3. Best value: 0.646213:   4%|▍         | 4/100 [00:07<02:44,  1.72s/it]

[I 2023-08-18 06:00:41,316] Trial 3 finished with value: 0.6462133444223787 and parameters: {'num_leaves': 37, 'max_depth': 2, 'min_child_samples': 80, 'subsample': 0.6508861504501793, 'colsample_bytree': 0.6552405971872812, 'reg_alpha': 0.35480083081155517, 'reg_lambda': 0.0028481469492314926, 'feature_fraction': 0.6157047403442716, 'bagging_fraction': 0.6622191722796049, 'bagging_freq': 1}. Best is trial 3 with value: 0.6462133444223787.


Best trial: 3. Best value: 0.646213:   5%|▌         | 5/100 [00:09<02:56,  1.86s/it]

[I 2023-08-18 06:00:43,436] Trial 4 finished with value: 0.6500255413264022 and parameters: {'num_leaves': 44, 'max_depth': 17, 'min_child_samples': 27, 'subsample': 0.21603366788936798, 'colsample_bytree': 0.38388551583176544, 'reg_alpha': 8.122433559209657e-06, 'reg_lambda': 0.0003643964717966421, 'feature_fraction': 0.6631609080773921, 'bagging_fraction': 0.9930243028355357, 'bagging_freq': 5}. Best is trial 3 with value: 0.6462133444223787.


Best trial: 5. Best value: 0.645852:   6%|▌         | 6/100 [00:11<02:40,  1.71s/it]

[I 2023-08-18 06:00:44,852] Trial 5 finished with value: 0.6458515748728587 and parameters: {'num_leaves': 12, 'max_depth': 17, 'min_child_samples': 33, 'subsample': 0.5196796955706757, 'colsample_bytree': 0.31998303280144247, 'reg_alpha': 1.8696343095249954e-07, 'reg_lambda': 7.638377698149978e-08, 'feature_fraction': 0.793797753679164, 'bagging_fraction': 0.4829097708091683, 'bagging_freq': 5}. Best is trial 5 with value: 0.6458515748728587.


Best trial: 6. Best value: 0.644106:   7%|▋         | 7/100 [00:12<02:30,  1.61s/it]

[I 2023-08-18 06:00:46,267] Trial 6 finished with value: 0.6441055496028988 and parameters: {'num_leaves': 53, 'max_depth': 4, 'min_child_samples': 108, 'subsample': 0.18648856710456677, 'colsample_bytree': 0.9788135185120562, 'reg_alpha': 5.613188324247261e-05, 'reg_lambda': 0.6517615040663892, 'feature_fraction': 0.7629073118470275, 'bagging_fraction': 0.8435581476389811, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:   8%|▊         | 8/100 [00:14<02:21,  1.54s/it]

[I 2023-08-18 06:00:47,648] Trial 7 finished with value: 0.6459254152869218 and parameters: {'num_leaves': 9, 'max_depth': 8, 'min_child_samples': 16, 'subsample': 0.3861848614545784, 'colsample_bytree': 0.472836695063203, 'reg_alpha': 3.259717550795507e-08, 'reg_lambda': 0.003465588189977713, 'feature_fraction': 0.739960872523945, 'bagging_fraction': 0.5592336945636672, 'bagging_freq': 1}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:   9%|▉         | 9/100 [00:15<02:24,  1.58s/it]

[I 2023-08-18 06:00:49,326] Trial 8 finished with value: 0.6492209968837489 and parameters: {'num_leaves': 38, 'max_depth': 23, 'min_child_samples': 41, 'subsample': 0.7006693419673136, 'colsample_bytree': 0.21861807616395296, 'reg_alpha': 0.005377960807748353, 'reg_lambda': 2.0665634478498945e-06, 'feature_fraction': 0.5099148172042701, 'bagging_fraction': 0.7519077608860498, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  10%|█         | 10/100 [00:17<02:17,  1.53s/it]

[I 2023-08-18 06:00:50,725] Trial 9 finished with value: 0.6550446927768635 and parameters: {'num_leaves': 2, 'max_depth': 17, 'min_child_samples': 35, 'subsample': 0.7616746199103354, 'colsample_bytree': 0.9659696906056944, 'reg_alpha': 9.77293810275356e-07, 'reg_lambda': 0.0004066854878593079, 'feature_fraction': 0.7552251587631034, 'bagging_fraction': 0.743351143474524, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  11%|█         | 11/100 [00:19<02:33,  1.73s/it]

[I 2023-08-18 06:00:52,905] Trial 10 finished with value: 0.6507505085087458 and parameters: {'num_leaves': 62, 'max_depth': 9, 'min_child_samples': 122, 'subsample': 0.9366763195250474, 'colsample_bytree': 0.9717347835605356, 'reg_alpha': 5.593843834941959e-05, 'reg_lambda': 0.09643804891502325, 'feature_fraction': 0.9736355868102851, 'bagging_fraction': 0.8551925594141547, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  12%|█▏        | 12/100 [00:20<02:08,  1.46s/it]

[I 2023-08-18 06:00:53,763] Trial 11 finished with value: 0.6484452218010871 and parameters: {'num_leaves': 18, 'max_depth': 2, 'min_child_samples': 95, 'subsample': 0.3507775064219657, 'colsample_bytree': 0.7340365887670226, 'reg_alpha': 9.460977194705953e-07, 'reg_lambda': 9.857740475606069e-08, 'feature_fraction': 0.8378544805830852, 'bagging_fraction': 0.4365776267460467, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  13%|█▎        | 13/100 [00:21<02:15,  1.55s/it]

[I 2023-08-18 06:00:55,522] Trial 12 finished with value: 0.652705767731717 and parameters: {'num_leaves': 58, 'max_depth': 11, 'min_child_samples': 54, 'subsample': 0.10106087519011635, 'colsample_bytree': 0.8181816636142784, 'reg_alpha': 4.611301859818868e-07, 'reg_lambda': 0.7123036879153268, 'feature_fraction': 0.7985685929330968, 'bagging_fraction': 0.4237149014756329, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  14%|█▍        | 14/100 [00:23<02:19,  1.62s/it]

[I 2023-08-18 06:00:57,292] Trial 13 finished with value: 0.6489084593177968 and parameters: {'num_leaves': 22, 'max_depth': 7, 'min_child_samples': 3, 'subsample': 0.4487720442744564, 'colsample_bytree': 0.6332088050085889, 'reg_alpha': 2.259021673762932e-05, 'reg_lambda': 5.444076147966956e-08, 'feature_fraction': 0.8806231667495892, 'bagging_fraction': 0.8331420066092983, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  15%|█▌        | 15/100 [00:25<02:32,  1.79s/it]

[I 2023-08-18 06:00:59,481] Trial 14 finished with value: 0.6509276226295124 and parameters: {'num_leaves': 49, 'max_depth': 13, 'min_child_samples': 103, 'subsample': 0.284085486552939, 'colsample_bytree': 0.35121962006540414, 'reg_alpha': 0.0006284216778870082, 'reg_lambda': 1.1161964357990123e-08, 'feature_fraction': 0.749069849875959, 'bagging_fraction': 0.6292843543185052, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 6. Best value: 0.644106:  16%|█▌        | 16/100 [00:28<02:43,  1.95s/it]

[I 2023-08-18 06:01:01,787] Trial 15 finished with value: 0.649487511667584 and parameters: {'num_leaves': 52, 'max_depth': 22, 'min_child_samples': 60, 'subsample': 0.4847257157296235, 'colsample_bytree': 0.11060218229755633, 'reg_alpha': 8.463681058370916e-08, 'reg_lambda': 7.314163614018206e-06, 'feature_fraction': 0.8108826453936372, 'bagging_fraction': 0.8179122593954121, 'bagging_freq': 5}. Best is trial 6 with value: 0.6441055496028988.


Best trial: 16. Best value: 0.644073:  17%|█▋        | 17/100 [00:29<02:21,  1.71s/it]

[I 2023-08-18 06:01:02,945] Trial 16 finished with value: 0.6440732739425292 and parameters: {'num_leaves': 24, 'max_depth': 5, 'min_child_samples': 48, 'subsample': 0.28127280012832134, 'colsample_bytree': 0.835728117656237, 'reg_alpha': 5.495900368769805e-06, 'reg_lambda': 1.1670377056574256e-06, 'feature_fraction': 0.4060195645059174, 'bagging_fraction': 0.7375185032398109, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  18%|█▊        | 18/100 [00:30<02:03,  1.51s/it]

[I 2023-08-18 06:01:03,999] Trial 17 finished with value: 0.645033776307842 and parameters: {'num_leaves': 25, 'max_depth': 5, 'min_child_samples': 76, 'subsample': 0.2528920290119911, 'colsample_bytree': 0.8638752787005917, 'reg_alpha': 5.1470321855453615e-06, 'reg_lambda': 2.0738703859889235e-06, 'feature_fraction': 0.401866639435603, 'bagging_fraction': 0.7305146914692642, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  19%|█▉        | 19/100 [00:31<01:54,  1.41s/it]

[I 2023-08-18 06:01:05,177] Trial 18 finished with value: 0.6447634744544753 and parameters: {'num_leaves': 28, 'max_depth': 4, 'min_child_samples': 98, 'subsample': 0.31358126029980954, 'colsample_bytree': 0.8643091698659897, 'reg_alpha': 0.00013379769846551414, 'reg_lambda': 1.3205575341955847e-05, 'feature_fraction': 0.5657020607745311, 'bagging_fraction': 0.79300929846598, 'bagging_freq': 1}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  20%|██        | 20/100 [00:32<01:50,  1.38s/it]

[I 2023-08-18 06:01:06,480] Trial 19 finished with value: 0.6441002313577718 and parameters: {'num_leaves': 43, 'max_depth': 5, 'min_child_samples': 48, 'subsample': 0.10220956197782005, 'colsample_bytree': 0.9675257224129697, 'reg_alpha': 2.5154381046293703e-06, 'reg_lambda': 0.00434258510115324, 'feature_fraction': 0.4230201570220323, 'bagging_fraction': 0.879534713331549, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  21%|██        | 21/100 [00:34<01:52,  1.42s/it]

[I 2023-08-18 06:01:08,007] Trial 20 finished with value: 0.6483315320656907 and parameters: {'num_leaves': 46, 'max_depth': 11, 'min_child_samples': 52, 'subsample': 0.10481984095068603, 'colsample_bytree': 0.7533043154993494, 'reg_alpha': 2.8054511832667922e-06, 'reg_lambda': 6.680339109117003e-07, 'feature_fraction': 0.4051113158305669, 'bagging_fraction': 0.8937974333983907, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  22%|██▏       | 22/100 [00:35<01:51,  1.43s/it]

[I 2023-08-18 06:01:09,441] Trial 21 finished with value: 0.6455923056681689 and parameters: {'num_leaves': 56, 'max_depth': 5, 'min_child_samples': 46, 'subsample': 0.1945777658760045, 'colsample_bytree': 0.9736570024276053, 'reg_alpha': 1.7129695916143388e-05, 'reg_lambda': 0.6588480831633784, 'feature_fraction': 0.4679557629907205, 'bagging_fraction': 0.8827399689151345, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  23%|██▎       | 23/100 [00:37<01:51,  1.44s/it]

[I 2023-08-18 06:01:10,922] Trial 22 finished with value: 0.6483039698878317 and parameters: {'num_leaves': 44, 'max_depth': 7, 'min_child_samples': 65, 'subsample': 0.1830365338810447, 'colsample_bytree': 0.9056036717113698, 'reg_alpha': 2.760867710410667e-06, 'reg_lambda': 0.01489287519994871, 'feature_fraction': 0.48844474500598517, 'bagging_fraction': 0.7918624077015508, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  24%|██▍       | 24/100 [00:38<01:41,  1.34s/it]

[I 2023-08-18 06:01:12,022] Trial 23 finished with value: 0.6460223657519764 and parameters: {'num_leaves': 63, 'max_depth': 4, 'min_child_samples': 68, 'subsample': 0.29037144153384137, 'colsample_bytree': 0.9927657488859083, 'reg_alpha': 9.903419042659953e-05, 'reg_lambda': 0.1253351853256299, 'feature_fraction': 0.5316330491720599, 'bagging_fraction': 0.9399856314378807, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  25%|██▌       | 25/100 [00:40<01:48,  1.45s/it]

[I 2023-08-18 06:01:13,736] Trial 24 finished with value: 0.6473545931873073 and parameters: {'num_leaves': 40, 'max_depth': 10, 'min_child_samples': 88, 'subsample': 0.4023639601584622, 'colsample_bytree': 0.9227415309726585, 'reg_alpha': 3.3250613359073714e-07, 'reg_lambda': 0.0023682673869429727, 'feature_fraction': 0.44834291154178835, 'bagging_fraction': 0.8625165055493407, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 16. Best value: 0.644073:  26%|██▌       | 26/100 [00:41<01:51,  1.51s/it]

[I 2023-08-18 06:01:15,370] Trial 25 finished with value: 0.6470406949809197 and parameters: {'num_leaves': 51, 'max_depth': 6, 'min_child_samples': 22, 'subsample': 0.2643098067828139, 'colsample_bytree': 0.8124582057132604, 'reg_alpha': 1.8003672499527027e-06, 'reg_lambda': 0.020569713668690228, 'feature_fraction': 0.5653132998873008, 'bagging_fraction': 0.7983639982536488, 'bagging_freq': 5}. Best is trial 16 with value: 0.6440732739425292.


Best trial: 26. Best value: 0.642658:  27%|██▋       | 27/100 [00:43<01:43,  1.42s/it]

[I 2023-08-18 06:01:16,593] Trial 26 finished with value: 0.6426576527159088 and parameters: {'num_leaves': 20, 'max_depth': 3, 'min_child_samples': 50, 'subsample': 0.14430351359678228, 'colsample_bytree': 0.9049321289913492, 'reg_alpha': 8.046759511407816e-06, 'reg_lambda': 0.31397840626496987, 'feature_fraction': 0.6927464757543285, 'bagging_fraction': 0.6996859900207485, 'bagging_freq': 5}. Best is trial 26 with value: 0.6426576527159088.


Best trial: 27. Best value: 0.642376:  28%|██▊       | 28/100 [00:44<01:38,  1.37s/it]

[I 2023-08-18 06:01:17,832] Trial 27 finished with value: 0.6423764099788104 and parameters: {'num_leaves': 17, 'max_depth': 3, 'min_child_samples': 46, 'subsample': 0.10060474003048595, 'colsample_bytree': 0.8976159836981201, 'reg_alpha': 1.0702544722380703e-07, 'reg_lambda': 7.66863944919939e-05, 'feature_fraction': 0.44493616646388356, 'bagging_fraction': 0.6674404385408661, 'bagging_freq': 1}. Best is trial 27 with value: 0.6423764099788104.


Best trial: 27. Best value: 0.642376:  29%|██▉       | 29/100 [00:45<01:30,  1.28s/it]

[I 2023-08-18 06:01:18,903] Trial 28 finished with value: 0.646361842908707 and parameters: {'num_leaves': 18, 'max_depth': 2, 'min_child_samples': 40, 'subsample': 0.34341588205651385, 'colsample_bytree': 0.7822374909593068, 'reg_alpha': 9.459001540966004e-08, 'reg_lambda': 6.414807978609194e-05, 'feature_fraction': 0.45659948619970536, 'bagging_fraction': 0.6831580198884699, 'bagging_freq': 1}. Best is trial 27 with value: 0.6423764099788104.


Best trial: 27. Best value: 0.642376:  30%|███       | 30/100 [00:46<01:31,  1.31s/it]

[I 2023-08-18 06:01:20,275] Trial 29 finished with value: 0.6434534442070255 and parameters: {'num_leaves': 11, 'max_depth': 3, 'min_child_samples': 69, 'subsample': 0.2331976434960968, 'colsample_bytree': 0.7049378634764227, 'reg_alpha': 3.8957103688960174e-08, 'reg_lambda': 3.4666354891494694e-05, 'feature_fraction': 0.6965694581725653, 'bagging_fraction': 0.70718618488193, 'bagging_freq': 1}. Best is trial 27 with value: 0.6423764099788104.


Best trial: 27. Best value: 0.642376:  31%|███       | 31/100 [00:47<01:46,  1.55s/it]


[I 2023-08-18 06:01:21,388] Trial 30 finished with value: 0.6465508010498588 and parameters: {'num_leaves': 9, 'max_depth': 3, 'min_child_samples': 74, 'subsample': 0.1489697230847907, 'colsample_bytree': 0.7064178025212421, 'reg_alpha': 2.1301505323589564e-08, 'reg_lambda': 3.2582926425767894e-05, 'feature_fraction': 0.7087178040194724, 'bagging_fraction': 0.6475235009554737, 'bagging_freq': 1}. Best is trial 27 with value: 0.6423764099788104.
[W 2023-08-18 06:01:21,468] Trial 31 failed with parameters: {'num_leaves': 15, 'max_depth': 3, 'min_child_samples': 58, 'subsample': 0.24779587428901512, 'colsample_bytree': 0.831293670609765, 'reg_alpha': 4.631729013919431e-08, 'reg_lambda': 0.0001273730203552704, 'feature_fraction': 0.6009588399600144, 'bagging_fraction': 0.6841434658641048, 'bagging_freq': 1} because of the following error: KeyboardInterrupt().
Traceback (most recent call last):
  File "/home/education/signate_scup2023/.venv/lib/python3.11/site-packages/optuna/study/_optimiz

KeyboardInterrupt: 

In [8]:
lgbm.best_params = {
    'num_leaves': 41,
    'max_depth': 4,
    'min_child_samples': 65,
    'subsample': 0.1813266686908916,
    'colsample_bytree': 0.9997207808739403,
    'reg_alpha': 3.8163343968470076e-06,
    'reg_lambda': 9.185674902594394e-05,
    'feature_fraction': 0.5180973927754882,
    'bagging_fraction': 0.8804646505719466,
    'bagging_freq': 1
}
lgbm_predictions = lgbm.predict(5)
predictions = pl.concat([predictions, lgbm_predictions], how="horizontal")

Fold_lgbm 0: 0.636015510527037
Fold_lgbm 1: 0.6569602826793614
Fold_lgbm 2: 0.6639626734725691
Fold_lgbm 3: 0.6492586335734132
Fold_lgbm 4: 0.6537258793302255


In [None]:
importance = lgbm.feature_importance()
importance = importance.sort(by='lgbm_importance_mean')
#グラフ表示
plt.figure(figsize=(12, 40))
plt.barh(importance["feature"], importance["lgbm_importance_mean"])
plt.xlabel('Feature importance')
plt.ylabel('Features')
plt.grid()
plt.show()

In [None]:
#xgb = XGBModel(train, test)
#xgb.objective(20)
#xgb.best_params = {'n_estimators': 767, 'max_depth': 8, 'lambda': 1.2306916748991704e-06, 'alpha': 0.018078104089246788, 'colsample_bytree': 0.42319770953022684, 'subsample': 0.2810517802368746, 'min_child_weight': 218, 'gamma': 6.031109467976734e-08, 'eta': 0.018889170085640027}
#xgb_predictions = xgb.predict()
#predictions = pl.concat([predictions, xgb_predictions], how="horizontal")

In [None]:
#rf = RandomForestModel(df)
##rf.objective(5)
#rf.best_params = {'max_depth': 9, 'min_samples_split': 11, 'min_samples_leaf': 14, 'max_features': 0.6306125661502896, 'max_leaf_nodes': 18, 'n_estimators': 8762, 'bootstrap': True}
#rf_predictions = rf.predict()
#predictions = pd.concat([predictions, rf_predictions], axis=1)

In [None]:
#rgf = RGFModel(df)
##rgf.objective(5)
#rgf.best_params = {'max_leaf': 8072, 'algorithm': 'RGF_Opt', 'test_interval': 142, 'min_samples_leaf': 11, 'reg_depth': 9, 'l2': 0.0002082492344277923, 'sl2': 4.2919223241162815e-07, 'normalize': False}
#rgf_predictions = rgf.predict()
#predictions = pd.concat([predictions, rgf_predictions], axis=1)

In [None]:
#cat = CatBoostModel(df)
##cat.objective(5)
#cat.best_params = {"depth": 6}
#cat_predictions = cat.predict()
#predictions = pd.concat([predictions, cat_predictions], axis=1)

In [None]:
predictions.head()

In [None]:
#model = Ridge(random_state=0)
#train = predictions[predictions["price"].notnull()]
#test = predictions[predictions["price"].isnull()]
#X_train = train.drop(["price"], axis=1)
#y_train = train["price"]
#X_test = test.drop(["price"], axis=1)
#model.fit(X_train, y_train)
#y_pred = model.predict(X_test)

In [None]:
y_pred = lgbm_predictions.mean(axis=1)[train.height:].to_list()

In [None]:
#sub = pl.read_csv(os.path.join(os.path.dirname(__file__), "../input/submit_sample.csv"), has_header=False, new_columns=["id", "price"])
#sub = sub.with_columns(pl.Series("", y_pred).alias("price"))
#sub.write_csv(os.path.join(os.path.dirname(__file__), "../output/submission_te0810_3.csv"), has_header=False)