# ライブラリのインポート / データの読み込み

In [1]:
!pip install transformers

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [22]:
import numpy as np
import pandas as pd

pd.set_option('max_colwidth', 500)
pd.set_option('max_columns', 500)
pd.set_option('max_rows', 500)

%matplotlib inline

from matplotlib import pyplot as plt
import matplotlib.ticker as mtick # For specifying the axes tick format 

import seaborn as sns
import re

import json, os, gc, math, time
import datetime
import collections
from tqdm import tqdm
import glob

from statistics import mean
from sklearn.preprocessing import MultiLabelBinarizer
from sklearn.preprocessing import LabelEncoder

from sklearn.model_selection import KFold, GroupKFold, StratifiedKFold

from sklearn import metrics
import time

import lightgbm as lgb

import warnings
warnings.filterwarnings("ignore")

In [3]:
#ドライブへのアクセス
from google.colab import drive
drive.mount('/content/drive')
%cd "/content/drive/My Drive/00_datascience/19_ufj_bank"

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).
/content/drive/My Drive/00_datascience/19_ufj_bank


In [4]:
train = pd.read_csv('input/train.csv')
test = pd.read_csv('input/test.csv')
sub = pd.read_csv('input/sample_submit.csv')

# bertによる特徴抽出

In [5]:
def remove_html(text):
    html_pattern = re.compile('<.*?>')
    return html_pattern.sub(r'', text)

In [6]:
for i in range(len(train)):
  train.loc[i, 'cleaned_text'] = remove_html(train.loc[i, 'html_content'])

for i in range(len(test)):
  test.loc[i, 'cleaned_text'] = remove_html(test.loc[i, 'html_content'])

In [7]:
#すでに抽出済みの特徴量を使用
text_train_df = pd.read_csv('input/05_seq_train_df.csv')
text_train_df.drop(['Unnamed: 0'], axis=1, inplace=True)
text_test_df = pd.read_csv('input/05_seq_test_df.csv')
text_test_df.drop(['Unnamed: 0'], axis=1, inplace=True)

In [8]:
merge_text = pd.concat([text_train_df, text_test_df], ignore_index=True)

# ラベルデータの前処理

In [9]:
#学習しやすいようにtrain, testをマージ
merge_df = pd.concat([train, test], ignore_index=True)

In [10]:
#goalカラムの数値化
for i in range(len(merge_df)):
  price_list = re.findall(r"\d+", merge_df.loc[i, 'goal'])
  merge_df.loc[i, 'goal_min'] = price_list[0]
  if len(price_list) == 1:
    merge_df.loc[i, 'goal_max'] = price_list[0]
  else:
    merge_df.loc[i, 'goal_max'] = price_list[1]

In [11]:
#int型に変換
merge_df['goal_max'] = merge_df['goal_max'].astype(int)
merge_df['goal_min'] = merge_df['goal_min'].astype(int)

#1日あたりの目標金額の算出
merge_df['goal_per_day_max'] = merge_df['goal_max'] / merge_df['duration']
merge_df['goal_per_day_min'] = merge_df['goal_min'] / merge_df['duration']
#merge_df.head()

In [12]:
# ワンホットエンコーディング

dummy_cols = ['goal',	'country', 'category1',	'category2']
from sklearn.preprocessing import OneHotEncoder

dummy_df = pd.get_dummies(merge_df[dummy_cols])

In [13]:
merge_df_new = pd.merge(merge_df, dummy_df, left_index=True, right_index=True)

In [14]:
#ラベルエンコーディング
from sklearn.preprocessing import LabelEncoder

le_cols = ['goal', 'country', 'category1', 'category2']

#カテゴリ変数をループしてlabel encoding
for c in le_cols:
  le = LabelEncoder()
  le.fit(merge_df_new[c])
  merge_df_new[c] = le.transform(merge_df_new[c])

# tfidfによる特徴抽出

In [15]:
#tfidfによる特徴抽出
from sklearn.feature_extraction.text import TfidfVectorizer
tv = TfidfVectorizer()
features = tv.fit_transform(merge_df_new["cleaned_text"].fillna(""))

In [16]:
from sklearn.decomposition import TruncatedSVD, NMF, LatentDirichletAllocation
from sklearn.pipeline import Pipeline



tfidf_svd = Pipeline(steps=[
    ("TfidfVectorizer", TfidfVectorizer()),
    ("TruncatedSVD", TruncatedSVD(n_components=1000, random_state=42))
])

features_svd = tfidf_svd.fit_transform(merge_df_new["cleaned_text"].fillna(""))

In [17]:
svd_df_merge = pd.DataFrame(features_svd)
svd_df_merge.head()

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,236,237,238,239,240,241,242,243,244,245,246,247,248,249,...,750,751,752,753,754,755,756,757,758,759,760,761,762,763,764,765,766,767,768,769,770,771,772,773,774,775,776,777,778,779,780,781,782,783,784,785,786,787,788,789,790,791,792,793,794,795,796,797,798,799,800,801,802,803,804,805,806,807,808,809,810,811,812,813,814,815,816,817,818,819,820,821,822,823,824,825,826,827,828,829,830,831,832,833,834,835,836,837,838,839,840,841,842,843,844,845,846,847,848,849,850,851,852,853,854,855,856,857,858,859,860,861,862,863,864,865,866,867,868,869,870,871,872,873,874,875,876,877,878,879,880,881,882,883,884,885,886,887,888,889,890,891,892,893,894,895,896,897,898,899,900,901,902,903,904,905,906,907,908,909,910,911,912,913,914,915,916,917,918,919,920,921,922,923,924,925,926,927,928,929,930,931,932,933,934,935,936,937,938,939,940,941,942,943,944,945,946,947,948,949,950,951,952,953,954,955,956,957,958,959,960,961,962,963,964,965,966,967,968,969,970,971,972,973,974,975,976,977,978,979,980,981,982,983,984,985,986,987,988,989,990,991,992,993,994,995,996,997,998,999
0,0.294975,0.000612,0.023093,-0.043301,-0.00465,0.020541,-0.045337,0.023749,-0.013548,0.034168,-0.013013,0.0068,-0.034913,0.006792,-0.015054,0.005607,-0.006633,0.028449,0.020395,-0.021418,0.013802,0.013191,-0.021499,0.007818,-0.03327,0.021218,-0.02872,0.018364,0.040835,0.015443,-0.009399,-0.024765,-0.008274,0.021418,-0.004099,-0.0018,0.006569,-0.017899,-0.0227,-0.039155,0.027662,-0.042093,-0.018316,0.007389,-0.015836,0.025763,0.019476,-0.021724,-0.004165,-0.040945,-0.011895,-0.005414,0.044285,0.000752,-0.02562,-0.012126,-0.016218,-0.032687,0.000541,0.013212,0.02316,0.008573,0.01985,0.001818,0.028804,0.006221,-0.017187,-0.031764,-0.003156,-0.015492,-0.02632,0.001645,-0.009675,-0.020839,0.005702,-0.031384,-0.014141,0.006166,-0.016562,0.021373,-0.019713,-0.013808,-0.013545,0.004556,0.024441,0.002668,0.007806,0.010765,-0.034016,-0.008416,-0.018521,-0.010729,-0.01425,-0.011515,0.015059,0.008557,0.014118,0.006811,-0.011104,-0.010446,-0.004324,-0.017287,-0.010474,-0.004138,-0.010734,-0.004927,0.010384,-0.017388,-0.008818,0.014501,0.016185,-0.012236,-0.001071,-0.003736,-0.004962,-0.001863,0.00549,-0.005913,0.011078,-0.000654,0.015868,-0.015941,-0.010237,-0.028429,0.00232,-0.006602,-0.037504,-0.015901,-0.001221,0.005836,-0.002604,0.033665,0.016386,0.011442,0.009914,-0.007815,-0.002609,-0.007079,0.006088,-0.030331,-0.013934,-0.017419,0.000299,-0.021974,0.014502,-0.016659,0.015314,-0.012596,-0.014667,-0.034675,-0.010979,-0.020586,-0.019136,-0.012399,-0.005613,0.00258,0.00575,-0.008406,-0.008458,-0.013055,-0.027402,-0.003059,0.002124,0.010547,-0.012725,-0.003126,0.016835,0.004937,-0.005492,-0.016231,0.017594,-0.005843,0.005354,-0.001336,0.014849,-0.014394,0.005559,-0.000798,0.019274,-0.007828,-0.013374,0.000941,-0.006692,-0.015561,-0.009937,0.028827,-0.003553,-0.008625,0.015199,-0.004971,0.01167,0.001208,0.014611,-0.005897,-0.014305,-0.000319,-0.002148,0.023332,0.001524,-0.009723,-0.013181,0.004239,0.002568,0.00901,-0.015208,-0.002074,0.03143,-0.028039,0.012889,-0.000447,0.03445,-0.047279,0.012189,-0.000357,-0.016639,-0.040275,-8.2e-05,-0.018842,-0.00257,0.010655,-0.014037,0.002502,-0.022144,-0.010554,-0.009705,0.002513,0.015605,-0.016693,0.011624,0.026751,-0.007696,-0.006099,0.013947,0.032808,-0.032835,0.002261,-0.000137,0.007278,0.001538,0.002026,0.008423,0.005439,-0.000653,-0.0132,0.000347,-0.000774,0.001934,-0.001673,-0.003433,0.01807,...,-0.016099,0.012883,-0.012841,0.007548,-0.002943,0.012171,-0.006604,-0.005415,-0.007829,0.007166,-0.003168,-0.001466,0.008689,-0.018905,-0.011179,-0.008115,0.022747,-0.00931,0.004477,-0.006221,-0.006181,0.029164,0.012193,-0.006215,-0.008985,-0.011839,-0.000163,-0.000881,0.026042,-0.009521,-0.00824,0.006103,0.009046,0.029958,-0.001803,-0.011523,0.002099,0.012144,-0.013081,-0.023165,-0.00018,0.006197,-0.009419,0.01424,0.003808,0.009915,-0.015102,0.022243,0.016207,0.010521,-0.014451,-0.00739,0.00176,-0.006443,0.013258,0.003821,-0.018041,0.006343,-0.008321,-0.017759,0.037882,0.007056,0.006074,0.00841,-0.00243,0.004689,0.013723,0.001751,-0.005835,0.00829,-0.007839,-0.002283,0.020922,0.030412,0.017098,-0.002124,-0.012072,0.012636,-0.004065,0.012042,-0.016107,-0.003588,0.006715,-0.000571,-0.014769,-0.000543,0.01913,0.026,-0.011347,0.009438,0.006729,-0.018298,0.009277,0.004362,-0.036778,-0.011224,0.005278,-0.025055,-0.005119,0.005691,0.024141,-0.01107,-0.013339,0.002221,0.010723,0.002505,-0.016674,-0.007536,0.001639,-0.011075,0.008626,-0.007707,0.034665,-0.002003,-0.003024,-0.012765,0.020067,-0.029421,-0.02669,-0.006795,-0.016024,-0.02877,-0.023783,0.004518,0.016675,0.013916,0.002384,-0.011357,-0.003361,-0.001323,0.005599,0.017254,0.003251,-0.029765,0.017826,0.019395,0.012429,-0.013652,-0.005969,0.001635,-0.003851,0.007266,0.007584,0.024149,-0.016264,0.016645,0.007142,-0.001446,0.011135,0.00882,0.010148,-0.01518,-0.008931,0.001281,0.022528,0.006061,0.010228,0.021073,0.013032,0.009872,-0.002013,-0.010935,-0.022775,0.016848,0.00115,-0.009085,0.011367,0.014402,0.014905,0.010605,0.013383,0.017596,-0.00983,0.012473,0.01669,0.021795,0.020104,-0.002639,0.007445,-0.00202,0.03592,-0.008698,0.000678,0.010546,0.017188,0.007885,0.012775,0.003499,-0.001949,-0.008935,-0.018692,0.004765,0.002306,-0.035943,0.004474,-0.003377,-0.009865,-0.00065,-0.00639,0.006445,-0.015233,0.016457,0.000989,0.007472,0.008095,0.000736,0.007946,0.002536,-0.003446,0.007217,0.008118,-0.002294,0.008856,-0.002071,-0.005032,-0.005876,0.01849,-0.015047,-0.012355,-0.006415,-0.028527,0.012203,0.002919,0.008932,-0.007454,0.018613,-0.008403,0.001163,-0.01645,-0.011396,-0.003107,0.014947,0.01684,-0.026257,-0.008401,-0.012782,-0.010434,0.010039,0.011844,0.02103,0.000124,0.000489,-0.009038,-0.000686,0.007243,-0.002014,0.008054,-0.018337,-0.023733,-0.020279
1,0.163203,-0.003916,0.027252,0.018163,-0.00254,-0.027746,0.007868,0.058626,-0.076373,0.005528,0.001529,0.063075,0.065003,-0.036947,0.008215,-0.003938,0.08456,-0.047096,-0.007873,-0.02466,-0.022861,0.038011,0.000873,-0.016922,0.020855,-0.002865,0.014032,-0.020272,-0.01099,-0.01371,0.02368,0.002178,-0.000967,-0.031042,-0.004752,-0.018551,0.003876,-0.013606,-0.001061,0.018526,-0.004301,0.007273,0.003778,0.014811,-0.016286,0.008544,0.024332,0.020833,0.004556,0.000324,-0.032635,-0.005675,0.023483,0.00302,-0.02912,0.024354,-0.002268,-0.00464,0.009902,0.008106,0.024882,0.008621,-0.002636,0.013224,0.019978,-0.012846,0.007939,0.000698,-0.000215,0.016903,-0.000474,-0.014555,0.012662,0.01251,-0.021633,-0.008538,-0.003125,-0.008088,0.013117,-0.009557,0.000851,-0.017528,0.001191,0.007709,-0.001766,0.020381,-0.005863,-0.02302,0.024056,-0.00791,0.005164,-0.011834,0.001697,-0.016363,-0.008947,-0.011359,0.003416,0.02878,-0.028298,0.029897,0.010942,-0.013545,-0.002524,-0.006774,-0.011273,-0.019111,-0.005488,-0.0174,-0.002447,0.000306,0.009233,0.045651,-0.019731,-0.005575,-0.015095,0.000524,-0.040278,-0.005891,0.010361,0.025173,-0.016652,-0.011704,0.002611,0.011888,0.003131,0.010718,0.003442,0.020717,0.014597,0.005664,-0.014143,0.031922,-0.01108,-0.030853,-0.025534,-0.031084,0.028729,-0.021383,-0.00704,0.013895,0.011523,0.039635,0.016981,0.01985,0.002501,0.01681,-0.004223,-0.018938,0.023907,-0.023487,0.002042,0.013993,0.00224,-0.002838,-0.009567,0.018288,-0.016401,-0.027892,0.010301,0.001655,-0.016686,0.016793,0.020765,-0.005369,-0.005755,-0.003286,0.053517,-0.001225,-0.013528,0.000271,0.008128,-0.022293,0.005077,-0.010455,-0.004157,-0.001229,0.037806,-0.009819,0.004569,0.012237,-0.020589,0.010069,0.039595,0.016693,-0.043044,-0.018939,0.003175,-0.009108,-0.034252,-0.004267,-0.012908,0.022416,-0.018378,-0.026124,-0.008873,0.051107,0.003554,-0.011948,-0.009944,-0.037975,0.002671,0.035799,0.023041,0.020862,0.045357,-0.020641,0.012063,-0.050603,-0.02814,0.014709,0.031799,-0.023259,0.002922,-0.033369,0.020316,0.015812,-0.021273,-0.007365,-0.014972,0.018593,0.005183,-0.011201,-3e-05,0.025178,-0.028153,-0.006706,0.008234,-0.017415,0.02312,0.024656,0.035186,0.036811,0.033137,-0.033257,-0.001973,0.01518,0.002734,0.02386,0.026429,-0.019863,-0.044924,0.019595,-0.02486,-0.008751,0.03552,0.011556,0.015276,-0.030822,0.016943,0.025531,...,-0.014491,0.021563,-0.00191,-0.027161,-0.012628,-0.005645,-0.019387,0.009913,-0.000309,0.010775,-0.00722,-0.004204,-0.003175,0.000653,-0.002736,5.4e-05,-0.020718,0.004102,0.022705,0.013215,-0.000467,0.010435,-0.019733,-0.016565,0.02263,0.004184,0.015468,-0.003021,-0.007257,0.007486,0.022607,0.008557,-0.001968,-0.004975,-0.006968,-0.001328,-0.016286,-0.027568,-0.004201,0.000924,0.004066,-0.001837,0.015101,-0.00818,0.006889,-0.007366,0.012027,-0.019927,0.017396,0.001098,0.008229,-0.006866,-0.005379,0.009148,0.001501,-0.003874,0.001819,-0.012747,-0.017725,0.006927,-0.010464,-0.005854,-0.001681,-0.007335,-0.009632,0.008367,-0.018594,-0.002657,0.002032,0.017999,0.032068,-0.004056,0.02175,0.013154,0.009671,0.014351,0.00351,0.01613,0.014172,0.025033,0.002877,-0.010961,-0.016607,-0.010237,-0.021819,-0.011139,0.01957,0.007313,-0.005829,0.002248,0.014776,-0.02375,-0.007566,0.0181,0.022587,-0.01401,0.006129,-0.000616,-0.026692,0.024902,-0.029891,0.012419,-0.01117,0.006421,0.004966,0.015502,-0.016539,-0.000376,-0.004348,0.020437,0.009455,-0.00836,-0.000999,-0.0387,0.005629,0.015564,0.002159,0.001678,0.002856,-0.01193,0.000469,-0.003209,-0.018165,-0.016314,-0.001649,-0.008824,-0.00777,0.003651,-0.005602,-0.001789,-0.024382,-0.014518,0.007571,0.008288,-0.00601,0.006855,-0.015831,-0.012372,-0.0153,-0.006085,0.006057,0.004746,-0.013825,-0.003538,0.009069,-0.008544,-0.001935,-0.004956,-0.004616,-0.025658,-0.020609,0.000116,0.006831,0.014914,0.012233,-0.003559,-0.012581,-0.02491,0.003656,-0.005802,0.007581,0.008013,-0.008877,-0.020485,-7e-06,0.02812,-0.022953,0.000516,0.021637,-0.014669,-0.008374,-0.002591,0.000908,0.018143,-0.017998,-0.018524,-0.001669,-0.00564,-0.01516,-0.00566,-0.006,-0.002963,-0.009491,0.001823,-0.002844,0.003992,-0.017427,0.009456,0.003433,0.007122,-0.004276,-0.018932,0.001612,-0.037727,-0.006228,0.033435,-0.026799,-0.018439,-0.002599,0.001306,-0.007357,-0.004787,-0.00831,-0.024953,0.020005,0.002315,-0.00773,0.003005,-0.021059,-0.008973,-0.01052,0.018879,-0.017572,0.001697,0.017083,-0.015465,-0.010573,0.008283,-0.003409,0.000338,-0.013632,0.010031,0.002132,0.011786,-0.004094,-0.002239,-0.028196,0.002179,0.002188,0.002522,0.016844,-0.013167,0.007012,-0.001568,-0.026436,0.010996,0.011933,0.029659,0.00392,-0.004853,-0.004148,-0.008931,-0.000211,-0.00533,0.000174,0.008596,0.006749,-0.010743,-0.001232,0.001835
2,0.416711,0.004678,-0.052108,-0.079082,-0.010637,0.082928,-0.018374,0.036624,-0.071621,-0.046461,-0.014937,0.041353,-0.02023,-0.010954,-0.087217,-0.007253,-0.03034,0.014084,-0.012513,-0.046767,-0.023714,0.035796,0.028166,-0.034383,-0.00715,-0.004731,0.04632,-0.009199,0.025744,-0.041982,0.013379,0.020957,0.029541,0.004967,-0.000513,-0.047433,-0.016302,-0.025886,-0.005006,0.002927,0.008941,-0.000856,-0.043802,0.011403,0.037981,-0.043098,-0.028671,-0.0116,0.021919,0.053433,-0.013155,0.027544,0.046684,-0.003121,-0.026851,0.043691,0.032545,-0.001155,-0.045344,-0.050752,-0.007366,0.016945,0.045481,-0.009139,-0.000754,0.007511,0.015721,0.010016,0.010388,-0.009383,0.017408,-0.006617,-0.015586,-0.005069,0.021774,0.019472,0.001169,0.019556,0.013257,0.016152,-0.00386,-0.000786,-0.049568,0.011025,0.066205,-0.001984,0.01615,-0.012385,-0.015478,0.014282,-0.032462,0.014437,0.005782,0.024554,-0.002222,-0.025342,0.021117,-0.02482,0.064364,0.055525,0.006127,0.018422,-0.026213,0.033217,0.008746,0.020138,-0.027226,0.040503,-0.044763,-0.018296,0.026648,-0.016892,-0.03163,-0.01276,0.047104,-0.027456,-0.035023,-0.019202,-0.029166,-0.03371,-0.014051,-0.016597,0.001666,-0.037552,-0.022097,0.007841,-0.011892,-0.044172,0.019255,-0.003818,0.011183,-0.032117,-0.005148,0.015417,0.003596,0.015057,0.006639,-0.045651,-0.012154,-0.01804,0.018817,0.005831,-0.009101,-0.017881,-0.005815,0.031115,-0.009515,-0.027579,-0.020108,-0.009779,-0.001768,-0.018058,0.001469,-0.011637,0.000498,-0.000336,-0.01798,-0.023657,0.012333,0.011513,-0.054273,-0.004851,0.005643,-0.005956,0.017713,0.019298,-0.008307,0.006968,0.022609,-0.043011,0.008947,-0.011541,0.00771,-0.000788,-0.036268,-0.006473,0.021165,0.001536,0.010151,-0.005417,0.008128,-0.037581,0.028168,0.033521,0.007275,-0.014207,-0.00441,-0.037092,0.007924,-0.030522,-0.006879,-0.012487,-0.01403,-0.000711,-0.015325,-0.02017,0.010217,0.014397,-0.00385,-0.006103,0.002713,-0.037777,-0.0081,-0.016956,-0.025564,0.01436,0.031717,-0.007588,0.004932,-0.010349,0.031142,-0.001216,-0.001228,0.011576,-0.029862,-0.04081,-0.014916,-0.013363,-0.003375,0.002491,0.027492,0.026274,0.012392,-0.036279,0.012096,-0.016733,-0.031237,0.006643,0.020541,0.02526,0.00863,-0.042927,0.020364,0.008361,0.015502,0.013699,-0.006739,-0.024219,0.024582,-0.017702,0.003237,0.015193,-0.008769,-0.011097,-0.00643,0.025075,0.007788,-0.012706,-0.027435,-0.023457,...,-0.014857,-0.00216,-0.011976,0.020542,-0.006018,-0.027447,0.013445,-0.01198,0.01235,0.009707,0.013402,0.005683,0.000625,0.026848,-0.010496,0.008083,-0.010812,-0.001824,-0.028365,-0.02889,0.008116,0.008144,-0.002608,0.004059,0.003763,0.011824,-0.03439,0.008332,-0.010611,0.011242,-0.003349,-0.006388,0.017141,-0.002094,0.021249,-0.010146,-0.008463,0.006551,-0.013283,0.009914,-0.005801,0.029222,-0.015934,-0.000666,-0.002653,-0.011533,0.010184,-0.003417,0.006184,0.027988,0.00926,-0.008196,0.015286,0.007804,0.007631,0.020264,0.013792,0.00459,-0.012086,-0.025707,0.001059,-0.008521,0.010453,0.006803,0.007349,-0.01384,0.015168,-0.019589,0.00084,0.003193,-0.003203,0.005045,0.017933,0.000784,-0.012789,0.00148,0.018621,-0.017031,0.002626,0.003433,-0.004536,0.002009,-0.013262,0.007675,0.000336,-0.01075,-0.012059,-0.022031,0.000461,0.013457,-0.016934,-0.012933,0.003099,0.026767,0.013726,-0.017949,-0.011543,0.020636,-0.000441,0.011238,-0.011171,-0.00765,0.015625,0.003788,-0.020689,0.019662,-0.008173,0.014061,-0.000284,-0.026717,0.008861,-0.009344,-0.007306,-0.018563,0.019679,0.003151,-0.013251,-0.005034,0.014641,-0.005812,0.011181,-0.002103,0.003715,-0.015333,-0.010421,0.010473,-0.00678,-0.016673,-0.009246,0.007189,0.020128,0.004302,-0.012103,-0.005518,-0.001214,0.001717,0.021088,0.008352,-0.000897,-0.016625,0.00088,-0.017332,0.01251,0.008588,0.008806,0.007567,0.018045,0.003331,0.010538,-0.008543,-0.004654,0.000713,-0.014124,-0.010727,0.006192,0.0016,-0.008668,0.004956,-0.004512,-0.014023,-0.012967,-0.000638,0.017548,-0.00768,-0.007315,-0.001778,-0.000527,0.030791,0.002955,-6.9e-05,0.004696,0.009216,-0.002777,-0.006202,-0.00383,0.004999,0.01092,-0.0008,0.002981,0.013403,-0.006788,0.009266,-0.00161,0.006845,-0.001608,-0.006379,-0.004918,0.006208,-0.019745,-0.001083,0.01084,-0.018603,0.021087,-0.013267,0.013273,0.000572,0.012304,0.015473,-0.001938,-0.016747,-0.011603,0.00049,0.006754,-0.015257,-0.004887,0.012116,0.022651,-0.007946,0.000725,-0.012088,-0.008467,0.005077,0.001769,-0.011165,-0.006992,0.009142,-0.004191,-0.012172,-0.006984,0.014484,-0.022477,-0.005632,0.018116,0.003595,-0.004487,-0.016404,-0.008032,-0.005169,-0.005786,-0.010108,0.011953,0.006167,0.006354,0.011018,-0.000981,-0.001572,-0.005907,0.00932,0.013183,-0.007182,0.012934,0.014778,0.017162,-0.000349,0.000987,0.015633,0.008954,-0.010348,0.006575,-0.014112
3,0.354831,0.040357,-0.074435,-0.139759,-0.016493,0.005695,-0.074026,-0.054699,-0.033434,0.03026,0.012646,-0.062608,0.00824,-0.000222,-0.032508,-0.007403,-0.049114,0.0356,-0.013439,-0.027953,0.020413,-0.020297,0.060604,-0.026912,-0.018858,-0.024159,0.034556,-0.004681,-0.079385,0.025447,-0.036582,-0.026748,-0.002426,-0.01561,-0.007601,0.007285,0.002834,0.006736,-0.003803,0.029364,-0.034202,0.01329,-0.03283,0.00622,0.019821,0.005239,-0.005108,-0.004175,-0.019418,-0.003939,-0.0229,0.005322,-0.006389,-0.016694,0.020352,0.000532,-0.005358,0.007688,0.015439,-0.014903,0.000497,-0.025091,0.038066,0.022247,0.025744,-0.044186,-0.013244,-0.01435,0.032862,0.004652,0.002907,0.052804,0.040742,0.001959,0.038512,-0.037992,0.009148,0.009935,-0.012512,-0.019181,-0.02082,-0.010559,0.004297,-0.031179,-0.03984,0.013303,0.006313,0.010052,0.026313,0.012935,-0.003577,0.018719,-0.009603,-0.006088,-0.005305,-0.00056,0.016964,0.01316,-0.020031,0.016817,-0.021971,-0.009791,-0.004445,0.00135,-0.009765,-0.009284,0.030867,-0.00231,-0.024532,0.013115,0.010341,0.006994,0.028502,-0.038407,0.001474,-0.001461,0.012973,-0.013424,0.017586,-0.023397,-0.008244,0.001646,0.006405,0.015847,0.011986,-0.004791,0.019177,-0.000444,0.008817,-0.030391,0.030161,0.012279,0.0412,-0.001849,0.010755,-0.001938,0.009961,0.022877,0.016852,0.019603,-0.013305,-0.011957,0.017533,-0.028892,-0.001102,-0.005012,-0.01334,-0.006471,-0.009103,0.011448,0.008719,0.011907,-0.027063,0.008273,0.014869,-0.020488,0.008205,0.017412,-0.012122,-0.019606,6.3e-05,-0.016888,0.000609,-0.007586,-0.02095,-0.006462,0.00882,-0.017223,-0.010221,0.016537,-0.019464,0.001446,-0.033243,0.017079,0.001037,-0.036752,0.013987,-0.00093,0.032308,0.023817,-0.014823,-0.002498,-0.016409,0.019117,0.010393,-0.020819,0.010697,0.00703,-0.019943,-0.012122,-0.022144,-0.005367,0.028425,0.023097,0.004683,-0.00022,-0.012699,0.000804,0.025886,0.010371,-0.019809,0.000561,0.009143,0.004792,-0.00835,-0.003197,-0.005574,-0.024619,0.017152,-0.012928,0.017486,-0.016929,0.008582,-0.007906,-0.015085,0.019877,0.013868,-0.012204,0.016049,0.017897,-0.000649,0.005307,-0.033497,-0.002593,0.013232,0.003024,0.002759,-0.002712,0.005477,-0.011919,-0.006065,-0.009448,0.006449,0.003561,0.021671,-0.013557,-0.00211,-0.009508,0.020472,0.011725,-0.001872,0.008712,0.01369,0.002172,0.002079,-0.006013,0.00149,0.014787,0.005351,-0.026147,...,0.011632,0.003777,-0.005038,-0.03486,-0.002287,0.007412,-0.032065,0.027521,0.00441,0.004578,-0.007357,-0.010225,0.024198,-0.008371,0.007081,-0.011657,0.003902,0.002629,-0.002359,0.003715,0.000919,-0.024047,0.023534,0.00192,0.005026,-0.025874,0.002473,0.009828,-0.00022,-0.013283,0.015758,-0.019447,0.003965,-0.007609,0.000406,-0.008155,0.001179,-0.024954,0.003644,0.008312,0.000676,0.012392,-0.009195,-0.015123,-0.005614,-0.01256,-0.016877,0.010155,0.002459,0.010004,0.023314,0.008574,0.008594,-0.005049,0.036177,-0.0035,0.001582,0.002943,-0.003729,-0.006037,-0.002205,0.005887,0.009146,-0.002269,0.001287,-0.010818,-0.025416,0.017802,0.026037,0.00656,-0.004174,0.000747,-0.015709,0.000676,-0.025741,0.004742,0.012904,-0.00106,0.013402,0.017817,0.010493,0.003192,-0.012465,0.003589,0.001525,-0.002632,-0.012802,-0.018991,-0.006782,-0.013642,0.020988,-0.003163,0.00317,-0.014955,-0.020833,0.006626,0.014323,0.01657,0.001981,-0.011016,-0.006053,0.011569,0.032834,0.005437,-0.01757,0.032496,0.024372,-0.003924,0.012155,0.013369,-0.007649,-0.012178,-0.001225,-0.003112,-0.002941,-0.027923,-0.018719,-0.001747,0.006152,-0.014483,0.006486,-0.001865,-0.015074,-0.01919,-0.0011,-0.021225,0.01264,-0.002907,0.016307,0.017844,-0.001223,0.003435,0.003767,0.007851,0.005853,0.024788,-0.006201,0.015758,-0.019047,-0.003009,-0.006989,-0.007274,0.008466,-0.011538,-0.013219,-0.006061,0.013187,0.022545,0.001105,-0.022129,-0.025426,-0.019197,0.008071,-0.002727,0.009418,0.01047,-0.015868,0.014608,0.01331,-0.012707,3.2e-05,-0.014194,-0.008931,-0.000238,-0.012185,0.01785,-0.024195,0.001021,0.006956,-0.011032,-0.003599,0.011939,0.001227,-0.005888,0.009995,-0.009991,-0.010683,-0.002204,-0.005606,-0.012877,0.013541,-0.009793,-0.006724,-0.005561,0.013113,0.020208,-0.020939,-0.007329,-0.002547,-0.001549,0.003672,0.00689,0.001792,-0.000765,0.010997,0.012701,0.005545,0.010882,-0.01839,-0.002396,0.008529,-0.015515,0.00328,0.000177,-0.005979,-0.000474,0.009878,0.002668,-0.015074,0.023535,0.025727,-0.005711,-0.003026,-0.0021,0.010756,-0.007389,0.022679,-0.021783,0.011469,0.023369,0.013543,0.005819,-0.008193,-0.022173,0.010043,-0.010266,0.004841,0.003978,0.006775,0.023316,-0.002508,-0.010891,-0.00632,-0.007378,-0.009789,-0.001304,-0.019433,0.00726,-0.013169,-0.005807,0.003505,0.002077,0.0087,0.003708,-0.009396,0.001097,0.005384,-0.021981,0.014758,0.001323
4,0.260418,0.001437,0.023826,-0.039866,-0.012193,0.048333,0.003216,0.018025,0.000457,0.010451,-0.007496,0.005901,-0.013798,-0.00127,0.006453,-0.006204,-0.013362,-0.00464,-0.011439,0.004546,-0.020052,0.021943,-0.038509,-0.031898,0.021489,-0.04358,0.026812,0.028345,-0.051297,-0.026968,0.002224,0.008726,0.006622,0.004064,0.009595,-0.014266,0.000759,-0.018837,-0.017229,-0.012619,-0.015413,0.001253,-0.002926,-0.005068,-0.006741,0.008884,-0.026707,0.007758,-0.002768,0.019606,0.0084,0.002017,0.007639,-0.024668,-0.019798,-0.009077,0.010443,0.014548,-0.003935,-0.001725,-0.012165,-0.014666,0.00495,0.020164,-0.020817,-0.003486,-0.001153,-0.021603,0.006628,0.014381,0.002429,0.008681,0.005371,-0.006455,0.007451,-0.007448,-0.008729,-0.008689,0.027924,0.003964,0.004692,-0.009452,0.040757,-0.002294,-0.031132,-0.027936,0.01816,0.000445,0.027245,-0.01469,-0.009801,0.025528,-0.010282,-0.003054,0.008385,0.020047,0.018788,-0.015323,0.011298,0.001274,-0.012685,0.011211,-0.003496,-0.015086,0.018461,0.010039,0.004739,0.008245,-0.009951,0.010161,0.003167,0.008002,0.006856,0.045457,-0.003717,0.005907,-0.006409,-0.005648,-0.00528,0.002772,-0.019114,0.002834,-0.023933,0.020473,0.008406,-0.004248,-0.01397,-0.01335,-0.001464,0.030525,0.036413,-0.008728,0.009513,-0.005477,-0.002815,-0.016502,-0.020021,-0.002263,-0.007754,0.028613,-0.027242,0.006785,0.017183,-0.017848,-0.007099,0.008683,-0.009221,-0.0066,0.011027,0.008383,-0.006325,0.003703,0.001017,0.01697,-0.007225,0.003562,-0.00077,-0.013412,9e-06,0.003014,-0.002322,0.00144,0.002704,-0.001626,0.020536,0.004499,-0.015401,0.015077,-0.007936,-0.013811,0.008415,0.013475,0.00319,0.039058,-0.003731,-0.018056,0.005108,-0.003523,0.003485,0.012334,0.026674,-0.011207,0.011113,-0.015886,0.008407,-0.005337,0.011466,-0.003606,0.00555,-0.013253,0.005936,-0.012032,-0.019458,0.022411,0.026451,-0.010068,0.012942,0.007071,0.010529,0.005094,0.005497,-0.017846,0.014543,0.000704,0.002868,0.001769,0.000755,-0.0167,0.006314,-0.026375,0.02485,0.010919,0.008715,-0.025685,0.006094,-0.010598,0.022431,0.002813,-0.008159,-0.01669,0.007257,-0.000645,-0.005431,0.006583,-0.019347,-0.005865,0.004368,-0.007054,-0.008473,-0.013201,0.004146,0.006203,-0.024055,-0.035922,-0.018692,0.003655,0.002455,-0.013312,-0.0142,-0.000274,0.010439,0.015272,0.003749,-0.002744,0.001232,-0.000504,-0.007763,0.004023,0.007308,-0.010887,...,-0.013173,0.023503,-0.010245,-0.015603,0.026,0.029594,0.001302,-0.021453,0.02307,0.006232,0.005747,0.006323,-0.008617,0.011267,0.015093,-0.005216,0.015048,0.002781,-0.02322,0.005438,-0.001666,0.002513,-0.011097,0.01738,-0.008317,-0.004583,-0.002354,0.007639,0.013353,-0.013146,-0.025517,-0.0271,-0.006591,0.001843,0.001062,-0.012657,-0.007179,-0.039001,-0.003399,0.005394,0.009915,-0.027925,0.000765,0.012588,-0.008022,-0.001207,-0.010596,-0.002761,-0.007922,0.002595,-0.031436,0.004379,5.4e-05,-0.008197,-0.018943,-0.010019,0.006205,0.005405,0.009652,-0.023458,0.025697,-0.005892,-0.01169,-0.027872,0.001346,-0.011951,0.004023,0.006672,0.034805,-0.01774,0.004024,0.00501,-0.003977,0.034318,0.02068,-0.008413,-0.002519,0.011755,0.000651,-0.033324,-0.013947,0.011879,-0.003168,0.000963,0.014483,-0.010325,0.006459,-0.030672,0.010891,0.004653,-0.025613,0.017819,-0.015316,0.014326,0.029078,-0.001413,-0.015053,-0.015853,-0.004021,0.030505,0.009326,4.9e-05,0.009161,-0.010304,-0.004189,-0.015463,0.016571,0.012624,0.003678,-0.001421,0.015006,0.008807,-0.007519,0.026629,-0.007716,-0.015358,0.023818,-0.00792,0.023507,-0.028177,0.000231,0.011322,0.025646,-0.005576,0.006567,-0.002166,-0.010547,0.01199,0.004171,-0.003129,-0.00584,0.003658,-0.031407,0.022655,7.8e-05,0.016811,0.03095,-0.00353,0.004136,-0.004726,-0.011563,0.007177,-0.017104,-0.04369,0.024385,0.016168,-0.006112,0.012056,0.01702,-0.0144,0.022438,-0.026379,0.012208,-0.009011,-0.007607,-0.017701,0.02037,-0.007433,-0.001069,0.011731,0.015423,0.010314,0.025385,-0.005858,-0.005249,0.002673,0.021611,-0.029679,0.001213,0.006744,0.044891,0.013353,0.02231,0.010267,-0.008566,-0.012184,-0.024157,0.003042,-0.014568,-0.005744,-0.005019,0.011744,0.016017,0.016955,-0.018329,0.018231,0.01226,0.034439,0.01607,0.018735,-0.004544,0.003598,0.008704,0.028522,-0.008638,0.006914,-0.01909,-0.023486,0.001516,-0.017873,-0.013283,0.001644,0.046562,0.006549,-0.00219,-0.007218,0.013065,0.001522,0.015876,0.017838,-0.023688,0.001774,-0.012914,-0.009435,0.027438,-0.015447,0.002116,-0.024751,0.020434,0.028441,0.027867,0.01051,0.012785,0.007194,0.015611,0.015381,0.003264,-0.041768,-0.013986,0.003217,-0.008579,-0.016507,-0.008806,-0.024715,-0.017433,0.04227,0.033567,0.011603,0.008257,0.020121,-0.00271,-0.004643,-0.003341,0.037405,-0.018459,-0.00043,0.024612,-0.003941,0.022521,-0.018837


# w2vによる特徴抽出

https://qiita.com/propella/items/febc423998fd210800ca
よりフォーク

In [26]:
#単語に対して分散表現を与える
from gensim.models.doc2vec import Doc2Vec, TaggedDocument
documents = [TaggedDocument(doc, [i]) for i, doc in enumerate(merge_df_new["cleaned_text"])]
model = Doc2Vec(documents, vector_size=100, window=5, min_count=1, workers=4)



In [None]:
#コサイン類似度が上位n個のものを抽出
n = 10
for i in range(len(merge_df_new)):
  print(i)
  for j in range(n):
    merge_df_new.loc[i, 'similar{}'.format(j)] = model.docvecs.most_similar(i)[j][0]

In [28]:
merge_df_new.head()

Unnamed: 0,id,goal,country,duration,category1,category2,html_content,state,cleaned_text,goal_min,goal_max,goal_per_day_max,goal_per_day_min,goal_1-1000,goal_100000+,goal_10001-11000,goal_1001-2000,goal_11001-12000,goal_12001-13000,goal_13001-14000,goal_14001-15000,goal_15001-16000,goal_16001-17000,goal_17001-18000,goal_18001-19000,goal_19001-20000,goal_20001-21000,goal_2001-3000,goal_21001-22000,goal_22001-23000,goal_23001-24000,goal_24001-25000,goal_25001-26000,goal_26001-27000,goal_27001-28000,goal_28001-29000,goal_29001-30000,goal_30001-31000,goal_3001-4000,goal_31001-32000,goal_32001-33000,goal_33001-34000,goal_34001-35000,goal_35001-36000,goal_36001-37000,goal_37001-38000,goal_38001-39000,goal_39001-40000,goal_40001-41000,goal_4001-5000,goal_41001-42000,goal_42001-43000,goal_43001-44000,goal_44001-45000,goal_45001-46000,goal_46001-47000,goal_47001-48000,goal_48001-49000,goal_49001-50000,goal_50001-51000,goal_5001-6000,goal_51001-52000,goal_52001-53000,goal_53001-54000,goal_54001-55000,goal_55001-56000,goal_56001-57000,goal_57001-58000,goal_58001-59000,goal_59001-60000,goal_60001-61000,goal_6001-7000,goal_61001-62000,goal_62001-63000,goal_63001-64000,goal_64001-65000,goal_65001-66000,goal_66001-67000,goal_67001-68000,goal_68001-69000,goal_69001-70000,goal_70001-71000,goal_7001-8000,goal_71001-72000,goal_72001-73000,goal_73001-74000,goal_74001-75000,goal_75001-76000,goal_76001-77000,goal_77001-78000,goal_78001-79000,goal_79001-80000,goal_80001-81000,goal_8001-9000,goal_81001-82000,goal_82001-83000,goal_83001-84000,goal_84001-85000,goal_85001-86000,goal_86001-87000,goal_87001-88000,goal_88001-89000,goal_89001-90000,goal_90001-91000,goal_9001-10000,goal_91001-92000,goal_92001-93000,goal_93001-94000,goal_94001-95000,goal_95001-96000,goal_96001-97000,goal_97001-98000,goal_98001-99000,goal_99001-100000,country_AT,country_AU,country_BE,country_CA,country_CH,country_DE,country_DK,country_ES,country_FR,country_GB,country_HK,country_IE,country_IT,country_JP,country_LU,country_MX,country_NL,country_NO,country_NZ,country_SE,country_SG,country_US,category1_art,category1_comics,category1_crafts,category1_dance,category1_design,category1_fashion,category1_film & video,category1_food,category1_games,category1_journalism,category1_music,category1_photography,category1_publishing,category1_technology,category1_theater,category2_3d printing,category2_academic,category2_accessories,category2_action,category2_animals,category2_animation,category2_anthologies,category2_apparel,category2_apps,category2_architecture,category2_art books,category2_audio,category2_bacon,category2_blues,category2_calendars,category2_camera equipment,category2_candles,category2_ceramics,category2_children's books,category2_childrenswear,category2_chiptune,category2_civic design,category2_classical music,category2_comedy,category2_comic books,category2_community gardens,category2_conceptual art,category2_cookbooks,category2_country & folk,category2_couture,category2_crochet,category2_digital art,category2_diy,category2_diy electronics,category2_documentary,category2_drama,category2_drinks,category2_electronic music,category2_embroidery,category2_events,category2_experimental,category2_fabrication tools,category2_faith,category2_family,category2_fantasy,category2_farmer's markets,category2_farms,category2_festivals,category2_fiction,category2_fine art,category2_flight,category2_food trucks,category2_footwear,category2_gadgets,category2_gaming hardware,category2_glass,category2_graphic design,category2_graphic novels,category2_hardware,category2_hip-hop,category2_horror,category2_illustration,category2_immersive,category2_indie rock,category2_installations,category2_interactive design,category2_jazz,category2_jewelry,category2_kids,category2_knitting,category2_latin,category2_letterpress,category2_literary journals,category2_literary spaces,category2_live games,category2_makerspaces,category2_metal,category2_mixed media,category2_mobile games,category2_movie theaters,category2_music videos,category2_musical,category2_narrative film,category2_nature,category2_nonfiction,category2_painting,category2_people,category2_performance art,category2_performances,category2_periodicals,category2_pet fashion,category2_photo,category2_photobooks,category2_places,category2_playing cards,category2_plays,category2_poetry,category2_pop,category2_pottery,category2_print,category2_printing,category2_product design,category2_public art,category2_punk,category2_puzzles,category2_quilts,category2_r&b,category2_radio & podcasts,category2_ready-to-wear,category2_residencies,category2_restaurants,category2_robots,category2_rock,category2_romance,category2_science fiction,category2_sculpture,category2_shorts,category2_small batch,category2_social practice,category2_software,category2_sound,category2_space exploration,category2_spaces,category2_stationery,category2_tabletop games,category2_television,category2_textiles,category2_thrillers,category2_toys,category2_translations,category2_typography,category2_vegan,category2_video,category2_video art,category2_video games,category2_wearables,category2_weaving,category2_web,category2_webcomics,category2_webseries,category2_woodworking,category2_workshops,category2_world music,category2_young adult,category2_zines,similar0,similar1,similar2,similar3,similar4,similar5,similar6,similar7,similar8,similar9
0,train_00000,13,21,45,0,77,"<div class=""contents""><div><p><a href=""http://dummy.com"">http://dummy.com<p>In its first year, The Shillito's Elves Display won an international \ndesign award for Shillito's department store. The elves display is arts\n and crafts at its finest. The mixed media exhibit displays the talents\n of local fine arts graduates, and the display, while ""folksy"", is as \ntechnologically advanced as Disney World's famous ""It's a Small World"" \nride. </p><p>The Shillito's Elves attracted close to 100...",1.0,"http://dummy.comIn its first year, The Shillito's Elves Display won an international \ndesign award for Shillito's department store. The elves display is arts\n and crafts at its finest. The mixed media exhibit displays the talents\n of local fine arts graduates, and the display, while ""folksy"", is as \ntechnologically advanced as Disney World's famous ""It's a Small World"" \nride. The Shillito's Elves attracted close to 100,000 people each\n year. It was one of the most beloved Christmas ...",20001,21000,466.666667,444.466667,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,17777.0,18927.0,18186.0,19377.0,3618.0,2223.0,14866.0,1928.0,4056.0,12259.0
1,train_00001,12,21,59,7,110,"<div class=""contents""><div><p>Cultural Pretzel Sports Bar is a place where people can come and watch their favorite local and world wide sports teams, while enjoying their favorite ethnic foods on a soft pretzel. Our menu includes a variety of appetizers and soft pretzels. Our pretzels include - Mexican Taco, Mexican Steak Fajita, Greek Gyro, Italian Sausage and Peppers, and American Steak Philly Soft Pretzels. With more to be added to the menu as the business grows.</p><p>Cultural Pretze...",0.0,"Cultural Pretzel Sports Bar is a place where people can come and watch their favorite local and world wide sports teams, while enjoying their favorite ethnic foods on a soft pretzel. Our menu includes a variety of appetizers and soft pretzels. Our pretzels include - Mexican Taco, Mexican Steak Fajita, Greek Gyro, Italian Sausage and Peppers, and American Steak Philly Soft Pretzels. With more to be added to the menu as the business grows.Cultural Pretzel plans to start with one Sports Bar ...",19001,20000,338.983051,322.050847,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,19176.0,16360.0,97.0,2171.0,18606.0,264.0,16191.0,15756.0,18700.0,1250.0
2,train_00002,14,21,38,0,87,"<div class=""contents""><div><p>I want to perform this piece guerilla style, off the back off a 24 Ft truck on Christmas Eve, amid last minute Christmas shopping in New York City.</p>\n<p>Our truck pulls in, the door rolls up and I perform. </p>\n<p>New York is a city where you just do it - no excuses. A place where the new becomes the normal real fast and where the artist is challenged to capture the attention and the hearts of the unshockable and unstoppable. In times of celebration and re...",0.0,"I want to perform this piece guerilla style, off the back off a 24 Ft truck on Christmas Eve, amid last minute Christmas shopping in New York City.\nOur truck pulls in, the door rolls up and I perform. \nNew York is a city where you just do it - no excuses. A place where the new becomes the normal real fast and where the artist is challenged to capture the attention and the hearts of the unshockable and unstoppable. In times of celebration and rest our intellectual faculties are more easil...",2001,3000,78.947368,52.657895,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,183.0,181.0,14.0,10.0,409.0,9.0,7.0,197.0,143.0,199.0
3,train_00003,3,21,30,0,77,"<div class=""contents""><div><div class=""template asset"" contenteditable=""false"" data-alt-text="""" data-caption="""" data-id=""_xxx_"">\n<figure>\n<img alt="""" class=""fit lazyload"" data-src=""http://dummy.com""/>\n</figure>\n</div>\n<h1 class=""page-anchor"" id=""_xxx_"">\n<figure>\n<img alt=""Canyon de Chelley, Dine' (Navajo) Reservation, Arizona. Photo by: Demian Dine' Yazhi'"" class=""fit lazyload"" data-src=""http://dummy.com""/>\n<figcaption class=""px2"">Canyon de Chelley, Dine' (Navajo) Reservation, Arizo...",1.0,"\n\n\n\n\n\n\n\nCanyon de Chelley, Dine' (Navajo) Reservation, Arizona. Photo by: Demian Dine' Yazhi'\n\n\nAnother goal of the project is to actively document the process through photography, digital video, and text/prose/poetry. By using a variety of media and content, I hope this will help the project to take a unique shape as the weeks unfold. Ultimately, the end goal of TRANSPLANT ///. is independent zine distribution and a potential gallery showing. At this point, my interests lie i...",1001,2000,66.666667,33.366667,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,392.0,405.0,718.0,588.0,164.0,5.0,197.0,117.0,447.0,218.0
4,train_00004,3,21,29,6,139,"<div class=""contents""><div><p>The story of the show, both on and off screen, is about daring to dream after something impossible.Even with an incredible amount of difficulty and opposition, the project continued to grow in size and depth. A year ago, we were finally able to release the pilot episode of Azusa Ghost Hunter's Society (check it out! <a href=""http://dummy.com"">\n<figure>\n<img alt="""" class=""fit lazyload"" data-src=""http://dummy.com""/>\n</figure>\n</div>\n<p>Which brings us to now...",1.0,"The story of the show, both on and off screen, is about daring to dream after something impossible.Even with an incredible amount of difficulty and opposition, the project continued to grow in size and depth. A year ago, we were finally able to release the pilot episode of Azusa Ghost Hunter's Society (check it out! \n\n\n\n\nWhich brings us to now! We have three more episodes in the works to finish out the season, and we need your help to bring them to life! All financial support will go t...",1001,2000,68.965517,34.517241,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,18547.0,18429.0,16105.0,15984.0,3194.0,4070.0,17278.0,2735.0,18813.0,6928.0


# データのマージ/kmeans用の前処理

In [29]:
#不要なカラムの定義
non_use_cols = ['id',	'html_content',	'cleaned_text', 'state']

#スケーリングするカラムの選択
sc_cols = ['duration', 'goal_max', 'goal_min', 'goal_per_day_max', 'goal_per_day_min']

In [30]:
#bertから抽出した特徴量を追加
full_merge_df = pd.merge(merge_df_new.drop(non_use_cols, axis=1), merge_text, left_index=True, right_index=True)

In [31]:
#tfidfから抽出した特徴量を追加
full_merge_df_fin = pd.merge(full_merge_df, svd_df_merge, left_index=True, right_index=True)

In [32]:
full_merge_df_fin.head()

Unnamed: 0,goal,country,duration,category1,category2,goal_min,goal_max,goal_per_day_max,goal_per_day_min,goal_1-1000,goal_100000+,goal_10001-11000,goal_1001-2000,goal_11001-12000,goal_12001-13000,goal_13001-14000,goal_14001-15000,goal_15001-16000,goal_16001-17000,goal_17001-18000,goal_18001-19000,goal_19001-20000,goal_20001-21000,goal_2001-3000,goal_21001-22000,goal_22001-23000,goal_23001-24000,goal_24001-25000,goal_25001-26000,goal_26001-27000,goal_27001-28000,goal_28001-29000,goal_29001-30000,goal_30001-31000,goal_3001-4000,goal_31001-32000,goal_32001-33000,goal_33001-34000,goal_34001-35000,goal_35001-36000,goal_36001-37000,goal_37001-38000,goal_38001-39000,goal_39001-40000,goal_40001-41000,goal_4001-5000,goal_41001-42000,goal_42001-43000,goal_43001-44000,goal_44001-45000,goal_45001-46000,goal_46001-47000,goal_47001-48000,goal_48001-49000,goal_49001-50000,goal_50001-51000,goal_5001-6000,goal_51001-52000,goal_52001-53000,goal_53001-54000,goal_54001-55000,goal_55001-56000,goal_56001-57000,goal_57001-58000,goal_58001-59000,goal_59001-60000,goal_60001-61000,goal_6001-7000,goal_61001-62000,goal_62001-63000,goal_63001-64000,goal_64001-65000,goal_65001-66000,goal_66001-67000,goal_67001-68000,goal_68001-69000,goal_69001-70000,goal_70001-71000,goal_7001-8000,goal_71001-72000,goal_72001-73000,goal_73001-74000,goal_74001-75000,goal_75001-76000,goal_76001-77000,goal_77001-78000,goal_78001-79000,goal_79001-80000,goal_80001-81000,goal_8001-9000,goal_81001-82000,goal_82001-83000,goal_83001-84000,goal_84001-85000,goal_85001-86000,goal_86001-87000,goal_87001-88000,goal_88001-89000,goal_89001-90000,goal_90001-91000,goal_9001-10000,goal_91001-92000,goal_92001-93000,goal_93001-94000,goal_94001-95000,goal_95001-96000,goal_96001-97000,goal_97001-98000,goal_98001-99000,goal_99001-100000,country_AT,country_AU,country_BE,country_CA,country_CH,country_DE,country_DK,country_ES,country_FR,country_GB,country_HK,country_IE,country_IT,country_JP,country_LU,country_MX,country_NL,country_NO,country_NZ,country_SE,country_SG,country_US,category1_art,category1_comics,category1_crafts,category1_dance,category1_design,category1_fashion,category1_film & video,category1_food,category1_games,category1_journalism,category1_music,category1_photography,category1_publishing,category1_technology,category1_theater,category2_3d printing,category2_academic,category2_accessories,category2_action,category2_animals,category2_animation,category2_anthologies,category2_apparel,category2_apps,category2_architecture,category2_art books,category2_audio,category2_bacon,category2_blues,category2_calendars,category2_camera equipment,category2_candles,category2_ceramics,category2_children's books,category2_childrenswear,category2_chiptune,category2_civic design,category2_classical music,category2_comedy,category2_comic books,category2_community gardens,category2_conceptual art,category2_cookbooks,category2_country & folk,category2_couture,category2_crochet,category2_digital art,category2_diy,category2_diy electronics,category2_documentary,category2_drama,category2_drinks,category2_electronic music,category2_embroidery,category2_events,category2_experimental,category2_fabrication tools,category2_faith,category2_family,category2_fantasy,category2_farmer's markets,category2_farms,category2_festivals,category2_fiction,category2_fine art,category2_flight,category2_food trucks,category2_footwear,category2_gadgets,category2_gaming hardware,category2_glass,category2_graphic design,category2_graphic novels,category2_hardware,category2_hip-hop,category2_horror,category2_illustration,category2_immersive,category2_indie rock,category2_installations,category2_interactive design,category2_jazz,category2_jewelry,category2_kids,category2_knitting,category2_latin,category2_letterpress,category2_literary journals,category2_literary spaces,category2_live games,category2_makerspaces,category2_metal,category2_mixed media,category2_mobile games,category2_movie theaters,category2_music videos,category2_musical,category2_narrative film,category2_nature,category2_nonfiction,category2_painting,category2_people,category2_performance art,category2_performances,category2_periodicals,category2_pet fashion,category2_photo,category2_photobooks,category2_places,category2_playing cards,category2_plays,category2_poetry,category2_pop,category2_pottery,category2_print,category2_printing,category2_product design,category2_public art,...,750,751,752,753,754,755,756,757,758,759,760,761,762,763,764,765,766,767,768,769,770,771,772,773,774,775,776,777,778,779,780,781,782,783,784,785,786,787,788,789,790,791,792,793,794,795,796,797,798,799,800,801,802,803,804,805,806,807,808,809,810,811,812,813,814,815,816,817,818,819,820,821,822,823,824,825,826,827,828,829,830,831,832,833,834,835,836,837,838,839,840,841,842,843,844,845,846,847,848,849,850,851,852,853,854,855,856,857,858,859,860,861,862,863,864,865,866,867,868,869,870,871,872,873,874,875,876,877,878,879,880,881,882,883,884,885,886,887,888,889,890,891,892,893,894,895,896,897,898,899,900,901,902,903,904,905,906,907,908,909,910,911,912,913,914,915,916,917,918,919,920,921,922,923,924,925,926,927,928,929,930,931,932,933,934,935,936,937,938,939,940,941,942,943,944,945,946,947,948,949,950,951,952,953,954,955,956,957,958,959,960,961,962,963,964,965,966,967,968,969,970,971,972,973,974,975,976,977,978,979,980,981,982,983,984,985,986,987,988,989,990,991,992,993,994,995,996,997,998,999
0,13,21,45,0,77,20001,21000,466.666667,444.466667,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.016099,0.012883,-0.012841,0.007548,-0.002943,0.012171,-0.006604,-0.005415,-0.007829,0.007166,-0.003168,-0.001466,0.008689,-0.018905,-0.011179,-0.008115,0.022747,-0.00931,0.004477,-0.006221,-0.006181,0.029164,0.012193,-0.006215,-0.008985,-0.011839,-0.000163,-0.000881,0.026042,-0.009521,-0.00824,0.006103,0.009046,0.029958,-0.001803,-0.011523,0.002099,0.012144,-0.013081,-0.023165,-0.00018,0.006197,-0.009419,0.01424,0.003808,0.009915,-0.015102,0.022243,0.016207,0.010521,-0.014451,-0.00739,0.00176,-0.006443,0.013258,0.003821,-0.018041,0.006343,-0.008321,-0.017759,0.037882,0.007056,0.006074,0.00841,-0.00243,0.004689,0.013723,0.001751,-0.005835,0.00829,-0.007839,-0.002283,0.020922,0.030412,0.017098,-0.002124,-0.012072,0.012636,-0.004065,0.012042,-0.016107,-0.003588,0.006715,-0.000571,-0.014769,-0.000543,0.01913,0.026,-0.011347,0.009438,0.006729,-0.018298,0.009277,0.004362,-0.036778,-0.011224,0.005278,-0.025055,-0.005119,0.005691,0.024141,-0.01107,-0.013339,0.002221,0.010723,0.002505,-0.016674,-0.007536,0.001639,-0.011075,0.008626,-0.007707,0.034665,-0.002003,-0.003024,-0.012765,0.020067,-0.029421,-0.02669,-0.006795,-0.016024,-0.02877,-0.023783,0.004518,0.016675,0.013916,0.002384,-0.011357,-0.003361,-0.001323,0.005599,0.017254,0.003251,-0.029765,0.017826,0.019395,0.012429,-0.013652,-0.005969,0.001635,-0.003851,0.007266,0.007584,0.024149,-0.016264,0.016645,0.007142,-0.001446,0.011135,0.00882,0.010148,-0.01518,-0.008931,0.001281,0.022528,0.006061,0.010228,0.021073,0.013032,0.009872,-0.002013,-0.010935,-0.022775,0.016848,0.00115,-0.009085,0.011367,0.014402,0.014905,0.010605,0.013383,0.017596,-0.00983,0.012473,0.01669,0.021795,0.020104,-0.002639,0.007445,-0.00202,0.03592,-0.008698,0.000678,0.010546,0.017188,0.007885,0.012775,0.003499,-0.001949,-0.008935,-0.018692,0.004765,0.002306,-0.035943,0.004474,-0.003377,-0.009865,-0.00065,-0.00639,0.006445,-0.015233,0.016457,0.000989,0.007472,0.008095,0.000736,0.007946,0.002536,-0.003446,0.007217,0.008118,-0.002294,0.008856,-0.002071,-0.005032,-0.005876,0.01849,-0.015047,-0.012355,-0.006415,-0.028527,0.012203,0.002919,0.008932,-0.007454,0.018613,-0.008403,0.001163,-0.01645,-0.011396,-0.003107,0.014947,0.01684,-0.026257,-0.008401,-0.012782,-0.010434,0.010039,0.011844,0.02103,0.000124,0.000489,-0.009038,-0.000686,0.007243,-0.002014,0.008054,-0.018337,-0.023733,-0.020279
1,12,21,59,7,110,19001,20000,338.983051,322.050847,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.014491,0.021563,-0.00191,-0.027161,-0.012628,-0.005645,-0.019387,0.009913,-0.000309,0.010775,-0.00722,-0.004204,-0.003175,0.000653,-0.002736,5.4e-05,-0.020718,0.004102,0.022705,0.013215,-0.000467,0.010435,-0.019733,-0.016565,0.02263,0.004184,0.015468,-0.003021,-0.007257,0.007486,0.022607,0.008557,-0.001968,-0.004975,-0.006968,-0.001328,-0.016286,-0.027568,-0.004201,0.000924,0.004066,-0.001837,0.015101,-0.00818,0.006889,-0.007366,0.012027,-0.019927,0.017396,0.001098,0.008229,-0.006866,-0.005379,0.009148,0.001501,-0.003874,0.001819,-0.012747,-0.017725,0.006927,-0.010464,-0.005854,-0.001681,-0.007335,-0.009632,0.008367,-0.018594,-0.002657,0.002032,0.017999,0.032068,-0.004056,0.02175,0.013154,0.009671,0.014351,0.00351,0.01613,0.014172,0.025033,0.002877,-0.010961,-0.016607,-0.010237,-0.021819,-0.011139,0.01957,0.007313,-0.005829,0.002248,0.014776,-0.02375,-0.007566,0.0181,0.022587,-0.01401,0.006129,-0.000616,-0.026692,0.024902,-0.029891,0.012419,-0.01117,0.006421,0.004966,0.015502,-0.016539,-0.000376,-0.004348,0.020437,0.009455,-0.00836,-0.000999,-0.0387,0.005629,0.015564,0.002159,0.001678,0.002856,-0.01193,0.000469,-0.003209,-0.018165,-0.016314,-0.001649,-0.008824,-0.00777,0.003651,-0.005602,-0.001789,-0.024382,-0.014518,0.007571,0.008288,-0.00601,0.006855,-0.015831,-0.012372,-0.0153,-0.006085,0.006057,0.004746,-0.013825,-0.003538,0.009069,-0.008544,-0.001935,-0.004956,-0.004616,-0.025658,-0.020609,0.000116,0.006831,0.014914,0.012233,-0.003559,-0.012581,-0.02491,0.003656,-0.005802,0.007581,0.008013,-0.008877,-0.020485,-7e-06,0.02812,-0.022953,0.000516,0.021637,-0.014669,-0.008374,-0.002591,0.000908,0.018143,-0.017998,-0.018524,-0.001669,-0.00564,-0.01516,-0.00566,-0.006,-0.002963,-0.009491,0.001823,-0.002844,0.003992,-0.017427,0.009456,0.003433,0.007122,-0.004276,-0.018932,0.001612,-0.037727,-0.006228,0.033435,-0.026799,-0.018439,-0.002599,0.001306,-0.007357,-0.004787,-0.00831,-0.024953,0.020005,0.002315,-0.00773,0.003005,-0.021059,-0.008973,-0.01052,0.018879,-0.017572,0.001697,0.017083,-0.015465,-0.010573,0.008283,-0.003409,0.000338,-0.013632,0.010031,0.002132,0.011786,-0.004094,-0.002239,-0.028196,0.002179,0.002188,0.002522,0.016844,-0.013167,0.007012,-0.001568,-0.026436,0.010996,0.011933,0.029659,0.00392,-0.004853,-0.004148,-0.008931,-0.000211,-0.00533,0.000174,0.008596,0.006749,-0.010743,-0.001232,0.001835
2,14,21,38,0,87,2001,3000,78.947368,52.657895,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.014857,-0.00216,-0.011976,0.020542,-0.006018,-0.027447,0.013445,-0.01198,0.01235,0.009707,0.013402,0.005683,0.000625,0.026848,-0.010496,0.008083,-0.010812,-0.001824,-0.028365,-0.02889,0.008116,0.008144,-0.002608,0.004059,0.003763,0.011824,-0.03439,0.008332,-0.010611,0.011242,-0.003349,-0.006388,0.017141,-0.002094,0.021249,-0.010146,-0.008463,0.006551,-0.013283,0.009914,-0.005801,0.029222,-0.015934,-0.000666,-0.002653,-0.011533,0.010184,-0.003417,0.006184,0.027988,0.00926,-0.008196,0.015286,0.007804,0.007631,0.020264,0.013792,0.00459,-0.012086,-0.025707,0.001059,-0.008521,0.010453,0.006803,0.007349,-0.01384,0.015168,-0.019589,0.00084,0.003193,-0.003203,0.005045,0.017933,0.000784,-0.012789,0.00148,0.018621,-0.017031,0.002626,0.003433,-0.004536,0.002009,-0.013262,0.007675,0.000336,-0.01075,-0.012059,-0.022031,0.000461,0.013457,-0.016934,-0.012933,0.003099,0.026767,0.013726,-0.017949,-0.011543,0.020636,-0.000441,0.011238,-0.011171,-0.00765,0.015625,0.003788,-0.020689,0.019662,-0.008173,0.014061,-0.000284,-0.026717,0.008861,-0.009344,-0.007306,-0.018563,0.019679,0.003151,-0.013251,-0.005034,0.014641,-0.005812,0.011181,-0.002103,0.003715,-0.015333,-0.010421,0.010473,-0.00678,-0.016673,-0.009246,0.007189,0.020128,0.004302,-0.012103,-0.005518,-0.001214,0.001717,0.021088,0.008352,-0.000897,-0.016625,0.00088,-0.017332,0.01251,0.008588,0.008806,0.007567,0.018045,0.003331,0.010538,-0.008543,-0.004654,0.000713,-0.014124,-0.010727,0.006192,0.0016,-0.008668,0.004956,-0.004512,-0.014023,-0.012967,-0.000638,0.017548,-0.00768,-0.007315,-0.001778,-0.000527,0.030791,0.002955,-6.9e-05,0.004696,0.009216,-0.002777,-0.006202,-0.00383,0.004999,0.01092,-0.0008,0.002981,0.013403,-0.006788,0.009266,-0.00161,0.006845,-0.001608,-0.006379,-0.004918,0.006208,-0.019745,-0.001083,0.01084,-0.018603,0.021087,-0.013267,0.013273,0.000572,0.012304,0.015473,-0.001938,-0.016747,-0.011603,0.00049,0.006754,-0.015257,-0.004887,0.012116,0.022651,-0.007946,0.000725,-0.012088,-0.008467,0.005077,0.001769,-0.011165,-0.006992,0.009142,-0.004191,-0.012172,-0.006984,0.014484,-0.022477,-0.005632,0.018116,0.003595,-0.004487,-0.016404,-0.008032,-0.005169,-0.005786,-0.010108,0.011953,0.006167,0.006354,0.011018,-0.000981,-0.001572,-0.005907,0.00932,0.013183,-0.007182,0.012934,0.014778,0.017162,-0.000349,0.000987,0.015633,0.008954,-0.010348,0.006575,-0.014112
3,3,21,30,0,77,1001,2000,66.666667,33.366667,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,0.011632,0.003777,-0.005038,-0.03486,-0.002287,0.007412,-0.032065,0.027521,0.00441,0.004578,-0.007357,-0.010225,0.024198,-0.008371,0.007081,-0.011657,0.003902,0.002629,-0.002359,0.003715,0.000919,-0.024047,0.023534,0.00192,0.005026,-0.025874,0.002473,0.009828,-0.00022,-0.013283,0.015758,-0.019447,0.003965,-0.007609,0.000406,-0.008155,0.001179,-0.024954,0.003644,0.008312,0.000676,0.012392,-0.009195,-0.015123,-0.005614,-0.01256,-0.016877,0.010155,0.002459,0.010004,0.023314,0.008574,0.008594,-0.005049,0.036177,-0.0035,0.001582,0.002943,-0.003729,-0.006037,-0.002205,0.005887,0.009146,-0.002269,0.001287,-0.010818,-0.025416,0.017802,0.026037,0.00656,-0.004174,0.000747,-0.015709,0.000676,-0.025741,0.004742,0.012904,-0.00106,0.013402,0.017817,0.010493,0.003192,-0.012465,0.003589,0.001525,-0.002632,-0.012802,-0.018991,-0.006782,-0.013642,0.020988,-0.003163,0.00317,-0.014955,-0.020833,0.006626,0.014323,0.01657,0.001981,-0.011016,-0.006053,0.011569,0.032834,0.005437,-0.01757,0.032496,0.024372,-0.003924,0.012155,0.013369,-0.007649,-0.012178,-0.001225,-0.003112,-0.002941,-0.027923,-0.018719,-0.001747,0.006152,-0.014483,0.006486,-0.001865,-0.015074,-0.01919,-0.0011,-0.021225,0.01264,-0.002907,0.016307,0.017844,-0.001223,0.003435,0.003767,0.007851,0.005853,0.024788,-0.006201,0.015758,-0.019047,-0.003009,-0.006989,-0.007274,0.008466,-0.011538,-0.013219,-0.006061,0.013187,0.022545,0.001105,-0.022129,-0.025426,-0.019197,0.008071,-0.002727,0.009418,0.01047,-0.015868,0.014608,0.01331,-0.012707,3.2e-05,-0.014194,-0.008931,-0.000238,-0.012185,0.01785,-0.024195,0.001021,0.006956,-0.011032,-0.003599,0.011939,0.001227,-0.005888,0.009995,-0.009991,-0.010683,-0.002204,-0.005606,-0.012877,0.013541,-0.009793,-0.006724,-0.005561,0.013113,0.020208,-0.020939,-0.007329,-0.002547,-0.001549,0.003672,0.00689,0.001792,-0.000765,0.010997,0.012701,0.005545,0.010882,-0.01839,-0.002396,0.008529,-0.015515,0.00328,0.000177,-0.005979,-0.000474,0.009878,0.002668,-0.015074,0.023535,0.025727,-0.005711,-0.003026,-0.0021,0.010756,-0.007389,0.022679,-0.021783,0.011469,0.023369,0.013543,0.005819,-0.008193,-0.022173,0.010043,-0.010266,0.004841,0.003978,0.006775,0.023316,-0.002508,-0.010891,-0.00632,-0.007378,-0.009789,-0.001304,-0.019433,0.00726,-0.013169,-0.005807,0.003505,0.002077,0.0087,0.003708,-0.009396,0.001097,0.005384,-0.021981,0.014758,0.001323
4,3,21,29,6,139,1001,2000,68.965517,34.517241,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.013173,0.023503,-0.010245,-0.015603,0.026,0.029594,0.001302,-0.021453,0.02307,0.006232,0.005747,0.006323,-0.008617,0.011267,0.015093,-0.005216,0.015048,0.002781,-0.02322,0.005438,-0.001666,0.002513,-0.011097,0.01738,-0.008317,-0.004583,-0.002354,0.007639,0.013353,-0.013146,-0.025517,-0.0271,-0.006591,0.001843,0.001062,-0.012657,-0.007179,-0.039001,-0.003399,0.005394,0.009915,-0.027925,0.000765,0.012588,-0.008022,-0.001207,-0.010596,-0.002761,-0.007922,0.002595,-0.031436,0.004379,5.4e-05,-0.008197,-0.018943,-0.010019,0.006205,0.005405,0.009652,-0.023458,0.025697,-0.005892,-0.01169,-0.027872,0.001346,-0.011951,0.004023,0.006672,0.034805,-0.01774,0.004024,0.00501,-0.003977,0.034318,0.02068,-0.008413,-0.002519,0.011755,0.000651,-0.033324,-0.013947,0.011879,-0.003168,0.000963,0.014483,-0.010325,0.006459,-0.030672,0.010891,0.004653,-0.025613,0.017819,-0.015316,0.014326,0.029078,-0.001413,-0.015053,-0.015853,-0.004021,0.030505,0.009326,4.9e-05,0.009161,-0.010304,-0.004189,-0.015463,0.016571,0.012624,0.003678,-0.001421,0.015006,0.008807,-0.007519,0.026629,-0.007716,-0.015358,0.023818,-0.00792,0.023507,-0.028177,0.000231,0.011322,0.025646,-0.005576,0.006567,-0.002166,-0.010547,0.01199,0.004171,-0.003129,-0.00584,0.003658,-0.031407,0.022655,7.8e-05,0.016811,0.03095,-0.00353,0.004136,-0.004726,-0.011563,0.007177,-0.017104,-0.04369,0.024385,0.016168,-0.006112,0.012056,0.01702,-0.0144,0.022438,-0.026379,0.012208,-0.009011,-0.007607,-0.017701,0.02037,-0.007433,-0.001069,0.011731,0.015423,0.010314,0.025385,-0.005858,-0.005249,0.002673,0.021611,-0.029679,0.001213,0.006744,0.044891,0.013353,0.02231,0.010267,-0.008566,-0.012184,-0.024157,0.003042,-0.014568,-0.005744,-0.005019,0.011744,0.016017,0.016955,-0.018329,0.018231,0.01226,0.034439,0.01607,0.018735,-0.004544,0.003598,0.008704,0.028522,-0.008638,0.006914,-0.01909,-0.023486,0.001516,-0.017873,-0.013283,0.001644,0.046562,0.006549,-0.00219,-0.007218,0.013065,0.001522,0.015876,0.017838,-0.023688,0.001774,-0.012914,-0.009435,0.027438,-0.015447,0.002116,-0.024751,0.020434,0.028441,0.027867,0.01051,0.012785,0.007194,0.015611,0.015381,0.003264,-0.041768,-0.013986,0.003217,-0.008579,-0.016507,-0.008806,-0.024715,-0.017433,0.04227,0.033567,0.011603,0.008257,0.020121,-0.00271,-0.004643,-0.003341,0.037405,-0.018459,-0.00043,0.024612,-0.003941,0.022521,-0.018837


In [33]:
#sc_colsのスケーリング
from sklearn.preprocessing import StandardScaler

for c in sc_cols:
  std = StandardScaler()
  full_merge_df_fin[c] = std.fit_transform(pd.DataFrame(full_merge_df_fin[c]))

# kmeansによるクラスタリング

In [40]:
from sklearn.cluster import KMeans
non_use_cols_for_km = [
    'goal', 
    'country', 
    'category1', 
    'category2', 
    'similar0', 'similar1', 'similar2', 'similar3', 'similar4', 'similar5', 'similar6', 'similar7', 'similar8', 'similar9']

In [41]:
# エルボー方による推定。クラスター数を1から20に増やして、それぞれの距離の総和を求める
"""
dist_list =[]
for i in range(1,50):
    print('今はクラスター数{}のクラスタリングを実行しています。'.format(i))
    kmeans= KMeans(n_clusters=i, init='random', random_state=0)
    kmeans.fit(full_merge_df_fin.drop(non_use_cols_for_km, axis=1))
    dist_list.append(kmeans.inertia_)
    
# グラフを表示
plt.plot(range(1,50), dist_list,marker='+')
plt.xlabel('Number of clusters')
plt.ylabel('Distortion')
"""

"\ndist_list =[]\nfor i in range(1,50):\n    print('今はクラスター数{}のクラスタリングを実行しています。'.format(i))\n    kmeans= KMeans(n_clusters=i, init='random', random_state=0)\n    kmeans.fit(full_merge_df_fin.drop(non_use_cols_for_km, axis=1))\n    dist_list.append(kmeans.inertia_)\n    \n# グラフを表示\nplt.plot(range(1,50), dist_list,marker='+')\nplt.xlabel('Number of clusters')\nplt.ylabel('Distortion')\n"

In [43]:
#クラスタリング
clusters_list=[5, 10, 15, 20, 30, 50, 100]

for n_clusters in clusters_list:
  print('今クラスター数[{}]のクラスタリングをしています。'.format(n_clusters))
  kmeans = KMeans(init='random', n_clusters=n_clusters, random_state=0)
  kmeans.fit(full_merge_df_fin.drop(non_use_cols_for_km, axis=1))
  full_merge_df_fin['cluster_number_{}'.format(n_clusters)] =pd.Series(kmeans.labels_, name='cluster_number_{}'.format(5))

今クラスター数[5]のクラスタリングをしています。
今クラスター数[10]のクラスタリングをしています。
今クラスター数[15]のクラスタリングをしています。
今クラスター数[20]のクラスタリングをしています。
今クラスター数[30]のクラスタリングをしています。
今クラスター数[50]のクラスタリングをしています。
今クラスター数[100]のクラスタリングをしています。


# aggrigation特徴量の作成

In [44]:
#aggrigationの際にgroup化するカラム
group_cols = ['goal',	'country', 'category1',	'category2', 'cluster_number_5', 'cluster_number_10', 'cluster_number_15', 'cluster_number_20', 'cluster_number_30', 'cluster_number_50', 'cluster_number_100', 'similar0', 'similar1', 'similar2', 'similar3', 'similar4', 'similar5', 'similar6', 'similar7', 'similar8', 'similar9']

In [45]:
#関数定義
def agg_func_duration(input_df, cols):
  agg_func = ["mean", "median", "max", "min", "std"]
  tmp = input_df.groupby([c])["duration"].agg(agg_func)
  output_df = pd.merge(input_df, tmp, how="left", on=[c])[agg_func].add_suffix("_agg_func_duration")

  return output_df

def agg_func_state(input_df, cols):
  agg_func = ["mean", "median", "max", "min", "std"]
  tmp = input_df.groupby([c])["duration"].agg(agg_func)
  output_df = pd.merge(input_df, tmp, how="left", on=[c])[agg_func].add_suffix("_agg_func_state")

  return output_df

def agg_func_goal_per_day_max(input_df, cols):
  agg_func = ["mean", "median", "max", "min", "std"]
  tmp = input_df.groupby([c])["goal_per_day_max"].agg(agg_func)
  output_df = pd.merge(input_df, tmp, how="left", on=[c])[agg_func].add_suffix("_agg_func_state")

  return output_df

def agg_func_goal_per_day_min(input_df, cols):
  agg_func = ["mean", "median", "max", "min", "std"]
  tmp = input_df.groupby([c])["goal_per_day_min"].agg(agg_func)
  output_df = pd.merge(input_df, tmp, how="left", on=[c])[agg_func].add_suffix("_agg_func_state")

  return output_df

In [46]:
#実行の準備
full_merge_df_fin["state"] = train['state']
agg_df = agg_func_duration(full_merge_df_fin, group_cols[0])

In [47]:
#関数の実行
for c in group_cols[1:len(group_cols)]:
  agg_df = pd.merge(agg_df, agg_func_duration(full_merge_df_fin, c), left_index=True, right_index=True)

for c in group_cols:
  agg_df = pd.merge(agg_df, agg_func_state(full_merge_df_fin, c), left_index=True, right_index=True)

for c in group_cols:
  agg_df = pd.merge(agg_df, agg_func_goal_per_day_max(full_merge_df_fin, c), left_index=True, right_index=True)

for c in group_cols:
  agg_df = pd.merge(agg_df, agg_func_goal_per_day_min(full_merge_df_fin, c), left_index=True, right_index=True)

In [48]:
agg_df

Unnamed: 0,mean_agg_func_duration_x,median_agg_func_duration_x,max_agg_func_duration_x,min_agg_func_duration_x,std_agg_func_duration_x,mean_agg_func_duration_y,median_agg_func_duration_y,max_agg_func_duration_y,min_agg_func_duration_y,std_agg_func_duration_y,mean_agg_func_duration_x.1,median_agg_func_duration_x.1,max_agg_func_duration_x.1,min_agg_func_duration_x.1,std_agg_func_duration_x.1,mean_agg_func_duration_y.1,median_agg_func_duration_y.1,max_agg_func_duration_y.1,min_agg_func_duration_y.1,std_agg_func_duration_y.1,mean_agg_func_duration_x.2,median_agg_func_duration_x.2,max_agg_func_duration_x.2,min_agg_func_duration_x.2,std_agg_func_duration_x.2,mean_agg_func_duration_y.2,median_agg_func_duration_y.2,max_agg_func_duration_y.2,min_agg_func_duration_y.2,std_agg_func_duration_y.2,mean_agg_func_duration_x.3,median_agg_func_duration_x.3,max_agg_func_duration_x.3,min_agg_func_duration_x.3,std_agg_func_duration_x.3,mean_agg_func_duration_y.3,median_agg_func_duration_y.3,max_agg_func_duration_y.3,min_agg_func_duration_y.3,std_agg_func_duration_y.3,mean_agg_func_duration_x.4,median_agg_func_duration_x.4,max_agg_func_duration_x.4,min_agg_func_duration_x.4,std_agg_func_duration_x.4,mean_agg_func_duration_y.4,median_agg_func_duration_y.4,max_agg_func_duration_y.4,min_agg_func_duration_y.4,std_agg_func_duration_y.4,mean_agg_func_duration_x.5,median_agg_func_duration_x.5,max_agg_func_duration_x.5,min_agg_func_duration_x.5,std_agg_func_duration_x.5,mean_agg_func_duration_y.5,median_agg_func_duration_y.5,max_agg_func_duration_y.5,min_agg_func_duration_y.5,std_agg_func_duration_y.5,mean_agg_func_duration_x.6,median_agg_func_duration_x.6,max_agg_func_duration_x.6,min_agg_func_duration_x.6,std_agg_func_duration_x.6,mean_agg_func_duration_y.6,median_agg_func_duration_y.6,max_agg_func_duration_y.6,min_agg_func_duration_y.6,std_agg_func_duration_y.6,mean_agg_func_duration_x.7,median_agg_func_duration_x.7,max_agg_func_duration_x.7,min_agg_func_duration_x.7,std_agg_func_duration_x.7,mean_agg_func_duration_y.7,median_agg_func_duration_y.7,max_agg_func_duration_y.7,min_agg_func_duration_y.7,std_agg_func_duration_y.7,mean_agg_func_duration_x.8,median_agg_func_duration_x.8,max_agg_func_duration_x.8,min_agg_func_duration_x.8,std_agg_func_duration_x.8,mean_agg_func_duration_y.8,median_agg_func_duration_y.8,max_agg_func_duration_y.8,min_agg_func_duration_y.8,std_agg_func_duration_y.8,mean_agg_func_duration_x.9,median_agg_func_duration_x.9,max_agg_func_duration_x.9,min_agg_func_duration_x.9,std_agg_func_duration_x.9,mean_agg_func_duration_y.9,median_agg_func_duration_y.9,max_agg_func_duration_y.9,min_agg_func_duration_y.9,std_agg_func_duration_y.9,mean_agg_func_duration,median_agg_func_duration,max_agg_func_duration,min_agg_func_duration,std_agg_func_duration,mean_agg_func_state_x,median_agg_func_state_x,max_agg_func_state_x,min_agg_func_state_x,std_agg_func_state_x,mean_agg_func_state_y,median_agg_func_state_y,max_agg_func_state_y,min_agg_func_state_y,std_agg_func_state_y,mean_agg_func_state_x.1,median_agg_func_state_x.1,max_agg_func_state_x.1,min_agg_func_state_x.1,std_agg_func_state_x.1,mean_agg_func_state_y.1,median_agg_func_state_y.1,max_agg_func_state_y.1,min_agg_func_state_y.1,std_agg_func_state_y.1,mean_agg_func_state_x.2,median_agg_func_state_x.2,max_agg_func_state_x.2,min_agg_func_state_x.2,std_agg_func_state_x.2,mean_agg_func_state_y.2,median_agg_func_state_y.2,max_agg_func_state_y.2,min_agg_func_state_y.2,std_agg_func_state_y.2,mean_agg_func_state_x.3,median_agg_func_state_x.3,max_agg_func_state_x.3,min_agg_func_state_x.3,std_agg_func_state_x.3,mean_agg_func_state_y.3,median_agg_func_state_y.3,max_agg_func_state_y.3,min_agg_func_state_y.3,std_agg_func_state_y.3,mean_agg_func_state_x.4,median_agg_func_state_x.4,max_agg_func_state_x.4,min_agg_func_state_x.4,std_agg_func_state_x.4,mean_agg_func_state_y.4,median_agg_func_state_y.4,max_agg_func_state_y.4,min_agg_func_state_y.4,std_agg_func_state_y.4,mean_agg_func_state_x.5,median_agg_func_state_x.5,max_agg_func_state_x.5,min_agg_func_state_x.5,std_agg_func_state_x.5,mean_agg_func_state_y.5,median_agg_func_state_y.5,max_agg_func_state_y.5,min_agg_func_state_y.5,std_agg_func_state_y.5,mean_agg_func_state_x.6,median_agg_func_state_x.6,max_agg_func_state_x.6,min_agg_func_state_x.6,std_agg_func_state_x.6,mean_agg_func_state_y.6,median_agg_func_state_y.6,max_agg_func_state_y.6,min_agg_func_state_y.6,std_agg_func_state_y.6,mean_agg_func_state_x.7,median_agg_func_state_x.7,max_agg_func_state_x.7,min_agg_func_state_x.7,std_agg_func_state_x.7,mean_agg_func_state_y.7,median_agg_func_state_y.7,max_agg_func_state_y.7,min_agg_func_state_y.7,std_agg_func_state_y.7,mean_agg_func_state_x.8,median_agg_func_state_x.8,max_agg_func_state_x.8,min_agg_func_state_x.8,std_agg_func_state_x.8,mean_agg_func_state_y.8,median_agg_func_state_y.8,max_agg_func_state_y.8,min_agg_func_state_y.8,std_agg_func_state_y.8,mean_agg_func_state_x.9,median_agg_func_state_x.9,max_agg_func_state_x.9,min_agg_func_state_x.9,std_agg_func_state_x.9,mean_agg_func_state_y.9,median_agg_func_state_y.9,max_agg_func_state_y.9,min_agg_func_state_y.9,std_agg_func_state_y.9,mean_agg_func_state_x.10,median_agg_func_state_x.10,max_agg_func_state_x.10,min_agg_func_state_x.10,std_agg_func_state_x.10,mean_agg_func_state_y.10,median_agg_func_state_y.10,max_agg_func_state_y.10,min_agg_func_state_y.10,std_agg_func_state_y.10,mean_agg_func_state_x.11,median_agg_func_state_x.11,max_agg_func_state_x.11,min_agg_func_state_x.11,std_agg_func_state_x.11,mean_agg_func_state_y.11,median_agg_func_state_y.11,max_agg_func_state_y.11,min_agg_func_state_y.11,std_agg_func_state_y.11,mean_agg_func_state_x.12,median_agg_func_state_x.12,max_agg_func_state_x.12,min_agg_func_state_x.12,std_agg_func_state_x.12,mean_agg_func_state_y.12,median_agg_func_state_y.12,max_agg_func_state_y.12,min_agg_func_state_y.12,std_agg_func_state_y.12,mean_agg_func_state_x.13,median_agg_func_state_x.13,max_agg_func_state_x.13,min_agg_func_state_x.13,std_agg_func_state_x.13,mean_agg_func_state_y.13,median_agg_func_state_y.13,max_agg_func_state_y.13,min_agg_func_state_y.13,std_agg_func_state_y.13,mean_agg_func_state_x.14,median_agg_func_state_x.14,max_agg_func_state_x.14,min_agg_func_state_x.14,std_agg_func_state_x.14,mean_agg_func_state_y.14,median_agg_func_state_y.14,max_agg_func_state_y.14,min_agg_func_state_y.14,std_agg_func_state_y.14,mean_agg_func_state_x.15,median_agg_func_state_x.15,max_agg_func_state_x.15,min_agg_func_state_x.15,std_agg_func_state_x.15,mean_agg_func_state_y.15,median_agg_func_state_y.15,max_agg_func_state_y.15,min_agg_func_state_y.15,std_agg_func_state_y.15,mean_agg_func_state_x.16,median_agg_func_state_x.16,max_agg_func_state_x.16,min_agg_func_state_x.16,std_agg_func_state_x.16,mean_agg_func_state_y.16,median_agg_func_state_y.16,max_agg_func_state_y.16,min_agg_func_state_y.16,std_agg_func_state_y.16,mean_agg_func_state_x.17,median_agg_func_state_x.17,max_agg_func_state_x.17,min_agg_func_state_x.17,std_agg_func_state_x.17,mean_agg_func_state_y.17,median_agg_func_state_y.17,max_agg_func_state_y.17,min_agg_func_state_y.17,std_agg_func_state_y.17,mean_agg_func_state_x.18,median_agg_func_state_x.18,max_agg_func_state_x.18,min_agg_func_state_x.18,std_agg_func_state_x.18,mean_agg_func_state_y.18,median_agg_func_state_y.18,max_agg_func_state_y.18,min_agg_func_state_y.18,std_agg_func_state_y.18,mean_agg_func_state_x.19,median_agg_func_state_x.19,max_agg_func_state_x.19,min_agg_func_state_x.19,std_agg_func_state_x.19,mean_agg_func_state_y.19,median_agg_func_state_y.19,max_agg_func_state_y.19,min_agg_func_state_y.19,std_agg_func_state_y.19,mean_agg_func_state_x.20,median_agg_func_state_x.20,max_agg_func_state_x.20,min_agg_func_state_x.20,std_agg_func_state_x.20,mean_agg_func_state_y.20,median_agg_func_state_y.20,max_agg_func_state_y.20,min_agg_func_state_y.20,std_agg_func_state_y.20,mean_agg_func_state_x.21,median_agg_func_state_x.21,max_agg_func_state_x.21,min_agg_func_state_x.21,std_agg_func_state_x.21,mean_agg_func_state_y.21,median_agg_func_state_y.21,max_agg_func_state_y.21,min_agg_func_state_y.21,std_agg_func_state_y.21,mean_agg_func_state_x.22,median_agg_func_state_x.22,max_agg_func_state_x.22,min_agg_func_state_x.22,std_agg_func_state_x.22,mean_agg_func_state_y.22,median_agg_func_state_y.22,max_agg_func_state_y.22,min_agg_func_state_y.22,std_agg_func_state_y.22,mean_agg_func_state_x.23,median_agg_func_state_x.23,max_agg_func_state_x.23,min_agg_func_state_x.23,std_agg_func_state_x.23,mean_agg_func_state_y.23,median_agg_func_state_y.23,max_agg_func_state_y.23,min_agg_func_state_y.23,std_agg_func_state_y.23,mean_agg_func_state_x.24,median_agg_func_state_x.24,max_agg_func_state_x.24,min_agg_func_state_x.24,std_agg_func_state_x.24,mean_agg_func_state_y.24,median_agg_func_state_y.24,max_agg_func_state_y.24,min_agg_func_state_y.24,std_agg_func_state_y.24,mean_agg_func_state_x.25,median_agg_func_state_x.25,max_agg_func_state_x.25,min_agg_func_state_x.25,std_agg_func_state_x.25,mean_agg_func_state_y.25,median_agg_func_state_y.25,max_agg_func_state_y.25,min_agg_func_state_y.25,std_agg_func_state_y.25,mean_agg_func_state_x.26,median_agg_func_state_x.26,max_agg_func_state_x.26,min_agg_func_state_x.26,std_agg_func_state_x.26,mean_agg_func_state_y.26,median_agg_func_state_y.26,max_agg_func_state_y.26,min_agg_func_state_y.26,std_agg_func_state_y.26,mean_agg_func_state_x.27,median_agg_func_state_x.27,max_agg_func_state_x.27,min_agg_func_state_x.27,std_agg_func_state_x.27,mean_agg_func_state_y.27,median_agg_func_state_y.27,max_agg_func_state_y.27,min_agg_func_state_y.27,std_agg_func_state_y.27,mean_agg_func_state_x.28,median_agg_func_state_x.28,max_agg_func_state_x.28,min_agg_func_state_x.28,std_agg_func_state_x.28,mean_agg_func_state_y.28,median_agg_func_state_y.28,max_agg_func_state_y.28,min_agg_func_state_y.28,std_agg_func_state_y.28,mean_agg_func_state_x.29,median_agg_func_state_x.29,max_agg_func_state_x.29,min_agg_func_state_x.29,std_agg_func_state_x.29,mean_agg_func_state_y.29,median_agg_func_state_y.29,max_agg_func_state_y.29,min_agg_func_state_y.29,std_agg_func_state_y.29,mean_agg_func_state_x.30,median_agg_func_state_x.30,max_agg_func_state_x.30,min_agg_func_state_x.30,std_agg_func_state_x.30,mean_agg_func_state_y.30,median_agg_func_state_y.30,max_agg_func_state_y.30,min_agg_func_state_y.30,std_agg_func_state_y.30,mean_agg_func_state,median_agg_func_state,max_agg_func_state,min_agg_func_state,std_agg_func_state
0,1.020501,1.020501,1.020501,1.020501,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,-0.111216,-0.220204,2.261207,-2.618901,0.911437,0.197392,-0.220204,4.742618,-2.618901,1.140077,0.982883,1.020501,4.742618,-2.618901,1.290113,1.173576,1.434070,4.742618,-1.791764,1.197820,1.173576,1.434070,4.742618,-1.791764,1.197820,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,1.875055,2.178493,2.261207,0.855074,0.513863,0.824056,1.020501,2.261207,-1.626337,1.414060,0.441506,0.441506,1.020501,-0.137490,0.818824,-0.054777,-0.220204,1.020501,-0.799200,0.767055,1.378928,1.020501,2.178493,0.937788,0.693678,-0.501431,-0.799200,1.020501,-1.460909,0.962114,0.606933,1.020501,1.020501,-0.220204,0.716322,-0.220204,-0.220204,1.020501,-1.460909,1.754622,0.400149,-0.220204,2.261207,-0.220204,1.038049,1.020501,1.020501,1.020501,1.020501,,1.020501,1.020501,1.020501,1.020501,,0.258354,-0.220204,2.261207,-0.964627,0.889830,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,-0.111216,-0.220204,2.261207,-2.618901,0.911437,0.197392,-0.220204,4.742618,-2.618901,1.140077,0.982883,1.020501,4.742618,-2.618901,1.290113,1.173576,1.434070,4.742618,-1.791764,1.197820,1.173576,1.434070,4.742618,-1.791764,1.197820,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,1.875055,2.178493,2.261207,0.855074,0.513863,0.824056,1.020501,2.261207,-1.626337,1.414060,0.441506,0.441506,1.020501,-0.137490,0.818824,-0.054777,-0.220204,1.020501,-0.799200,0.767055,1.378928,1.020501,2.178493,0.937788,0.693678,-0.501431,-0.799200,1.020501,-1.460909,0.962114,0.606933,1.020501,1.020501,-0.220204,0.716322,-0.220204,-0.220204,1.020501,-1.460909,1.754622,0.400149,-0.220204,2.261207,-0.220204,1.038049,1.020501,1.020501,1.020501,1.020501,,1.020501,1.020501,1.020501,1.020501,,0.196629,0.255796,0.521505,-0.054198,0.146281,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.132644,-0.275622,10.707018,-0.353121,0.498883,-0.187126,-0.275622,3.178595,-0.349430,0.341657,-0.181078,-0.253480,2.588131,-0.354351,0.216750,-0.208305,-0.275622,2.588131,-0.354351,0.202709,-0.228965,-0.275622,0.698644,-0.354351,0.144083,-0.228965,-0.275622,0.698644,-0.354351,0.144083,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.112440,-0.142768,0.329604,-0.349430,0.169180,0.068439,-0.251776,1.604023,-0.334669,0.669853,-0.086102,-0.086102,0.049133,-0.221338,0.191252,-0.118379,-0.113244,0.078657,-0.325683,0.211805,0.209153,0.049133,0.642282,-0.063956,0.379338,0.020509,-0.305145,0.983608,-0.319907,0.560438,-0.065679,0.049133,0.088498,-0.334669,0.233782,-0.128006,-0.128006,0.049133,-0.305145,0.250513,-0.199354,-0.275622,0.049133,-0.334669,0.152957,0.049133,0.049133,0.049133,0.049133,,0.049133,0.049133,0.049133,0.049133,,0.202338,0.258802,0.512372,-0.037030,0.139598,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.135602,-0.273669,10.760287,-0.332851,0.500612,-0.191517,-0.273669,3.181483,-0.332847,0.340144,-0.180040,-0.252158,2.477550,-0.332852,0.212371,-0.201179,-0.272681,2.477550,-0.332852,0.194251,-0.218660,-0.273669,0.672976,-0.332852,0.143510,-0.218660,-0.273669,0.672976,-0.332852,0.143510,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.096860,-0.125775,0.347532,-0.332847,0.169319,0.076647,-0.269099,1.639253,-0.332833,0.681992,-0.078371,-0.078371,0.061581,-0.218324,0.197922,-0.115900,-0.106044,0.081312,-0.332824,0.217822,0.223327,0.061581,0.655457,-0.047058,0.378157,0.014354,-0.303251,0.979062,-0.332818,0.564538,-0.056743,0.061581,0.101023,-0.332833,0.239913,-0.135611,-0.135611,0.061581,-0.332803,0.278871,-0.193145,-0.273669,0.061581,-0.332833,0.154833,0.061581,0.061581,0.061581,0.061581,,0.061581,0.061581,0.061581,0.061581,
1,2.178493,2.178493,2.178493,2.178493,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.107058,-0.220204,2.261207,-2.618901,1.016086,0.176685,-0.220204,2.261207,-2.618901,1.052416,0.197392,-0.220204,4.742618,-2.618901,1.140077,0.982883,1.020501,4.742618,-2.618901,1.290113,1.173576,1.434070,4.742618,-1.791764,1.197820,1.173576,1.434070,4.742618,-1.791764,1.197820,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,1.875055,2.178493,2.261207,0.855074,0.513863,1.654640,2.178493,2.261207,0.524219,0.979846,0.110651,-0.096133,2.178493,-1.543623,1.541525,0.259535,-0.220204,2.178493,-0.220204,1.072730,0.965359,0.896431,2.261207,-0.220204,1.301175,1.174113,2.178493,2.261207,-0.302918,1.330661,2.178493,2.178493,2.178493,2.178493,,2.178493,2.178493,2.178493,2.178493,,2.178493,2.178493,2.178493,2.178493,,2.219850,2.219850,2.261207,2.178493,0.058487,2.178493,2.178493,2.178493,2.178493,,0.242664,-0.220204,4.329049,-2.618901,1.028299,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.107058,-0.220204,2.261207,-2.618901,1.016086,0.176685,-0.220204,2.261207,-2.618901,1.052416,0.197392,-0.220204,4.742618,-2.618901,1.140077,0.982883,1.020501,4.742618,-2.618901,1.290113,1.173576,1.434070,4.742618,-1.791764,1.197820,1.173576,1.434070,4.742618,-1.791764,1.197820,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,1.875055,2.178493,2.261207,0.855074,0.513863,1.654640,2.178493,2.261207,0.524219,0.979846,0.110651,-0.096133,2.178493,-1.543623,1.541525,0.259535,-0.220204,2.178493,-0.220204,1.072730,0.965359,0.896431,2.261207,-0.220204,1.301175,1.174113,2.178493,2.261207,-0.302918,1.330661,2.178493,2.178493,2.178493,2.178493,,2.178493,2.178493,2.178493,2.178493,,2.178493,2.178493,2.178493,2.178493,,2.219850,2.219850,2.261207,2.178493,0.058487,2.178493,2.178493,2.178493,2.178493,,0.241578,0.226273,17.349745,-0.155793,0.857872,-0.000641,-0.216576,17.349745,-0.354351,0.663338,0.233995,-0.068960,58.977496,-0.349430,1.502638,0.650141,0.226273,58.977496,-0.336514,3.175402,-0.181078,-0.253480,2.588131,-0.354351,0.216750,-0.208305,-0.275622,2.588131,-0.354351,0.202709,-0.228965,-0.275622,0.698644,-0.354351,0.144083,-0.228965,-0.275622,0.698644,-0.354351,0.144083,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.112440,-0.142768,0.329604,-0.349430,0.169180,-0.032091,-0.063956,0.317113,-0.349430,0.334412,-0.129535,-0.066458,-0.047872,-0.337353,0.138837,-0.251003,-0.275622,-0.063956,-0.334669,0.111374,-0.251869,-0.280672,-0.063956,-0.334669,0.096837,-0.255055,-0.290384,-0.063956,-0.349430,0.107154,-0.063956,-0.063956,-0.063956,-0.063956,,-0.063956,-0.063956,-0.063956,-0.063956,,-0.063956,-0.063956,-0.063956,-0.063956,,-0.169789,-0.169789,-0.063956,-0.275622,0.149671,-0.063956,-0.063956,-0.063956,-0.063956,,0.243790,0.229220,16.529612,-0.134480,0.816636,-0.000649,-0.214506,17.416177,-0.332852,0.664832,0.236176,-0.066597,58.239854,-0.332847,1.490582,0.653640,0.229220,58.239854,-0.332834,3.139052,-0.180040,-0.252158,2.477550,-0.332852,0.212371,-0.201179,-0.272681,2.477550,-0.332852,0.194251,-0.218660,-0.273669,0.672976,-0.332852,0.143510,-0.218660,-0.273669,0.672976,-0.332852,0.143510,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.096860,-0.125775,0.347532,-0.332847,0.169319,-0.017615,-0.047058,0.327061,-0.332847,0.330938,-0.131433,-0.072919,-0.047058,-0.332835,0.134919,-0.246096,-0.273669,-0.047058,-0.332833,0.117715,-0.242652,-0.264342,-0.047058,-0.332833,0.101173,-0.244800,-0.273684,-0.047058,-0.332847,0.106717,-0.047058,-0.047058,-0.047058,-0.047058,,-0.047058,-0.047058,-0.047058,-0.047058,,-0.047058,-0.047058,-0.047058,-0.047058,,-0.152975,-0.152975,-0.047058,-0.258893,0.149790,-0.047058,-0.047058,-0.047058,-0.047058,
2,0.441506,0.441506,0.441506,0.441506,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,0.102029,-0.220204,4.659904,-2.536187,1.200040,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,0.110651,0.110651,0.441506,-0.220204,0.467899,-0.170576,-0.220204,0.441506,-1.047341,0.565849,-0.282239,-0.013420,0.441506,-1.543623,0.884108,0.110651,0.110651,0.441506,-0.220204,0.467899,0.524219,0.110651,2.095780,-0.220204,1.093157,0.441506,0.441506,0.441506,0.441506,,0.441506,0.441506,0.441506,0.441506,,-0.275346,-0.220204,0.441506,-1.047341,0.745953,0.110651,0.110651,0.441506,-0.220204,0.467899,0.441506,0.441506,0.441506,0.441506,,-0.074289,-0.220204,4.659904,-2.536187,0.931173,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,0.102029,-0.220204,4.659904,-2.536187,1.200040,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,0.110651,0.110651,0.441506,-0.220204,0.467899,-0.170576,-0.220204,0.441506,-1.047341,0.565849,-0.282239,-0.013420,0.441506,-1.543623,0.884108,0.110651,0.110651,0.441506,-0.220204,0.467899,0.524219,0.110651,2.095780,-0.220204,1.093157,0.441506,0.441506,0.441506,0.441506,,0.441506,0.441506,0.441506,0.441506,,-0.275346,-0.220204,0.441506,-1.047341,0.745953,0.110651,0.110651,0.441506,-0.220204,0.467899,0.441506,0.441506,0.441506,0.441506,,-0.266549,-0.275622,0.964353,-0.334337,0.062541,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.132644,-0.275622,10.707018,-0.353121,0.498883,-0.111421,-0.265781,2.588131,-0.353121,0.468439,-0.181078,-0.253480,2.588131,-0.354351,0.216750,-0.160593,-0.246099,1.407202,-0.349430,0.230062,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.189198,-0.231337,0.774561,-0.345740,0.157121,-0.107806,-0.107806,0.078657,-0.294268,0.263698,0.001119,-0.275622,0.521505,-0.334669,0.417605,0.135150,0.113618,0.648033,-0.334669,0.521999,-0.270184,-0.270184,-0.246099,-0.294268,0.034061,-0.217165,-0.270184,-0.009913,-0.318380,0.141398,-0.294268,-0.294268,-0.294268,-0.294268,,-0.294268,-0.294268,-0.294268,-0.294268,,-0.301520,-0.294268,-0.275622,-0.334669,0.030184,-0.314469,-0.314469,-0.294268,-0.334669,0.028567,-0.294268,-0.294268,-0.294268,-0.294268,,-0.267605,-0.273669,0.555034,-0.312909,0.041797,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.135602,-0.273669,10.760287,-0.332851,0.500612,-0.114987,-0.273669,2.625311,-0.332851,0.467144,-0.180040,-0.252158,2.477550,-0.332852,0.212371,-0.162666,-0.244087,1.361445,-0.332847,0.228541,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.193558,-0.239411,0.681495,-0.332844,0.156136,-0.102410,-0.102410,0.081312,-0.286131,0.259821,0.002754,-0.273669,0.529259,-0.332833,0.415288,0.132085,0.121564,0.618043,-0.332833,0.511519,-0.265109,-0.265109,-0.244087,-0.286131,0.029729,-0.209974,-0.265109,-0.007434,-0.302245,0.137235,-0.286131,-0.286131,-0.286131,-0.286131,,-0.286131,-0.286131,-0.286131,-0.286131,,-0.302470,-0.288445,-0.286131,-0.332833,0.026321,-0.309482,-0.309482,-0.286131,-0.332833,0.033023,-0.286131,-0.286131,-0.286131,-0.286131,
3,-0.220204,-0.220204,-0.220204,-0.220204,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,-0.111216,-0.220204,2.261207,-2.618901,0.911437,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,-0.369089,-0.220204,-0.220204,-0.964627,0.332916,-0.261561,-0.261561,0.937788,-1.460909,0.979846,-0.082348,-0.220204,0.193365,-0.220204,0.238774,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.054777,-0.220204,0.606933,-0.220204,0.369907,-0.220204,-0.220204,-0.220204,-0.220204,,-0.385631,-0.261561,0.027937,-1.047341,0.463000,-0.468345,-0.220204,-0.137490,-1.047341,0.503128,-0.145838,-0.220204,4.659904,-2.618901,0.965364,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.090545,-0.220204,4.659904,-2.618901,1.047584,-0.111216,-0.220204,2.261207,-2.618901,0.911437,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,-0.369089,-0.220204,-0.220204,-0.964627,0.332916,-0.261561,-0.261561,0.937788,-1.460909,0.979846,-0.082348,-0.220204,0.193365,-0.220204,0.238774,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.054777,-0.220204,0.606933,-0.220204,0.369907,-0.220204,-0.220204,-0.220204,-0.220204,,-0.385631,-0.261561,0.027937,-1.047341,0.463000,-0.468345,-0.220204,-0.137490,-1.047341,0.503128,-0.294839,-0.305145,1.407202,-0.344289,0.066360,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.132644,-0.275622,10.707018,-0.353121,0.498883,-0.187126,-0.275622,3.178595,-0.349430,0.341657,-0.181078,-0.253480,2.588131,-0.354351,0.216750,-0.160593,-0.246099,1.407202,-0.349430,0.230062,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.189198,-0.231337,0.774561,-0.345740,0.157121,-0.150781,-0.275622,0.437153,-0.334669,0.329575,-0.311936,-0.305145,-0.303803,-0.333651,0.014490,-0.309363,-0.305145,-0.288275,-0.334669,0.023483,-0.305145,-0.305145,-0.275622,-0.334669,0.029523,-0.305145,-0.305145,-0.305145,-0.305145,,-0.305145,-0.305145,-0.305145,-0.305145,,-0.164910,-0.305145,0.373889,-0.342049,0.303153,-0.305145,-0.305145,-0.305145,-0.305145,,-0.056280,-0.220740,0.521505,-0.305145,0.387313,-0.196417,-0.305145,0.035800,-0.319907,0.201242,-0.298082,-0.303251,0.555477,-0.322881,0.033279,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.135602,-0.273669,10.760287,-0.332851,0.500612,-0.191517,-0.273669,3.181483,-0.332847,0.340144,-0.180040,-0.252158,2.477550,-0.332852,0.212371,-0.162666,-0.244087,1.361445,-0.332847,0.228541,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.193558,-0.239411,0.681495,-0.332844,0.156136,-0.151114,-0.273669,0.427853,-0.332833,0.324580,-0.315347,-0.318027,-0.292503,-0.332832,0.020644,-0.306070,-0.303251,-0.282125,-0.332833,0.025471,-0.303251,-0.303251,-0.273669,-0.332833,0.029582,-0.303251,-0.303251,-0.303251,-0.303251,,-0.303251,-0.303251,-0.303251,-0.303251,,-0.161260,-0.303251,0.377129,-0.332840,0.302690,-0.303251,-0.303251,-0.303251,-0.303251,,-0.057170,-0.217845,0.510262,-0.303251,0.380472,-0.198915,-0.303251,0.039324,-0.332818,0.206850
4,-0.302918,-0.302918,-0.302918,-0.302918,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.015340,-0.220204,4.659904,-2.536187,1.007883,-0.035978,-0.220204,3.998195,-2.039905,1.003031,-0.119153,-0.220204,3.584626,-2.536187,0.878242,-0.427494,-0.220204,1.103215,-2.536187,0.595937,-0.427494,-0.220204,1.103215,-2.536187,0.595937,-0.435693,-0.220204,1.020501,-2.536187,0.597287,-0.435693,-0.220204,1.020501,-2.536187,0.597287,-0.472661,-0.220204,1.020501,-2.536187,0.574132,-0.476481,-0.220204,1.020501,-2.536187,0.576814,-0.633772,-0.633772,-0.302918,-0.964627,0.467899,-0.261561,-0.261561,-0.220204,-0.302918,0.058487,-0.282239,-0.261561,-0.220204,-0.385631,0.079192,-0.302918,-0.302918,-0.302918,-0.302918,,-0.247775,-0.302918,1.020501,-1.460909,1.241624,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.247775,-0.220204,-0.220204,-0.302918,0.047755,-0.145838,-0.220204,4.659904,-2.618901,0.965364,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.015340,-0.220204,4.659904,-2.536187,1.007883,-0.035978,-0.220204,3.998195,-2.039905,1.003031,-0.119153,-0.220204,3.584626,-2.536187,0.878242,-0.427494,-0.220204,1.103215,-2.536187,0.595937,-0.427494,-0.220204,1.103215,-2.536187,0.595937,-0.435693,-0.220204,1.020501,-2.536187,0.597287,-0.435693,-0.220204,1.020501,-2.536187,0.597287,-0.472661,-0.220204,1.020501,-2.536187,0.574132,-0.476481,-0.220204,1.020501,-2.536187,0.576814,-0.633772,-0.633772,-0.302918,-0.964627,0.467899,-0.261561,-0.261561,-0.220204,-0.302918,0.058487,-0.282239,-0.261561,-0.220204,-0.385631,0.079192,-0.302918,-0.302918,-0.302918,-0.302918,,-0.247775,-0.302918,1.020501,-1.460909,1.241624,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.247775,-0.220204,-0.220204,-0.302918,0.047755,-0.294839,-0.305145,1.407202,-0.344289,0.066360,-0.000641,-0.216576,17.349745,-0.354351,0.663338,0.062893,-0.216576,17.349745,-0.349430,0.739416,-0.118436,-0.246099,3.267165,-0.349180,0.411444,-0.139603,-0.231337,2.799011,-0.349430,0.258752,-0.160873,-0.246099,2.799011,-0.344938,0.253115,-0.160873,-0.246099,2.799011,-0.344938,0.253115,-0.212706,-0.253480,0.742929,-0.344510,0.141236,-0.212706,-0.253480,0.742929,-0.344510,0.141236,-0.224763,-0.275622,0.742929,-0.344510,0.140402,-0.214876,-0.269296,0.742929,-0.342589,0.148051,-0.270387,-0.270387,-0.237664,-0.303109,0.046277,-0.230319,-0.230319,-0.157529,-0.303109,0.102941,-0.051053,-0.211304,0.521505,-0.303109,0.384175,-0.303109,-0.303109,-0.303109,-0.303109,,-0.212617,-0.303109,-0.029595,-0.305145,0.158504,-0.303109,-0.303109,-0.303109,-0.303109,,-0.303109,-0.303109,-0.303109,-0.303109,,-0.303109,-0.303109,-0.303109,-0.303109,,-0.303109,-0.303109,-0.303109,-0.303109,,0.974873,0.875784,2.351945,-0.303109,1.330298,-0.298082,-0.303251,0.555477,-0.322881,0.033279,-0.000649,-0.214506,17.416177,-0.332852,0.664832,0.064095,-0.214506,17.416177,-0.332847,0.744667,-0.118431,-0.244087,3.261363,-0.332847,0.411999,-0.141380,-0.236897,2.709957,-0.332847,0.257501,-0.166886,-0.267092,2.709957,-0.332843,0.250487,-0.166886,-0.267092,2.709957,-0.332843,0.250487,-0.218823,-0.269441,0.665632,-0.332842,0.139007,-0.218823,-0.269441,0.665632,-0.332842,0.139007,-0.230700,-0.273669,0.665632,-0.332842,0.137569,-0.221373,-0.273669,0.665632,-0.332841,0.145151,-0.275265,-0.275265,-0.248301,-0.302230,0.038134,-0.228786,-0.228786,-0.155342,-0.302230,0.103865,-0.049437,-0.210279,0.525038,-0.302230,0.385444,-0.302230,-0.302230,-0.302230,-0.302230,,-0.217446,-0.302230,-0.017304,-0.332803,0.174001,-0.302230,-0.302230,-0.302230,-0.302230,,-0.302230,-0.302230,-0.302230,-0.302230,,-0.302230,-0.302230,-0.302230,-0.302230,,-0.302230,-0.302230,-0.302230,-0.302230,,0.978965,0.880018,2.359105,-0.302230,1.333424
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
19586,-0.302918,-0.302918,-0.302918,-0.302918,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.055309,-0.220204,4.742618,-2.618901,1.020367,0.156565,-0.220204,4.659904,-2.536187,1.082846,-0.119153,-0.220204,3.584626,-2.536187,0.878242,0.196400,-0.220204,3.584626,-2.536187,0.992576,0.198594,-0.220204,3.584626,-2.536187,0.992289,0.198594,-0.220204,3.584626,-2.536187,0.992289,0.287894,-0.137490,2.261207,-1.543623,0.962403,0.287894,-0.137490,2.261207,-1.543623,0.962403,0.287894,-0.137490,2.261207,-1.543623,0.962403,-0.302918,-0.302918,-0.302918,-0.302918,0.000000,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.606201,-0.468345,-0.302918,-1.047341,0.390890,-0.302918,-0.302918,-0.302918,-0.302918,,-0.137490,-0.261561,1.020501,-1.047341,0.856929,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.027205,0.027937,0.193365,-0.302918,0.252695,0.083215,-0.220204,4.659904,-2.536187,0.975628,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.055309,-0.220204,4.742618,-2.618901,1.020367,0.156565,-0.220204,4.659904,-2.536187,1.082846,-0.119153,-0.220204,3.584626,-2.536187,0.878242,0.196400,-0.220204,3.584626,-2.536187,0.992576,0.198594,-0.220204,3.584626,-2.536187,0.992289,0.198594,-0.220204,3.584626,-2.536187,0.992289,0.287894,-0.137490,2.261207,-1.543623,0.962403,0.287894,-0.137490,2.261207,-1.543623,0.962403,0.287894,-0.137490,2.261207,-1.543623,0.962403,-0.302918,-0.302918,-0.302918,-0.302918,0.000000,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.606201,-0.468345,-0.302918,-1.047341,0.390890,-0.302918,-0.302918,-0.302918,-0.302918,,-0.137490,-0.261561,1.020501,-1.047341,0.856929,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.302918,-0.302918,-0.302918,-0.302918,,-0.027205,0.027937,0.193365,-0.302918,0.252695,-0.210986,-0.216576,1.850050,-0.314434,0.118223,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.143427,-0.253480,9.476884,-0.350133,0.447636,-0.083593,-0.231337,3.042334,-0.349430,0.459714,-0.139603,-0.231337,2.799011,-0.349430,0.258752,-0.123211,-0.208806,1.407202,-0.349430,0.226591,-0.123313,-0.208806,1.407202,-0.349430,0.226625,-0.123313,-0.208806,1.407202,-0.349430,0.226625,-0.069910,-0.167370,0.639598,-0.349430,0.246600,-0.069910,-0.167370,0.639598,-0.349430,0.246600,-0.069910,-0.167370,0.639598,-0.349430,0.246600,-0.211485,-0.211485,-0.211485,-0.211485,0.000000,-0.211485,-0.211485,-0.211485,-0.211485,,-0.211485,-0.211485,-0.211485,-0.211485,,-0.130683,-0.211485,0.095058,-0.275622,0.198111,-0.211485,-0.211485,-0.211485,-0.211485,,-0.225144,-0.214031,-0.187052,-0.285463,0.042227,-0.211485,-0.211485,-0.211485,-0.211485,,-0.211485,-0.211485,-0.211485,-0.211485,,-0.211485,-0.211485,-0.211485,-0.211485,,-0.125670,-0.211485,0.091309,-0.256835,0.189273,-0.210024,-0.214506,1.442485,-0.292967,0.094789,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.143601,-0.258883,9.527715,-0.332848,0.447000,-0.083550,-0.237746,3.046316,-0.332847,0.455785,-0.141380,-0.236897,2.709957,-0.332847,0.257501,-0.120738,-0.199730,1.353385,-0.332847,0.225154,-0.120812,-0.199730,1.353385,-0.332847,0.225164,-0.120812,-0.199730,1.353385,-0.332847,0.225164,-0.065126,-0.164382,0.643365,-0.332847,0.246455,-0.065126,-0.164382,0.643365,-0.332847,0.246455,-0.065126,-0.164382,0.643365,-0.332847,0.246455,-0.210424,-0.210424,-0.210424,-0.210424,0.000000,-0.210424,-0.210424,-0.210424,-0.210424,,-0.210424,-0.210424,-0.210424,-0.210424,,-0.134802,-0.210424,0.094462,-0.288445,0.202345,-0.210424,-0.210424,-0.210424,-0.210424,,-0.224577,-0.212465,-0.199700,-0.273679,0.033325,-0.210424,-0.210424,-0.210424,-0.210424,,-0.210424,-0.210424,-0.210424,-0.210424,,-0.210424,-0.210424,-0.210424,-0.210424,,-0.121457,-0.210424,0.098211,-0.252158,0.191379
19587,-0.220204,-0.220204,-0.220204,-0.220204,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.017138,-0.220204,4.659904,-2.536187,0.925905,-0.086383,-0.220204,2.261207,-2.536187,0.710982,0.296580,-0.220204,4.742618,-2.618901,1.115978,-0.125521,-0.220204,4.659904,-2.536187,0.814004,0.043195,-0.220204,4.659904,-2.122619,0.785988,0.043195,-0.220204,4.659904,-2.122619,0.785988,0.043195,-0.220204,4.659904,-2.122619,0.785988,-0.196706,-0.220204,1.185929,-2.122619,0.385864,-0.198951,-0.220204,1.020501,-1.626337,0.381174,-0.406310,-0.220204,-0.220204,-0.964627,0.372212,1.020501,1.020501,2.261207,-0.220204,1.754622,-0.344274,-0.220204,0.193365,-0.964627,0.345309,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,-0.087862,-0.220204,0.193365,-0.220204,0.190421,0.292621,-0.220204,2.261207,-0.220204,1.101056,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.007512,-0.302918,2.178493,-0.799200,0.984324,0.049235,-0.220204,3.419199,-2.122619,0.895374,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.017138,-0.220204,4.659904,-2.536187,0.925905,-0.086383,-0.220204,2.261207,-2.536187,0.710982,0.296580,-0.220204,4.742618,-2.618901,1.115978,-0.125521,-0.220204,4.659904,-2.536187,0.814004,0.043195,-0.220204,4.659904,-2.122619,0.785988,0.043195,-0.220204,4.659904,-2.122619,0.785988,0.043195,-0.220204,4.659904,-2.122619,0.785988,-0.196706,-0.220204,1.185929,-2.122619,0.385864,-0.198951,-0.220204,1.020501,-1.626337,0.381174,-0.406310,-0.220204,-0.220204,-0.964627,0.372212,1.020501,1.020501,2.261207,-0.220204,1.754622,-0.344274,-0.220204,0.193365,-0.964627,0.345309,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,-0.087862,-0.220204,0.193365,-0.220204,0.190421,0.292621,-0.220204,2.261207,-0.220204,1.101056,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.220204,-0.220204,-0.220204,-0.220204,,-0.007512,-0.302918,2.178493,-0.799200,0.984324,-0.036354,-0.039436,1.027617,-0.232534,0.148217,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.141905,-0.256835,5.540454,-0.349430,0.395621,-0.183626,-0.242027,1.850050,-0.349430,0.213956,0.037466,-0.180944,4.949989,-0.349430,0.489325,0.089641,-0.128006,3.431652,-0.349430,0.505257,-0.055168,-0.128006,1.533730,-0.349430,0.248036,-0.055168,-0.128006,1.533730,-0.349430,0.248036,-0.055168,-0.128006,1.533730,-0.349430,0.248036,0.039367,-0.009913,1.533730,-0.344062,0.262413,-0.091427,-0.111136,0.580551,-0.339589,0.159041,0.639598,0.019610,2.588131,-0.068960,1.300587,-0.172291,-0.172291,-0.039436,-0.305145,0.187885,-0.201838,-0.272342,0.141921,-0.328764,0.167888,-0.009913,-0.009913,0.019610,-0.039436,0.041752,0.189004,-0.039436,1.246166,-0.246099,0.608562,0.051324,-0.068960,0.964353,-0.349430,0.526230,-0.039436,-0.039436,-0.039436,-0.039436,,-0.039436,-0.039436,-0.039436,-0.039436,,-0.039436,-0.039436,-0.039436,-0.039436,,-0.046320,-0.216576,0.949083,-0.349180,0.452757,-0.034207,-0.037015,0.935053,-0.212924,0.135023,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.141473,-0.254531,5.583484,-0.332847,0.395369,-0.183670,-0.241026,1.442485,-0.332847,0.197070,0.040520,-0.182146,4.105285,-0.332847,0.486959,0.089533,-0.128014,3.343851,-0.332847,0.506194,-0.051938,-0.125760,1.505495,-0.332847,0.246221,-0.051938,-0.125760,1.505495,-0.332847,0.246221,-0.051938,-0.125760,1.505495,-0.332847,0.246221,0.041301,-0.013344,1.505495,-0.332842,0.261089,-0.089664,-0.117795,0.554649,-0.332838,0.157756,0.640198,0.022148,2.595759,-0.079262,1.305477,-0.162745,-0.162745,-0.037015,-0.288475,0.177809,-0.201943,-0.272024,0.148923,-0.332827,0.171702,-0.007434,-0.007434,0.022148,-0.037015,0.041835,0.193260,-0.037015,1.253821,-0.244087,0.610856,0.057071,-0.066597,0.968764,-0.332847,0.524356,-0.037015,-0.037015,-0.037015,-0.037015,,-0.037015,-0.037015,-0.037015,-0.037015,,-0.037015,-0.037015,-0.037015,-0.037015,,-0.043715,-0.214506,0.952444,-0.332847,0.452156
19588,-0.220204,-0.220204,-0.220204,-0.220204,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.055309,-0.220204,4.742618,-2.618901,1.020367,0.089972,-0.220204,2.261207,-2.618901,1.104731,-0.390712,-0.220204,2.261207,-2.618901,0.629676,0.105572,-0.220204,2.261207,-2.122619,1.054277,0.105572,-0.220204,2.261207,-2.122619,1.054277,0.137119,-0.220204,2.261207,-2.122619,1.221303,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,0.137119,-0.220204,2.261207,-2.122619,1.221303,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.171308,-0.220204,2.261207,-2.122619,1.105515,0.606933,-0.013420,2.261207,-0.220204,1.105308,0.051570,-0.220204,1.020501,-0.385631,0.537563,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.184174,-0.220204,2.261207,-1.212768,1.227152,0.179579,-0.261561,2.261207,-1.957192,1.728235,0.216997,-0.220204,2.261207,-0.633772,1.029461,-0.106473,-0.220204,0.937788,-0.633772,0.469854,0.395554,-0.220204,2.261207,-0.302918,1.063507,-0.074289,-0.220204,4.659904,-2.536187,0.931173,-0.019053,-0.220204,4.742618,-2.618901,0.983125,0.055309,-0.220204,4.742618,-2.618901,1.020367,0.089972,-0.220204,2.261207,-2.618901,1.104731,-0.390712,-0.220204,2.261207,-2.618901,0.629676,0.105572,-0.220204,2.261207,-2.122619,1.054277,0.105572,-0.220204,2.261207,-2.122619,1.054277,0.137119,-0.220204,2.261207,-2.122619,1.221303,1.133152,1.434070,4.742618,-2.122619,1.214957,1.133152,1.434070,4.742618,-2.122619,1.214957,0.137119,-0.220204,2.261207,-2.122619,1.221303,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.171308,-0.220204,2.261207,-2.122619,1.105515,0.606933,-0.013420,2.261207,-0.220204,1.105308,0.051570,-0.220204,1.020501,-0.385631,0.537563,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.184174,-0.220204,2.261207,-1.212768,1.227152,0.179579,-0.261561,2.261207,-1.957192,1.728235,0.216997,-0.220204,2.261207,-0.633772,1.029461,-0.106473,-0.220204,0.937788,-0.633772,0.469854,0.395554,-0.220204,2.261207,-0.302918,1.063507,-0.266549,-0.275622,0.964353,-0.334337,0.062541,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.143427,-0.253480,9.476884,-0.350133,0.447636,-0.029176,-0.268371,9.476884,-0.349430,0.923141,-0.162132,-0.275622,2.912886,-0.349430,0.283757,-0.033271,-0.206383,2.588131,-0.349430,0.457915,-0.033271,-0.206383,2.588131,-0.349430,0.457915,-0.182348,-0.281398,0.783934,-0.348921,0.244398,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.227147,-0.275622,0.783934,-0.354351,0.149385,-0.182348,-0.281398,0.783934,-0.348921,0.244398,-0.305145,-0.305145,-0.275622,-0.334669,0.041752,-0.215996,-0.242027,0.078657,-0.344510,0.136541,0.125402,-0.290384,1.604023,-0.334669,0.803769,-0.129362,-0.174400,0.226273,-0.275622,0.170460,-0.172291,-0.172291,-0.068960,-0.275622,0.146133,0.208790,-0.275622,2.096077,-0.334168,0.870399,-0.285411,-0.304636,-0.153312,-0.349430,0.073189,-0.193039,-0.263544,0.226273,-0.332560,0.192364,-0.062016,-0.246099,0.521505,-0.332560,0.335759,-0.025546,-0.229301,2.056713,-0.334669,0.588322,-0.267605,-0.273669,0.555034,-0.312909,0.041797,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.143601,-0.258883,9.527715,-0.332848,0.447000,-0.030915,-0.273160,9.527715,-0.332847,0.925431,-0.167973,-0.273669,2.862054,-0.332847,0.281778,-0.031761,-0.197473,2.625311,-0.332847,0.460757,-0.031761,-0.197473,2.625311,-0.332847,0.460757,-0.183499,-0.298745,0.784703,-0.332847,0.245278,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.217289,-0.273669,0.784703,-0.332852,0.148792,-0.183499,-0.298745,0.784703,-0.332847,0.245278,-0.303251,-0.303251,-0.273669,-0.332833,0.041835,-0.216954,-0.273669,0.081312,-0.332842,0.138131,0.133602,-0.281072,1.619552,-0.332833,0.806545,-0.124958,-0.174357,0.239071,-0.273669,0.173773,-0.170133,-0.170133,-0.066597,-0.273669,0.146422,0.212037,-0.273669,2.083029,-0.317806,0.865914,-0.292325,-0.325410,-0.163781,-0.332847,0.067010,-0.188614,-0.261831,0.229220,-0.332830,0.191643,-0.059032,-0.244087,0.525038,-0.332830,0.334331,-0.019339,-0.222225,2.063288,-0.332833,0.588514
19589,-0.220204,-0.220204,-0.220204,-0.220204,0.0,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.141818,-0.220204,3.088344,-2.453474,1.024294,-0.180314,-0.220204,2.261207,-2.453474,1.011184,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,0.551791,-0.220204,2.261207,-0.385631,1.482707,0.193365,0.193365,0.606933,-0.220204,0.584874,1.020501,1.020501,2.261207,-0.220204,1.754622,0.327774,-0.220204,1.930352,-1.047341,1.194500,0.379470,-0.220204,2.261207,-0.302918,1.255097,0.193365,-0.220204,2.261207,-0.468345,1.160942,0.193365,-0.220204,1.434070,-0.220204,0.716322,0.914155,0.772360,2.261207,-0.220204,1.166541,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.007259,-0.344274,2.261207,-1.543623,1.608670,0.094585,-0.220204,4.577190,-2.288046,0.958105,-0.019053,-0.220204,4.742618,-2.618901,0.983125,-0.141818,-0.220204,3.088344,-2.453474,1.024294,-0.180314,-0.220204,2.261207,-2.453474,1.011184,0.197392,-0.220204,4.742618,-2.618901,1.140077,-0.222810,-0.220204,3.088344,-2.536187,0.759481,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.228053,-0.220204,3.088344,-2.536187,0.753762,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.302361,-0.220204,2.261207,-2.536187,0.657124,-0.381242,-0.220204,2.261207,-2.370760,0.664513,0.551791,-0.220204,2.261207,-0.385631,1.482707,0.193365,0.193365,0.606933,-0.220204,0.584874,1.020501,1.020501,2.261207,-0.220204,1.754622,0.327774,-0.220204,1.930352,-1.047341,1.194500,0.379470,-0.220204,2.261207,-0.302918,1.255097,0.193365,-0.220204,2.261207,-0.468345,1.160942,0.193365,-0.220204,1.434070,-0.220204,0.716322,0.914155,0.772360,2.261207,-0.220204,1.166541,-0.220204,-0.220204,-0.220204,-0.220204,0.000000,0.007259,-0.344274,2.261207,-1.543623,1.608670,-0.128432,-0.128006,1.052923,-0.283674,0.102653,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.122974,-0.255157,4.696933,-0.349430,0.435576,-0.178605,-0.272568,2.292899,-0.349430,0.289099,-0.181078,-0.253480,2.588131,-0.354351,0.216750,-0.160593,-0.246099,1.407202,-0.349430,0.230062,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.160056,-0.246099,1.407202,-0.349430,0.230304,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.154942,-0.237664,1.407202,-0.349430,0.231847,-0.189198,-0.231337,0.774561,-0.345740,0.157121,-0.254534,-0.300928,-0.128006,-0.334669,0.110868,0.196749,0.196749,0.521505,-0.128006,0.459274,-0.231337,-0.231337,-0.128006,-0.334669,0.146133,0.231521,-0.172291,2.588131,-0.332560,0.990339,-0.188707,-0.187052,-0.119862,-0.260861,0.075109,-0.167183,-0.216576,0.108180,-0.300928,0.169524,-0.228104,-0.305145,0.007801,-0.344510,0.131740,-0.012027,-0.260861,0.669121,-0.331985,0.421659,-0.216576,-0.216576,-0.098483,-0.334669,0.104380,-0.085010,-0.087939,0.167226,-0.331388,0.206198,-0.126134,-0.125760,0.909748,-0.262259,0.090012,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.125558,-0.258893,4.611640,-0.332847,0.436518,-0.182705,-0.272634,2.299942,-0.332847,0.287048,-0.180040,-0.252158,2.477550,-0.332852,0.212371,-0.162666,-0.244087,1.361445,-0.332847,0.228541,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.162179,-0.244087,1.361445,-0.332847,0.228805,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.157684,-0.244073,1.361445,-0.332847,0.230639,-0.193558,-0.239411,0.681495,-0.332844,0.156136,-0.248318,-0.301136,-0.125760,-0.318057,0.106474,0.203333,0.203333,0.532426,-0.125760,0.465408,-0.221908,-0.221908,-0.125760,-0.318057,0.135974,0.236334,-0.170133,2.595759,-0.332818,0.992061,-0.183142,-0.184924,-0.118619,-0.244102,0.070442,-0.163139,-0.214506,0.125669,-0.301136,0.176925,-0.222961,-0.303251,0.022136,-0.332842,0.134168,-0.002240,-0.244102,0.672946,-0.316711,0.416968,-0.214506,-0.214506,-0.096179,-0.332833,0.104587,-0.088249,-0.102501,0.184833,-0.332829,0.212823


In [49]:
#データのマージ
full_merge_df_fin = pd.merge(full_merge_df_fin, agg_df, left_index=True, right_index=True)
full_merge_df_fin.drop(['state'], axis=1, inplace=True)

# データセットの整理

In [50]:
train_df = pd.DataFrame(full_merge_df_fin.loc[:len(train),])
test_df = pd.DataFrame(full_merge_df_fin.loc[len(train):19591,])

In [51]:
test_df = test_df.reset_index()
test_df.drop(['index'], axis=1, inplace=True)
test_df.head()

Unnamed: 0,goal,country,duration,category1,category2,goal_min,goal_max,goal_per_day_max,goal_per_day_min,goal_1-1000,goal_100000+,goal_10001-11000,goal_1001-2000,goal_11001-12000,goal_12001-13000,goal_13001-14000,goal_14001-15000,goal_15001-16000,goal_16001-17000,goal_17001-18000,goal_18001-19000,goal_19001-20000,goal_20001-21000,goal_2001-3000,goal_21001-22000,goal_22001-23000,goal_23001-24000,goal_24001-25000,goal_25001-26000,goal_26001-27000,goal_27001-28000,goal_28001-29000,goal_29001-30000,goal_30001-31000,goal_3001-4000,goal_31001-32000,goal_32001-33000,goal_33001-34000,goal_34001-35000,goal_35001-36000,goal_36001-37000,goal_37001-38000,goal_38001-39000,goal_39001-40000,goal_40001-41000,goal_4001-5000,goal_41001-42000,goal_42001-43000,goal_43001-44000,goal_44001-45000,goal_45001-46000,goal_46001-47000,goal_47001-48000,goal_48001-49000,goal_49001-50000,goal_50001-51000,goal_5001-6000,goal_51001-52000,goal_52001-53000,goal_53001-54000,goal_54001-55000,goal_55001-56000,goal_56001-57000,goal_57001-58000,goal_58001-59000,goal_59001-60000,goal_60001-61000,goal_6001-7000,goal_61001-62000,goal_62001-63000,goal_63001-64000,goal_64001-65000,goal_65001-66000,goal_66001-67000,goal_67001-68000,goal_68001-69000,goal_69001-70000,goal_70001-71000,goal_7001-8000,goal_71001-72000,goal_72001-73000,goal_73001-74000,goal_74001-75000,goal_75001-76000,goal_76001-77000,goal_77001-78000,goal_78001-79000,goal_79001-80000,goal_80001-81000,goal_8001-9000,goal_81001-82000,goal_82001-83000,goal_83001-84000,goal_84001-85000,goal_85001-86000,goal_86001-87000,goal_87001-88000,goal_88001-89000,goal_89001-90000,goal_90001-91000,goal_9001-10000,goal_91001-92000,goal_92001-93000,goal_93001-94000,goal_94001-95000,goal_95001-96000,goal_96001-97000,goal_97001-98000,goal_98001-99000,goal_99001-100000,country_AT,country_AU,country_BE,country_CA,country_CH,country_DE,country_DK,country_ES,country_FR,country_GB,country_HK,country_IE,country_IT,country_JP,country_LU,country_MX,country_NL,country_NO,country_NZ,country_SE,country_SG,country_US,category1_art,category1_comics,category1_crafts,category1_dance,category1_design,category1_fashion,category1_film & video,category1_food,category1_games,category1_journalism,category1_music,category1_photography,category1_publishing,category1_technology,category1_theater,category2_3d printing,category2_academic,category2_accessories,category2_action,category2_animals,category2_animation,category2_anthologies,category2_apparel,category2_apps,category2_architecture,category2_art books,category2_audio,category2_bacon,category2_blues,category2_calendars,category2_camera equipment,category2_candles,category2_ceramics,category2_children's books,category2_childrenswear,category2_chiptune,category2_civic design,category2_classical music,category2_comedy,category2_comic books,category2_community gardens,category2_conceptual art,category2_cookbooks,category2_country & folk,category2_couture,category2_crochet,category2_digital art,category2_diy,category2_diy electronics,category2_documentary,category2_drama,category2_drinks,category2_electronic music,category2_embroidery,category2_events,category2_experimental,category2_fabrication tools,category2_faith,category2_family,category2_fantasy,category2_farmer's markets,category2_farms,category2_festivals,category2_fiction,category2_fine art,category2_flight,category2_food trucks,category2_footwear,category2_gadgets,category2_gaming hardware,category2_glass,category2_graphic design,category2_graphic novels,category2_hardware,category2_hip-hop,category2_horror,category2_illustration,category2_immersive,category2_indie rock,category2_installations,category2_interactive design,category2_jazz,category2_jewelry,category2_kids,category2_knitting,category2_latin,category2_letterpress,category2_literary journals,category2_literary spaces,category2_live games,category2_makerspaces,category2_metal,category2_mixed media,category2_mobile games,category2_movie theaters,category2_music videos,category2_musical,category2_narrative film,category2_nature,category2_nonfiction,category2_painting,category2_people,category2_performance art,category2_performances,category2_periodicals,category2_pet fashion,category2_photo,category2_photobooks,category2_places,category2_playing cards,category2_plays,category2_poetry,category2_pop,category2_pottery,category2_print,category2_printing,category2_product design,category2_public art,...,mean_agg_func_state_y,median_agg_func_state_y,max_agg_func_state_y,min_agg_func_state_y,std_agg_func_state_y,mean_agg_func_state_x,median_agg_func_state_x,max_agg_func_state_x,min_agg_func_state_x,std_agg_func_state_x,mean_agg_func_state_y.1,median_agg_func_state_y.1,max_agg_func_state_y.1,min_agg_func_state_y.1,std_agg_func_state_y.1,mean_agg_func_state_x.1,median_agg_func_state_x.1,max_agg_func_state_x.1,min_agg_func_state_x.1,std_agg_func_state_x.1,mean_agg_func_state_y.2,median_agg_func_state_y.2,max_agg_func_state_y.2,min_agg_func_state_y.2,std_agg_func_state_y.2,mean_agg_func_state_x.2,median_agg_func_state_x.2,max_agg_func_state_x.2,min_agg_func_state_x.2,std_agg_func_state_x.2,mean_agg_func_state_y.3,median_agg_func_state_y.3,max_agg_func_state_y.3,min_agg_func_state_y.3,std_agg_func_state_y.3,mean_agg_func_state_x.3,median_agg_func_state_x.3,max_agg_func_state_x.3,min_agg_func_state_x.3,std_agg_func_state_x.3,mean_agg_func_state_y.4,median_agg_func_state_y.4,max_agg_func_state_y.4,min_agg_func_state_y.4,std_agg_func_state_y.4,mean_agg_func_state_x.4,median_agg_func_state_x.4,max_agg_func_state_x.4,min_agg_func_state_x.4,std_agg_func_state_x.4,mean_agg_func_state_y.5,median_agg_func_state_y.5,max_agg_func_state_y.5,min_agg_func_state_y.5,std_agg_func_state_y.5,mean_agg_func_state_x.5,median_agg_func_state_x.5,max_agg_func_state_x.5,min_agg_func_state_x.5,std_agg_func_state_x.5,mean_agg_func_state_y.6,median_agg_func_state_y.6,max_agg_func_state_y.6,min_agg_func_state_y.6,std_agg_func_state_y.6,mean_agg_func_state_x.6,median_agg_func_state_x.6,max_agg_func_state_x.6,min_agg_func_state_x.6,std_agg_func_state_x.6,mean_agg_func_state_y.7,median_agg_func_state_y.7,max_agg_func_state_y.7,min_agg_func_state_y.7,std_agg_func_state_y.7,mean_agg_func_state_x.7,median_agg_func_state_x.7,max_agg_func_state_x.7,min_agg_func_state_x.7,std_agg_func_state_x.7,mean_agg_func_state_y.8,median_agg_func_state_y.8,max_agg_func_state_y.8,min_agg_func_state_y.8,std_agg_func_state_y.8,mean_agg_func_state_x.8,median_agg_func_state_x.8,max_agg_func_state_x.8,min_agg_func_state_x.8,std_agg_func_state_x.8,mean_agg_func_state_y.9,median_agg_func_state_y.9,max_agg_func_state_y.9,min_agg_func_state_y.9,std_agg_func_state_y.9,mean_agg_func_state_x.9,median_agg_func_state_x.9,max_agg_func_state_x.9,min_agg_func_state_x.9,std_agg_func_state_x.9,mean_agg_func_state_y.10,median_agg_func_state_y.10,max_agg_func_state_y.10,min_agg_func_state_y.10,std_agg_func_state_y.10,mean_agg_func_state_x.10,median_agg_func_state_x.10,max_agg_func_state_x.10,min_agg_func_state_x.10,std_agg_func_state_x.10,mean_agg_func_state_y.11,median_agg_func_state_y.11,max_agg_func_state_y.11,min_agg_func_state_y.11,std_agg_func_state_y.11,mean_agg_func_state_x.11,median_agg_func_state_x.11,max_agg_func_state_x.11,min_agg_func_state_x.11,std_agg_func_state_x.11,mean_agg_func_state_y.12,median_agg_func_state_y.12,max_agg_func_state_y.12,min_agg_func_state_y.12,std_agg_func_state_y.12,mean_agg_func_state_x.12,median_agg_func_state_x.12,max_agg_func_state_x.12,min_agg_func_state_x.12,std_agg_func_state_x.12,mean_agg_func_state_y.13,median_agg_func_state_y.13,max_agg_func_state_y.13,min_agg_func_state_y.13,std_agg_func_state_y.13,mean_agg_func_state_x.13,median_agg_func_state_x.13,max_agg_func_state_x.13,min_agg_func_state_x.13,std_agg_func_state_x.13,mean_agg_func_state_y.14,median_agg_func_state_y.14,max_agg_func_state_y.14,min_agg_func_state_y.14,std_agg_func_state_y.14,mean_agg_func_state_x.14,median_agg_func_state_x.14,max_agg_func_state_x.14,min_agg_func_state_x.14,std_agg_func_state_x.14,mean_agg_func_state_y.15,median_agg_func_state_y.15,max_agg_func_state_y.15,min_agg_func_state_y.15,std_agg_func_state_y.15,mean_agg_func_state_x.15,median_agg_func_state_x.15,max_agg_func_state_x.15,min_agg_func_state_x.15,std_agg_func_state_x.15,mean_agg_func_state_y.16,median_agg_func_state_y.16,max_agg_func_state_y.16,min_agg_func_state_y.16,std_agg_func_state_y.16,mean_agg_func_state_x.16,median_agg_func_state_x.16,max_agg_func_state_x.16,min_agg_func_state_x.16,std_agg_func_state_x.16,mean_agg_func_state_y.17,median_agg_func_state_y.17,max_agg_func_state_y.17,min_agg_func_state_y.17,std_agg_func_state_y.17,mean_agg_func_state_x.17,median_agg_func_state_x.17,max_agg_func_state_x.17,min_agg_func_state_x.17,std_agg_func_state_x.17,mean_agg_func_state_y.18,median_agg_func_state_y.18,max_agg_func_state_y.18,min_agg_func_state_y.18,std_agg_func_state_y.18,mean_agg_func_state_x.18,median_agg_func_state_x.18,max_agg_func_state_x.18,min_agg_func_state_x.18,std_agg_func_state_x.18,mean_agg_func_state_y.19,median_agg_func_state_y.19,max_agg_func_state_y.19,min_agg_func_state_y.19,std_agg_func_state_y.19,mean_agg_func_state_x.19,median_agg_func_state_x.19,max_agg_func_state_x.19,min_agg_func_state_x.19,std_agg_func_state_x.19,mean_agg_func_state_y.20,median_agg_func_state_y.20,max_agg_func_state_y.20,min_agg_func_state_y.20,std_agg_func_state_y.20,mean_agg_func_state_x.20,median_agg_func_state_x.20,max_agg_func_state_x.20,min_agg_func_state_x.20,std_agg_func_state_x.20,mean_agg_func_state_y.21,median_agg_func_state_y.21,max_agg_func_state_y.21,min_agg_func_state_y.21,std_agg_func_state_y.21,mean_agg_func_state_x.21,median_agg_func_state_x.21,max_agg_func_state_x.21,min_agg_func_state_x.21,std_agg_func_state_x.21,mean_agg_func_state_y.22,median_agg_func_state_y.22,max_agg_func_state_y.22,min_agg_func_state_y.22,std_agg_func_state_y.22,mean_agg_func_state_x.22,median_agg_func_state_x.22,max_agg_func_state_x.22,min_agg_func_state_x.22,std_agg_func_state_x.22,mean_agg_func_state_y.23,median_agg_func_state_y.23,max_agg_func_state_y.23,min_agg_func_state_y.23,std_agg_func_state_y.23,mean_agg_func_state_x.23,median_agg_func_state_x.23,max_agg_func_state_x.23,min_agg_func_state_x.23,std_agg_func_state_x.23,mean_agg_func_state_y.24,median_agg_func_state_y.24,max_agg_func_state_y.24,min_agg_func_state_y.24,std_agg_func_state_y.24,mean_agg_func_state,median_agg_func_state,max_agg_func_state,min_agg_func_state,std_agg_func_state
0,47,8,-0.220204,3,88,-0.314798,-0.315146,-0.187052,-0.184924,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.220204,-0.220204,-0.220204,-0.220204,0.0,0.259535,-0.220204,1.020501,-0.220204,0.657561,-0.220204,-0.220204,-0.220204,-0.220204,,0.524219,-0.220204,2.261207,-0.220204,1.109721,0.027937,-0.220204,0.524219,-0.220204,0.429793,0.077565,-0.220204,1.268643,-1.460909,1.101366,-0.495916,-0.220204,-0.220204,-1.047341,0.477548,0.540762,-0.220204,2.178493,-0.633772,1.259043,-0.174965,-0.187052,4.949989,-0.275622,0.224284,0.074193,-0.187052,3.267165,-0.34943,0.649347,-0.159056,-0.237664,2.689935,-0.34943,0.299519,-0.186524,-0.246099,1.620991,-0.34943,0.228696,-0.139603,-0.231337,2.799011,-0.34943,0.258752,-0.07807,-0.246099,3.267165,-0.34943,0.433627,-0.07807,-0.246099,3.267165,-0.34943,0.433627,-0.07807,-0.246099,3.267165,-0.34943,0.433627,-0.07807,-0.246099,3.267165,-0.34943,0.433627,-0.07807,-0.246099,3.267165,-0.34943,0.433627,-0.101153,-0.248666,3.267165,-0.34943,0.410065,0.359127,-0.083721,1.879573,-0.275622,1.021151,-0.231337,-0.231337,-0.187052,-0.275622,0.062628,0.314842,0.314842,0.816737,-0.187052,0.709787,0.285498,-0.305145,2.588131,-0.34451,1.288662,-0.187052,-0.187052,-0.187052,-0.187052,,-0.23429,-0.275622,-0.06896,-0.334669,0.107669,-0.060633,-0.187052,0.255796,-0.250641,0.275873,-0.055674,-0.098483,0.403412,-0.327288,0.275592,-0.172291,-0.187052,-0.098483,-0.231337,0.067646,-0.062859,-0.296061,0.816737,-0.328764,0.494947,-0.174829,-0.184924,4.105285,-0.258893,0.187311,0.078461,-0.184924,3.261363,-0.332847,0.655767,-0.161297,-0.24408,2.696746,-0.332847,0.299845,-0.188704,-0.244087,1.625683,-0.332847,0.228872,-0.14138,-0.236897,2.709957,-0.332847,0.257501,-0.073847,-0.244087,3.261363,-0.332847,0.435466,-0.073847,-0.244087,3.261363,-0.332847,0.435466,-0.073847,-0.244087,3.261363,-0.332847,0.435466,-0.073847,-0.244087,3.261363,-0.332847,0.435466,-0.073847,-0.244087,3.261363,-0.332847,0.435466,-0.09663,-0.246951,3.261363,-0.332847,0.411188,0.362338,-0.081388,1.885797,-0.273669,1.023174,-0.236685,-0.236685,-0.184924,-0.288445,0.073201,0.317966,0.317966,0.820855,-0.184924,0.711193,0.298324,-0.303251,2.625311,-0.332842,1.302111,-0.184924,-0.184924,-0.184924,-0.184924,,-0.227329,-0.258893,-0.066597,-0.332833,0.105031,-0.05598,-0.184924,0.258802,-0.241819,0.27409,-0.055009,-0.096179,0.416561,-0.314355,0.278345,-0.175058,-0.184924,-0.096179,-0.244073,0.074439,-0.056261,-0.281646,0.820855,-0.332827,0.493441
1,58,9,-0.7992,12,18,-0.268232,-0.268351,-0.094632,-0.101314,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.7992,-0.7992,-0.7992,-0.7992,,-0.330489,-0.7992,1.020501,-1.212768,1.188125,-0.509702,-0.509702,-0.220204,-0.7992,0.409412,-0.7992,-0.7992,-0.7992,-0.7992,,-0.509702,-0.509702,-0.220204,-0.7992,0.409412,-0.633772,-0.633772,-0.468345,-0.7992,0.23395,-0.509702,-0.509702,-0.220204,-0.7992,0.409412,-0.7992,-0.7992,-0.7992,-0.7992,,-0.153734,-0.157529,1.185778,-0.295304,0.098587,0.008182,-0.260861,88.205491,-0.34943,2.449515,-0.141905,-0.256835,5.540454,-0.34943,0.395621,-0.183626,-0.242027,1.85005,-0.34943,0.213956,-0.139603,-0.231337,2.799011,-0.34943,0.258752,-0.123211,-0.208806,1.407202,-0.34943,0.226591,-0.123313,-0.208806,1.407202,-0.34943,0.226625,-0.123313,-0.208806,1.407202,-0.34943,0.226625,-0.159814,-0.232977,1.407202,-0.344938,0.219132,-0.172623,-0.246099,1.407202,-0.342589,0.215284,-0.125611,-0.187052,0.521505,-0.334669,0.1962,-0.094632,-0.094632,-0.094632,-0.094632,,-0.158959,-0.158959,-0.094632,-0.223286,0.090972,-0.094632,-0.094632,-0.094632,-0.094632,,0.234117,-0.094632,0.915148,-0.118165,0.589907,-0.007988,-0.007988,0.078657,-0.094632,0.122533,-0.094632,-0.094632,-0.094632,-0.094632,,-0.007988,-0.007988,0.078657,-0.094632,0.122533,-0.180207,-0.180207,-0.094632,-0.265781,0.121021,-0.111319,-0.111319,-0.094632,-0.128006,0.023599,-0.094632,-0.094632,-0.094632,-0.094632,,-0.152082,-0.155342,0.998538,-0.273689,0.084684,0.005496,-0.272681,88.412333,-0.332847,2.445671,-0.141473,-0.254531,5.583484,-0.332847,0.395369,-0.18367,-0.241026,1.442485,-0.332847,0.19707,-0.14138,-0.236897,2.709957,-0.332847,0.257501,-0.120738,-0.19973,1.353385,-0.332847,0.225154,-0.120812,-0.19973,1.353385,-0.332847,0.225164,-0.120812,-0.19973,1.353385,-0.332847,0.225164,-0.161743,-0.231414,1.31539,-0.332843,0.217417,-0.173398,-0.244087,1.31539,-0.332841,0.212825,-0.124049,-0.184924,0.525038,-0.332833,0.19732,-0.101314,-0.101314,-0.101314,-0.101314,,-0.15657,-0.15657,-0.101314,-0.211826,0.078143,-0.101314,-0.101314,-0.101314,-0.101314,,0.230799,-0.101314,0.929311,-0.135601,0.605173,-0.010001,-0.010001,0.081312,-0.101314,0.129136,-0.101314,-0.101314,-0.101314,-0.101314,,-0.010001,-0.010001,0.081312,-0.101314,0.129136,-0.184203,-0.184203,-0.101314,-0.267092,0.117223,-0.113537,-0.113537,-0.101314,-0.12576,0.017286,-0.101314,-0.101314,-0.101314,-0.101314,
2,58,9,-0.220204,14,95,-0.268232,-0.268351,-0.157529,-0.155342,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,...,-0.220204,-0.220204,-0.220204,-0.220204,,0.08308,-0.220204,0.689647,-0.220204,0.525303,-0.220204,-0.220204,-0.220204,-0.220204,,-0.165061,-0.220204,-0.054777,-0.220204,0.09551,-0.220204,-0.220204,-0.220204,-0.220204,0.0,0.606933,-0.220204,2.261207,-0.220204,1.432643,-0.220204,-0.220204,-0.220204,-0.220204,,-0.716486,-0.220204,-0.220204,-1.957192,0.764822,-0.153734,-0.157529,1.185778,-0.295304,0.098587,0.008182,-0.260861,88.205491,-0.34943,2.449515,-0.122974,-0.255157,4.696933,-0.34943,0.435576,-0.178605,-0.272568,2.292899,-0.34943,0.289099,0.037466,-0.180944,4.949989,-0.34943,0.489325,0.089641,-0.128006,3.431652,-0.34943,0.505257,-0.176696,-0.237664,1.85005,-0.347159,0.19064,-0.176696,-0.237664,1.85005,-0.347159,0.19064,-0.154565,-0.216576,1.11197,-0.347159,0.199849,-0.169672,-0.237664,0.964353,-0.338886,0.196454,-0.174981,-0.237664,0.964353,-0.34451,0.189041,0.358073,-0.071068,1.85005,-0.275622,1.001805,-0.25594,-0.275622,-0.157529,-0.334669,0.090195,-0.157529,-0.157529,-0.157529,-0.157529,,-0.217296,-0.216576,-0.157529,-0.277782,0.06013,-0.157529,-0.157529,-0.157529,-0.157529,,-0.145228,-0.157529,-0.032056,-0.246099,0.107551,-0.187052,-0.187052,-0.157529,-0.216576,0.041752,-0.182132,-0.157529,-0.098483,-0.290384,0.098288,-0.157529,-0.157529,-0.157529,-0.157529,,0.05082,-0.06896,0.639598,-0.216576,0.34495,-0.152082,-0.155342,0.998538,-0.273689,0.084684,0.005496,-0.272681,88.412333,-0.332847,2.445671,-0.125558,-0.258893,4.61164,-0.332847,0.436518,-0.182705,-0.272634,2.299942,-0.332847,0.287048,0.04052,-0.182146,4.105285,-0.332847,0.486959,0.089533,-0.128014,3.343851,-0.332847,0.506194,-0.183157,-0.244087,1.442485,-0.332845,0.183431,-0.183157,-0.244087,1.442485,-0.332845,0.183431,-0.161181,-0.228417,0.998464,-0.332845,0.196005,-0.178497,-0.24408,0.953988,-0.332837,0.19649,-0.182756,-0.244087,0.953988,-0.332842,0.183989,0.358907,-0.069765,1.863604,-0.288445,1.010832,-0.273649,-0.332773,-0.155342,-0.332833,0.102457,-0.155342,-0.155342,-0.155342,-0.155342,,-0.212584,-0.214506,-0.155342,-0.267905,0.056306,-0.155342,-0.155342,-0.155342,-0.155342,,-0.142401,-0.155342,-0.027773,-0.244087,0.108736,-0.184924,-0.184924,-0.155342,-0.214506,0.041835,-0.175068,-0.155342,-0.096179,-0.273684,0.090382,-0.155342,-0.155342,-0.155342,-0.155342,,0.037096,-0.135552,0.643365,-0.214506,0.352779
3,3,3,-1.543623,0,31,-0.501058,-0.502326,-0.237664,-0.269409,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-1.543623,-1.543623,-1.543623,-1.543623,,-0.302918,-0.220204,1.020501,-1.543623,0.624475,-0.881914,-0.881914,-0.220204,-1.543623,0.935799,-1.543623,-1.543623,-1.543623,-1.543623,,0.138222,-0.220204,2.178493,-1.543623,1.886767,-1.543623,-1.543623,-1.543623,-1.543623,,0.077565,-0.220204,2.261207,-1.543623,1.376133,-0.881914,-0.881914,-0.220204,-1.543623,0.935799,-0.294839,-0.305145,1.407202,-0.344289,0.06636,-0.058953,-0.242027,3.853412,-0.34943,0.50206,-0.132644,-0.275622,10.707018,-0.353121,0.498883,-0.134178,-0.275622,5.146811,-0.34943,0.54822,-0.139603,-0.231337,2.799011,-0.34943,0.258752,-0.160873,-0.246099,2.799011,-0.344938,0.253115,-0.160873,-0.246099,2.799011,-0.344938,0.253115,-0.255668,-0.300928,0.875784,-0.344938,0.115744,-0.255668,-0.300928,0.875784,-0.344938,0.115744,-0.262301,-0.305145,0.816737,-0.344938,0.10641,-0.208278,-0.237664,0.226273,-0.318771,0.105505,-0.15637,-0.280798,0.167226,-0.334669,0.237272,-0.214786,-0.283674,0.290454,-0.334669,0.185986,-0.237664,-0.237664,-0.237664,-0.237664,,-0.215362,-0.246099,0.226273,-0.334669,0.160221,-0.212358,-0.212358,-0.187052,-0.237664,0.035788,-0.237664,-0.237664,-0.237664,-0.237664,,0.008077,-0.237664,0.551028,-0.289133,0.470913,-0.237664,-0.237664,-0.237664,-0.237664,,-0.218709,-0.246099,0.000507,-0.334669,0.128307,-0.271405,-0.271405,-0.237664,-0.305145,0.047717,-0.298082,-0.303251,0.555477,-0.322881,0.033279,-0.058638,-0.244087,3.8931,-0.332847,0.505488,-0.135602,-0.273669,10.760287,-0.332851,0.500612,-0.137779,-0.297329,5.090554,-0.332847,0.548592,-0.14138,-0.236897,2.709957,-0.332847,0.257501,-0.166886,-0.267092,2.709957,-0.332843,0.250487,-0.166886,-0.267092,2.709957,-0.332843,0.250487,-0.263724,-0.303251,0.820914,-0.332843,0.110515,-0.263724,-0.303251,0.820914,-0.332843,0.110515,-0.26494,-0.303251,0.554886,-0.332843,0.102106,-0.208552,-0.236897,0.22922,-0.310084,0.103271,-0.158582,-0.291041,0.170057,-0.332833,0.239104,-0.223503,-0.332781,0.284534,-0.332833,0.190167,-0.269409,-0.269409,-0.269409,-0.269409,,-0.216807,-0.244087,0.22922,-0.332833,0.162665,-0.227167,-0.227167,-0.184924,-0.269409,0.05974,-0.269409,-0.269409,-0.269409,-0.269409,,0.004176,-0.269409,0.554619,-0.272681,0.4767,-0.269409,-0.269409,-0.269409,-0.269409,,-0.219748,-0.269409,0.006484,-0.332833,0.131752,-0.28633,-0.28633,-0.269409,-0.303251,0.02393
4,0,21,-0.220204,10,59,-0.547623,-0.549121,-0.334669,-0.332833,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,...,-0.716486,-0.261561,-0.220204,-2.122619,0.938232,0.259535,-0.220204,2.261207,-1.543623,1.120763,0.281986,-0.220204,2.261207,-2.039905,1.338234,-0.211933,-0.220204,1.020501,-1.047341,0.561601,0.027937,-0.220204,1.020501,-0.220204,0.55486,-0.92327,-0.92327,-0.220204,-1.626337,0.994286,-0.220204,-0.220204,-0.220204,-0.220204,0.0,-0.199526,-0.220204,-0.13749,-0.220204,0.041357,-0.323382,-0.334669,0.521505,-0.354351,0.04346,-0.000641,-0.216576,17.349745,-0.354351,0.663338,-0.143427,-0.25348,9.476884,-0.350133,0.447636,-0.029176,-0.268371,9.476884,-0.34943,0.923141,-0.162132,-0.275622,2.912886,-0.34943,0.283757,-0.148449,-0.275622,4.949989,-0.344062,0.318522,-0.098701,-0.237664,2.166371,-0.344062,0.336731,-0.098701,-0.237664,2.166371,-0.344062,0.336731,-0.231717,-0.275622,1.407202,-0.344062,0.132051,-0.246075,-0.297765,0.344366,-0.344062,0.117042,-0.246075,-0.297765,0.344366,-0.344062,0.117042,0.114741,-0.275622,1.141493,-0.334669,0.643237,-0.258114,-0.270128,-0.157529,-0.334669,0.073639,-0.12357,-0.214031,0.268449,-0.334669,0.26747,-0.210619,-0.289133,0.373889,-0.334669,0.186832,-0.058065,-0.305145,2.689935,-0.34943,0.797197,-0.157568,-0.312526,0.774561,-0.334669,0.355916,0.094402,-0.305145,1.604023,-0.334669,0.847093,-0.247234,-0.247234,-0.1598,-0.334669,0.123651,-0.231337,-0.231337,-0.128006,-0.334669,0.146133,-0.27586,-0.319907,-0.128006,-0.335621,0.09958,-0.332821,-0.332833,-0.331975,-0.332852,4.4e-05,-0.000649,-0.214506,17.416177,-0.332852,0.664832,-0.143601,-0.258883,9.527715,-0.332848,0.447,-0.030915,-0.27316,9.527715,-0.332847,0.925431,-0.167973,-0.273669,2.862054,-0.332847,0.281778,-0.154625,-0.273669,4.105285,-0.332842,0.313475,-0.102618,-0.244073,2.076063,-0.332842,0.334797,-0.102618,-0.244073,2.076063,-0.332842,0.334797,-0.236914,-0.273669,0.850703,-0.332842,0.121503,-0.247838,-0.30223,0.288443,-0.332842,0.114109,-0.247838,-0.30223,0.288443,-0.332842,0.114109,0.124034,-0.258893,1.146254,-0.332833,0.647908,-0.260931,-0.277774,-0.155342,-0.332833,0.075333,-0.145846,-0.212465,0.17438,-0.332833,0.220902,-0.207225,-0.272681,0.377129,-0.332833,0.186893,-0.056808,-0.303251,2.727317,-0.332847,0.805852,-0.156628,-0.313109,0.782817,-0.332833,0.358675,0.102999,-0.303251,1.639253,-0.332833,0.861939,-0.264548,-0.264548,-0.196263,-0.332833,0.096569,-0.229297,-0.229297,-0.12576,-0.332833,0.146422,-0.273669,-0.318042,-0.12576,-0.332834,0.099587


# lgbによる予測

In [52]:
target = train['state']

In [53]:
# 3分割交差検証を指定し、インスタンス化
from sklearn.model_selection import KFold
from sklearn.metrics import accuracy_score

kf = KFold(n_splits=5)  # 3分割交差検証のためにインスタンス化

# スコアとモデルを格納するリスト
score_list = []
models = []

print('input size is {}行, {}カラム'.format(len(train_df), len(train_df.columns)))
for fold_, (train_index, valid_index) in enumerate(kf.split(train, target)):
    train_x = train_df.iloc[train_index]
    valid_x = train_df.iloc[valid_index]
    train_y = target[train_index]
    valid_y = target[valid_index]
    
    print(f'fold{fold_ + 1} start')

    gbm = lgb.LGBMClassifier(objective='binary',num_boost_round=50000, learning_rate=0.1)
    gbm.fit(train_x, train_y, eval_set = [(valid_x, valid_y)],
                early_stopping_rounds=100,
                verbose= 100) # 学習の状況を表示しない
    
    oof = gbm.predict(valid_x, num_iteration=gbm.best_iteration_)
    score_list.append(round(accuracy_score(valid_y, oof)*100,2))
    models.append(gbm)  # 学習が終わったモデルをリストに入れておく
    print(f'fold{fold_ + 1} end\n' )
print(score_list, '平均score', np.mean(score_list), "%")  

input size is 9792行, 2497カラム
fold1 start
Training until validation scores don't improve for 100 rounds.
[100]	valid_0's binary_logloss: 0.431735
Early stopping, best iteration is:
[69]	valid_0's binary_logloss: 0.430195
fold1 end

fold2 start
Training until validation scores don't improve for 100 rounds.
[100]	valid_0's binary_logloss: 0.422785
[200]	valid_0's binary_logloss: 0.431981
Early stopping, best iteration is:
[117]	valid_0's binary_logloss: 0.419698
fold2 end

fold3 start
Training until validation scores don't improve for 100 rounds.
[100]	valid_0's binary_logloss: 0.423383
[200]	valid_0's binary_logloss: 0.432444
Early stopping, best iteration is:
[131]	valid_0's binary_logloss: 0.420504
fold3 end

fold4 start
Training until validation scores don't improve for 100 rounds.
[100]	valid_0's binary_logloss: 0.402257
[200]	valid_0's binary_logloss: 0.401789
Early stopping, best iteration is:
[125]	valid_0's binary_logloss: 0.396278
fold4 end

fold5 start
Training until validation

In [54]:
# testの予測
test_pred = np.zeros((len(test), 5))  # 行:len(test), 列:3のall zeroの配列を用意

for fold_, gbm in enumerate(models):  # 学習ずみのmodelをgbmに入れる
    pred_ = gbm.predict(test_df, num_iteration=gbm.best_iteration_)  # testの予測
    test_pred[:, fold_] = pred_  # １回目は0列目、2回目は1列目、2回目は3列目に格納

pred = (np.mean(test_pred, axis=1) > 0.5).astype(int)  # 平均をとって、0と１に変換

# submission

In [55]:
sub = pd.DataFrame(test['id'])

In [56]:
sub['state'] = pred
sub.head()

Unnamed: 0,id,state
0,test_00000,1
1,test_00001,1
2,test_00002,1
3,test_00003,0
4,test_00004,0


In [57]:
sub.to_csv('sub/14_lgb6.csv',index=False, header=None)