From 594fa47d5efcb64119ff899f8a982f13fc3182de Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Wed, 17 Oct 2018 19:05:39 +0000 Subject: [PATCH 1/2] Done --- __pycache__/__init__.cpython-36.pyc | Bin 141 -> 163 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 155 -> 177 bytes .../__pycache__/build.cpython-36.pyc | Bin 414 -> 331 bytes q01_load_data/build.py | 9 ++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 161 -> 183 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1525 -> 1547 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 156 -> 178 bytes .../__pycache__/build.cpython-36.pyc | Bin 660 -> 672 bytes q02_data_split/build.py | 14 +++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 162 -> 184 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3134 -> 3156 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 159 -> 181 bytes .../__pycache__/build.cpython-36.pyc | Bin 924 -> 744 bytes q03_data_encoding/build.py | 12 +++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 165 -> 187 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2197 -> 2219 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 157 -> 179 bytes .../__pycache__/build.cpython-36.pyc | Bin 1006 -> 1163 bytes q03_ohe_encoder/build.py | 18 ++++++++++++++---- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 163 -> 185 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1478 -> 1500 bytes 21 files changed, 46 insertions(+), 7 deletions(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index b0c3719c2f46201b3baa3fcef746c16a601c9e9f..423888ac994efa6162f7380336a29d9df9d2d32b 100644 GIT binary patch delta 57 zcmeBWT+GN}%*)GFA$&Y~B8RzZfPO}PZmND!Vs2$(c2Q<=MqXl`g_(YMeo=ODL1J>M MesX?F>O?<#0RQh3Hvj+t delta 35 qcmZ3?*vrUa%*)I5Qh!m@L=JO)EB%c8+*JMaqSVU7lKk9>DfR%jdkbO! diff --git a/q01_load_data/__pycache__/__init__.cpython-36.pyc b/q01_load_data/__pycache__/__init__.cpython-36.pyc index 4596200714efc1a2bd21ca0d0f36671155da8439..cedda302b131361af9e244d49a616e662cf41f2a 100644 GIT binary patch delta 57 zcmbQuxRH^=n3tEULil*}L=JP+IQ@+L+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNt+00>+YZvX%Q delta 35 qcmdnUIGd5fn3tF9rT(I*i5%wq9{L&ixvBc;MX8mECHc7%Q+xruJqwxu diff --git a/q01_load_data/__pycache__/build.cpython-36.pyc b/q01_load_data/__pycache__/build.cpython-36.pyc index 98e98a79cdf9a026efe48fdde2a84d1da49836cc..8c55f6b27936036c36f65bfa9e222d26f7bce246 100644 GIT binary patch delta 227 zcmbQoe42^Vn3tEUO89v6zKNVp^^6P*3@kwG48+BJK%#^pi?N0wg)xPxmnoP*liBYV zqqQdEE#~6X0!^k{Oa&=X97U;#De=k0Wk6w;g2a-Hl?+8}K%Kv$^)vEwQ}v4yb1M_G zi!zHd@)Gkb%=E+ai?WLg5|dN)lk-zj^>a&eN;1n5i!u{SQsXB}GMf0ZgY0Gk5)6z* s96(Z&`4(G2VqQvOaS_OAU@@=_NCZgFEe@O9{FKt1R6CGnun8Qj0Gcm2F8}}l delta 296 zcmYjNJ5Iwu5Z&1|j-3xBXJD%oNHicMf@qNtsoYo#GY~9qZ0#-*NI{&yMJ_;rM8O@n z0XNu|DpyFwI2FY_&AidPnKwW3UFAoU$?)^|qxfCtvo|S(NH{Jy{2@aS6|4jT%1*w* z3Mz>T6Wr@$r7*=o2R(Zubau6c6Ae*$YB#`>n*oECF}Zig9Vq;4mOrW`jB0<-* zI*GEyV(7?V8O-f@O)>Sxwlx(aN1j6YxI}vHWm*#!MUEyI7PRyw+=v%!FQ<#f()7X6 ziwTWgf6uOa13qOCunz~|CY)&%)0R&#-ep|wxSha17;__Lr?$bTn$CI;zW+z2{s7B( BOcMYA diff --git a/q01_load_data/build.py b/q01_load_data/build.py index 7cd3700..421b7a2 100644 --- a/q01_load_data/build.py +++ b/q01_load_data/build.py @@ -1,4 +1,11 @@ +# %load q01_load_data/build.py import pandas as pd # Write your code below - +# path = 'data/student-mat.csv' + +def load_data(path): + return pd.read_csv(path, sep = ';') +# load_data(path) + + diff --git a/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc b/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc index d07fd2f92eb40b45050574e400ae0ba39249b5e5..6e6da1276c4949c55a827ab9dbdab5683f3c1cef 100644 GIT binary patch delta 57 zcmZ3;xSf&1n3tEUM)-L2L=JP+6#b0++*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNt<01UDdivR!s delta 35 qcmdnaxR8;q5 diff --git a/q01_load_data/tests/__pycache__/test.cpython-36.pyc b/q01_load_data/tests/__pycache__/test.cpython-36.pyc index 9aa6996833ac66f36d6c99e9f80a514b1a8a8440..d4d20046aa1c5169b72585406a15a3a8b9094300 100644 GIT binary patch delta 59 zcmey$-Oa;c%*)GFBYZr1Bgacd)dc;F{M=OiqQu delta 38 tcmeC?`O3{<%*)FqWWFeBBgacdelPuu{M=Oi^rFRq0+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNt600{LHa{vGU delta 35 qcmdnQIERtLn3tF9rT(I*i5%wqp86U2xvBc;MX8mECHc7%Q~UtDlnb5! diff --git a/q02_data_split/__pycache__/build.cpython-36.pyc b/q02_data_split/__pycache__/build.cpython-36.pyc index e6bd2ebf2f76eee17541ce631c667ecb332558ff..76b1e39e89e4ed65a87c16f264b2acf43198e024 100644 GIT binary patch delta 366 zcmYjLJxc>Y5Z&3^`wExT20Od6IWQn1qGiCsM$othjwN$3XL29xonT}S3oT6%VxyIR z!(ZTkxPK7rEUny2%^*anESrP?OBy%y9aWP3ndaxf{W^!8OViX0V45QTx^tW6s zFB}bocEF)qRCYA?-PJeXskAh&tz0J&MNM;*P0)=(Hh=y>yHPqvNrrc`=$Ptm6cM~Ibxv;lFB70b9N{bj9 z1ws4;f5FCI*gr^XX`_2rg9lvtRxg*b2%Kw6mKtw2N%>7I+QmO*Ujy1+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNt901Chpe*gdg delta 35 qcmdnWIG>Tjn3tF9rT(I*i5%wqKKdE?xvBc;MX8mECHc7%Qvw0KnG31_ diff --git a/q03_data_encoding/__pycache__/build.cpython-36.pyc b/q03_data_encoding/__pycache__/build.cpython-36.pyc index 302366cb1c8d346c67f347e326ce7abc487c2dcb..18640a0e2bbe501cadec72acf7c5482bf8dd46a1 100644 GIT binary patch delta 320 zcmYjNy-LJD5Z;|!ez}NXEp|exEri2DZ0v0;lvo_gWy9qz*(|#`A&~Qmdjd)83)tBC z41$gQK7r3*bNJ=QXK9+eJ-*-Xp5l+4M+gDTD@=2W(2+ga!a!DZ zfEDcNmJIZd(*dgzZb(M2Gfz)YpZi>?y3fgJv1(v+=kGS7y0uB@aDkO z5zc(i*|Kc})BL#U`C3utxpR{Q0+`Y%=wy6= zSC#v6)2QBpR5nmt7Tj1+g@vNjKB{$qV8i~`2@-Uo6W4O<{z2@N(M8i1n_67DmzV5MC zwX(DEL3o61ZS)naoFzgallf=%xAXaJy*b6xN~P2|dvAZe78g?!A!LDHfXf$<49(Dl zj7AxzI7b6Q$swANOLR{sMrI65U=}605onHOJtqTu$qZ^dulY7+l_1PIR~clx~%(v*kH diff --git a/q03_data_encoding/build.py b/q03_data_encoding/build.py index bb4c8ca..283b82b 100644 --- a/q03_data_encoding/build.py +++ b/q03_data_encoding/build.py @@ -1,3 +1,4 @@ +# %load q03_data_encoding/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset from sklearn.preprocessing import LabelEncoder @@ -5,10 +6,19 @@ import pandas as pd df = load_data('data/student-mat.csv') -x_train, x_test, y_train, y_test = split_dataset(df) +X_train, X_test, y_train, y_test = split_dataset(df) # Write your code below +def label_encode(X_train,X_test): + + le = LabelEncoder() + + X_train = X_train.apply(le.fit_transform) + X_test = X_test.apply(le.fit_transform) + return X_train, X_test + +# label_encode(X_train,X_test) diff --git a/q03_data_encoding/tests/__pycache__/__init__.cpython-36.pyc b/q03_data_encoding/tests/__pycache__/__init__.cpython-36.pyc index 7d18c185f615d8dacd541c2aac10e2127c6a6058..c084ebf12f5a9ad01b907e6a357b64d84a9fa352 100644 GIT binary patch delta 57 zcmZ3=xSNr~n3tDpd)@Kqi5%vt8TuLdxvBa^iMf@D*+rSf8F`6$7H0b4`9;~q1&PV2 M`pNkzsT2Le0WHfEK>z>% delta 35 qcmdnZxRjB@n3tF9rT(I*i5%wqLHZf_xvBc;MX8mECHc7%Q^EniqYJ_S diff --git a/q03_data_encoding/tests/__pycache__/test.cpython-36.pyc b/q03_data_encoding/tests/__pycache__/test.cpython-36.pyc index 8ade2b73d89dd5f9591f59a4f4d14aa50d93bd2e..6faf62bd22873e799b74c5a08b681fea2f72db60 100644 GIT binary patch delta 65 zcmbO#xLT0In3tDpd)@KqjT{P0YAN~|`MIh3MTxnUiP=S&#Tj{tc@}2+;rT_`#RZAU Vsrt$JDXIFCU$V<@4rj7s0|3ja7Bm0= delta 43 zcmZ22I8~6tn3tDJ*J4rBMh*og0YCkW{M=Oi^rFkFa) diff --git a/q03_ohe_encoder/__pycache__/build.cpython-36.pyc b/q03_ohe_encoder/__pycache__/build.cpython-36.pyc index 1433b7bfe437842ddac619a606d8eb33eef1b873..dc2b7838d18207c9ebb7074bfb898905974df371 100644 GIT binary patch delta 650 zcmYjO&1w`u5bmGZ`Ps~FHa{9c)I(5Mg4shrJctnz^Z^1I+UU~R?#<3-=ZBtIaAB4R z6Y&r{taJ4(d;pKW!(7Fy51vI{DF&9z_96HBy2TdazXa+G^X^qOAR{&=IH z1wABCx2ZRWRC%g-NyQD-I3nGZ#g_*ye)m**#NG4v)V8Jvfc70drJ>6+S=YmyKl8lIZ!YSO-s*M~1*6Z`;*Jq=Pu?vD{Z|ZK z%vLw|geQq~PJB@ZDr-|J0^kr#=}$*AL?|NBl&R;*+w;$>i9_?4uek)NBY zUzC_znV4OaS)7rVm}g<8AD&;7U0jfuoT{IkpOQLxE@K!Y|Ku->pSeMrz&eZgCVyh; zU=*BO&1}dhGR=U7DzPG delta 243 zcmcb^eTR;*+w;$vW7_~oOYk)NBY zpI($&nOKsat3O$RRethiMl(i%$y`jIxj|~c3XAwBb1-)>3QeBKY-lJ96urfloLG{Y zo?lcMpP84ET5*fHxTHvvsYn#0LkzABYykh{&&+v-;vhjOR2hggNK6n&@B(o$3y|Po g;$SHfoIHu;kBSILk_$vgfC!K>h=Y)wwuw~>0EbC5N&o-= From a36c4473273e8494ddec22812ea6bbd09c1195cb Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Thu, 25 Oct 2018 17:12:49 +0000 Subject: [PATCH 2/2] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 164 -> 186 bytes .../__pycache__/build.cpython-36.pyc | Bin 921 -> 904 bytes q04_data_visualisation/build.py | 14 +++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 170 -> 192 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1259 -> 1281 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 169 -> 191 bytes .../__pycache__/build.cpython-36.pyc | Bin 810 -> 811 bytes q05_linear_regression_model/build.py | 14 +++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 175 -> 197 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1588 -> 1610 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 162 -> 184 bytes .../__pycache__/build.cpython-36.pyc | Bin 1086 -> 1018 bytes q06_cross_validation/build.py | 9 +++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 168 -> 190 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2082 -> 2104 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 161 -> 183 bytes .../__pycache__/build.cpython-36.pyc | Bin 1168 -> 1190 bytes q07_regression_pred/build.py | 12 ++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 167 -> 189 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3674 -> 3696 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 158 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 1359 -> 1382 bytes q08_linear_model/build.py | 13 ++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 164 -> 186 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3958 -> 3980 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 192 bytes .../__pycache__/build.cpython-36.pyc | Bin 1339 -> 1329 bytes q09_advanced_model_q01_lasso/build.py | 12 ++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 176 -> 198 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 4099 -> 4121 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 192 bytes .../__pycache__/build.cpython-36.pyc | Bin 1339 -> 1364 bytes q09_advanced_model_q02_ridge/build.py | 13 ++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 176 -> 198 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 4079 -> 4101 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 165 -> 187 bytes .../__pycache__/build.cpython-36.pyc | Bin 911 -> 842 bytes q10_data_missing_values/build.py | 9 +++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 171 -> 193 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2358 -> 2380 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 177 -> 199 bytes .../__pycache__/build.cpython-36.pyc | Bin 1081 -> 1100 bytes q11_feature_selection_q01_plot_corr/build.py | 35 +++++++++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 183 -> 205 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1488 -> 1510 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 183 -> 205 bytes .../__pycache__/build.cpython-36.pyc | Bin 1715 -> 1472 bytes .../build.py | 15 +++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 189 -> 211 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2604 -> 2626 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 163 -> 185 bytes .../__pycache__/build.cpython-36.pyc | Bin 995 -> 1048 bytes q12_feature_selection/build.py | 10 +++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 169 -> 191 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2699 -> 2721 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 160 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 556 -> 1373 bytes q13_plot_residuals/build.py | 36 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 166 -> 188 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1475 -> 1497 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 158 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 2166 -> 2115 bytes q14_benchmarking/build.py | 18 +++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 164 -> 186 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2092 -> 2114 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 1461 bytes q15_select_best_model/build.py | 16 ++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 191 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1994 bytes 69 files changed, 210 insertions(+), 16 deletions(-) create mode 100644 q15_select_best_model/__pycache__/build.cpython-36.pyc create mode 100644 q15_select_best_model/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q15_select_best_model/tests/__pycache__/test.cpython-36.pyc diff --git a/q04_data_visualisation/__pycache__/__init__.cpython-36.pyc b/q04_data_visualisation/__pycache__/__init__.cpython-36.pyc index d44a511ba9fc7f538b045ab1a267d7e0fc7a3439..179b2e1bba03dfb312194037f1b69457eaada21f 100644 GIT binary patch delta 57 zcmZ3&xQmg)n3tEULil*}L=JP+bp4F{+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNs!01dqplK=n! delta 35 qcmdnRxP+0zn3tF9rT(I*i5%wqf%+NwxvBc;MX8mECHc7%Q^EkhObfmM diff --git a/q04_data_visualisation/__pycache__/build.cpython-36.pyc b/q04_data_visualisation/__pycache__/build.cpython-36.pyc index 2bfbd4e9d4e48bf9ff2e2bf665199d203cc772e7..c689d6ae2bd4f6a5cf7bd06a37ec4162108458b6 100644 GIT binary patch delta 299 zcmbQq-oegk%*)I5cFOVSClfjUO2{xUFqAOVFr+Z1u%SJ(#FrE$X6D^u z12R&JOK!1O!UTW}pa57m*nT8}8>E%PCO1E&G$+-L3CJrJ01`ZmK*+?!$ivLRD8R_a F3;=bHPB8!g delta 317 zcmeBRpUKW?%*)HQ-eOVIhKZbiqxBdV7)ltj7@HXw8A_OH7*ZHhSW}o&SbAB2e1|&6-EOo9-wS72asT3 z_!fIbd`VGaX5K9}AS1Q7Xsv+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsE01;CYs{jB1 delta 35 qcmX@WxQda(n3tF9rT(I*i5%wq;rbc*xvBc;MX8mECHc7%Q(^$YRtweu diff --git a/q04_data_visualisation/tests/__pycache__/test.cpython-36.pyc b/q04_data_visualisation/tests/__pycache__/test.cpython-36.pyc index 5353356812e3190f1d8c90fdc95d0d7f053a87cf..3788e3c16b103874295603dbfd0fb234a860e037 100644 GIT binary patch delta 98 zcmaFO*~rCV%*)GFA$&Y~BZm`{TBd$Rer~FMQDSaoVs=qxaYkNZo`soycz#iKaY15o us(x~QN~-?k^~~~{E17mO%0vm~CYBWB=>(P8D(w><|dXD}6qdOFWTG0K diff --git a/q05_linear_regression_model/__pycache__/__init__.cpython-36.pyc b/q05_linear_regression_model/__pycache__/__init__.cpython-36.pyc index 06a2a9b901d2940b1616332fc3af2e6292737630..c1dab24092e8299fbc3ded00c931aee34583c199 100644 GIT binary patch delta 57 zcmZ3n3tF9rT(I*i5%wqVfq>QxvBc;MX8mECHc7%Q=$RD{|nLp diff --git a/q05_linear_regression_model/__pycache__/build.cpython-36.pyc b/q05_linear_regression_model/__pycache__/build.cpython-36.pyc index c40d112c5d846cc979296e4912c2f11a9f286eee..59af3126d366fc94a24085fc3340418561c81338 100644 GIT binary patch delta 280 zcmZ3*wwjI8n3tDp_4MP>D<*P2uV-OkU|?+%?!0nHB4EIH4HV3%}lk- zHO#>bnv8y$Ohq8YQOs$XC7LX^7$a^mRz|VqWabs6rr%=C%}+_qS;rKN+Z6KesfeWbz~?>B*gp7Lo!W``Lg5 z10x$F4`UHGkmaYzcgudV0+Zfk4yI!O#6 delta 280 zcmZ3@wu+6@n3tF9y~U!a%!!=O>zNrC7(mz=h>N9wL!m?BZeMVFF zHZue>XfpdnF%=nUGDfi%C+8Ps=A~;g6@hd{vE-&E=4rCrV$ID@NzJ*%7;%fSGK!jy1+*JLd#N5in?4r!#jJ(7=3p4%j{34$0;)2BFRQ+V2cKykx zndB#{Gg*m=gB-*HBp8?k7>js;w5G@{`^o#6^foVNQe|Yh#gtbt`69Er1_w|IEDyE^ ZiQoZB+~TkSx~eoM)sAVh0*fpo3jmQsKxhB} delta 312 zcmYj~Jxc>Y5QcYlZ|_4AL=-fISn4$%m_ih>u~i!zxh5RhHRimJu)7L@6N}VW-9NCi z6np=I{bDWTFQjr78yV(dKHhm}6?}%#u-{)hK6y;+yazok~uh|nA)%!=~*!~+V)gdiMkwVlNo8L zI>Id-Kc#^l*J@f#V&Bs0YG(aEo%OVoLOC1dBdk}-tcpF$%Ua07!mWk5N4E zM#<_jxvxu^Oq85wrY@82i|%zlaJsRDTkTv3^f1)mBcUm9wT_dnW%~!4Sg3)6Gx~=e SY;AakKOYNu4&67~1^Np^4^Ykk diff --git a/q06_cross_validation/build.py b/q06_cross_validation/build.py index 406a734..d2d414d 100644 --- a/q06_cross_validation/build.py +++ b/q06_cross_validation/build.py @@ -1,3 +1,4 @@ +# %load q06_cross_validation/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -18,4 +19,12 @@ model =linear_regression(x_train,y_train) # Write your code below + +def cross_validation_regressor(model, X,y): + r2_score = cross_val_score(model,X,y,scoring='r2') + return r2_score.mean() + +# cross_validation_regressor(model, x_train,y_train) + + diff --git a/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc b/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc index b571b36039256ecb659b19941ead2c342e31d840..d696aaacf2dcaade5daf1d204fcbbfb09427c841 100644 GIT binary patch delta 57 zcmZ3%xQ~&;n3tEULil*}L=JP+Z2gS<+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsk01zP)qW}N^ delta 35 qcmdnTxPpj diff --git a/q06_cross_validation/tests/__pycache__/test.cpython-36.pyc b/q06_cross_validation/tests/__pycache__/test.cpython-36.pyc index e065247889afd73fa150bc5ca136b8b2492d5d10..b41c1362a9edbee1d5cce0c310cca930985e5cd0 100644 GIT binary patch delta 279 zcmZ1^utR{un3tEULil*}MvhaAj8U5}GYT^kE-pw+PSsD&Pf69Ee1J`Uvm~<|qkte#QxQlfgbp^lR*hJCE|JbbnQ0_M> diff --git a/q07_regression_pred/__pycache__/__init__.cpython-36.pyc b/q07_regression_pred/__pycache__/__init__.cpython-36.pyc index 3e7e4674f103511456d5015475ef0cbf23edade2..1d41f19fee7a8218dd632e604f7b7a4f16eab144 100644 GIT binary patch delta 57 zcmZ3;xSf&1n3tEULil*}L=JP+6#b0++*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNt<01NUHhX4Qo delta 35 qcmdnaxR8;q5 diff --git a/q07_regression_pred/__pycache__/build.cpython-36.pyc b/q07_regression_pred/__pycache__/build.cpython-36.pyc index dfa0411c934d2ac90e55ee4d32c73e0e7f34e120..d8af45c117d8cfc5c81582cd2bca0ddaca4d4e76 100644 GIT binary patch delta 113 zcmbQhxr~$3n3tF9(Zb`=iwhEy zQ}vVcQ&ROOJ2J~pwqP>mmSA9DDCPnZ3{0ELn0_0p8x;= delta 35 qcmdnXxSWy0n3tF9rT(I*i5%wqA^I8lxvBc;MX8mECHc7%Qz8MtQ47id diff --git a/q07_regression_pred/tests/__pycache__/test.cpython-36.pyc b/q07_regression_pred/tests/__pycache__/test.cpython-36.pyc index 203c5fffc9b57db56ac2473265e2f03506fa63eb..95935bda1986d1decc9f7720ed53dfefd5d982e4 100644 GIT binary patch delta 225 zcmca5^FfBgn3tEULil*}Mh;_UwKV;V{M=OiqQuJ8KWlWv;1e2nw-!2lued_fuRV*RGeJRb{N5x+8oDznvqck zC?hr5fQx;yH|J3{RghwNsL&Y*R}sinn5@K|sUi)Ml>-q9AVLX5sDKDH5TOntG$ya- eE@q6{tju$pQ9uSHA`c=IK?EOAPJFT|pD6$le>e63 delta 181 zcmew$b4!N9n3tF9rT(I*jU2|z`~mtI`MIh3=|!oPi6!~Dn-iE-7#VL(Ze{t;C_TA= zO>y!v)+20k3=9lKAnp?cQ)+Vw`)Ni-*~t!^&)C#J3KW1$#mT;0MjZ?=vjS diff --git a/q08_linear_model/__pycache__/__init__.cpython-36.pyc b/q08_linear_model/__pycache__/__init__.cpython-36.pyc index b91b141617b95b635e59b43a1e9967e108638c18..47d323d760c30b26894cc3f8f1055b06296aa350 100644 GIT binary patch delta 57 zcmbQoxP_6!n3tEULil*}L=JP+ME#8X+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNrp0177)djJ3c delta 35 qcmdnOIFFITn3tF9rT(I*i5%wq-ufB&xvBc;MX8mECHc7%Qvv|JLJOt< diff --git a/q08_linear_model/__pycache__/build.cpython-36.pyc b/q08_linear_model/__pycache__/build.cpython-36.pyc index 438fb9485b4b16efb7c4d78b935df99cb4da3c8f..13ab053703c02056a11f0063650aeb7992f97775 100644 GIT binary patch delta 420 zcmYk1yGjE=6oz+ZXZDr^uMth7AYK-W1qHDPHj1SnDuRk(*qtPr-E5qh2!UBFQd`JA zg_VdeVP`)NkkSXRa>ha|&Ijil{{Q^vGnfSaPOTQKlaDL@=HG+Iie*`jt^-~COhZ`G zl5h+QB!EN`NPBEwqXHLB;TE2N!v5Xcg)h(@mcDd_BfU22fCMBku@lrm34Ve_pw(Cg zZTr*;o#RVCW;y4r2a+l~BUB-lajKe-ZHGX)ah?vdJ`Y`nbq3}dm{)QLJx8Y5Qg{T_P&y6)L_yHis&^7C^jM%8pO&%3n2*M$gVMxGjVSf1G`wHwz}5J z&QkmV_BQtW1M(xRoVC(o9)@>jcxPr7f5p*ur4n!KzI0aKqFek}MhG#8Lx}toppZtI zOo{On*4}SU4O0Yitm%|qc*Zw@2~DJ#4s@s^j-NdfD|+qen3F!{^of`f^!vJWNzYK? zog|)Rz3zQFv^2{FAQhI#Es2}pm|)8WH(Wd5iq~GIGtaLkZ9cvPqW@ddjj~r7C|#av9|B&+3by#p%1Xz}hxPUw07+G`b{{>{jY0mQx>TWRH PgUP$0*vG{ITf_7Rlh9hU diff --git a/q08_linear_model/build.py b/q08_linear_model/build.py index 85d49da..22f94d1 100644 --- a/q08_linear_model/build.py +++ b/q08_linear_model/build.py @@ -1,3 +1,4 @@ +# %load q08_linear_model/build.py import pandas as pd import numpy as np from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data @@ -17,4 +18,14 @@ # Write your code below - +def linear_model(x_train, x_test, y_train, y_test): + + G = linear_regression(x_train, y_train) + y_pred, rmse, mae, r2 = regression_predictor(G, x_test, y_test) + val = cross_validation_regressor(model, x_train, y_train) + stats = pd.DataFrame([(val,mae,mse,r2)], columns = ['cross_val','mae','rmse','r2']) + return G, y_pred, stats + +# linear_model(x_train, x_test, y_train, y_test) + + diff --git a/q08_linear_model/tests/__pycache__/__init__.cpython-36.pyc b/q08_linear_model/tests/__pycache__/__init__.cpython-36.pyc index 5f231d25458b7d9ddd095d46081a461751daeff2..de7c851b239d68fa481b8446179a881d1c156584 100644 GIT binary patch delta 57 zcmZ3&xQmg)n3tEULil*}L=JP+bp4F{+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNs!01dqplK=n! delta 35 qcmdnRxP+0zn3tF9rT(I*i5%wqf%+NwxvBc;MX8mECHc7%Q^EkhObfmM diff --git a/q08_linear_model/tests/__pycache__/test.cpython-36.pyc b/q08_linear_model/tests/__pycache__/test.cpython-36.pyc index cbaeda35dafd76d9b3875e0d9e56e950079bc591..767e28052a1a6f7ee96a602d4db23d1528b2feec 100644 GIT binary patch delta 78 zcmew+*CWqi%*)GFA$&Y~BS##wTC#pder~FMQDSaoVs=qxaYkNZo`soycz#iKaY15o is(x~QN~->3Szh_gQ<*b48KXA;=MiOMjG8RUp9lc`5E*X( delta 56 zcmeB?|0c&_%*)H=Yqcn9BS##wfUkZ=er~FMdQoa+Vo83k{^SF^@|#yPXL2&$+APW| M%EWkUvNnGr0QC+L*#H0l diff --git a/q09_advanced_model_q01_lasso/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q01_lasso/__pycache__/__init__.cpython-36.pyc index b8b8fc73c23c3602d2cc8046c670d9178deb30ae..240d92c77db314282892da501b67d9f8e98ecbcb 100644 GIT binary patch delta 57 zcmZ3*cz}_^n3tEULil*}L=JP+T>Xsv+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsE01;CYs{jB1 delta 35 qcmX@WxQda(n3tF9rT(I*i5%wq;rbc*xvBc;MX8mECHc7%Q(^$YRtweu diff --git a/q09_advanced_model_q01_lasso/__pycache__/build.cpython-36.pyc b/q09_advanced_model_q01_lasso/__pycache__/build.cpython-36.pyc index ad763a5d1b8809864ca92cb9383d06dcf0025f16..8b1b5d639ef429609eb9d72c71f160bfb6338fe4 100644 GIT binary patch delta 348 zcmYk0KTE?v7{>2kk|u3Mw1U`TaVc~$prReb)lJY2LLADGOIzC{7w%G_a2<+sr+f;> z;-+7~#V>G+-^0nfOCQY=dxc{%febOs2y-Tcxf`^qD@S>%KE^}P_wM>oJ2Wk(H1cD?r5wG`RO5^$8i})r zh)gCX;>A2&WV!6uglo=4)hW6k!ds1P+Fgzck+2Axtf-r|Xc%Zmmb8>_KpYwMI}4{g zOF}`jC7p|BIn8N4xC|e;n9G93Nf>jMgw+~%s~^-m)=o;LX8nAA`*wg$bJpS@)CfXZ`PP9)5+vLA4rAkKa45^MKU0K}SoXj#xMg~=~Y CXj&ow diff --git a/q09_advanced_model_q01_lasso/build.py b/q09_advanced_model_q01_lasso/build.py index c832d59..77fec51 100644 --- a/q09_advanced_model_q01_lasso/build.py +++ b/q09_advanced_model_q01_lasso/build.py @@ -1,3 +1,4 @@ +# %load q09_advanced_model_q01_lasso/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -20,4 +21,15 @@ # Write your solution here +def lasso(x_train, x_test, y_train, y_test,alpha=0.1): + G = Lasso(alpha = alpha) + G.fit(x_train, y_train) + val = cross_validation_regressor(G,x_train,y_train) + y_pred, mse, mae, r2 = regression_predictor(G, x_test, y_test) + stats = pd.DataFrame([(val,mae,r2,np.sqrt(mse))], columns = ['cross_val','mae','r2','rmse']) + return G, y_pred, stats + +# lasso(x_train, x_test, y_train, y_test) + + diff --git a/q09_advanced_model_q01_lasso/tests/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q01_lasso/tests/__pycache__/__init__.cpython-36.pyc index 80296f75275fe1779be1cb1510cdcbebf24a3c57..580b97b43fd9da72cadaffbb63a6a9784e75daba 100644 GIT binary patch delta 57 zcmdnMc#M(5n3tEULil*}L=JP+V*QN#+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsc02JvH!vFvP delta 35 qcmX@cxPg(wn3tF9rT(I*i5%wqvHBVLxvBc;MX8mECHc7%Q<4C~U<>X5 diff --git a/q09_advanced_model_q01_lasso/tests/__pycache__/test.cpython-36.pyc b/q09_advanced_model_q01_lasso/tests/__pycache__/test.cpython-36.pyc index 3d92981a85fdfdd93eb4850d6b323ecab8bd7161..be1b7b72ad26fadc865297fc82dd5aad186fb9d4 100644 GIT binary patch delta 200 zcmZoxn5n>F%*)GFA$&Y~BZnumYQBC(er~FMQDSaoVs=qxaYkNZo`soycz#iKaY15o zs(x~QO6ukWW<6%csLlOsFPIorH&<}7GIDD%FfbIUf(Y%&y*yHr7jfOk5L?E52Tg2} zyb4H*I*8B&5jr434@BsL2!qXbyvG^EqFD1va|5`hjWE>fRt$UlV}Y^@+j Pt@z}L9Kw?y^P2$xX@xgN diff --git a/q09_advanced_model_q02_ridge/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q02_ridge/__pycache__/__init__.cpython-36.pyc index 222893d6c4bc0f716c4fdbff600e66340545b3cd..60aedf7349109ef3c4c3c5a65c36f9b80b3bd3b8 100644 GIT binary patch delta 57 zcmZ3*cz}_^n3tEULil*}L=JP+T>Xsv+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsE01;CYs{jB1 delta 35 qcmX@WxQda(n3tF9rT(I*i5%wq;rbc*xvBc;MX8mECHc7%Q(^$YRtweu diff --git a/q09_advanced_model_q02_ridge/__pycache__/build.cpython-36.pyc b/q09_advanced_model_q02_ridge/__pycache__/build.cpython-36.pyc index 29083a5660093320a13d952ea9eeaf0c4458cabd..5352fe7b0b3d0c039d0d885b98e6d7cd7de67c0c 100644 GIT binary patch delta 369 zcmYk1yGjE=6ozMZ_MVG~QG^(SO(2a63Th!X7J`MK5rnk}!_MToH_jwNWJQ9t)jox# zSo#81R#wya0KS2hGo2jx;Q#s0?cM+Kz5QCvKmYu={dx5m#*;F|r;mkK_%nOr6z&rq zm_y7=W-*&NLzB7B#zUpB3a6+HNDp#NF^cCMbF0#?eU86B=E3mO{h8XFod4SmBuY$++- Q<0NDAn4cJB(`sY$5Bm^g9{>OV delta 347 zcmYk1Jxjx25XW;*UYevyEvWbsu}+0d1-q3Zh@Ze05W0lW=P_2Aq+C+5kWS7{*~Cd) z9L3SE;q-umU&6u3dpgN+Ke+#K_rLpeKU}Bp`|iu&d9-|UH~_CRIO&$wO{22!p>ish z8&3u|6X4bZTQ)1RYE;cD{agzh^%n#~>0zAlJdKJnE=6caa~$2qQ)ysY2&t#BkPHtI zG))UZnv;x+yU<39YFYQ$>9L6uo(S}nU@f8<3O>?l7S~9@wvtV?yLi=bpQ_)B-gTae zUV>r~mwDQ&zx7W2!@7GIPqldJxkVCg qE9@xjDyTgxuYc%}ChcLG^Z8U9sdoxB<*`+ej}0~>KW4KwYq39_K2d1^ diff --git a/q09_advanced_model_q02_ridge/build.py b/q09_advanced_model_q02_ridge/build.py index 0fb3e1a..14ee6e0 100644 --- a/q09_advanced_model_q02_ridge/build.py +++ b/q09_advanced_model_q02_ridge/build.py @@ -1,3 +1,4 @@ +# %load q09_advanced_model_q02_ridge/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -20,6 +21,16 @@ # Write your code below - +def ridge(x_train, x_test, y_train, y_test,alpha=0.1): + + G = Ridge(alpha = alpha, normalize= True, random_state=9) + G.fit(x_train, y_train) + val = cross_validation_regressor(G,x_train,y_train) + y_pred, mse, mae, r2 = regression_predictor(G, x_test, y_test) + stats = pd.DataFrame([(val,mae,r2,np.sqrt(mse))], columns = ['cross_val','mae','r2','rmse']) + return G, y_pred, stats +# ridge(x_train, x_test, y_train, y_test,alpha=0.1) + + diff --git a/q09_advanced_model_q02_ridge/tests/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q02_ridge/tests/__pycache__/__init__.cpython-36.pyc index 602e1f5d5c4f60e2bd8813680dc29fba2e27d856..cdef0de364231a417488cf62822833d41c492b21 100644 GIT binary patch delta 57 zcmdnMc#M(5n3tEULil*}L=JP+V*QN#+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsc02JvH!vFvP delta 35 qcmX@cxPg(wn3tF9rT(I*i5%wqvHBVLxvBc;MX8mECHc7%Q<4C~U<>X5 diff --git a/q09_advanced_model_q02_ridge/tests/__pycache__/test.cpython-36.pyc b/q09_advanced_model_q02_ridge/tests/__pycache__/test.cpython-36.pyc index 37f31c3afe884d721a91308abc3e21f01dc3af87..603ba9ecb9fa9de8b44c101ad274536f522f3050 100644 GIT binary patch delta 208 zcmaDa->Sf2%*)GFA$&Y~BZnumYQBC(er~FMQDSaoVs=qxaYkNZo`soycz#iKaY15o zs(x~QO6ukWW+`UIsLj=EFPIorH>Ys2GIDD%FfbIUf(Y%&2^>8+2Yx6|5 z7fg(5o2xik8M(C?7#NDwK!ncZejcgGOStZ1h^^qhgC;gfUKON814L+n2wf1N4XT*pr?7#o6rAk9D?a%gzc~Q?vN6j5 diff --git a/q10_data_missing_values/__pycache__/__init__.cpython-36.pyc b/q10_data_missing_values/__pycache__/__init__.cpython-36.pyc index 9f50df257f7dadafbe3ce884c55c000ecc154d68..3f4c741a47c2dd333dba6ae87e587e46493a296f 100644 GIT binary patch delta 57 zcmZ3=xSNr~n3tEULil*}L=JP+4E>D!+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNuK01j3YmjD0& delta 35 qcmdnZxRjB@n3tF9rT(I*i5%wqLHZf_xvBc;MX8mECHc7%Q^EniqYJ_S diff --git a/q10_data_missing_values/__pycache__/build.cpython-36.pyc b/q10_data_missing_values/__pycache__/build.cpython-36.pyc index 5c075f43b94e582040d94a38ff22b71e81107625..5e9f8f87792f07861ba4588c43d9c31988c179da 100644 GIT binary patch delta 281 zcmeBYKgFhO%*)F)?cRy#BTNhoj~S2v3y|#q#KlDul?&NYSb`ZeIVWC-uw@2{0o5`% zgXCm@L=8h0Lo-7yBamh+Vaj4|W~^nZVXR?FV*+Yn^wVUy#gUR)oLrQdlo~ZTmQm7? z`4)Rcd`VGaW?m5+P=65zkXXr3#08{&rRrzo=ceixCFWKpW*21^XXGX3S(xdE=NDxc z7bGU9>L=%?q)wj5=qJVxR9+0y&%nsR$irB~17v9mO%`PO$;%F8-eO8gE8+w)CQCC* iX@Dfb79bJaAXOYTx%nxjIjMFaFBJ<-E?^d6WB~w1xjh#E delta 392 zcmaJ+F-yZh6ux(j$ypQ8v2U()fCgzO9Uf=!|h7R=ICVq zia+62XMccBzKaN*e8=~_ci+AHc<A`9)(42}ZQ8!+@>T9g zIH!RdG*XhWJu+-nG#V=FuAhrA9xD?Ip5@9a{sb&gs9Y6<3I=LnBI0qbjJ%le lYOXobgDBQb(&+Y@@9V9z7LpD6unLT>z%pfq4W^3{gC7+MR|)_C diff --git a/q10_data_missing_values/build.py b/q10_data_missing_values/build.py index 582edbb..d84b74d 100644 --- a/q10_data_missing_values/build.py +++ b/q10_data_missing_values/build.py @@ -1,3 +1,4 @@ +# %load q10_data_missing_values/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset from greyatomlib.multivariate_regression_project.q03_data_encoding.build import label_encode @@ -11,3 +12,11 @@ # Write your code below +def describe_df(x_train): + describe = x_train.describe() + value_counts = x_train.apply(pd.value_counts) + return describe, value_counts + +# describe_df(x_train) + + diff --git a/q10_data_missing_values/tests/__pycache__/__init__.cpython-36.pyc b/q10_data_missing_values/tests/__pycache__/__init__.cpython-36.pyc index 2fdd38ba92c3ca5f1d29fa65d48fd61e792f83c8..653358f4d03d717caf34856ad495fab398d1a4f4 100644 GIT binary patch delta 57 zcmZ3@c#x69n3tEULil*}L=JP+JpGLP+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNtv01@mHuK)l5 delta 35 qcmX@exSEl}n3tF9rT(I*i5%wq5&9YVxvBc;MX8mECHc7%Q(^(Ztqa-! diff --git a/q10_data_missing_values/tests/__pycache__/test.cpython-36.pyc b/q10_data_missing_values/tests/__pycache__/test.cpython-36.pyc index 17019265bc29ee0e0ca9f98bf98dfee0d9486c8d..0f864dd899d6851d8608dc0ad6e75272352134f8 100644 GIT binary patch delta 66 zcmdlcbVi87n3tEULil*}Mve?7)hzvt{M=OiqQujv`vV^n3tEU&t*~6Mve?7fe`(S{M=Oi^rFXJA>0BJ8eqXXtSTj1#XH`xTq7AL5tpL=I>Rf_X{luO W#-FyVSZVIZoZUozS1UG28`{5H9bvox delta 418 zcmZ8byH3L}6!mqS)=kr@JcSAqOj+nqF@cymF@OXM6b1rL+eAqnx#m%niXn5S{s9{! zV&Wf|82tzE35WqZ3?O9ro_o%@y63*q7wWWYHRrAK&{g)6vjO+l2%!u`C`S`4A=9si z8BE~}Ppk=%nBg1%WhAn)qLW10vXtSdoI?%(T#mKsMAaMtV(18Y z_Pz&Os@x0vqwp?JrIYwT9J2SWzQ_Yb1(&`I`OtF}x#U6!q77l|qGlhkzNhR|ghMH? zQLHqUii`&Q#2_7 zfWo}~4m6<-%OKXY=7FdfSWt6`FVmRIIK0?Q$EH)I9~6tvUw8?&&3uvbr{fwK#n3tEULil*}Mvf3BwKDyT{M=OiqQuQf4~6mr3oPGef>W6+|pLuRnc>O1x?zgj|RV z2yGx4WN<|oz9CDea;Bt06U_{{$K2wz=V}oxofhCo zoC#qrC$#Ld8P)vR z`frnb&R5#Hd8UnZ-e=Mh$!PREG08|J1*dHd?0Cb|gO&}h8|AFD!D3tBnGH41d1{2B z{#`E{j(5%vc2&H!vFSwE_)eL#IKP12v}c5jXR%bAWsQ`+Md}bd{(LvQ5(OWEnME>F znZ7EM^6Yf@N~oEZNy>+*V0>7A^d8n9$di-9fAa&mUGqLD>3v8DcVO+|9>hLG2dks{ z);)V{Nh#_5A~7--CePj+%SBUBf4e&}H}+Zm!#l1|yK;`V}R-gn=|jC^`i>K~P$zfr2JY5Qd5a zI0X{O9VHzl;tx>s6Sk(|FNB6!I{^wL?liMAvoo{bezRXIUuva?wOaY+(~sfz&!rqs zN(dnb!~&7;Kq)k~6dqY4G9_bsWcSDnjWF1bvcR*a_zWvYxyqa2Dg39ngJT?%6F;_M z`>hqDk<;^Ir;gr`IvTsD2=?9BJMl;E6EwwRPnCM*8CvE{AmBrw0LdI}rw8<})h+xe6kEP=F295hUTAPoOkTK)EvFf=N+^gmb!ez%#bh6>LZq z&$hBbs**!05~^5R%&X4Y{Dt*s;x|*8?Z>or$Fv4P#~TF`5zAGQvUb1SVN?yEYonR+ zh^Ddy#6mC5>%SfeLf6y~Vz$fqPzVrioM$&x+PM_|hEVqT}GdfG?|p6=4Q0Okr5- zBx=%Dg66WrMW$`jJoJ_%wt-D96pOV330*DS+Z6kJ(YUs1A**-=S8Z_@;sF-s{Rg+g`8R8G zL)->OuVqvfDOYK--zbL0((c7-6{*sX=hSY@pV>cOYEs17h3m&0Sd$D$B5_B1M~2KK m*De@LD(wv~17JX4arSbY=866ptoEBg(I90lGXLP*!}u4PJO)|- diff --git a/q11_feature_selection_q02_best_k_features/build.py b/q11_feature_selection_q02_best_k_features/build.py index 95002c5..37651c0 100644 --- a/q11_feature_selection_q02_best_k_features/build.py +++ b/q11_feature_selection_q02_best_k_features/build.py @@ -1,3 +1,4 @@ +# %load q11_feature_selection_q02_best_k_features/build.py # Default imports from sklearn.feature_selection import SelectPercentile from sklearn.feature_selection import f_regression @@ -20,8 +21,18 @@ np.random.seed(9) # Write your code below - - +def percentile_k_features(x_train, y_train, k=50): + selector = SelectPercentile(f_regression,percentile=k) + selector.fit_transform(x_train, y_train) + scores = selector.scores_[selector.get_support()] + features = x_train.columns.values[selector.get_support()] + features_scores_list = list(zip(features,scores)) + df = pd.DataFrame(features_scores_list, columns=['Features','Scores']) + sorted_list = df.sort_values('Scores',ascending=False) + top_k_predictors = list(sorted_list['Features']) + return top_k_predictors + +# percentile_k_features(x_train, y_train, k=50) diff --git a/q11_feature_selection_q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc index 3a1830b270d6d769e5565023aecb9be5259bd743..13e3cf99b52e1ee0aefc61c802fa204ec3824c5b 100644 GIT binary patch delta 57 zcmdnXc$tyIn3tEULil*}L=JP+2K|iu+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNui035Cp_W%F@ delta 35 qcmcc2xR;T`n3tF9rT(I*i5%wqS^63IxvBc;MX8mECHc7%Q}O}F%M2m_ diff --git a/q11_feature_selection_q02_best_k_features/tests/__pycache__/test.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/tests/__pycache__/test.cpython-36.pyc index 7c11282368a691d1031e0ef3e349d85d1d4b9116..276e402fbc3a5d86bb5c80a84bb06c3cda1712f5 100644 GIT binary patch delta 85 zcmZ1@a!7>3n3tEULil*}Mvk>iYBl;9`MIh3MTxnUiP=S&#Tj{tc@}2+;rT_`#RZAU psrt$JDXIFC{W;|~KVf>x%ow%#6q^Ghqw;2MjwVLNsL6et^8nZB9IF5T delta 63 zcmV-F0Kosk6s!~oGYt(2=`W&Mu?VdK5N0oEZ*65SXL4nEVRUb8FO!Z4AG7)b3=Aa&= zews{0Y(N!7tUyAODV*vno C@;CJW delta 150 zcmbQi@tB>{n3tC;%XLvy@J3E0Mt1=Q28I%b8ipFi8m4CETIL$&USyHVrs}5`rB)`EF1f{C2@#lliCLSGY4Sg2DFAMyD$f7_ diff --git a/q12_feature_selection/build.py b/q12_feature_selection/build.py index 1bbe2b2..bf88c03 100644 --- a/q12_feature_selection/build.py +++ b/q12_feature_selection/build.py @@ -1,3 +1,4 @@ +# %load q12_feature_selection/build.py # import matplotlib.pyplot as plt from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -16,3 +17,12 @@ x_train,x_test = label_encode(x_train,x_test) # Write your code below + +def feature_selection(x_train, y_train, k=50): + plot_corr(x_train) + reduced_features = percentile_k_features(x_train,y_train,k) + return reduced_features + +# feature_selection(x_train, y_train, k=50) + + diff --git a/q12_feature_selection/tests/__pycache__/__init__.cpython-36.pyc b/q12_feature_selection/tests/__pycache__/__init__.cpython-36.pyc index 199811ee773001ca0c605ea752dff30b16fe2a41..5eef781505398c7b938c1e666d3c2b341df4d70c 100644 GIT binary patch delta 57 zcmZ3n3tF9rT(I*i5%wqVfq>QxvBc;MX8mECHc7%Q=$RD{|nLp diff --git a/q12_feature_selection/tests/__pycache__/test.cpython-36.pyc b/q12_feature_selection/tests/__pycache__/test.cpython-36.pyc index 3a7de81e6c075362fc5574bc7cd7fa1084aa1fb6..35d77b47824ad046c8146e90c7b7661e2dfa5ce5 100644 GIT binary patch delta 122 zcmeAcT`0<7%*)GFA$&Y~BgbkcwG91?{M=OiqQu^iMp!DWW4hbdzmjWR2 diff --git a/q13_plot_residuals/__pycache__/__init__.cpython-36.pyc b/q13_plot_residuals/__pycache__/__init__.cpython-36.pyc index 339472dc72a16004e01d1fdcf966768b0a1ec9f4..4e489764e6f22ebb7cd656fbc72185e2e2531cd7 100644 GIT binary patch delta 57 zcmZ3$xQ&s+n3tEULil*}L=JP+Wc`f%+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNsU01H_Yg8%>k delta 35 qcmdnSxPXzvn3tF9rT(I*i5%wqzWN#YxvBc;MX8mECHc7%Q-T1!@C&X0 diff --git a/q13_plot_residuals/__pycache__/build.cpython-36.pyc b/q13_plot_residuals/__pycache__/build.cpython-36.pyc index b3cfbafacaf9b3c23302f194e7c40a3e8bb72751..88511eea10c5509a9aab3f0c0c6160685c30ecd3 100644 GIT binary patch literal 1373 zcmb7D&2Aev5MFYBB}=m7D2eN)MXowjYHT3Mp=bgGX>UQ`915@ow)Aphugv`kNjZ@# zos?tqAi4C?OP`^Sz+2H%UZJNBDYZ>{DZC2~XZZ6C`OU|}e!u%u{M+}xL_zRJ@WF?1 z@Ccj!6^#f4kwHZmA->Vt65-vB&E`hE z?_l!Fq02haW+tFEUsT+T3w?3=3Aihk;Dj(#YJ;}5+^(2W<1aN{Mbz;TYeL{BgKN1#hF zbEjl?ytJ!LGJulq=!HLpgQ zjVokO+T?X^KpUIPeUHmLk1VV-py9x%I$+!25+PsfgXnjG+QE!}{xCUfDwrr<&H1@1 z^;ym92lpo5HR@cqynu--)1;b7Q(kaYasz*JzAjiZg~Ci;-aX7+jsC@-oXkoo#_ik= zKAyPks2-pR$dF{DN4ox3yEroX%sxah%(-bQS)PplC++yITLs#6G?n%;6fwOS`O3H%Lxj_Q}QeEtR<77KMRodU+eK6!u<%7`eAT@WKQPzaitH=A)=a|Jt`PcjG(FVH`p-y4 QdlY?|(H%OVUD}KO0#MVTdjJ3c literal 556 zcmY*VJx@Y06m8#kh=?r4(e*997~*D(i6JHq4C?e2Qs@;*`gqv(p%|QSHU0-T|58^c z{(_UY@Di~%_uP~F)zfyG&BjOfGe4t*e3PByA-_b|hX|Z-D#?WA9{0HaMslCiJCX)# ztdZW(cL7g;?)VkDzDHP+B|RdqzQI`@bN`)Eg51Nrzw$QR=fP^54R~0ykViF(mR`-` z6``mDZ%umZ7Vcgr2r0GkgBWS?0x!*5(1KS?9?xWH^6*+Q4tdm7s#H4llzWkK^3ufm zGihvula&G+>mf4+lnsqA5^VG=*#M-C7TXwWHV5prfgYDnX@G^k0c~=OGX>lRQ&vFU z0(Vni)hhHCQBLR2O*SqI$VLhl%#=k|RMLn!Q-T@5Zp>>f$|Yk0qrE0LD~ diff --git a/q13_plot_residuals/build.py b/q13_plot_residuals/build.py index 9cdb3e3..e25947e 100644 --- a/q13_plot_residuals/build.py +++ b/q13_plot_residuals/build.py @@ -1,5 +1,39 @@ +# %load q13_plot_residuals/build.py +from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data +from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset +from greyatomlib.multivariate_regression_project.q03_data_encoding.build import label_encode +from greyatomlib.multivariate_regression_project.q07_regression_pred.build import regression_predictor +from sklearn.linear_model import Ridge +import numpy as np +import pandas as pd -import matplotlib.pyplot as plt +from matplotlib import pyplot as plt + +from greyatomlib.multivariate_regression_project.q06_cross_validation.build import cross_validation_regressor +np.random.seed(9) + +df = load_data('data/student-mat.csv') + +x_train, x_test, y_train, y_test = split_dataset(df) + +x_train,x_test = label_encode(x_train,x_test) + +l2=Ridge(alpha=0.01) + +l2.fit(x_train,y_train) # Write your code below + +def plot_residuals(model, x_test, y_test): + y_pred, mse, mae, r2 = regression_predictor(model, x_test, y_test) + error_residuals=y_test-y_pred + plt.scatter(y_test,error_residuals) + plt.title('Residual Plot') + plt.xlabel('SalePrice') + plt.ylabel('Errors') + plt.show() + +# plot_residuals(l2, x_test, y_test) + + diff --git a/q13_plot_residuals/tests/__pycache__/__init__.cpython-36.pyc b/q13_plot_residuals/tests/__pycache__/__init__.cpython-36.pyc index 3aa40f003ac9ed7ca53d9580f2b40524a62da90c..de5efcf9b1617e546afc620b54528c029ec48e8f 100644 GIT binary patch delta 57 zcmZ3+xQCI$n3tEULil*}L=JP+O#O`f+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNr(01odHn*aa+ delta 35 qcmdnPxQvm*n3tF9rT(I*i5%wq!TK5bxvBc;MX8mECHc7%Qz8Jr`U}PY diff --git a/q13_plot_residuals/tests/__pycache__/test.cpython-36.pyc b/q13_plot_residuals/tests/__pycache__/test.cpython-36.pyc index 89ecb4e3b62bb3c40148c8459b358afd6936e702..b3b620aad28e9257d2f2026bac28decf2bb0a9d1 100644 GIT binary patch delta 71 zcmX@ieUqERn3tEULil*}Mvf^=YN`4e`MIh3MTxnUiP=S&#Tj{tc@}2+;rT_`#RZAU bsrt$JDXIFCH!{m_KFuV?#27XC5z9jWUpyHQ delta 44 zcmcb~eVCiWn3tF9rT(I*jT}>$`2F=W@^e%5(~D9o6HD@QHy>m&V`98D`3K8G08CX7 AI{*Lx diff --git a/q14_benchmarking/__pycache__/__init__.cpython-36.pyc b/q14_benchmarking/__pycache__/__init__.cpython-36.pyc index 453edefacf2fed8cd72ca5b14c268f798bc1dbac..49d647a2559b38cdb494c0c778bfe7daffb34e85 100644 GIT binary patch delta 57 zcmbQoxP_6!n3tEULil*}L=JP+ME#8X+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNrp0177)djJ3c delta 35 qcmdnOIFFITn3tF9rT(I*i5%wq-ufB&xvBc;MX8mECHc7%Qvv|JLJOt< diff --git a/q14_benchmarking/__pycache__/build.cpython-36.pyc b/q14_benchmarking/__pycache__/build.cpython-36.pyc index 28c02f81e980cbbac2a50fb3e6c6400240d89583..0ec668f50ce3582bd87a5c9711c214871d02952d 100644 GIT binary patch delta 565 zcmZXRL2DC16vt;~C+Q}eP2;x423iGM#r5FQD5YRg!HeM0Lm?HzusdnfY_jXj6b#Jb zq341!SHFOVp8N)S5&Q;gZ}k&+@ZiZep|k-9-jDzPy*Kk_m_My=t@Ve#U;p~z$KHJx zp>s61DClPp^6caKPt(S~o6F!9AfDUoC(|a62MIlKin>O+-a&`XF)BQbFLgs9?dgUl z+DULiPAadR!Y`V|qQd{>Tg9~^Q1q~(t9nt_bg)m4aj~SAUZJpJPDv-kB_4%UQHSBe zv#0?|8fW>mBzaO+<7^T$6)u}!*4c*;g%C=VuVvb`1UW@03B7V{|15+0ei^p@$+dmA@lj|>2a ztl$;W#0}h-selMu3-6Rq&4Y?u@hK QDCJKGIJse7x_2@C2Mq+7CjbBd delta 612 zcmZ9Jzi-qq6vyrSXw&w_T&8(3%GnbnOmY5TDu^`-$HO1MYSbT%} zmOM8)_iUoJM>cufnRuDm2tw^ zZ9v0d1pje`cgxL!+8z)-q2Na$<6g5=-51wyug~JZvW)Xd|l~p z+RT`x<&9wyrx9@Qi<%!1y`z5n*UQ0v62o9b;gIko9>kM~hwljuiTq}*$lqpfeN}Nx z-wHC@YSat|JGNf6FzqO}-^-uLYx~jF#M&~kD=+7FUTK^zX<62?qD8YgCb^x`aLjX? g?UNLWU6iD)A!k>e`6Pm;SVgQSSDj7UbnZ6rAM{MG&;S4c diff --git a/q14_benchmarking/build.py b/q14_benchmarking/build.py index 4a4557b..62e1fcf 100644 --- a/q14_benchmarking/build.py +++ b/q14_benchmarking/build.py @@ -1,3 +1,4 @@ +# %load q14_benchmarking/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -26,5 +27,22 @@ # Write your code below +def create_stats(x_train, x_test, y_train, y_test): + + l1,y_pred_l1,lasso_stats = lasso(x_train, x_test, y_train, y_test, alpha=0.1) + l2,y_pred_l2,ridge_stats = ridge(x_train, x_test, y_train, y_test, alpha=0.1) + + features= feature_selection(x_train, y_train, k=50) + x_trainft=x_train[features].copy() + x_testft=x_test[features].copy() + + l1ft,y_pred_l1ft,lasso_statsft = lasso(x_trainft, x_testft, y_train, y_test, alpha=0.1) + l2ft,y_pred_l2ft,ridge_statsft = ridge(x_trainft, x_testft, y_train, y_test, alpha=0.1) + + complete_stats = pd.concat([lasso_stats,lasso_statsft,ridge_stats,ridge_statsft]) + + return complete_stats + +# create_stats(x_train, x_test, y_train, y_test) diff --git a/q14_benchmarking/tests/__pycache__/__init__.cpython-36.pyc b/q14_benchmarking/tests/__pycache__/__init__.cpython-36.pyc index defa63dc0453c646fc0d879d36fc778a5d140e09..51a88705729b8e9e356dd34771f9af47ab731325 100644 GIT binary patch delta 57 zcmZ3&xQmg)n3tEULil*}L=JP+bp4F{+*JLd#N5in?4r!#jJ(7=3p4%j{G#mQg2d!h M{p9?V)QNs!01dqplK=n! delta 35 qcmdnRxP+0zn3tF9rT(I*i5%wqf%+NwxvBc;MX8mECHc7%Q^EkhObfmM diff --git a/q14_benchmarking/tests/__pycache__/test.cpython-36.pyc b/q14_benchmarking/tests/__pycache__/test.cpython-36.pyc index cc77345a80d2a31276437a4b20a95a08f4c2fe16..340c264e181bb7cb55669dfcda1c820b7b512657 100644 GIT binary patch delta 116 zcmZ1@a7ci|n3tEULil*}MviMts>%8p`MIh3MTxnUiP=S&#Tj{tc@}2+;rT_`#RZAU zsrt$JDXE*^GS#veN3rIW<`z`mV#+IsVk=0@OGzxg#Z-_IC77F7Qjn8hl9QRFS5OIJ M0i_}IkuttExn3tDpxBsH3jU3mQ1bp=~@^e%5(~D9o6HD@Q^(Pmy%5PR?j%8uIHMx;p fOy-tgZemG6PJT&FW|Ce(C5Uy44N6bm%-##K5=>)~+NtA70Fmmea8{zdP7A>b#l z^dBHN;#i^zQ;Z!Zl2ic=JPu@7MKtm_lyQ~N#N$Y&RYo(9W7(s9@QdYu4n==4THNBv z2Dk*~=?2pS5r~5gJ`3q>dPwikyCM>|#o>mW5oh5U@4ZCy10Mf`#{Jij4;o{e$%gTq zGs8d`>Q zn3)v%s&Hj+Umq5f2nDe8ZyDBkO1# zn{W|z5$q%$#eh=hv531QCmr@E&5238AL)WkxXw({C0*KWwH|n;UDoyHga-dsujCXr9Q7&{neM#pBr_dTULmv zEBCZoN>g4jRk|80F;_zCvZ?b{H7?rp^7wJCg#?(-gf@8vPI5Y1mXc4})tlalEVU_` zsy+S0-N#)nMlU{f7Ab&od-6m!1(W)8vOlg|J;s=Z?7GzB%tngUb72E1YUP@&T#YPg zxy_zJx4(yb2peB9xfEK(ZZ9sHx?pD9R|BuY)geQhthObvF#s^o5gZcpMy>L)=Hi-W zyBg(&rduCCkuRGKy~nM0>HAlA3>0tg;|*#E0ms7&jv>$f0Vj8cvIO>3&Abn&$r#Y2Yc#6Cq8n*HOqJVJ>eUkp1>q5r8sqM(9UZ>-u@|0 L0jI$M9)jgnJ|4{g1dl-k3@`#24nSPY0whuxf*CX!{Z=v*frJsnuN?i1{M=OiqQu?^^5T^nX}@3ICvm~JCgSDS*1%zU0Q)9LH;K5p*naRD4c(+|N2hZ62kmlN*3b*RTZ z?!(vT0k6O};8h4NEVnSK_}y^&1m@#|gdwyeX!;2l;}|j{zmqr4$Ti*@!pWX9g9U(m z#UHpk&di=OEaCSQ(p~ysrVpN9fH+3*2y`k^2t-GZ_-E0J z=Vt|zr6)z!c1vFiIVgQp`A@Ju43tgovK6+GnRexb@!KCo$4{`i!LhM zO$%v~bEXoMRf!WNv`+FY9;Hhy{*jbKUs);gGpjkEV0{|64Pved}PK=MruIT3WroE+Fc=VB(j72oaRrFX1 zQ>ZLDXR;8FqeMsee*g-IXp$G8t%&ABlI$c}JdbocC^zPkzSJ)>NUf|d%D|>r>5e(A zJp-1Xkfro-tu|5XuuH4*+}r}UT(^C<(#3WQrFwC%L!d`Dqj@@~u@w~Ze8E&j zrXOy~bX|Paf(J8>{&*vvgD;_UWc^{v)amtxuy)fRD^e&RZZ@WsG0Qm9Y6tquiUKE3 zv8)MRx_m&Z7qL++$!G-toFJ`Et~vnVkz%6SgI-Apn;-UehTqOJ>N~79`Xew+Vqdqp Qcta8b3cU@oM%KLl09*Jp6#xJL literal 0 HcmV?d00001