From 0fb464153a11ea93c788abbb374ccbcd9a7e8cab Mon Sep 17 00:00:00 2001 From: sagarpatil232 Date: Mon, 26 Nov 2018 17:04:24 +0000 Subject: [PATCH 1/3] Done --- __pycache__/__init__.cpython-36.pyc | Bin 141 -> 161 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 155 -> 175 bytes .../__pycache__/build.cpython-36.pyc | Bin 414 -> 368 bytes q01_load_data/build.py | 10 +++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 161 -> 181 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1525 -> 1545 bytes 6 files changed, 9 insertions(+), 1 deletion(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index b0c3719c2f46201b3baa3fcef746c16a601c9e9f..51294e0e4e4741df5656dbfcb0701016f40251e0 100644 GIT binary patch delta 55 zcmeBWT*$~_%*)H=p!O$vB8R!MpMFMuZmNE9VtQgxL1IZ}j*+pEet3RSc5y*sa;koE KeoE>@KYIYt-4YrA delta 35 qcmZ3;*vrUa%*)I5Qh!m@L=JO)EB%c8+*JMaqSVU7lKk9>N%jD@F$-P* diff --git a/q01_load_data/__pycache__/__init__.cpython-36.pyc b/q01_load_data/__pycache__/__init__.cpython-36.pyc index 4596200714efc1a2bd21ca0d0f36671155da8439..fa84581e8c27cb86e450c1d3bc9f8bf65142923f 100644 GIT binary patch delta 55 zcmbQuxSo;2n3tE!LG4fUL=JQ182ya=+*JMI#Pr0Xg2a-{93x{R{qX#v?BasNeTggzw3Do;5Qa>X2SqXbJp8DBR{7;yB7`{S@cWD)YFG*cl%0HqCDalX zCb-kdT49QV4*Kp?l-bn=j!KBilU)OEt_O@##^m1VyEt}wfvuVOpab2MP$lSETP9Ij ztcH#>&Vs&eD5fV~8{1Gda^xw@9v4W@y^PgiUgfBRW#z39-I w)%V$TZ@{Mv0lTmVuHdXxF}3`H_AcXc+uI8K!jy1+*JMI#Pr0Xg2a-{93x{R{qX#v?BasN7gCqJqSd%p4=#N<@{ MO-x^z0VQD*@&Et; delta 38 tcmeC=`O3{<%*)FqWWFeBBgacdelPuu{M=Oi^rF Date: Mon, 26 Nov 2018 17:18:47 +0000 Subject: [PATCH 2/3] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 156 -> 176 bytes .../__pycache__/build.cpython-36.pyc | Bin 660 -> 654 bytes q02_data_split/build.py | 14 +++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 162 -> 182 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3134 -> 3154 bytes 5 files changed, 13 insertions(+), 1 deletion(-) diff --git a/q02_data_split/__pycache__/__init__.cpython-36.pyc b/q02_data_split/__pycache__/__init__.cpython-36.pyc index 5d17273741a726a430cdf3ccf2eb63426483d618..2f5206b0a1cd14806858edf36ea3fb141a43cbb2 100644 GIT binary patch delta 55 zcmbQkxPg(wn3tE!LG4fUL=JQ1SpAIr+*JMI#Pr0Xg2a-{93x{R{qX#v?BasNMa-;7-|@@7*ZHhn3|bt8Eb$nNrqac62=&8s-|78rB-NG?rinO*X$MCU@hPj6gHeXUznGllCvQfILm6 zD9)19;*$8{%&OEVo}$FOl>FTI;*!LYRG<_~N>P465i>~LWDiCI4PGGYSCoE6er~FM zabkL6Q9)u!W{#1uk$!l7QFd`bVsff}a(+tcU|g(7-|@@7*c?+l?h0)wlbwLNix(jB8jqrMVLw$ zYZz;oQkYVhQ&@UgVpwXKYguYpYuRd;YglSnYuM6Qf*CZ~{a!Kx%}k#)69i7$ztjTq zG?{L3mZTP!#205)rQYHxO3X{i&y6oGNfaqbefb{@{=cPFq(-700n-z z>1X8Urs}5`rB)`Eo>$pT@ diff --git a/q02_data_split/build.py b/q02_data_split/build.py index c2e7147..c0f75f9 100644 --- a/q02_data_split/build.py +++ b/q02_data_split/build.py @@ -1,8 +1,20 @@ +# %load q02_data_split/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from sklearn.model_selection import train_test_split import pandas as pd df = load_data('data/student-mat.csv') # Write your code below +def split_dataset(df): + X = df.drop('G3',1) + y = df['G3'] + x_train, x_test, y_train, y_test = train_test_split(X,y,test_size=0.20, random_state=42) + return x_train, x_test, y_train, y_test - + + + + + + + diff --git a/q02_data_split/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_split/tests/__pycache__/__init__.cpython-36.pyc index e780e63f202604d8b01427afe772dd73a1ea13a3..b4c872200046894a548f70024f542015f65eb73e 100644 GIT binary patch delta 55 zcmZ3)xQ&s+n3tE!LG4fUL=JQ1Wc`f%+*JMI#Pr0Xg2a-{93x{R{qX#v?BasN=JGO delta 35 qcmdnSxQLO%n3tF9rT(I*i5%wq{`wjDxvBc;MX8mECHc7%lR^N#R12~I diff --git a/q02_data_split/tests/__pycache__/test.cpython-36.pyc b/q02_data_split/tests/__pycache__/test.cpython-36.pyc index a1b3fc579e35798e380953fe62d7efac2225573f..95dd866976c48c2070884f75b967ec1360b94fc0 100644 GIT binary patch delta 58 zcmdldaY=&1n3tE!LG4fUMh;~r<#_#!{M=Oi;>7gCqJqSd%p4=#N<@{ N%~nh-TmT;w5~u(G delta 38 tcmca4u}^}-n3tF9i20(ZjU38M{NDN*`MIh3=|!oPi6!~DoBfzrxB%um3(o)m From f19ea9d6911c78511d0815fc7beed4f623f97fa5 Mon Sep 17 00:00:00 2001 From: sagarpatil232 Date: Mon, 26 Nov 2018 17:36:03 +0000 Subject: [PATCH 3/3] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 159 -> 179 bytes .../__pycache__/build.cpython-36.pyc | Bin 924 -> 939 bytes q03_data_encoding/build.py | 18 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 165 -> 185 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2197 -> 2217 bytes 5 files changed, 17 insertions(+), 1 deletion(-) diff --git a/q03_data_encoding/__pycache__/__init__.cpython-36.pyc b/q03_data_encoding/__pycache__/__init__.cpython-36.pyc index 884722b9e5eb21d01be2d88d202ca11e74eb4609..aad7023cedfb85cc4d15a2ad325f55fbbaf0689c 100644 GIT binary patch delta 55 zcmbQwxS5f|n3tE!LG4fUL=JQ11pSQs+*JMI#Pr0Xg2a-{93x{R{qX#v?BasNTjn3tF9rT(I*i5%wqKKdE?xvBc;MX8mECHc7%lL7&~PYb31 diff --git a/q03_data_encoding/__pycache__/build.cpython-36.pyc b/q03_data_encoding/__pycache__/build.cpython-36.pyc index 302366cb1c8d346c67f347e326ce7abc487c2dcb..23a801e133ddd515c1f495482898327857e5a1c3 100644 GIT binary patch delta 517 zcmYjNO-sW-5Z&FRn^;?|(u1D#XfFm@@FXJW*@Gf25eZAO)zo~syOkCaddM%3Ui||i z_&+>(-(Mo)!AVO|mU;8$4YT`pUaU8(-fK4NUxz<8*T!@GW44A6G9k_&WCW0-5h_tZ za=gff!cdutjEoYE%%TR&EU2m}n$r>k)=IpCN?cfzgWNhtxBG>inMrVna|XM zX){zjennyf?0w%l_i4->$?llQmfFN4X fU6}d@o7IGU9H+rJ;wJQo+V(lUMlj31J1 delta 502 zcmY+9J4*vW5XX1tUNIz^fcU6PC7cja*jNM$6~V^FLJ5c***$aNUhZBbkqaq;Aa;^g z8#@vF9)5*wt^5jB&IS`A!~B{3?L6O|XQ#MZE*I;2udOe5Dt?YkLWqTah%O&cGBPGZ z==U?qXimDoV3UmDh+MLvkr`bRnZ+PCe9fuc$f0XbnZbv1pQB52ocy|AZoQu`x<;_Ba8PThjgM=48q z@ikYL?06|x5U0uxq~KoIGJ`N_x5|EyT^(nbCH+K1YH1$2rgAQ>@EOF)#(>LALC6&i z-iTPi-ajXeP7?9PwcrCUOQOc)1-2#!;I0?(SC&u+*sunxberx_QJp-(M_*aEY&sAH z{8e`9#mtimQl^0U%IVJrVxR{)gBid8fv95Hbozo+bgM!$N?0%C`}%yjj8dZ73fiCo Ezx2k4ivR!s diff --git a/q03_data_encoding/build.py b/q03_data_encoding/build.py index bb4c8ca..2abf4bc 100644 --- a/q03_data_encoding/build.py +++ b/q03_data_encoding/build.py @@ -1,3 +1,4 @@ +# %load q03_data_encoding/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset from sklearn.preprocessing import LabelEncoder @@ -8,7 +9,22 @@ x_train, x_test, y_train, y_test = split_dataset(df) # Write your code below +def label_encode(X, X_test): + X_transform = X.copy() + X_test_transform = X_test.copy() + le = LabelEncoder() + numeric_cols = x_train._get_numeric_data().columns + all_cols = x_train.columns + cat_cols = list(set(all_cols) - set(numeric_cols)) + for item in cat_cols: + le.fit_transform(X_transform[item]) + le.fit_transform(X_test_transform[item]) + return X_transform, X_test_transform - + + + + + diff --git a/q03_data_encoding/tests/__pycache__/__init__.cpython-36.pyc b/q03_data_encoding/tests/__pycache__/__init__.cpython-36.pyc index 7d18c185f615d8dacd541c2aac10e2127c6a6058..c78155a3e48b9c093dfecc68776a30b8d8ed9753 100644 GIT binary patch delta 55 zcmZ3=xRa5?n3tE!LG4fUL=JQ1H2sYH+*JMI#Pr0Xg2a-{93x{R{qX#v?BasN7gCqJqSd%p4=#N<@{ T