From 72c955751b96fd3ab7f2f0e267ef543adb4e4201 Mon Sep 17 00:00:00 2001 From: SL345 Date: Sun, 1 Jul 2018 04:32:19 +0000 Subject: [PATCH 01/16] Done --- __pycache__/__init__.cpython-36.pyc | Bin 141 -> 153 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 155 -> 167 bytes .../__pycache__/build.cpython-36.pyc | Bin 414 -> 331 bytes q01_load_data/build.py | 7 ++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 161 -> 173 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1525 -> 1537 bytes 6 files changed, 6 insertions(+), 1 deletion(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index b0c3719c2f46201b3baa3fcef746c16a601c9e9f..d71579303f602449092171d97ddac5732659d59f 100644 GIT binary patch delta 47 zcmeBWoXN;x%*)H=5NQ!Tk;7ctO+O<)H&s8_$JoSFKRmxEySN}RIaNP7KP7ddpFIF3 C3k~f6 delta 35 qcmbQq*vrUa%*)I5Qh!m@L=JO)EB%c8+*JMaqSVU7lKk9>QT70~2@6gD diff --git a/q01_load_data/__pycache__/__init__.cpython-36.pyc b/q01_load_data/__pycache__/__init__.cpython-36.pyc index 4596200714efc1a2bd21ca0d0f36671155da8439..c48523c46c3cf95307918baf7a6a8a0fc7bef4cd 100644 GIT binary patch delta 47 zcmbQuxSWy0n3tE!A<`mxB8Rzjh<-+XZmNE;kFklVet3RSc5y*sa;koEeoE>@KVJYW C#SSF^ delta 35 qcmZ3^IGd5fn3tF9rT(I*i5%wq9{L&ixvBc;MX8mECHc7%qkI9n%L|48 diff --git a/q01_load_data/__pycache__/build.cpython-36.pyc b/q01_load_data/__pycache__/build.cpython-36.pyc index 98e98a79cdf9a026efe48fdde2a84d1da49836cc..8728b494e50d81fce249a09217e9039649d8fd57 100644 GIT binary patch delta 200 zcmbQoe42^Vn3tE!J<=k2>O@ZeBq0U{h7yJ>#u|nc#uTPrrdq}t#$X0bX1`yI)|!mB zn2S>jG?{KO6{JLQ6s0Dn#3vV*0r@Nii6t4gm{QVKG8C}`P52e4pOK%NsvqoQY+|Y( zo?nz*T#%TYs-K*nk~*22(aE0`sHm6)NH8$+F&1$GX-(!^Yz2vVDT&2JAaSr5*eoQ1 Y11NEe!zMRBr8FnijtR&s1`!<00CgxYApigX delta 283 zcmYk1F-`+95Jf$<+3Y4+O3r|*6d)Q91rjX?LAA}wFau$=&RVvSKnmgnTjT;1NEBRw zD{uq1RJlSbys2oOX8vgYpZVeMqBtna@#oP;^}8xA-}V_}fi3QK4>3Y56h z^G0BXqaFtJnyLI^1IG%Y@MPDJHrJyB#iP7;`YukLUSMZxA9SD_1(ihCStTR4SdATN ztb@L7DP~?9+fp@ghvX^Lj|-&d!N%$^uL{&bCqqMD%uQ0j=6p8q49y-Kz39-H)%V$z tOuEk!80^9xxH45r#LT7>w0C)Gx7ya=AEs##^ApqIQ%k4A51uFF;t#>wOH}{> diff --git a/q01_load_data/build.py b/q01_load_data/build.py index 7cd3700..05616f4 100644 --- a/q01_load_data/build.py +++ b/q01_load_data/build.py @@ -1,4 +1,9 @@ +# %load q01_load_data/build.py import pandas as pd # Write your code below - +def load_data(path): + df = pd.read_csv(path, sep=';') + return df + + diff --git a/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc b/q01_load_data/tests/__pycache__/__init__.cpython-36.pyc index d07fd2f92eb40b45050574e400ae0ba39249b5e5..dce1a54346ff785e78ee2e62914bfed7c5c4ecbd 100644 GIT binary patch delta 47 zcmZ3;xR#N_n3tE!Bhn&zB8Rzjlzv8jZmNE;kFklVet3RSc5y*sa;koEeoE>@zhD3` C*A7Jh delta 35 qcmZ3>xR8;e$!beMider~FMu#d5cseX8VQFd`bVsff}a(+tcCZ?~< E0Bc$g%K!iX delta 38 tcmZqV`O3{<%*)FqWWFeBBgacdelPuu{M=Oi^rF Date: Tue, 3 Jul 2018 07:10:23 +0000 Subject: [PATCH 02/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 156 -> 168 bytes .../__pycache__/build.cpython-36.pyc | Bin 660 -> 663 bytes q02_data_split/build.py | 10 +++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 162 -> 174 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3134 -> 3146 bytes 5 files changed, 9 insertions(+), 1 deletion(-) diff --git a/q02_data_split/__pycache__/__init__.cpython-36.pyc b/q02_data_split/__pycache__/__init__.cpython-36.pyc index 5d17273741a726a430cdf3ccf2eb63426483d618..0bdf1bcfdcd4c58cbc5bdf8324cdcc2baeb9a038 100644 GIT binary patch delta 47 zcmbQkxPp@KR*C1 CKn^JY delta 35 qcmZ3%IERtLn3tF9rT(I*i5%wqp86U2xvBc;MX8mECHc7%qx=B7A`6ND diff --git a/q02_data_split/__pycache__/build.cpython-36.pyc b/q02_data_split/__pycache__/build.cpython-36.pyc index e6bd2ebf2f76eee17541ce631c667ecb332558ff..1960bc3dd5d57544a345432495583d33dc77f81c 100644 GIT binary patch delta 313 zcmbQjI-Ql%n3tC;T+urE>_pC)@*E5d46H!x48+BLK%#~riy;LFTbY0)%fy4i^{i=3 zk_@#>C5$zUHB2c?Da^ghF)X#rwJf!)wQM!aH7qr(HEd}twd^(Q!3>&gelHn;#-z`h z2?8hWH5sEgOHzwV;)^q@QeXZDf+CQ8noLnFnK}8%Ma&=$$1SFmv|Ef3w-_s<*dyXg ziV`#PqS$~8pvK85jDniCSW*&85?3-5@c@tFt7o!GY}X10ErrgEQS;yY-IwHtP>9k*R!QD zNix(jl`z&Y)-a_or7)+k^s>aT)H2ty)UwvH)iBqv)UejDrLhDvXtMjgWCR+LK5Hfj zoV0(b1>|Wm-Qp}sEiQ>K&a6tk#Z#1+my(|wUtE${lKS#L5EOBM6-BXR=Hw?AF@rel zx0q7WZZSsOVyxu3#av;Y7A diff --git a/q02_data_split/build.py b/q02_data_split/build.py index c2e7147..c3ea615 100644 --- a/q02_data_split/build.py +++ b/q02_data_split/build.py @@ -1,8 +1,16 @@ +# %load q02_data_split/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from sklearn.model_selection import train_test_split import pandas as pd df = load_data('data/student-mat.csv') # Write your code below +def split_dataset(df): + X = df.iloc[:,:-1] + y = df.iloc[:,-1] + X_train,X_test,y_train,y_test = train_test_split(X,y,test_size=0.2) + data = (X_train,X_test,y_train,y_test) + return data - + + diff --git a/q02_data_split/tests/__pycache__/__init__.cpython-36.pyc b/q02_data_split/tests/__pycache__/__init__.cpython-36.pyc index e780e63f202604d8b01427afe772dd73a1ea13a3..9003b7a15da417c72d483d419551bc8d93488b84 100644 GIT binary patch delta 47 zcmZ3)xQ>y-n3tE!A<`mxB8Rzjw0=f@ZmNE;kFklVet3RSc5y*sa;koEeoE>@zYqX0 CA`U?S delta 35 qcmZ3-xQLO%n3tF9rT(I*i5%wq{`wjDxvBc;MX8mECHc7%qe1|^EDNFl diff --git a/q02_data_split/tests/__pycache__/test.cpython-36.pyc b/q02_data_split/tests/__pycache__/test.cpython-36.pyc index a1b3fc579e35798e380953fe62d7efac2225573f..7d0c7acd02294641e92f9822e66ecb879007e1ad 100644 GIT binary patch delta 50 zcmdldaY};2n3tE!A<`mxBZo4Rbhv&-er~FMu#d5cseX8VQFd`bVsff}a(+tcW-BHZ FE&yc64toFq delta 43 zcmX>lu}^}-n3tF9i20(ZjU38M0^a%=`MIh3=|!oPi6!~D`jhu@%WqC&dcp|+D%lQc From 143133a1aa2b758a57aafeed90f428b79161de2c Mon Sep 17 00:00:00 2001 From: SL345 Date: Tue, 3 Jul 2018 07:58:58 +0000 Subject: [PATCH 03/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 159 -> 171 bytes .../__pycache__/build.cpython-36.pyc | Bin 924 -> 781 bytes q03_data_encoding/build.py | 9 ++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 165 -> 177 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2197 -> 2209 bytes 5 files changed, 8 insertions(+), 1 deletion(-) diff --git a/q03_data_encoding/__pycache__/__init__.cpython-36.pyc b/q03_data_encoding/__pycache__/__init__.cpython-36.pyc index 884722b9e5eb21d01be2d88d202ca11e74eb4609..60754790d9c3baf0d591f71d6a2d4b99afd2ba39 100644 GIT binary patch delta 47 zcmbQwxSEl}n3tE!A<`mxB8RzjgnmYTZmNE;kFklVet3RSc5y*sa;koEeoE>@zd!&k Cu?{r= delta 35 qcmZ3@IG>Tjn3tF9rT(I*i5%wqKKdE?xvBc;MX8mECHc7%qXGfECkvJU diff --git a/q03_data_encoding/__pycache__/build.cpython-36.pyc b/q03_data_encoding/__pycache__/build.cpython-36.pyc index 302366cb1c8d346c67f347e326ce7abc487c2dcb..0601354adbfaa616b3573d0a9f6a850a5ccc1e3a 100644 GIT binary patch delta 357 zcmYjNyGq1B6rGv8b+ZKg09yk>id7rMLR+y}L>Y@^*qPw2n`D^Dih(R!Y;7TFEo^OU z{RbQS`4lVf6lyr!!#!NieZ2%vel&{Xt&jcV+t=slbL}C72*f#r-UDjU9MyP(=469c zq{Thuw4`-%vT|E@j8c4=I@DuQE*j;6k;eI~p45t!IeN|#*k7PU$T-jZHVNC@LbvRl@DZs=66|0U|AK}lAYco+uejG VMa7p3accjjhd={t5n7PM`2p8BU+Dk< delta 501 zcmY+9J4*vW5XX1to{>Zo5FeGPgcBr%jYY6gL>n6mB_MKS_mT_ua`z$^xsW0VHWrfB z%Ff2dZ{bJS*2>D>%2`oShWRu5+j-vF_fBQ2R-4=0e(1d3RbD10A;d!8MVB`yIhm3% z6h%%MEy(~Ftdc40kux?na${g3vlx^{pgEN*B@FB@W-#OWm;Wbif>};UvGRWwo%}^@ zab7Qj)`Ypc|7T+jLT-;=glNdHj`n@Mc8d#`q5D1wE0a0#ns=m9C@zLM=4AA zNslW__Wg`2NHS%IQgA=&m|>K5JGCIp&-Zi8l0hnBRrw7)Q#q&S_zV+eW58vuAmWOK zk3=kB?~lV)KaF{-C-}(E)3`M|fVJ5(^_J)GS5{F7*suhPbe(Qc(U`r{r$Sk{Y&H@u z{wh236Xr_=8B@Rl@zi Date: Tue, 14 Aug 2018 13:07:19 +0000 Subject: [PATCH 04/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 157 -> 169 bytes .../__pycache__/build.cpython-36.pyc | Bin 1006 -> 1175 bytes q03_ohe_encoder/build.py | 28 +++++++++++------- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 163 -> 175 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1478 -> 1490 bytes 5 files changed, 18 insertions(+), 10 deletions(-) diff --git a/q03_ohe_encoder/__pycache__/__init__.cpython-36.pyc b/q03_ohe_encoder/__pycache__/__init__.cpython-36.pyc index e4ec35b27b6016dd979d13f661e08f8147e0e802..4d2ad26522f9b87b903cac156f42ebde2de00687 100644 GIT binary patch delta 47 zcmbQsxRQ~>n3tE!A<`mxB8Rzjn0`inZmNE;kFklVet3RSc5y*sa;koEeoE>@KYsu% CyACY? delta 35 qcmZ3_J1R;?aUVikAq5QCXIqNwR6OyUuQ50~>Nk zdy;}>LH~$9!2jTFuj0Xrzd*saHAp*;@0<6%dA#>#=9l%kzJJ(i*}uQ(H^-ci@8rfp zO^y&rcD4WPNE*UcpzIZhhGMF*g11~WMN4dmO=(K&oT#?iQjJMx1uHlvnAcU^A;_An zpM&UKefoNL&>u%L)gQb(eDbt^66w<<_I%a%BdPjDo!u)g;NjA)T2dsF=oW51L#mdA zFcB{h$w#D|Oo&9gpgA4VU9wNf!o27)Fc{l~gi}kn0?{ zkz-FwszjK0vLGOUJtUCEcy4 jhg5uE54vLW_Rt4O delta 494 zcmYjNJx}B?5cNkko6T;Puu$AprvrgVfwrK4f&vM|b?BsPkneO+w4Oi^n?$yeSSc%t zrKLa-LZYPOU);|?Zt3|AHxZvRn&&sRXWrPio#*!QMiBVf*1dRSgglW?<{;m}(B^u1 za~r5^&8YB!gFmBx9MKg$5s1EYW&4uA9E9MX%+KhI?h(8G&AgC=rsgGDkiC9S8U2FenKl0 znmWi>g|gFDR61oGH-O)n%eIL|iq!MR1X3CN?U` zby}#g?Yz^-we(Q9hp_=|Z2z^{B+haP=YkidD#o}kXau~V#r5@ zgg)llLm)KhQ6F6mFo_oHpZsCnx@D5fL|ax$+se=llhv!v eQd`aAks8#$o$p^MQXL}nXyYFBn8!l)h5rYg1$+Pi diff --git a/q03_ohe_encoder/build.py b/q03_ohe_encoder/build.py index 36e4b90..f2175c1 100644 --- a/q03_ohe_encoder/build.py +++ b/q03_ohe_encoder/build.py @@ -1,19 +1,27 @@ +# %load q03_ohe_encoder/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset from sklearn.preprocessing import OneHotEncoder -import pandas as pd import numpy as np +import pandas as pd +path = 'data/student-mat.csv' +df = load_data(path) +x_train, x_test, y_train, y_test = split_dataset(df) +category_index1 = [x for x in range(len(df.columns)) if df[df.columns[x]].dtype == 'object'] -df = load_data('data/student-mat.csv') - -x_train, x_test, y_train, y_test = split_dataset(df) - -category_index = [x for x in range(len(df.columns)) if df[df.columns[x]].dtype == 'object'] +def ohe_encode(x_train, x_test,category_index = category_index1): + cat_col_list = x_train.iloc[:,category_index] + for cat_col in cat_col_list: + # encoding in dummy variable + dummies = pd.get_dummies(x_train[cat_col], prefix=cat_col) + x_train = pd.concat([x_train, dummies], axis=1) -# Write your code below + dummies1 = pd.get_dummies(x_test[cat_col], prefix=cat_col) + x_test = pd.concat([x_test, dummies1], axis=1) - + # removing the variable + x_train.drop(cat_col, axis=1, inplace=True) + x_test.drop(cat_col, axis=1, inplace=True) + return x_train,x_test - - diff --git a/q03_ohe_encoder/tests/__pycache__/__init__.cpython-36.pyc b/q03_ohe_encoder/tests/__pycache__/__init__.cpython-36.pyc index 8c87a88f1c4ac0875da221298faa5cf1f1990908..e41b4b06ac5ba60cee051aecbbf88e75c7f15ade 100644 GIT binary patch delta 47 zcmZ3?xSo;2n3tE!A<`mxB8RzjjDALbZmNE;kFklVet3RSc5y*sa;koEeoE>@zfb@$ Coeo6+ delta 35 qcmZ3_xR{Z{n3tF9rT(I*i5%wq0s0yFxvBc;MX8mECHc7%qe20_gA1kr diff --git a/q03_ohe_encoder/tests/__pycache__/test.cpython-36.pyc b/q03_ohe_encoder/tests/__pycache__/test.cpython-36.pyc index 1956a19a3862d792c03ff34e686b4f3716827383..58c26b56e875c4e729488322670d71bd1ae0e259 100644 GIT binary patch delta 228 zcmX@ceTkdHn3tE!A<`mxBS#*iaTIGxNo7H*Cetk@J%d|}6)PEvco`TNenseKhYU3*%>QkW#SvBEHF=m^v5*Cs#8YG73#z z%PcJ_0+JJjD*!9yn|zl!&rl2`D2XZqkp_tg00|JUm<331FmbRH2~4hG`J*BXlH>vr R;vfQ~3}Q91Bj&Jb0RRG*F4q76 delta 220 zcmcb_eTR;*+w;$vW7_~oOYk)NBY zpI($&nOKsat3UYyi~Qu1jAo1ilbAkpgOq^P74c90$JD_nG`XGGkWqN@PG)IQQIMP% zTme`q|KyjO>aWM;!;9%llDH5FA!SY8%1SH7?A|yZrNEyUx KWJj!E)dB#T{Viqy From a5e263d32b1c588635f011a7a7c5c239beb3fd85 Mon Sep 17 00:00:00 2001 From: SL345 Date: Tue, 14 Aug 2018 14:04:40 +0000 Subject: [PATCH 05/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 169 -> 181 bytes .../__pycache__/build.cpython-36.pyc | Bin 810 -> 798 bytes q05_linear_regression_model/build.py | 8 +++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 175 -> 187 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1588 -> 1600 bytes 5 files changed, 7 insertions(+), 1 deletion(-) diff --git a/q05_linear_regression_model/__pycache__/__init__.cpython-36.pyc b/q05_linear_regression_model/__pycache__/__init__.cpython-36.pyc index 06a2a9b901d2940b1616332fc3af2e6292737630..cbc02e75b4f2b61b9bf7395d21eab32d96754f50 100644 GIT binary patch delta 47 zcmZ3hZmNE;kFklVet3RSc5y*sa;koEeoE>@zi0q6 Ce-2#$ delta 35 qcmdnWxRQ~>n3tF9rT(I*i5%wqVfq>QxvBc;MX8mECHc7%qoM)7jSId2 diff --git a/q05_linear_regression_model/__pycache__/build.cpython-36.pyc b/q05_linear_regression_model/__pycache__/build.cpython-36.pyc index c40d112c5d846cc979296e4912c2f11a9f286eee..3d11d4f63127d625ed8e119abb63794fdcdfe21d 100644 GIT binary patch delta 233 zcmZ3*Hjj4hP_K5hBqQuO+TkMq(Mif&{?n;ItcA%PH@%kD0xvBcWKE@`d`r-LS z*~JBk$*KCu`6;RTllz$DCwDShND2T|7PA2f21YhU9>yY0Aj?ma@0R^!1tz`898A~U yi$Jos*nk$K7MFnK!NwyI93TZ8Ho5sJr8%i~Oh8^SACTZ-@zeE5w CVGeZw delta 35 qcmdnZxSo;2n3tF9rT(I*i5%wqG5Q(#xvBc;MX8mECHc7%qY?qZmkZVa diff --git a/q05_linear_regression_model/tests/__pycache__/test.cpython-36.pyc b/q05_linear_regression_model/tests/__pycache__/test.cpython-36.pyc index 54551b93750f647d6e93e9edd56a0f2642a67061..d3b6e4f486542468a8c9e63c23879fe8a6327a16 100644 GIT binary patch delta 55 zcmdnObAX4#n3tE!A<`mxBS!+0Op1O+er~FMu#d5cseX8VQFd`bVsff}a(+sx{$v?e L`OVXr<}w2SwfYc? delta 43 zcmX@WvxSGln3tF9y~U!ajT{L~0ulNd`MIh3=|!oPi6!~D`jh)v Date: Tue, 14 Aug 2018 14:19:40 +0000 Subject: [PATCH 06/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 162 -> 174 bytes .../__pycache__/build.cpython-36.pyc | Bin 1086 -> 1019 bytes q06_cross_validation/build.py | 6 +++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 168 -> 180 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2082 -> 2094 bytes 5 files changed, 5 insertions(+), 1 deletion(-) diff --git a/q06_cross_validation/__pycache__/__init__.cpython-36.pyc b/q06_cross_validation/__pycache__/__init__.cpython-36.pyc index 9a1c3aaa4d67dd0ebf5ed2b2e34d7c0807004b94..94af4136c34b164988baa7a51aa67335d8b8ebc4 100644 GIT binary patch delta 47 zcmZ3)xQ>y-n3tE!A<`mxB8Rzjw0=f@ZmNE;kFklVet3RSc5y*sa;koEeoE>@zYqX0 CA`U?S delta 35 qcmZ3-xQLO%n3tF9rT(I*i5%wq{`wjDxvBc;MX8mECHc7%qe1|^EDNFl diff --git a/q06_cross_validation/__pycache__/build.cpython-36.pyc b/q06_cross_validation/__pycache__/build.cpython-36.pyc index 2e1c378d0210faf52111a997f473e84d10da11f6..7a3800f0757d0574794e50313cebad58f6168225 100644 GIT binary patch delta 289 zcmdnT@td8~n3tF9|Z3o!ho@mbiy_Xm_iiM!d7k4NSbBIOk(2xgqcwctXQND2>S+h zmSXRNT<`(X_yF2?HzLR|hr_w&ely?xdr<2&8XE_P&x7c-)`Lf%F?L4RbVw|l!jwx` z05B^gmqI#A{vfPVumTER2$A|mT-9i6B`T>vA;%z#%q*E$gLNHeGEXC8 zW2=zseVX#&-M}})Tu-ub=poN8X6XI)&@oC$U179Gf=;U9EOgLKbEy)9D}*_^H={g} zFHCP!F6DDVG~cww&=Vid=L7YlpvQQ s^zS39<4J}d8D%W`^S^)$1$v9BYr^``f6}TL!7=^sHc=-~eu!P*KQHHE00000 diff --git a/q06_cross_validation/build.py b/q06_cross_validation/build.py index 406a734..11f033d 100644 --- a/q06_cross_validation/build.py +++ b/q06_cross_validation/build.py @@ -1,3 +1,4 @@ +# %load q06_cross_validation/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -18,4 +19,7 @@ model =linear_regression(x_train,y_train) # Write your code below - +def cross_validation_regressor(model, x_train,y_train): + r2_score = cross_val_score(model,x_train,y_train,scoring='r2') + return np.mean(r2_score) + diff --git a/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc b/q06_cross_validation/tests/__pycache__/__init__.cpython-36.pyc index b571b36039256ecb659b19941ead2c342e31d840..543cff697c52eed58eda610578b2ce12f5536e05 100644 GIT binary patch delta 47 zcmZ3%xP_6!n3tE!A<`mxB8RzjqJBnxZmNE;kFklVet3RSc5y*sa;koEeoE>@zbF7R C1P)mM delta 35 qcmdnOxPpQ6qvCcjydS&mUa5U8{Wq#iDLg8;WE+NQ@6iNCI&&8<5~&;$Y!m zF5;Wa%ofWR#hO=|TTodf2b74ipX|@Bw|Nd58zZCC Date: Tue, 14 Aug 2018 14:26:51 +0000 Subject: [PATCH 07/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 161 -> 173 bytes .../__pycache__/build.cpython-36.pyc | Bin 1168 -> 1184 bytes q07_regression_pred/build.py | 8 ++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 167 -> 179 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3674 -> 3686 bytes 5 files changed, 8 insertions(+) diff --git a/q07_regression_pred/__pycache__/__init__.cpython-36.pyc b/q07_regression_pred/__pycache__/__init__.cpython-36.pyc index 3e7e4674f103511456d5015475ef0cbf23edade2..2794900dbd3cdd687b1bbc147d701be55aea4046 100644 GIT binary patch delta 47 zcmZ3;xR#N_n3tE!A<`mxB8Rzjlzv8jZmNE;kFklVet3RSc5y*sa;koEeoE>@zhD3_ Crw%;; delta 35 qcmZ3>xR8;G)*8Tr{N;!9GCOK!1Mg6YYx8RcZc^)vEwQ}u&=j7?1S z!}E)>iwhEyQ}vVcQ&ROOJ2J~pwqP=5l-QiZw4YJ9h?{|d;TAhkcTr+yUJ(zFH`#?n eSDqQjC>8?}B1}AtJRl4tIhX{P_?Wnucvt|JR3cjd delta 147 zcmZ3$If0YYn3tF9rsbk2){UHZ8I2huZZTHgVylcVC`wJa#hhE53M3L!Z!r}atz;+? zWME+U<*lEQpPQ;p3`mGD@i6j$Fp%V65@6zE;$q@q1^_01Dh&Vt diff --git a/q07_regression_pred/build.py b/q07_regression_pred/build.py index 3f2eee3..fe464d9 100644 --- a/q07_regression_pred/build.py +++ b/q07_regression_pred/build.py @@ -1,3 +1,4 @@ +# %load q07_regression_pred/build.py from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score @@ -20,3 +21,10 @@ # Write your code below +def regression_predictor(model, x_test, y_test): + y_pred = model.predict(x_test) + mse = mean_squared_error(y_test,y_pred) + mae = mean_absolute_error(y_test,y_pred) + r2 = r2_score(y_test,y_pred) + return y_pred , mse, mae, r2 + diff --git a/q07_regression_pred/tests/__pycache__/__init__.cpython-36.pyc b/q07_regression_pred/tests/__pycache__/__init__.cpython-36.pyc index f1435e528c2d79d16299d3cf5270ab25f34f4b3c..1bc36467a31788f0491f299446919ddef096beed 100644 GIT binary patch delta 47 zcmZ3^xS5f|n3tE!A<`mxB8Rzjf__GRZmNE;kFklVet3RSc5y*sa;koEeoE>@zeoTw Ci4Ii& delta 35 qcmdnYxSWy0n3tF9rT(I*i5%wqA^I8lxvBc;MX8mECHc7%qap#m-wU1h41}u)R*K-#$Mr~H+xy>jb U0}_!35sDy!4=5)-S(VQe0J%dltN;K2 delta 202 zcmaDRb4!N9n3tF9rT(I*jU2|z0s;CN`MIh3=|!oPi6!~D`jhQ>o} F2mt3xF;xHn From d859c5787d9d3b1c98670ea6b5c66ffa951a0287 Mon Sep 17 00:00:00 2001 From: SL345 Date: Wed, 15 Aug 2018 07:27:13 +0000 Subject: [PATCH 08/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 158 -> 170 bytes .../__pycache__/build.cpython-36.pyc | Bin 1359 -> 1382 bytes q08_linear_model/build.py | 10 +++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 164 -> 176 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 3958 -> 3970 bytes 5 files changed, 9 insertions(+), 1 deletion(-) diff --git a/q08_linear_model/__pycache__/__init__.cpython-36.pyc b/q08_linear_model/__pycache__/__init__.cpython-36.pyc index b91b141617b95b635e59b43a1e9967e108638c18..43dc77e922ce36f707548fb710a5dd238530370b 100644 GIT binary patch delta 47 zcmbQoxQda(n3tE!A<`mxB8RzjxPC@{ZmNE;kFklVet3RSc5y*sa;koEeoE>@zW@L( CHV!cW delta 35 qcmZ3*IFFITn3tF9rT(I*i5%wq-ufB&xvBc;MX8mECHc7%qXGcC&iwhEyQ}vU92I)_p$Ra;^J(Gr- z2vB7)50GGB0_3D3kilScz>Yy8B!CjPIBbCaDa}c>W16hZssaFaUs!Me delta 322 zcmaFHb)JjUn3tDJ-D**k(niiYM#iAY9gO;ZHS9GUHJmAob69G*N|>`)YPeFE(iu~j zdzosvYglU7YPi#wgBdhg{4`l^u_nitCFa~>&Mi&_5{ap|n2L;w7#SECG#PKPX6B`& zR!kOUa&=>LFX8|S-eRkaFDOb)DdGfjinu@oH;{;8&#jD4$xJS}#adjFSW>)_p-2oU z{L4c>BR@A)KfNfmGO;8-SAX(;X8Fk{m^9RcfwILsK!Smhi;0Ixgo%$yfT>6V$k&v) z#a57*my%dq#JgFH`8s1bKTxzt07M9a2q7SGi#0btB^Bsupwo*)K%%Jb0h@zc2tX C7!FAQ delta 35 qcmdnMxP+0zn3tF9rT(I*i5%wqf%+NwxvBc;MX8mECHc7%qrw2a+6$@x diff --git a/q08_linear_model/tests/__pycache__/test.cpython-36.pyc b/q08_linear_model/tests/__pycache__/test.cpython-36.pyc index cbaeda35dafd76d9b3875e0d9e56e950079bc591..438527cd07a37da1e6ac6cd84d0dc0d755ab5a50 100644 GIT binary patch delta 68 zcmew+*Cfwj%*)H=5NQ#;kt2>-CQ?5mKQ~oB*vHt!R6jhwD7&~IF*#K~IX@*;f3hsE Y{N}05nVgJKoB#8OGBHL?7UfR_0I!@BB>(^b delta 51 zcmZpY|0c&_%*)H=Yqcn9BS#!Fzps8qer~FMdQoa+Vo84P=0@gDPR3iCxp_sI7;jBh H Date: Wed, 15 Aug 2018 08:00:19 +0000 Subject: [PATCH 09/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 1339 -> 1377 bytes q09_advanced_model_q01_lasso/build.py | 12 +++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 176 -> 188 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 4099 -> 4111 bytes 5 files changed, 11 insertions(+), 1 deletion(-) diff --git a/q09_advanced_model_q01_lasso/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q01_lasso/__pycache__/__init__.cpython-36.pyc index b8b8fc73c23c3602d2cc8046c670d9178deb30ae..5e6a70e2fe5db756c6167fca12d4198661dd1744 100644 GIT binary patch delta 47 zcmZ3*xQ&s+n3tE!A<`mxB8RzjvVKN>ZmNE;kFklVet3RSc5y*sa;koEeoE>@zZd{B C`VL_L delta 35 qcmdnSxQda(n3tF9rT(I*i5%wq;rbc*xvBc;MX8mECHc7%qhbKR5LZ7{}+Cmu!+v)>>;lNL>XHaxu{AP4pmmDy3LqVHN7IGu?JgHen_$2ot32 z#fzt0{Q@4vqhFz)U_jb_jh=ks$$|fGo|k$4GxIyXj-#D4jlce}?=OBv6ZkSBgb37Y zls!WmrAJ#^zDML4t;6ao27$Q6GW2fI7Zp68Rwe6qEi z>3oKEd3Vmn-6ehU*o#71TiwF}yN)1`K#WRY147uu-Hd-dVsBw|3!6Tu@u||9_3oVS tzcFiAGq?K&RYzu{&+hiv?9qFgagY8v|KS0qK74`yIxX}|+T9lq{{j_sd2Ijy delta 478 zcmYjNO=}cE5be+T%5DbsOO@boI9t?;i0U-!WlkQD+nb{eu+mJ{Pd)RXh zve%rvNlw9I{z>2RH#}J#FVfVb>UF<*Ree|77Wq!UU(8 zBVK5#ndXoiW$gQvQ~%uy>e;*sz%wg4Z?l}SN1}B zK6IcK6?^ffQr0%mkAmc4*n-hV9Iap__F0XzjHB3J1U9kybGUul)Monx%!P7Iy|`n8 zXRv`ck1%ZfQ9_q#56?roMPcLj9^a?SYe@za#)Q C+zxpF delta 35 qcmdnPxPg(wn3tF9rT(I*i5%wqvHBVLxvBc;MX8mECHc7%qmlr@?hD!g diff --git a/q09_advanced_model_q01_lasso/tests/__pycache__/test.cpython-36.pyc b/q09_advanced_model_q01_lasso/tests/__pycache__/test.cpython-36.pyc index 3d92981a85fdfdd93eb4850d6b323ecab8bd7161..e0cf1bf291c8ec4e7d9c5ca6431df948aa85e3a5 100644 GIT binary patch delta 190 zcmZox=vUw{=H=ybh_r~_$l=K>ovNRapPQ;5>|<v}u3{EfAp#BJ@Fo y0f;c1e2`y!b0Y5sMzLG0d8N4pl|{-x@hG-}#JrTm;v)6Q>ikm})h6%Z4+a26PBH-i From 0359912f6427bd0b56417fad88a151d2035c0480 Mon Sep 17 00:00:00 2001 From: SL345 Date: Wed, 15 Aug 2018 11:43:34 +0000 Subject: [PATCH 10/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 170 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 1339 -> 1531 bytes q09_advanced_model_q02_ridge/build.py | 21 +++++++++++++----- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 176 -> 188 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 4079 -> 4091 bytes 5 files changed, 16 insertions(+), 5 deletions(-) diff --git a/q09_advanced_model_q02_ridge/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q02_ridge/__pycache__/__init__.cpython-36.pyc index 222893d6c4bc0f716c4fdbff600e66340545b3cd..5f2508e0107b77905b35b71da30db14f970eab7d 100644 GIT binary patch delta 47 zcmZ3*xQ&s+n3tE!A<`mxB8RzjvVKN>ZmNE;kFklVet3RSc5y*sa;koEeoE>@zZd{B C`VL_L delta 35 qcmdnSxQda(n3tF9rT(I*i5%wq;rbc*xvBc;MX8mECHc7%qhbKRfgc5cTfbj_o)!ZQAq;2|*+zA84euhzmkUpkAoB6eyTVVaaaWq;{OnZjnHa zsw$k2dZ=>c4l$c4YbUO4bC;KFR^p&sq?%$uFrH}gIETWxLBYSGVG{Te*S`R!c! zT=XB}QC}}wuU_W$w4TqVv&0dO2(r1nkv51UtNr=@f(XY1eIlYUNt=?%=9uic>0-K+ zE~hKflZ$d`O!uf|#5EC%+DDSE3V+8*W-flb*koodmweDs$0r=5=tzJ9Ok>LNx2nia zw7et(SnsHA0dlfHo}AWD9?EteS(%>@w9_YjDu~siS?LNY*f||}rPp^$r=(+wJVsNW zjeO+&5^s+xSXt3Q$;!%@VjSr3zds6fbm>KNQ$jmTQVf^alyk+KCbof=9E(B>(Mrva_gYwRDA%EyoZ delta 608 zcmYjN&1(}u6rYcs{YW+;Z4w))v_he{7Xx||DS{;j4_+*SOCSu+Bu&UBadukTGD{EZ zwTH474_*{6o;~_Uh~R0!llV{Q#W(52dA!H(egEG4t$(fUJ!~{;pB{Zo3lE`R=)VU( zdIFliyWV?sh>@(%TC)uimKZP=QHj${N#$mVhhExFJ83t)C7Eo?PDzHuMMOi?Mf?`0 zTf%>VlIHb~m(>VAyNqF~5Bk(i7hp6pp1^_#dPNIn*bEzFNJ%i##IQA{g|8`KY-mY` zUJ(>w5fwG<&6x4EKMM>HGm)tY@4YA31PlL)6m{qbOnppYeenE9g|IBSq?Ymd>X_ST zu~ZqKPcNj66<>&DHp(^EGVv^XJv!xc>!~c4mS$X9q8=#h`mtrxg^*`SsN5Bnj;C4$ zfE05sSqU2*a?J;dXVA7-SucO1bQ0U(Y@`*hev><`nk!{$Dkf4j09PBdx5M1_{4-KJ z5czY|KVD|CKT-0W>t)uje$w6Qgzn!{+mP;p=I$pEZsHiEgYV*XCc!F#aMJtojSg_z z6z>% diff --git a/q09_advanced_model_q02_ridge/build.py b/q09_advanced_model_q02_ridge/build.py index 0fb3e1a..05b822e 100644 --- a/q09_advanced_model_q02_ridge/build.py +++ b/q09_advanced_model_q02_ridge/build.py @@ -1,3 +1,4 @@ +# %load q09_advanced_model_q01_lasso/build.py from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset @@ -8,18 +9,28 @@ from sklearn.linear_model import Ridge import numpy as np import pandas as pd +from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score from greyatomlib.multivariate_regression_project.q06_cross_validation.build import cross_validation_regressor np.random.seed(9) df = load_data('data/student-mat.csv') - + x_train, x_test, y_train, y_test = split_dataset(df) x_train,x_test = label_encode(x_train,x_test) -# Write your code below - - - +# Write your solution here +def ridge(x_train, x_test, y_train, y_test, alpha=0.1): + np.random.seed(9) + model =Ridge(alpha=alpha,normalize=True) + model.fit(x_train,y_train) + val = cross_validation_regressor(model,x_train,y_train) + y_pred = model.predict(x_test) + mse= np.sqrt(mean_squared_error(y_test, y_pred)) + mae= mean_absolute_error (y_test,y_pred) + r2= r2_score(y_test,y_pred) + d = {'cross_validation':[val],'rmse':[mse],'mae':[mae],'r2':[r2]} + stats = pd.DataFrame(data=d) + return model,y_pred,stats diff --git a/q09_advanced_model_q02_ridge/tests/__pycache__/__init__.cpython-36.pyc b/q09_advanced_model_q02_ridge/tests/__pycache__/__init__.cpython-36.pyc index 602e1f5d5c4f60e2bd8813680dc29fba2e27d856..67b8393d898371282d36dc66c4075bb3205f2772 100644 GIT binary patch delta 47 zcmdnMxQCI$n3tE!A<`mxB8RzjrhZ0#ZmNE;kFklVet3RSc5y*sa;koEeoE>@za#)Q C+zxpF delta 35 qcmdnPxPg(wn3tF9rT(I*i5%wqvHBVLxvBc;MX8mECHc7%qmlr@?hD!g diff --git a/q09_advanced_model_q02_ridge/tests/__pycache__/test.cpython-36.pyc b/q09_advanced_model_q02_ridge/tests/__pycache__/test.cpython-36.pyc index 37f31c3afe884d721a91308abc3e21f01dc3af87..321fc886f11dc86f939198dc5dee19bed12d015e 100644 GIT binary patch delta 198 zcmaDa|688Jn3tE!A<`mxBZnumbgF(ver~FMu#d5cseX8VQFd`bVsff}a(+tc<^*Ob zX2z(^)od@A7*#i?aI!LTYcVh|6sdv;?a2uoQj`0*?qi5e;=Y3+HkqeFUInC09Ykn? z2ptfi2O{)Agu{NkG(c{ebMMX~0U<`z^IDFel$*a{N!QWA@c)F!j@PhnJ@JcmCR E0JI}8{{R30 delta 212 zcmew@|6ZQMn3tF9rT(I*jU1lL{E_+@`MIh3=|!oPi6!~Dn{$|@m^p8;=cObT6(v?q zZe*9)yqfI@6QkPZ0!~&&Zfynzh9Wf(p)+|Ro7Ci4T=y}==5gP_5S!0aA+HM3rU4?f zK!h%c&<7C)Ai{9+T7L1(zPuY46>hQSmF5;y7AXV8qu2@(fsQFIQU@uL2Z^{%KFF&# O*_%IxQEl=H{$K!Wj5lon From 28ea9e8a9fdca954d97d213e0dd0b73fb70655d5 Mon Sep 17 00:00:00 2001 From: SL345 Date: Wed, 15 Aug 2018 14:17:17 +0000 Subject: [PATCH 11/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 165 -> 177 bytes .../__pycache__/build.cpython-36.pyc | Bin 911 -> 832 bytes q10_data_missing_values/build.py | 7 ++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 171 -> 183 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2358 -> 2370 bytes 5 files changed, 6 insertions(+), 1 deletion(-) diff --git a/q10_data_missing_values/__pycache__/__init__.cpython-36.pyc b/q10_data_missing_values/__pycache__/__init__.cpython-36.pyc index 9f50df257f7dadafbe3ce884c55c000ecc154d68..9b65e244389b59d6124f1182299b7eeb5bd208d3 100644 GIT binary patch delta 47 zcmZ3=xRH^=n3tE!A<`mxB8RzjoPI`rZmNE;kFklVet3RSc5y*sa;koEeoE>@ziLEVZ9I_uz4f>2U()fCgTNdzN;Lw2QPa}k{M zU%2`g-s&%Kb@E+B=;S-T@4fr(-p70I`lHd@HqC1H=*4^BjD511(5OBjq_30axGk5Z zS-=_hEYFs8xgxCsi0uLj4vZAKs~pV#X7vIr&`z0Coji4Rft)IYL*-Z}x?=-YD29v= zDh2d8eT8F3LlMaIJPCUeOBdD}fY5nk$pZC!pSYKCB;AWd=6)7OZutcplI7)TxkZhDQD;P(i}f8^K5D;oK+* shZ$;FK9bYvW=M^Lq8-J-^_ARHyQdAJ8mJ?t5PS(1xzK8$TO@zgPe? Cbq-|! delta 35 qcmdnaxSEl}n3tF9rT(I*i5%wq5&9YVxvBc;MX8mECHc7%qhbNTI}64D diff --git a/q10_data_missing_values/tests/__pycache__/test.cpython-36.pyc b/q10_data_missing_values/tests/__pycache__/test.cpython-36.pyc index 17019265bc29ee0e0ca9f98bf98dfee0d9486c8d..774d9369d1730f2a3c9ae3126825b04dbda3d3ed 100644 GIT binary patch delta 56 zcmdlcbV!K9n3tE!A<`mxBS!|4bb@|Her~FMu#d5cseX8VQFd`bVsff}a(+tc=6WUp MHpZyQ6F8Ou0Lz6DCIA2c delta 49 zcmX>kv`vV^n3tEU&t*~6Mve?7fe`(S{M=Oi^rF Date: Wed, 15 Aug 2018 14:27:36 +0000 Subject: [PATCH 12/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 177 -> 189 bytes .../__pycache__/build.cpython-36.pyc | Bin 1081 -> 997 bytes q11_feature_selection_q01_plot_corr/build.py | 15 +++++++++------ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 183 -> 195 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1488 -> 1500 bytes 5 files changed, 9 insertions(+), 6 deletions(-) diff --git a/q11_feature_selection_q01_plot_corr/__pycache__/__init__.cpython-36.pyc b/q11_feature_selection_q01_plot_corr/__pycache__/__init__.cpython-36.pyc index 35c8cae903f3144112ac43723fc1b6346aa0fe84..6e1b653c27603e5f1f5cf862bc7405bee13538fa 100644 GIT binary patch delta 47 zcmdnUxR;T`n3tE!A<`mxB8RzjmVQQlZmNE;kFklVet3RSc5y*sa;koEeoE>@zhnS6 CR}Osu delta 35 qcmdnXxRH^=n3tF9rT(I*i5%wqarzngxvBc;MX8mECHc7%qmlu_MGM{l diff --git a/q11_feature_selection_q01_plot_corr/__pycache__/build.cpython-36.pyc b/q11_feature_selection_q01_plot_corr/__pycache__/build.cpython-36.pyc index 35748ec9368f7249043702f94546923c07c4c418..2b368f87e54357cc3939022f08d142a89bdf55fa 100644 GIT binary patch delta 456 zcmYjLyG{Z@6rDRez_Pp_CiGO>NP!v(G$zJE<0Fwm9cdP35O9~>%&hSd2#IT9LqTZ$ z0YAZCSxaMK;|Ewdiw$!#=bSmY_uP5czY^7YCSx2n{HtjUp-;4Oh|;_2%BOktpurFW zJ43TvXYl}NjvG7|K%3A!Ezlw@@ifo#LV(*ia+tw%mV5?Up1;0KqolnkX-k2RhA>vu z!whE7#uGfz#%PEGG$Fn=BxAxb(`Fc=&RBo|G1NjPIWd7IdV^~@c;qyGX`hNSrYzER zEYFOGnrHhWS`?D5D@3Ttk)(+}w|r;c@+gsg_s)!knDs)kjL=jT#n!z@si8L{a*BSh zYkk+@wboI6W3zVdiW})!U0&Y}dC3 zoptXaQZ)Y0!dQIcpAt<-ZgpHS5@|IdG71(ST6H^$S$<&!^2!VKrsJ|(o9}4qC5s9S Os6cvII@WO>vZ+6&(P`QM delta 541 zcmZ8cJ#W-781`#Bmt2}luLU7g*lvoDC=z24LZS-`NU%V-CDguaPDy-n+)w4y!L8J# zLv{ZEvG5c48;o8N0}Eni;`K35VaxBw^L{*!zlUF<(c{4&{<`}ycL5>a$c@7>eul3- zy&k=IBqPzYkPl=m2NuRWPxJMBm~Y5LrgGiVG4+UuMI`#?kZ)dpx;(>;8B;nDzhfvlP*I zwq^;CGeO>vEO?oL3n%5YEl;KEy{lg7*WyQxiV%;qGKDEslO>MtDXq2twf4eYSQn<< zS4W!pEYL+Wm5x=iap9h-4(g_L!CaS((bPAvd1V~;16km>C`|DHQ{>d?s*DO8Esj4E zy@mPj_uKobmfKS;PYR>z@zf1r+ CIS!Qo delta 35 qcmX@ixSf&1n3tF9rT(I*i5%wqDf$`txvBc;MX8mECHc7%qcQ=+PYd<{ diff --git a/q11_feature_selection_q01_plot_corr/tests/__pycache__/test.cpython-36.pyc b/q11_feature_selection_q01_plot_corr/tests/__pycache__/test.cpython-36.pyc index 93b5347767868d7c98b1b5816f63e3fa98466c9c..4b1d1aa9dcd0f916fba682672ba9f28bd1610fbc 100644 GIT binary patch delta 62 zcmcb>eTSRFn3tE!A<`mxBS#36Opbm=er~FMu#d5cseX8VQFd`bVsff}a(+sx{^W%$ S@|(Mv9x^gUZO&y$W&{97m=jt6 delta 50 zcmcb^eSw?9n3tF9rT(I*jT|9N0txyV`MIh3=|!oPi6!~D`jgkP$Zwv`^pKJ9*5*o< GWJUn1bP-bk From 7b95a5608761f51a61b228694e3d150006be266f Mon Sep 17 00:00:00 2001 From: SL345 Date: Thu, 16 Aug 2018 04:21:58 +0000 Subject: [PATCH 13/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 183 -> 195 bytes .../__pycache__/build.cpython-36.pyc | Bin 1715 -> 1462 bytes .../build.py | 14 +++++++++++--- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 189 -> 201 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2604 -> 2616 bytes 5 files changed, 11 insertions(+), 3 deletions(-) diff --git a/q11_feature_selection_q02_best_k_features/__pycache__/__init__.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/__pycache__/__init__.cpython-36.pyc index cce1771df2aeb4fe480a861dd0b34c2812778bf4..202a7b8c486b0ff82c12bef5965b879451bba0eb 100644 GIT binary patch delta 47 zcmdnac$ksHn3tE!A<`mxB8Rzjfqq7QZmNE;kFklVet3RSc5y*sa;koEeoE>@zf1r+ CIS!Qo delta 35 qcmX@ixSf&1n3tF9rT(I*i5%wqDf$`txvBc;MX8mECHc7%qcQ=+PYd<{ diff --git a/q11_feature_selection_q02_best_k_features/__pycache__/build.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/__pycache__/build.cpython-36.pyc index b0c88c740ec407a51b8c32a0e223d58ea3040313..afd000e722fd59772d8dfa298a1894d114c960e5 100644 GIT binary patch delta 664 zcmYjNyN(kv6tz9?JeIK9W!Z`fq%@l%3jzs20ZN5vB7tOz(J*$xBr{{n_8=Bblp+${ zR`UgvTOuTWfWL6Vf3OXAvI!vTUf*+leD33W|3^0(_xqin*XEu47L|D2K?u2EFTk_` zXOO`)Vfd1)oZ4BC8r671FoL+n?gpKrm0P2QxA6aB&jco{z1rQ74PN;sT6Aik5$4PZ zb3rMngGHA)%ws;F&;)hJ$SK<3^(v~PDH;Z^hnRLGS1B(|mU9|Tcw#EWHT9>dfP08- zkczx2N<9H?lxU!`teg*fia_7W0Z03@%)~||rJe~@&_Hkh#U&v|NuqW(=S z8_xEfAMK-f*T%LIVY3@$&f@$D)TRR?WW0=};w)>W^c7Oa(Bto7^g$GSG<`Kbe>i$8 z)KbeN<)c(EK5D*t_nI%{e0=i+UItV|JtL7O z9%}l#F$QAhGdlsf2O@n?zzsDJfbi~jP#PzoTp4r0qzC|T6}1j|##(*B#*yM#D;uRM zIf_IQDb^K>H`dOY-%g|KfJU7sCM^g$dA|5$-Jfo?QyxdD?0~UEylWC|4cS6MXFF(W02D#?<0E|BH`>-;>P%m_`fxeQD_8z)s21LD>r=u*Fkd$m~iz@tJYS_Py zi@Kq66|~bts+ea*XC2PcT;ZaV=6?ilQOy-$hA9j%toIVtRU*n|kBdy(CRgY!`_qL+ zaiJL14gmU0TPe%6BM+m3X_6P(jh22V<^7l2p4?d$wzBBBSrKayT%qw;pNMbij=D~IoK-3#?tQ1ep$6!_`N0t z)h?7pIdnrZD4x)s_Kr=Hl3crBFsZaRzIA{B4zU60mt!%n>SjRZO1}-2k5bkliwkEH F<39{^=h*-N diff --git a/q11_feature_selection_q02_best_k_features/build.py b/q11_feature_selection_q02_best_k_features/build.py index 95002c5..e833253 100644 --- a/q11_feature_selection_q02_best_k_features/build.py +++ b/q11_feature_selection_q02_best_k_features/build.py @@ -1,3 +1,4 @@ +# %load q11_feature_selection_q02_best_k_features/build.py # Default imports from sklearn.feature_selection import SelectPercentile from sklearn.feature_selection import f_regression @@ -20,8 +21,15 @@ np.random.seed(9) # Write your code below - - - +def percentile_k_features(x_train, y_train, k=50): + selector = SelectPercentile(f_regression,percentile=k) + selector.fit_transform(x_train, y_train) + scores = selector.scores_[selector.get_support()] + features = x_train.columns.values[selector.get_support()] + features_scores_list = list(zip(features,scores)) + df = pd.DataFrame(features_scores_list, columns=['Features','Scores']) + sorted_list = df.sort_values('Scores',ascending=False) + top_k_predictors = list(sorted_list['Features']) + return top_k_predictors diff --git a/q11_feature_selection_q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc index 3a1830b270d6d769e5565023aecb9be5259bd743..5ac181f5ef5c5e5fc7fa188a8af8663f552ef51e 100644 GIT binary patch delta 47 zcmdnXc#@IBn3tE!A<`mxB8RzjnSMroZmNE;kFklVet3RSc5y*sa;koEeoE>@zkC2a C8xE}i delta 35 qcmX@fxR;T`n3tF9rT(I*i5%wqS^63IxvBc;MX8mECHc7%qw)d9Squ&U diff --git a/q11_feature_selection_q02_best_k_features/tests/__pycache__/test.cpython-36.pyc b/q11_feature_selection_q02_best_k_features/tests/__pycache__/test.cpython-36.pyc index 7c11282368a691d1031e0ef3e349d85d1d4b9116..3864008d3a7e71a51207e78c90c33548c66690ff 100644 GIT binary patch delta 75 zcmZ1@vO|Q!n3tE!A<`mxBga}MnIip+{M=OiU>{=>Q~mJ#qU_>=#N<@{~2^X_22x|cW+LM|Io{-TMQ2+n{ From 08a5e32b667861f390cc9a6d89e9e60bc47e74a2 Mon Sep 17 00:00:00 2001 From: SL345 Date: Thu, 16 Aug 2018 04:32:16 +0000 Subject: [PATCH 14/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 163 -> 175 bytes .../__pycache__/build.cpython-36.pyc | Bin 995 -> 1106 bytes q12_feature_selection/build.py | 15 +++++++++------ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 169 -> 181 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2699 -> 2711 bytes 5 files changed, 9 insertions(+), 6 deletions(-) diff --git a/q12_feature_selection/__pycache__/__init__.cpython-36.pyc b/q12_feature_selection/__pycache__/__init__.cpython-36.pyc index 886fe32a654f75efb74de32eefce46b1759dcd99..b02224b4a259fb4ef1ef41a36b1dacdf1ecb27b8 100644 GIT binary patch delta 47 zcmZ3?xSo;2n3tE!A<`mxB8RzjjDALbZmNE;kFklVet3RSc5y*sa;koEeoE>@zfb@$ Coeo6+ delta 35 qcmZ3_xR{Z{n3tF9rT(I*i5%wq0s0yFxvBc;MX8mECHc7%qe20_gA1kr diff --git a/q12_feature_selection/__pycache__/build.cpython-36.pyc b/q12_feature_selection/__pycache__/build.cpython-36.pyc index 7c97eeb95ec157d7f2aaeafb7f302dd15b650ec6..bdb40aac53c06d5fbaae91d438e792991639bae1 100644 GIT binary patch delta 475 zcmYk0u}&N@5I{Zl-mY)&j@&^YQU2hXED@ogh!jyqh=xc}1|+ncjdHr3bh8-amP6Ca`q*z7%mA0#ZZB}C1GN=Z zfFm91Q3VG9F5?Qm#8oZzvR#GaL` z0$?6WRzk@u@k5k?RM;JJ8;Cy-p$-S8#y)70E)!|bXh4D9c@C(*4aymWA?F@yRITF&DN?pwhRdaQ0CAF$UT3$PE YyY#ub7VB@;2x1!ed?iRO`4E=GBLP}-Z2$lO delta 369 zcmYk1y-ve05XXJC6Q`|HN`=@E8&Z)_fj$5%h>1$54Cqt|MY79R+*V13RthkL7eILf zHf9!{12K8+#49l2goQiZ-Ov9!-N~Q9N<0n1uz7d#iX%qIiu^O~_}E3da7hsbF)@Gu z71Nj+hOA~5bK{{`Gmm{EP}J&IeY~#)vcC@EM-7e^u zR+4I|hH5?ot}A~;dh*+yCodltFf1h;oOawRBRR<-rv-apIdelW>_OtWPLEr-w6L^r zk9?w|?2RNXr~jPwZ)QgKuM@qDvYF|Z=XAULg2Sy1*G;Rx5|EIDuDVsCDqVY2KC->{ zgic`B`txY2qSVs4vQ$m1SX^aEbUU@a1D$48EdPWu;QO0hw?KlVwX*;M+JQFz1=TuG A=>Px# diff --git a/q12_feature_selection/build.py b/q12_feature_selection/build.py index 1bbe2b2..c377046 100644 --- a/q12_feature_selection/build.py +++ b/q12_feature_selection/build.py @@ -1,18 +1,21 @@ -# import matplotlib.pyplot as plt +# %load q12_feature_selection/build.py +import matplotlib.pyplot as plt from greyatomlib.multivariate_regression_project.q01_load_data.build import load_data from greyatomlib.multivariate_regression_project.q02_data_split.build import split_dataset - from greyatomlib.multivariate_regression_project.q03_data_encoding.build import label_encode - from greyatomlib.multivariate_regression_project.q11_feature_selection_q02_best_k_features.build import percentile_k_features - from greyatomlib.multivariate_regression_project.q11_feature_selection_q01_plot_corr.build import plot_corr - - +import seaborn as sns import pandas as pd + df = load_data('data/student-mat.csv') x_train, x_test, y_train, y_test = split_dataset(df) x_train,x_test = label_encode(x_train,x_test) # Write your code below +def feature_selection(x_train, y_train, k=50): + plot_corr(x_train) + reduced_features = percentile_k_features(x_train,y_train,k) + return reduced_features + diff --git a/q12_feature_selection/tests/__pycache__/__init__.cpython-36.pyc b/q12_feature_selection/tests/__pycache__/__init__.cpython-36.pyc index 199811ee773001ca0c605ea752dff30b16fe2a41..bf18366b89534c14df3249ba7fc993af605d2279 100644 GIT binary patch delta 47 zcmZ3hZmNE;kFklVet3RSc5y*sa;koEeoE>@zi0q6 Ce-2#$ delta 35 qcmdnWxRQ~>n3tF9rT(I*i5%wqVfq>QxvBc;MX8mECHc7%qoM)7jSId2 diff --git a/q12_feature_selection/tests/__pycache__/test.cpython-36.pyc b/q12_feature_selection/tests/__pycache__/test.cpython-36.pyc index 3a7de81e6c075362fc5574bc7cd7fa1084aa1fb6..c50dd20eb3fd954c3a85067e819bd29650c2f2e6 100644 GIT binary patch delta 112 zcmeAcoi55@%*)H=5NQ#;kz+NJOq_m3er~FMu#d5cseX8VQFd`bVsff}a(+sx{^Wg} z@|zzqU14U7+Pt03fss*Z@(=cSr6|GN#FB!X{F0o^B)x)45G#reN;4PaltkH24&c1BLL|0CLsU- delta 94 zcmbO(+AYdq%*)I5Qh!m@Mvm1?0zvv2`MIh3=|!oPi6!~D`jaPe$ZvkfbcLDm*5<=( r4vdV-lLNWLCrfj9$lMalO)M$M$uG&tOwuc;1hH Date: Thu, 16 Aug 2018 04:44:07 +0000 Subject: [PATCH 15/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 160 -> 172 bytes .../__pycache__/build.cpython-36.pyc | Bin 556 -> 598 bytes q13_plot_residuals/build.py | 15 +++++++++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 166 -> 178 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1475 -> 1487 bytes 5 files changed, 13 insertions(+), 2 deletions(-) diff --git a/q13_plot_residuals/__pycache__/__init__.cpython-36.pyc b/q13_plot_residuals/__pycache__/__init__.cpython-36.pyc index 339472dc72a16004e01d1fdcf966768b0a1ec9f4..ee4484247ca5fd7c05ae4d416a21390a5db361c8 100644 GIT binary patch delta 47 zcmZ3$xQ3C#n3tE!A<`mxB8Rzjq<%(zZmNE;kFklVet3RSc5y*sa;koEeoE>@zaRiF CEDkvU delta 35 qcmZ3(xPXzvn3tF9rT(I*i5%wqzWN#YxvBc;MX8mECHc7%qk;guehZoa diff --git a/q13_plot_residuals/__pycache__/build.cpython-36.pyc b/q13_plot_residuals/__pycache__/build.cpython-36.pyc index b3cfbafacaf9b3c23302f194e7c40a3e8bb72751..16ae4c78de237fbb463f33183cfbbefffbcacc4d 100644 GIT binary patch literal 598 zcmY*Wv2NQi5G6&4l8rcMw~QI1r9$C$D~c8!3KT_#8b|?&tCui-4 zBu_SYo16;vc|I>$;J9M6z`vlmZwM>0qDSN}^Fc0E>>mmuk5r=B}~3%8>m;IwL`Ic`ktMe@~3 z1!A!Gx;(O>LmS?eXB}&d7aWsY3nF!;^d77j*qw;$60f}h!T%UJ10(oyd&cgvzRBZ` zFQ*r4ZMH>2Dmf4+lnsqA5^VG=*#M-C7TXwWHV5prfgYDnX@G^k0c~=OGX>lRQ&vFU z0(Vni)hhHCQBLR2O*SqI$VLhl%#=k|RMLn!Q-T@5Zp>>f$|Yk0qrE0LD~ diff --git a/q13_plot_residuals/build.py b/q13_plot_residuals/build.py index 9cdb3e3..7e89ede 100644 --- a/q13_plot_residuals/build.py +++ b/q13_plot_residuals/build.py @@ -1,5 +1,16 @@ - - +# %load q13_plot_residuals/build.py +import matplotlib +matplotlib.use('Agg') import matplotlib.pyplot as plt # Write your code below +def plot_residuals(y_test,y_pred,name): + residual = y_test - y_pred + plt.figure(figsize=(16,7)) + plt.scatter(y_test, residuals) + plt.title('Residual plot') + plt.xlabel('Grade') + plt.ylabel('Residuals') + plt.show() + + diff --git a/q13_plot_residuals/tests/__pycache__/__init__.cpython-36.pyc b/q13_plot_residuals/tests/__pycache__/__init__.cpython-36.pyc index 3aa40f003ac9ed7ca53d9580f2b40524a62da90c..d0d253fbaff2c32b68d39f86bf22484bd3f7d132 100644 GIT binary patch delta 47 zcmZ3+xQUU&n3tE!A<`mxB8RzjynaT0ZmNE;kFklVet3RSc5y*sa;koEeoE>@zX$*_ C4h~TO delta 35 qcmdnQxQvm*n3tF9rT(I*i5%wq!TK5bxvBc;MX8mECHc7%qapylhzqg+ diff --git a/q13_plot_residuals/tests/__pycache__/test.cpython-36.pyc b/q13_plot_residuals/tests/__pycache__/test.cpython-36.pyc index 89ecb4e3b62bb3c40148c8459b358afd6936e702..f59da8e80cf64ba727041d0cb1b9393979af389c 100644 GIT binary patch delta 61 zcmX@ieV&`cn3tE!A<`mxBgYgbnP~lt{M=OiU>{=>Q~mJ#qU_>=#N<@{$1pM_g@^e%5(~D9o6HD@Q^(XITmfw7xNsNi{*5r3A F4*{AH5x)Qc From d506245505052dedaf5be5d1ce2ed9a140bde191 Mon Sep 17 00:00:00 2001 From: SL345 Date: Thu, 16 Aug 2018 04:56:09 +0000 Subject: [PATCH 16/16] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 158 -> 170 bytes .../__pycache__/build.cpython-36.pyc | Bin 2166 -> 2044 bytes q14_benchmarking/build.py | 15 +++++++++++---- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 164 -> 176 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 2092 -> 2104 bytes 5 files changed, 11 insertions(+), 4 deletions(-) diff --git a/q14_benchmarking/__pycache__/__init__.cpython-36.pyc b/q14_benchmarking/__pycache__/__init__.cpython-36.pyc index 453edefacf2fed8cd72ca5b14c268f798bc1dbac..0cacb255da5369367ca93708f8eb41edb8110886 100644 GIT binary patch delta 47 zcmbQoxQda(n3tE!A<`mxB8RzjxPC@{ZmNE;kFklVet3RSc5y*sa;koEeoE>@zW@L( CHV!cW delta 35 qcmZ3*IFFITn3tF9rT(I*i5%wq-ufB&xvBc;MX8mECHc7%qXGcC&uIC`&P;O`4XpwvlaaRW2{oxLvbxth=?wf!iVQ z;+=T_M7Y|)$*x4*(?f3Sp#^1_R#0CXlLm`ZUU2NW!p52Ch0M0Na0M?}HJ9_CykFiI zrCfKP9H=@I9iw*z) delta 695 zcmZuu&x_MQ6rLYRo2F@-))l)Vs9Se!_fk;sBqDh6=D}MKLTF~YU6Llw%;GN0u!o*K zthoz%^DOws#G`+JAmTw}@lCR;T{Oe{^4>S!d*4j*tM|hn-S2eVx6j@OFI|MbptZ+_ z{4s?1emeR*WOvvtcAIUn(aH+8*$&%2xVyp_ot}L=8Gxz@@x-X#07#^e!ip#ww5pjS<*yTT=V75M886*Dj{>A6j~ zCo8hI=60#C=FOz4PlPp5x0T&lmgWhQEUb?H0r6{a-JegV`&r7SbIy(n1ct&H2{bJU9aAbu1ih&ISR}C0diKEia`C=(c vTkJ@zc2tX C7!FAQ delta 35 qcmdnMxP+0zn3tF9rT(I*i5%wqf%+NwxvBc;MX8mECHc7%qrw2a+6$@x diff --git a/q14_benchmarking/tests/__pycache__/test.cpython-36.pyc b/q14_benchmarking/tests/__pycache__/test.cpython-36.pyc index cc77345a80d2a31276437a4b20a95a08f4c2fe16..217519582dc0b6843010f72c1aa4c58b65e138cd 100644 GIT binary patch delta 106 zcmZ1@utR{un3tE!A<`mxBgZu+=}7&I{M=OiU>{=>Q~mJ#qU_>=#N<@{&2O1% zS&XAt^Gb6IDsM666-2QWB<7_g7T;njNQn~6O)M$M$uG&tOwuc;1hIh95PI@l_I?0Y CoF&fy delta 99 zcmdlXuttExn3tDpxBsH3jU3mQ1bp=~@^e%5(~D9o6HD@Q^(QN`%5Rorj%6{v#hO=| wTTpq6DX$=ktspTkC9(JxQ$flt!Q8}>f}H%4oXjM>f=UqU78{hFypp{i0I{