From 9604a0b64e3838d66c2a9e5f666f65fb3bd1c227 Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 11:08:35 +0000 Subject: [PATCH 1/5] Done --- __pycache__/__init__.cpython-36.pyc | Bin 154 -> 157 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 178 -> 171 bytes q01_plot_corr/__pycache__/build.cpython-36.pyc | Bin 558 -> 686 bytes q01_plot_corr/build.py | 9 +++++++-- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 167 -> 177 bytes .../test_q01_plot_corr.cpython-36.pyc | Bin 791 -> 1106 bytes 6 files changed, 7 insertions(+), 2 deletions(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index abc397ac59f40d351e1861264050586541adce96..33f226667fe2e201a50f2c304d2065de7ce7e382 100644 GIT binary patch delta 84 zcmbQmIG2&bn3tD}?by-ii5%t*UiumNxvBa^iMf@D*+rSf8F`6$7H0b4`9;~q1&PV2 m`pNkzsrqTDi6x~)sqw|BIjPAdnfZC~1x5K;K&Jl08aV*DLLOuQ delta 81 zcmbQsIE#_Pn3tC;r0Y!NL=JOXcW0}Z(Bjmh;+VvwjLhPU)a)3S)Z*-t{DPSDqSVU7 elKkA5f};Ga)Z`Kv9bb}~Tac4jk{UCyUJd|*uO3?f diff --git a/q01_plot_corr/__pycache__/__init__.cpython-36.pyc b/q01_plot_corr/__pycache__/__init__.cpython-36.pyc index 460f88abffae2c2371906282e6e7f121c82a6603..2880baf78f7d241b58be0fcfcd354e47c1abe355 100644 GIT binary patch delta 125 zcmWN@K?=e!5CFjBB0=a^+=`$c#BV6{u!MA_u}L;=(nFu&JG}V^eT1*Ehk<$Pmo~em zS+BmI?r9F;3Ij(1v2nJe_%bA$j(fPUj3rw~;J7Eak*$*u77FC5=Y(1Kz7!tq7IWZ= Zjzs{`CtndadH$JGIMNnwS!wTwE5Pl30=$Uy>i6k`^t~XmnkVQlU?^jSntU}E+nVrtGO-<5uXPLRGxBDPI zh(1Jaz1mms%99GZm~eh_PS4Nx_3^>MJpJ+g!&6GgPjc-r^k1OZV^oqzXh;EQX+v99 zu$C9Rjf$v^ix`N4bt2gaMJf{+$@nW2GYM}x2~=>*2m|6Y-)!^-)Luj zYLzRiR`eGSq;Mi%>A|Y9H+7|K*$$1X&xEOkQ%99OySjn>DqMCt5$Yf>QS2vFJF+Gt z*;5BQyh|$K5}u_;q@~&7y~Mrd zL;69v=$h01LVD?F10__$ym_7{jULD!hQsvf@p1eI0iNL1;>1rW?ID2zg&JyTsb_oj>IIV~>G|njPJ;Ca>gBp5RGlwXCq4EUYPk4;BapW9zt%H^OK9F8gmCFSj-g>!;C4IcgVE?BLpivv zZfy0ll<`=9Heb|6k~!)prggci+9uocqG*lre4(98>~glyt+T{RH!bG*LJsD+v$yRJ z8Q;08_-1`%^5&-WT$ha>6s=y)8!O}0iWSLepG#_xnd(=a=WyimEzy$Du}APbU{ zG0F0~-(ZIH{rqk;ntVSxp8h*DnJp`=MvIk6Nlz&40RbSx1P?H!cux^i-R{WHgxAP~ rd`pJI7+uZicwjPqsV2PBcK7zuSFlflPfq5oTI%v+_!DfHmPUU8ouh^r diff --git a/q01_plot_corr/build.py b/q01_plot_corr/build.py index edc724a..272c9a8 100644 --- a/q01_plot_corr/build.py +++ b/q01_plot_corr/build.py @@ -1,7 +1,9 @@ +# %load q01_plot_corr/build.py # Default imports import pandas as pd from matplotlib.pyplot import yticks, xticks, subplots, set_cmap -plt.switch_backend('agg') +# plt.switch_backend('agg') +# % matplotlib inline data = pd.read_csv('data/house_prices_multivariate.csv') @@ -9,8 +11,11 @@ def plot_corr(data, size=11): corr = data.corr() fig, ax = subplots(figsize=(size, size)) - set_cmap("YlOrRd") + set_cmap('YlOrRd') ax.matshow(corr) xticks(range(len(corr.columns)), corr.columns, rotation=90) yticks(range(len(corr.columns)), corr.columns) return ax +# plot_corr(data,size=11) + + diff --git a/q01_plot_corr/tests/__pycache__/__init__.cpython-36.pyc b/q01_plot_corr/tests/__pycache__/__init__.cpython-36.pyc index c4bc30d7704db1af3a7d76f564945a76f376cb2d..56433c4f12651ab4404774608ed769034111e1b7 100644 GIT binary patch delta 104 zcmZ3^xRH^=n3tD}^Vreoi5%u3arzngxvBa^iMf@D*+rSf8F`6$7H0b4`9;~q1&PV2 z`pNkzsrqTDi6x~)sqw|BIjPAdnfZC~1x5K;K&F17fnj_>PJT&za(+>feo1O^NwNOK GPB{RB3no(l delta 121 zcmdnUxSWy0n3tDp{>3Yi6FJN?LY%E)LW@(2ienO!GBS%ZQnO=RQj4=o@(W_pi&85S zOY(DL(oz#kN{dqCi&Jw_lS?x5^I{4O4C4!O@=M~A^NWgNN>YnUieuvAGxIV_;^XxS XDsOSvt(V#22 diff --git a/q01_plot_corr/tests/__pycache__/test_q01_plot_corr.cpython-36.pyc b/q01_plot_corr/tests/__pycache__/test_q01_plot_corr.cpython-36.pyc index 40d2b706881e3ab76930c2164e7d4894f4b4633f..281cf38a31d66935da26c3dd6f361afb90d709ae 100644 GIT binary patch literal 1106 zcmaKrTWb_C6vvaf?9Ohx)h90?ItUd8q~irdL8MSh!G}du5XOfPC)w_7=hh^%*rh&g zzl#T@hRm5lDCLCVfFakf^tS zcw`t+8+?@79B?fca5jN~UY%ElrIk|9**TVG)Z{r=$GVp3?4jU>$K$HelGQ3prDjEw zn{3Ke#*N%d^)$uER|RA4L)G`d$X0ve2r8TllDMcHT2J_(sAC7HpAh?Dc`D<0l^RRY6m0&aZzb%U@VQGH?dbsxymlnoN;)+!1=rT8g$Yx15VgIV#95NI5{MHAB*Y5O{5)Yi?F)yT(f**KXu#%y1v={YE;&R0!mwQNn1Yb&d+bj7VQ zg>pL0?QI@1JuHUg0?j@_&_qxmf&r?&BO-zbE608ss(pH>lH*wV74~p_j%J@CIO1q% z^#_gudIkg&u*Gr~nFs@X9Mt(lS*wj(nl9*%tuC*A62mdz&$s#8>`E)w87=Xi&Rx;e+0Coh^4}CPhiYw)^2m|48-Eg<|6@;s^zf{N za=LwX)Mt7ey1+qjDQi_}DSaYk)j(GUK9TaKQ{~=c5=_?jascCS7RsEU*)TIs`~TUQ zkL<>J)>t36%B}oRwXLqf$Lpr3{Rj#Z^7>)k8RVXKb>V_A6S9cM#|>U~MG5_+#jsU1 tD9qe~;6^Ku`0{3em-@m7;= Date: Tue, 16 Oct 2018 12:05:59 +0000 Subject: [PATCH 2/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 167 -> 177 bytes .../__pycache__/build.cpython-36.pyc | Bin 951 -> 765 bytes q02_best_k_features/build.py | 16 +++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 173 -> 183 bytes ...est_q02_percentile_k_features.cpython-36.pyc | Bin 0 -> 1970 bytes 5 files changed, 15 insertions(+), 1 deletion(-) create mode 100644 q02_best_k_features/tests/__pycache__/test_q02_percentile_k_features.cpython-36.pyc diff --git a/q02_best_k_features/__pycache__/__init__.cpython-36.pyc b/q02_best_k_features/__pycache__/__init__.cpython-36.pyc index 43047f0b7d121cffd870478bfcf87b31503ee2f1..8f69d00d01a94716bb508643dadb998bfed8e349 100644 GIT binary patch delta 104 zcmZ3^xRH^=n3tD}?by-ii5%u3arzngxvBa^iMf@D*+rSf8F`6$7H0b4`9;~q1&PV2 z`pNkzsrqTDi6x~)sqw|BIjPAdnfZC~1x5K;K&F17fl+)?YH>+?c05#3vHrwPIRJrE BCQ$$Y delta 121 zcmdnUxSWy0n3tC;r0Y!NL=N+e5NE5H(Bjmh;+VvwjLhPU)a)3S)Z*-t{DPSDqSVU7 zlKkA5wA93s(xTM(;?$hf&ryk0@&Ee@O9 S{FKt1R69ln28LoFW&i+(_A2!N diff --git a/q02_best_k_features/__pycache__/build.cpython-36.pyc b/q02_best_k_features/__pycache__/build.cpython-36.pyc index 8372777e40963b4c282006fe1233b5dbaa51cf8a..98975cbb18ae8011ae49b6ab140b4f734fc576b4 100644 GIT binary patch literal 765 zcmZWnJC74F5cYVVc}d4hA}w8-ECLBpAcRDJIw=JwU$OYsPO_VQVS58Xn<`w%58;RK z3+UWZMf?LAm|ac~iIHYJ9^2o{H{++1$?(UwuU9vekniL~9Q0qI>dpuvASVp^l`=;{ z<_dZM=3&Ii{UTribhljeLl&YR3SR`DfDHsJ$ZT*#6mtIYk>G|$>#ET*u2q^y9T!b* z(k)jhH*%in?F{VMLgq3t7g8m%G-)m|HeSX`u9Va|t;*wlL`$&bUIMf}>T6W}7EMbs zEO-Ti3gPcX@6c}!wVTHUhMcrrFvcR^7*sqO{F%v=824w zO33K;Vf+UXn~VdhG8{wn?(viOT51z-;@e9)x^B{3%Ms$H@W1hoc~whzt;B9 dJ=+s=w?}(XRHDh{%Py<#5`+-Kkd9&O{swFf)lC2Z literal 951 zcmaJ=y>HYo6!&vJFHJ=SEXM#sNR_gjD#3U;Ngc!j16nz>~^j&5%=Nw{-Sz{7;KM+eI&^u#Z@JzkrBIA|H3yy2yG!c9zxRiNa z?PrdGV%xgz<~;ccO>@@TjLdr?tZYSAc1w<7O;%3pT#`OnxvkSu96d!_yS3JI<+uK^ z)w->>Mn=lUnX`uXpj_oC{}R^tUBDC=FnaDYi`gG6Mq2BgiPF0uxZ^PQ+;4l&$Qo8b z8;l8bpX!~#A*tvA=4`Ut&j9(EW=0f@+`%q=G?%1BatMO`FGc{!(YP|JF<)UL;OfC( zaCEZwB$;rjl6f-asaoRZ(PWtyY_MpwKP=L6!qQRS1jSBHAKm~DhDDvFg&d)?!M=*9 zw&uLip5Sk|ko*rtL(d%CQM`-J3@N@2SAbNZPd?HUdrUfNoxwPCuqRAaka@5WoaLFS z#fH7`aQ!M67P(YeT`orVa4yXeE;)VlAC|xIQ6Nl#wVl|N}pGZzm0b`lN*UfvhOxJ_+vK^TSbHbi#Zm-B+Bq8eP+Jdxewz*o=-(FxPR|5jt;8PV}tU^>f! Nk4$N#sb~nH^$W>S=m!7* diff --git a/q02_best_k_features/build.py b/q02_best_k_features/build.py index 9b1046a..290b915 100644 --- a/q02_best_k_features/build.py +++ b/q02_best_k_features/build.py @@ -1,7 +1,8 @@ +# %load q02_best_k_features/build.py # Default imports import pandas as pd - +import numpy as np data = pd.read_csv('data/house_prices_multivariate.csv') from sklearn.feature_selection import SelectPercentile @@ -9,4 +10,17 @@ # Write your solution here: +def percentile_k_features(df,k = 20): + X = df.drop(['SalePrice'], axis = 1) + y = df['SalePrice'] + + selector = SelectPercentile(f_regression, k) + X_new = selector.fit_transform(X, y) + + featurelist = list(X.columns.values[np.argsort(selector.scores_)[-1:-X_new.shape[1]-1:-1]]) + + return featurelist + +# percentile_k_features(data,20) + diff --git a/q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc b/q02_best_k_features/tests/__pycache__/__init__.cpython-36.pyc index 86a25cff523fa394416e407b58545caf2749163a..58b4227f703bc913166594b9f9c87c6ba07293ca 100644 GIT binary patch delta 110 zcmZ3>xSf&1n3tD}?by-ii5%upDf$`txvBa^iMf@D*+rSf8F`6$7H0b4`9;~q1&PV2 z`pNkzsrqTDi6x~)sqw|BIjPAdnfZC~1x5K;K&F17fl+)?YH>+?c05#3v3?1VU#vf| GUk(6ymMGBx delta 100 zcmdnaxR#N_n3tE!{`%F(i5%tuQO;H|p~b01#W9IV8JWcyso60usm0kP`2{iQMX8mE xCHc8AX{m`NrA4Xn#i==|$t9Wjc`=0sChz{OH z9I;WkN?(Qtfrpq|uJ#qU;v74h&6aIJ#nBv}c*f_<`Mz(Czu4I5wg342=iL@#f3mf! zgZ>^44QPM?&sfeQ&KWr1W=`%#ZtZ)Sm$#x;?YFXa)RCPNAKD8Zb)f@3bfE`*7{JD) z6ZIsQU7YD3GT4NzmkhR~yKticw4ShV``p1)A-6ZDQYEr5X(r>-cr1mfl+@=qNwfY_ zsm;F768+7IG~+7EgqrB7Oh)q$K^QSSE-NkLsY(;6T_fS1fXWuC)qTZoUVj}m2(ieXHy#KT`BD=41^W-4%KiB3UQ{)|B;`_oJC$zDP zi%QtTp?Acpt|; z4t*DmVTLdGulxl&ag6(d1Ha7{m=05|{U1BG*n;?Cn8+I`7vEGAbN<1@Ul2GWAwUeP z98uT79oPvD)0r&L3q6I(V2TpkzR+4K^YA$$XWdK|p<_KQv$6Gvf!~V3&W zYjjRLoWFx+{`HCnkYj<84Q3*%qz<4AiqZtRFv)Q+sad(YBIIfdBZTfHQHl<4=%_B< zRF4c*+?WA+_MQkiLB@kS=1aFe1&hanu;ShYso%6>RW`7?+g1rc-A$ z-@il!&vjtVrZO0pDo_$zLeW4Jq&j%^IMwFaPHZgl%dKPt2l zMI!CMl+#sbv0jF+TaUscnl);#0QTt{0BbfAr_0zxr=}Vi;^y%AgSSHNm7rGuT#4+) z6#!SlLf{^(fTPlaa*SAE2RzDZMWMOWRFerCz&}=^q)14L(pX#pA8@6>+r5QAh(65TrP{E40upQ){x@dg@qxMu3AhdO+5c&9F pff&C!)}t?zx`oSYJnN{}ZNmEBG*#TAv!XZA3^@IKr^j!g{TulgELQ*k literal 0 HcmV?d00001 From a121b3f686b50e12447a97cc7e4dc85f10ebb9ea Mon Sep 17 00:00:00 2001 From: ramyakrishnan86 Date: Tue, 16 Oct 2018 12:59:54 +0000 Subject: [PATCH 3/5] Done --- q03_rf_rfe/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 168 bytes q03_rf_rfe/__pycache__/build.cpython-36.pyc | Bin 0 -> 668 bytes q03_rf_rfe/build.py | 15 +++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 174 bytes .../__pycache__/test_q03_rf_rfe.cpython-36.pyc | Bin 0 -> 1869 bytes 5 files changed, 15 insertions(+) create mode 100644 q03_rf_rfe/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_rf_rfe/__pycache__/build.cpython-36.pyc create mode 100644 q03_rf_rfe/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_rf_rfe/tests/__pycache__/test_q03_rf_rfe.cpython-36.pyc diff --git a/q03_rf_rfe/__pycache__/__init__.cpython-36.pyc b/q03_rf_rfe/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4302864a18e33741f75a11869dac87f95f20a477 GIT binary patch literal 168 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU!nRL`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNc_`t=4F<|$LkeT-r}&y%}*)KNwou6R}91q0E5vjEC2ui literal 0 HcmV?d00001 diff --git a/q03_rf_rfe/__pycache__/build.cpython-36.pyc b/q03_rf_rfe/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2fe057fbce6918af67f41334d5233659bd79bac4 GIT binary patch literal 668 zcmZWm&1&2*5SHYhb;52*O9_PDdh=yn2!tL=DTL;@l+B?$I8h3F?VVzY?BFdP(xh9^aD1m*-M=QCyqeLD^YVfh(I{ zdvznM5+3H2yUA&YmKSgFI9`fYn&!e-aQ<8i=Txo0R&>mTD?y1-&QaU~VIV7{Cz*`C zu`L}?KOtM@>5gn8&xXiH16{>CD&uEJ4`bpXUL^w^*ba4{j$X7(PRMQ~oi6ynrO@zh zB)T7eMN+Z&tlWO=Nly9GwyZ(;9toD-lnyjhKF>ldt?6upL3WG`k%l%*Dx>?Rbs?&i z53yFx^UU>KXRI&tBrsVA`XSIwNE#zS^T^ilo!BGH@MnolYoM^A*@(4O?z$E2%d_IW zv1`|f3W^G!6!&EAi73-zlg$b_6`x+5mbS(X#Z|AgoOhd$-Wg_?-%Sw+eMB>s(qlSh z_6gqegOGMO1K|SeWXLQCS>lMWJ{%)Iacd32w)6kKy{(!b{qsZXpt;g;*O4*vZBY;4 ZG1@}*3hVAQydE3pGK7pBvMHS=e*rEUwhsUR literal 0 HcmV?d00001 diff --git a/q03_rf_rfe/build.py b/q03_rf_rfe/build.py index e8a8d20..f3cc913 100644 --- a/q03_rf_rfe/build.py +++ b/q03_rf_rfe/build.py @@ -1,3 +1,4 @@ +# %load q03_rf_rfe/build.py # Default imports import pandas as pd @@ -9,3 +10,17 @@ # Your solution code here +def rf_rfe(df): + X = df.drop('SalePrice',axis=1) + y = df['SalePrice'] + + model = RandomForestClassifier() + rfe = RFE(model,n_features_to_select=len(X.columns)/2) + rfe = rfe.fit(X,y) + + return list(X.columns[rfe.support_]) + +# rf_rfe(data) + + + diff --git a/q03_rf_rfe/tests/__pycache__/__init__.cpython-36.pyc b/q03_rf_rfe/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..327168f97291ec8a98372855cabacce7a5795dc4 GIT binary patch literal 174 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU(xy*`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNX)PzmlW&A$7kkcmc+;F6;$5hu*uC&Da}c>16f)O#0&tkJ};C2 literal 0 HcmV?d00001 diff --git a/q03_rf_rfe/tests/__pycache__/test_q03_rf_rfe.cpython-36.pyc b/q03_rf_rfe/tests/__pycache__/test_q03_rf_rfe.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..f47ba47504f7d22a71e47f376854d5572705b8d6 GIT binary patch literal 1869 zcmaJ?-EP}96ecCvmSrbPx+YyZY!!xefPo-hTVU9LVQ7*zL4hnAlKvpth05sAjuQR2 zByBWCca^@(9%Oq6-R>%{u&bRTxwg|Klc2*x>F|)}`#w^S78bnvUw{7gvc}loZ0=e{ z|1m!LEgE3J6Bcl6t;9<0z~&5Wa1tl21vT^;)RKDI2pXJ8e(FN~f(K1#fD29VpapGM zfJOKOmS7of!KZK=R$vwG^p^uq)?^c-Te}QCgSGbz)}(!52W{YotaJAgXJ`8zUbxSt zHrqnWOAFuNi@NHCswdG~>`T)dCW%meJ&@7(D-cF>Px7Ib;XuWa)L}YIOgs`Q7DjGF zdK9$waD27R+2PKE zph^CVtarE*w4UciB-F=_`#_tWM3MI}gUV~}s=atrrf6gAL8>>8N4pBJbfIt=M`{b_ z^{P%a)2lp(Co(#t^uG*b_G_-96YSKF)M1`LMBse52$skA=yf!*BrC9hgY}*THj#y` z12w2)TO(?)twR$*_6m={Jt*;vI1ZjNM2Tz>&M!Ey%%fqdfh+Iho~eu z`5tF||Gw@x#Zsl5XZl&DjmRQdv`sz;CmPU&li={eq4XVI0r3$ApU-1Z%^t>+WOoP( zDvBW#79W3e0~j9-yMoD-e!_Kz$&_-$;>i>XTCJb=uzWncj+2sbG&9PpnQ&MAClZM# zx)n`RxN@@lZYX-~nxZR(eSyO@od%4LzyAMns{#9+M&X8GCQ=!Og%^f+hz=9-+hIr> zy85CPF{N4}vqFZTos(lp3TaXi+|<)ljmzB{-u3crXCbH$L Date: Tue, 16 Oct 2018 13:10:28 +0000 Subject: [PATCH 4/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 179 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 711 bytes q04_select_from_model/build.py | 17 +++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 185 bytes .../test_q04_select_from_model.cpython-36.pyc | Bin 0 -> 2089 bytes 5 files changed, 17 insertions(+) create mode 100644 q04_select_from_model/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_select_from_model/__pycache__/build.cpython-36.pyc create mode 100644 q04_select_from_model/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_select_from_model/tests/__pycache__/test_q04_select_from_model.cpython-36.pyc diff --git a/q04_select_from_model/__pycache__/__init__.cpython-36.pyc b/q04_select_from_model/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..d79bb0f907b236046ea5b19d85f66b4aeec552d2 GIT binary patch literal 179 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUkUmd`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNC^5$X literal 0 HcmV?d00001 diff --git a/q04_select_from_model/__pycache__/build.cpython-36.pyc b/q04_select_from_model/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3945c94a25d926e3e88d4ab274db7ef6ede9b699 GIT binary patch literal 711 zcmZWmO>5jR5Y>n6^=@{Pwui!Ad)v#p(9-r$LLsoXhSEK>s05=}a^sC;Ig%W@#e3Rb z`$PIe`X_YFDSx4-jvWGl2xb_)VdgzOy_(G?Z*Ts7J0l3)pa%!;=mUg1h9r={3TezR z?rWlmri>0XRS}B;qbgw|8E;Y%?J*mRSR}s?n+Uo_i_tCYKnom>)>6sBudLA@jgShU z=bw2kj9wWloj+0BxvH$BJ^lGYaL=;~(>j?qwko8{b*p@J&27cKTo&%S!2Mo02}A^O z0^wGWI~IJ59PNn5d$gmTbaan*Q5S7!hdZ(-82PBfn;4K}kLC!vaTkN| z=#-7uT**&8|836(iX;A`a*I)jgf)$&0NUOxHY+Qid&_HA8mmL3D(AzfFsjwHV+Y@* z&t2Oz#`;A9!|=L*zXrSwvF^QK)Rme|OUZp}WnObF{~$Yq&Hv881}!to^_E}S%3ajF ze)lH(V(g`Bcp=7V~12%V;N^)B-A5q>p@#MZQYbW)&l7mYjY2d553#1Vtu3HV% rq;5iLB^Nn-ryaxkfn#{~gVak2>3h)KDtX*n?k13?c#2cdH;MiOpjyTq literal 0 HcmV?d00001 diff --git a/q04_select_from_model/build.py b/q04_select_from_model/build.py index 12dd1df..cb1948a 100644 --- a/q04_select_from_model/build.py +++ b/q04_select_from_model/build.py @@ -1,3 +1,4 @@ +# %load q04_select_from_model/build.py # Default imports from sklearn.feature_selection import SelectFromModel from sklearn.ensemble import RandomForestClassifier @@ -8,3 +9,19 @@ # Your solution code here +def select_from_model(data): + X = data.drop('SalePrice',axis=1) + y = data['SalePrice'] + + model = RandomForestClassifier() + + sfm = SelectFromModel(model) + sfm.fit_transform(X,y) + + feature_name = list(X.columns[sfm.get_support()]) + + return feature_name + +# select_from_model(data) + + diff --git a/q04_select_from_model/tests/__pycache__/__init__.cpython-36.pyc b/q04_select_from_model/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..e9120116f2c7176b92e4f93b0fbf961b693370d7 GIT binary patch literal 185 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CUupUo`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNqa=!UE{9S-frpl(4e@zQ3{WR`IDTTmafpe@*b zXMYMBV}=$UG@%7;=)e?A!wk&A9L&QtxDGd90d5XvgK5zaZTxR$(}G1*QHv9`Oc@SX{6*0~nPHqPM0oEC|QOxRah8m1YD1Sh8l!u0bb;cB3VA{u=P z-0uGL#|?O#A>7ukDKT(Xm4d^LuJzNfe0Enc%%dmn!AFlwLDHt z&>{6FfeSqX2wLBB{fktkQEN@7W+Rq68+U^y=|9W<&PLFFmKmPV7zf^6Z8j1`+C2%C z*4$KE@nPwry~!0WysOr5rB*eld_T`Jcr2m=a`?kg$R9Hm?ct!lt9G&kB7*1rL%=-5 zrdLpiGJ$~&4D5FnCJ_^dy$dy{V_$;?c-YsWi7>Z{8wBspMMNWpp6DUh9=3IC`W^~n z88&9WvbWa0ZJf6Z*pfBIrEr-uPx17K zAE;RGNiM&>-+P{^13l!C=tanqUSDvND-l-oi8G1B$o6qBz1N?Ac`|#3R6T>h=u(E4 z8mtbF3ZINV{5PD$HiP@q6pQ6}Y;^xpuvh=f$+>Khvoaf>pmH`FRW9hvPLOxDj~%oc zeKP?aM4#h1@DF*C3++SZ%gp#GH_@IyC{u9WqU)TdL(zfh+NzD6>X0DxD>02)v3x}! zCoc7MG^)U02*y_*1;%?H6D){LSj{RdZlQvVL~a@+zHx}7XBcR2kJe8iz{=p8qoMHo znevrDQpgGqKi2-styr6vEB;ZIBSXc>_gD`6+q&x(vlSzs>Zej0E+bLQS9}r>mbK+o zB6Q&<=%jFIkuIz7x&YOkE1;^j6UHarmk2S6(n7>+HhS<;m|bvo4!Q}A=FdSlp$Kcl|6DNoN3RFJ(cT_6UE~6(+b;)9* zZ~qS-m7DEuqwvB|@>GOj(F*A*$rI8$VMqn1`l9Frt2q)2Bo;}WCbQIt{HlS16iwyQ zV_ps4dO6#j3u-b?v0T`47}SSc0@sB-gu=^ZY$#?$@f5XJc;i4-`Wi?9DwO5%3p~7( zAjC_naOq+z>I$7?DHTHj>L&hN0$eV4+3pJOK^5M2bZj(5f?H%AdhHg Date: Tue, 6 Nov 2018 06:40:42 +0000 Subject: [PATCH 5/5] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 178 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 851 bytes q05_forward_selected/build.py | 33 ++++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 184 bytes .../test_q05_forward_selected.cpython-36.pyc | Bin 0 -> 2856 bytes 5 files changed, 33 insertions(+) create mode 100644 q05_forward_selected/__pycache__/__init__.cpython-36.pyc create mode 100644 q05_forward_selected/__pycache__/build.cpython-36.pyc create mode 100644 q05_forward_selected/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q05_forward_selected/tests/__pycache__/test_q05_forward_selected.cpython-36.pyc diff --git a/q05_forward_selected/__pycache__/__init__.cpython-36.pyc b/q05_forward_selected/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..969cd60bc49ef4c5249c4796c633159d7992c8e1 GIT binary patch literal 178 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU-9}G`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNOEb($y>7j538=R&8VQQL_*PlhUnvkpK3UI3UMfGo@$&7yFjJMDJg9p=BAhVUIDgIAfMrwuP+MlTr5n z$=$>T;5o735^{r;Wx?OLv%NzEwy;N_4YEm(jz|}EYnFn?+O;pe=6uKz4Z5=j5XG#& zB+wzY&nE{WS8s+6Tw!?H409?jQlm#9;#BIYb~H~-yWm2R9@SM_Y&5xI1%sHDmrUO0To{Y5**DPb(fb*Mwz+x^zYQ`Gpb)AXs_@w#NRr_O literal 0 HcmV?d00001 diff --git a/q05_forward_selected/build.py b/q05_forward_selected/build.py index 8816abd..1c6ba97 100644 --- a/q05_forward_selected/build.py +++ b/q05_forward_selected/build.py @@ -1,5 +1,7 @@ +# %load q05_forward_selected/build.py # Default imports import pandas as pd +import numpy as np from sklearn.linear_model import LinearRegression data = pd.read_csv('data/house_prices_multivariate.csv') @@ -8,3 +10,34 @@ # Your solution code here + +def forward_selected(df, model): + X = df.drop('SalePrice', axis=1) + y = df['SalePrice'] + X_list = list(X.columns) + best_X = [] + best_r2 = [] + + while len(X_list) > 0: + r2_X = [] + + for Xcol in X_list: + best_X.append(Xcol) + model.fit(X[best_X], y) + r2 = model.score(X[best_X], y) + r2_X.append((r2, Xcol)) + + best_X.remove(Xcol) + + r2_X.sort() + score, col = r2_X.pop() + + X_list.remove(col) + + best_X.append(col) + best_r2.append(score) + return best_X, best_r2 + +# forward_selected(data, model) + + diff --git a/q05_forward_selected/tests/__pycache__/__init__.cpython-36.pyc b/q05_forward_selected/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..64d29206523b2310e990b53c9eb2c56a0c050c63 GIT binary patch literal 184 zcmXr!<>g{Kb~Ks+2p)q77+?f49Dul(1xTbY1T$zd`mJOr0tq9CU#a>T`MIh3MTxnU ziP=S&#Tj{tc@}2+;rT_`#RZAUsrt$JDXIEtsfi_}MXB+{sX3|1C7Jno@dZWsSwNPO2Tq`eGnv007kk BGsyq| literal 0 HcmV?d00001 diff --git a/q05_forward_selected/tests/__pycache__/test_q05_forward_selected.cpython-36.pyc b/q05_forward_selected/tests/__pycache__/test_q05_forward_selected.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2abe7f1493d70ec733d3450557be9a7dfd2166a0 GIT binary patch literal 2856 zcmc&$&2Jk;6yGneH;(N%ZJK_Pu39QEYU8HmTUFhVHlZQ}(I6@Y&~~~rb~o7%cV_L9 zs7N4}|9}GrBo4r#2Lxw61Q()KLgK;!?S)E}DESAFfD7;KCQj0(MG;7>wQrtxX5P&F z-tWCP$4jMxx%B<(OO~SCR@OZQ&`-fDzXZV)rus^t5>-{0#&ll`bfSZ%7Fv zUF{8xRLCH&!2E6RX}cA&jcsQ`YzG@=JJ~L_o9$tH**=)Doe%cL3{5HQAvSVNVIy4a z>SPBqXO-&yW!S$`RTJwKF5?L*`LdRMs5ByRg$m|K?sGTh3`Vz_jmdb@7qgS3_*%Mn z5V3K_NPaqsGczwz`D!RK{d^R$)7+h(om@t*HJ9G`dg#ZWZr7VPm%jPx!|#5rH>Ycr zzec{jQ*S>1?)97X)^GLZ2cOK&{rov7zkl?@CpT_^^2KL&{&+LDTyLH$KYQ@~gP_z- z-`Ml%I4Hm5=WcyGvs`x(%GC!^JO!^j0fH+;WeU-l%Cu_=(V5N+XbqNQCbT)0XBM<3 zx*gg)x*l4KmB2;iWC(pTd6zp}6%6BpD*-)~33%l(5U~=gUG;7Csxqg=`c;*wyOl1i z46CmD-_VAYZc0*E!(RYT-(umK|J zr&4kepScX4Omv@zRV^`qGL6JQmRwgv35NaI0YU`4CTOrg=Y=OPg*1Hn$=dly%*z&a zdCiR&uQfQ0+k&r94%h?)isoQ1waZ7JaPB5#Ee2R*DxJ;xM_UWYejIbpOs99Sov=BH z2T?RjU3`2qphy3~#0E#8snii8psaU9<_3sHtp~b3vz+4nOb>6y8x%st?ohwYrOhHc zjAA>WzShBHY#p#oTG>f(tlpmmS2{}(o~4Nj31E@GHSHxgV7!3VJe#J>aS*u!Ar zzXIvl29SC|hI?P*RxhxCQ%8E7>ctWS)LJxUUVs#rc31UeAY%_wEX!qP9JQRWqe+pk zWJ3oE*nJ?WK9D!r4jiyIcJwg>1v9pyE}q;vYu20E00}1KG~6BqC4&T$e^;F|x)6Gx z=Q15jP}jga2&8>|MpR(@R?#w(!3?c&KZsWG(!y4fqe9SyB#+Qh*G+UN@#_GDPxk@v zzykqHtsa4mt|Ir;){#qX%vAdl%W*;)aK}jsjsq8mwvT$zaj=4AJz@aX5`!p)QS3so z55++gYe^&3Fu4jWz&KW7=CxGIuyXL4mY()hhZCzEdNH0-p!bv9#kS|Otc2zvv0%YX zb2%B3^FCZ^!cjlHS>YDBFEH5