From 00b53d2ef45db9e77fc99cfdfcdb79e7dc622914 Mon Sep 17 00:00:00 2001 From: Lavi1920 Date: Wed, 10 Oct 2018 03:49:22 +0000 Subject: [PATCH 1/4] Done --- __pycache__/__init__.cpython-36.pyc | Bin 168 -> 155 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 193 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 630 -> 604 bytes q01_calculate_statistics/build.py | 17 ++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 199 -> 186 bytes .../__pycache__/test_q01_plot.cpython-36.pyc | Bin 2949 -> 2936 bytes 6 files changed, 16 insertions(+), 1 deletion(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index cd8686b0f9f17c173480b2b430af88fa1427ca13..c589c20ba8ea8700ebbd04516b82d25ee5c27590 100644 GIT binary patch delta 50 zcmZ3%IGd5fn3tEUY1M}4i5%u~9{L&ixvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) F>;Qwd5K;gD delta 63 zcmbQuxPp91ulPqpoyj(sp;Ob zngee$&1PEXkhg`Vnto%NU$cj#Ug%8cUr8-M%!Fdy6)B59cm}!r@<_`dtB>R4p|Q>= z@J&B;!EB^6GQg?wo4CA^9lS|Fm5S2HZr4k+{uM$XEe)*YGrdVXyX6#lo_Jf#$-mI_ zJG)`X#E!MgnP5KOksaOfYmU!imnDt44qFT5Dzd@GtOq&7EIreqAS4z&XoIeW^wK%G z#f(uy%*_y*F99P<;JX^KR&D8j_#AU zQbDEgyh?*t&RA3e8XsgZJ{aXuqp<}Qs?TTZM#)Z19jbJYP<@z8r%&xR-v3|t2ygZ) z1VWE+KAT##-EeLCyR!xK@yYA4&*=&teINsC9Pcz zu5Uo0SA$p13^*#NeUQQUV3bFqQ@r|g{;XEgs?p*Yj}oe@(O7*p?BmJ*!pk(!0u|vU zE$Kt%9-zHm#924C!`?A`iF}Zqmfq#*Q8?J{!PE0=aNA*X*GsS*RRc!@I` RExbzArfvl-SV^DE{{XjqvDyFt diff --git a/q01_calculate_statistics/build.py b/q01_calculate_statistics/build.py index a556241..aa092bf 100644 --- a/q01_calculate_statistics/build.py +++ b/q01_calculate_statistics/build.py @@ -1,11 +1,26 @@ +# %load q01_calculate_statistics/build.py # Default Imports import numpy as np import pandas as pd data = pd.read_csv('data/house_prices_multivariate.csv') -sale_price = data.loc[:, "SalePrice"] +sp = data.loc[:, 'SalePrice'] #sale price # Return mean,median & mode for the SalePrice Column # Write your code here +def calculate_statistics(): + mean=np.mean(data.SalePrice) + med=np.median(data.SalePrice) + mod1 = np.asarray(data.SalePrice.mode(), dtype=np.int64) + mod = np.int_(mod1.item()) + return mean,med,mod + + +calculate_statistics() + + + + + diff --git a/q01_calculate_statistics/tests/__pycache__/__init__.cpython-36.pyc b/q01_calculate_statistics/tests/__pycache__/__init__.cpython-36.pyc index b1b01d55acae938b089c65022c1e5efe684e3182..c867380bb5807759266856b5c96317e39b750513 100644 GIT binary patch delta 50 zcmX@kxQmg)n3tDp-l`4J6FJP~()Ba)b5r$w63a3TEsYHH!}E)>iwhEyQ}vVcQ&J~p G#R34BE)ePf delta 63 zcmdnRc$|^Ln3tF9Mq+E!L=JQ968(()+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX?(%jU%l4AYzqSVU7lKfo# V#GD+3f};Ga)Z~)l&951IIROk?7=Hi& From 90c6a52e0c11c55f2be2dad4975808bca58b9d6e Mon Sep 17 00:00:00 2001 From: Lavi1920 Date: Wed, 10 Oct 2018 04:43:57 +0000 Subject: [PATCH 2/4] Done --- q02_plot/__pycache__/__init__.cpython-36.pyc | Bin 177 -> 164 bytes q02_plot/__pycache__/build.cpython-36.pyc | Bin 775 -> 873 bytes q02_plot/build.py | 20 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 183 -> 170 bytes .../__pycache__/test_q02_plot.cpython-36.pyc | Bin 969 -> 956 bytes 5 files changed, 19 insertions(+), 1 deletion(-) diff --git a/q02_plot/__pycache__/__init__.cpython-36.pyc b/q02_plot/__pycache__/__init__.cpython-36.pyc index 215eac083bf88e6537e6d7d6a5471a2c374ca81c..65bee38890a7b5726adb83e61d5059b054426ce6 100644 GIT binary patch delta 50 zcmdnUxP+0zn3tEUY1M}4i5%u~f%+NwxvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) F+yRJM5Ox3n delta 63 zcmZ3&xRH^=n3tDp*}dkdi5%wIarzngxvBbzNg0{?F8Rr&xv6<2#ro+*sg;Q(`MLUu SIXMaiMfq8&$tA@TW8DF%5EiQd diff --git a/q02_plot/__pycache__/build.cpython-36.pyc b/q02_plot/__pycache__/build.cpython-36.pyc index bed076d1cc99b8e94b503c07bb460492f8d4c6bc..2c727e5e682775a4086abffd5eb694fc536f2f71 100644 GIT binary patch literal 873 zcmZuv&2AGh5VrR(yW6Cq6{^IA13l%EO^YglR3Q*bPN+ia0b~v<$99w5db3;GNt>RK z7LGg!55bH0%86It#CTguL0Izm^Zfan89yBi(vR)85Boks-_gAVck~jreh-2pjwK?v zJH65;0U%F?RYW3;L{Rp)-(okEhe|*anrL%b{=amBq}4lFoz#>va0+2&_>h zctMw-m`t7>PA1@9bD`WINHSI8VkMSrGaOjIk%j~dXpv1dlzr0_(xX>vSuBP1mW>J^ zO2r^-NR^@+l{g#}MpPua>Ru+%raNsU#at};SEL@eC?|fNK))-Iy`k&k;Q8S=dsnM- z-B2bn2Bb1BG*d+bGq^u4AX1ltne1YGm^ZRE*=$uvK58~LaMwO$*4rQuPQ5+6hadYX zAhipc;WmjHy5v+_ui<2;qQ-^DVg}(3fw?jrt zDbJ=F Wt)zJ2=G7G$;}rKjC=l=Z@!%KM?d#|O literal 775 zcmZuvO>fgM7`B}>O+!10i3{R_xaHD}ah(tnh~tFRo0$~3_B-mxX)@a>6s@Pifx~_R zKY+iKE2sShPQ1=QR1=Q;`u(!~JWu>$Hp@<*eCOX7AwS8%h|qt9)4fHbh@ysYI;^aU zc#Ix1qdMUUB|xjOiuRPJkX92#75&Ooe90aYo~e;az7YOE(FMuJw|Evg&uRZi3L`rs zJe1B0ubtP@eSW5d7saaS9F(oq5?on##_Nr+8e8YmZTMs%47>|P84e30KuvJI#_2B5 zc(NxK(T?osj(J)!A0a4q!zjThz9uSCaR7D`|H;t%89%C$YqlSV{p(dEkT~zDL<%F> zn8x;W$rB~q3e+u1Nb<aDB27rURFw<~4{lPijzFtoyib6#O7|iU$)&keF5Aq}45|dZ;}@80y8<$!Xb|#uv*@8#QmYeH_AYjmyvwI;BVS z7(aW2Q9k8KE7quhonXix*20H=qnEfhcvv4+I}Y`;zo0_HeJE~zb@IIY-_w{6Xa@Co yYC))ScnjgZTv|~>ADKql6mJ+%4XPZN85a8V3?=IfybS+f;F8jePFY5eN527_GSx8v diff --git a/q02_plot/build.py b/q02_plot/build.py index 70276d6..642fb40 100644 --- a/q02_plot/build.py +++ b/q02_plot/build.py @@ -1,3 +1,4 @@ +# %load q02_plot/build.py # Default Imports import pandas as pd import matplotlib.pyplot as plt @@ -7,6 +8,23 @@ dataframe = pd.read_csv('data/house_prices_multivariate.csv') sale_price = dataframe.loc[:, 'SalePrice'] - # Draw the plot for the mean, median and mode for the dataset +def plot(): + plt.hist(sale_price) + #plotting the mean, median and mode + plt.axvline(x = np.mean(sale_price),c='#00FF00',label='mean') + plt.axvline(x = np.median(sale_price),c='#FFA500',label='median') + plt.axvline(x = np.array(sale_price.mode()).item(),c='#EE82EE',label='mode') + + #defining x and y label + plt.xlabel('SalePrice') + plt.ylabel('Frequency') + + plt.legend() + +plt.show() + + + + diff --git a/q02_plot/tests/__pycache__/__init__.cpython-36.pyc b/q02_plot/tests/__pycache__/__init__.cpython-36.pyc index 488a8902e9cb8aed0f38d008a72db519050c874f..fd4dae3b32e6e671d7e7ba352cf29d99a7892c1b 100644 GIT binary patch delta 50 zcmdnaxQda(n3tEUY1M}4i5%u~;rbc*xvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) Fd;yDc5RL!< delta 63 zcmZ3*xSf&1n3tF9Mq+E!L=JQ96#b0++*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX Date: Wed, 10 Oct 2018 05:03:07 +0000 Subject: [PATCH 3/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 192 -> 179 bytes .../__pycache__/build.cpython-36.pyc | Bin 494 -> 534 bytes q03_pearson_correlation/build.py | 15 +++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 198 -> 185 bytes .../test_q03_correlation.cpython-36.pyc | Bin 1680 -> 1667 bytes 5 files changed, 15 insertions(+) diff --git a/q03_pearson_correlation/__pycache__/__init__.cpython-36.pyc b/q03_pearson_correlation/__pycache__/__init__.cpython-36.pyc index 543c178c4df3a2d7e5b64ffe37ce6264e5b948ea..11176f74fad776dcb51f29ff24d0939d55fc27f6 100644 GIT binary patch delta 50 zcmX@WxS5f|n3tEUY1M}4i5%u~3HllNxvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) F!T^vK5V8OO delta 63 zcmdnYcz}_^n3tDp*}dkdi5%wIx%wITxvBbzNg0{?F8Rr&xv6<2#ro+*sg;Q(`MLUu SIXMaiMfq8&$tA@TW5WQm6&B|J diff --git a/q03_pearson_correlation/__pycache__/build.cpython-36.pyc b/q03_pearson_correlation/__pycache__/build.cpython-36.pyc index ba8cf119e61bb596104a35e0bb902136188759a1..aaa61aaab7c94e94ef03228822aaff04b5669aa1 100644 GIT binary patch delta 349 zcmYk1u}T9$5Qb-V_mcHAl@|I0a#);+AX*55ou~*wlobif?gn!vxnu7P2#Q4nYYF%c z_O?ENuaMTt#s|>G*;E;rZ+?cEpP3*2DlWDfjri~R3zy_n_$6W9~90i zQ`})DEE}VWW{Q)lSz)6mP<2-y1H#MU*&|s3r#uKYtAq+NtXRe?k?}FJd<`Dp9@>zI z6CZ}Z0}?jVJ{*ulQ#LG=G`aUCcirit)s^mgJ#d|-T4?LOJM}%|=KHOL&I$|b<_&y} zTz;?8>wMtSBR%RhcUzn3dG2q@LK~Nw+`7pg9`7vCTqy{EE9fQFM5u#epbPnLN(2-bGFuH@aqL$ s9!`cUhCcvZ8kr|D=~PR~_pBqCI<06~`X|TNpLn!0B>k{0Wf^A4A6aiiJpcdz diff --git a/q03_pearson_correlation/build.py b/q03_pearson_correlation/build.py index 33a762b..bfa2351 100644 --- a/q03_pearson_correlation/build.py +++ b/q03_pearson_correlation/build.py @@ -1,5 +1,7 @@ +# %load q03_pearson_correlation/build.py # Default Imports import pandas as pd +import numpy as np dataframe_1 = pd.read_csv('data/house_prices_multivariate.csv') dataframe_2 = pd.read_csv('data/house_prices_copy.csv') @@ -7,3 +9,16 @@ # Return the correlation value between the SalePrice column for the two loaded datasets # Your code here +def correlation(): + corrc=np.corrcoef(dataframe_1.SalePrice,dataframe_2.SalePrice)[0,1] + return corrc + +correlation() + + + + + + + + diff --git a/q03_pearson_correlation/tests/__pycache__/__init__.cpython-36.pyc b/q03_pearson_correlation/tests/__pycache__/__init__.cpython-36.pyc index d7eca9980cd94014cb671238783d84df5e9fb7da..2748494713e34828ea9dda3824a475bc9e746529 100644 GIT binary patch delta 50 zcmX@cxRa5?n3tEUY1M}4i5%u~Y5E!YxvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) FVgQpa5Xt}m delta 63 zcmdnVc#M(5n3tF9Mq+E!L=JQ9V*QN#+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX?(%jU%l4AYzqSVU7lKfo# W#GD+3f};Ga)Z~)l%?B6{vj70(Z5QJJ From 45177c389fbb83a9f6657ba7fbd0d247179f9346 Mon Sep 17 00:00:00 2001 From: Lavi1920 Date: Wed, 10 Oct 2018 05:09:03 +0000 Subject: [PATCH 4/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 193 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 505 -> 563 bytes q04_spearman_correlation/build.py | 11 +++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 199 -> 186 bytes ...st_q04_spearman_correlation.cpython-36.pyc | Bin 1717 -> 1704 bytes 5 files changed, 11 insertions(+) diff --git a/q04_spearman_correlation/__pycache__/__init__.cpython-36.pyc b/q04_spearman_correlation/__pycache__/__init__.cpython-36.pyc index 78682675323d8e4b951373280266bfae3fe10d8b..d3b8096e4f74af23fef52f058923e17aad84e8e9 100644 GIT binary patch delta 50 zcmX@exP_6!n3tEUY1M}4i5%u~iTWA&xvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) F!U2$)5VimS delta 63 zcmdnOc#x69n3tDp*}dkdi5%wIdHNaoxvBbzNg0{?F8Rr&xv6<2#ro+*sg;Q(`MLUu SIXMaiMfq8&$tA@TW5WTnz!vKO diff --git a/q04_spearman_correlation/__pycache__/build.cpython-36.pyc b/q04_spearman_correlation/__pycache__/build.cpython-36.pyc index 94f735a46faa9e694e8a6b3b49b480cf37144bf0..b1e0c1d66828ddc9e6b4bc4893b4c6f4349b9e8b 100644 GIT binary patch delta 370 zcmYjMyGjE=6rDS}n|&m)5cC7=wsB1?#6po+*hmmkL`E?VJ0m9UW0=_lB8C*Pv6Os* zm33-=WLqmgK`Za3%7ydba-YA}%AOxKo5B6t*UbkI@=Z2^qCZ2J4w4`O62f4ulv$`W zu~UaRKqQQ6!dd`x*Um=g2}jgk3G=1DAb`C+61qP)hjc?IeWN7TDbMut-uv~%yxL?T z&Jku8sUQW6Xkm@$g5J^@nZXOe3D6B~T@{yg!3+MNc`64j=J$9aukSRq8)7hyNe$4R7RJ4GHe~U52CGpuAhwJv5ewe$mJ>YPwLevHWGnt&@O5i xu$tnT;HIQXFee+QYFg4vvAT(eYPxRF_R?x=g5CRI@$eLNr#cVe0u7!nIXlo${c0Pc$ zZCxj7CAr=4G C!%C9? diff --git a/q04_spearman_correlation/build.py b/q04_spearman_correlation/build.py index 557be32..09f2e01 100644 --- a/q04_spearman_correlation/build.py +++ b/q04_spearman_correlation/build.py @@ -1,8 +1,19 @@ +# %load q04_spearman_correlation/build.py # Default Import import pandas as pd +import numpy as np +from scipy.stats import spearmanr dataframe_1 = pd.read_csv('data/house_prices_multivariate.csv') dataframe_2 = pd.read_csv('data/house_prices_copy.csv') # Your code here +def spearman_correlation(): + corr, p_value = spearmanr(dataframe_1.SalePrice, dataframe_2.SalePrice) + return corr + + +spearman_correlation() + + diff --git a/q04_spearman_correlation/tests/__pycache__/__init__.cpython-36.pyc b/q04_spearman_correlation/tests/__pycache__/__init__.cpython-36.pyc index 495646a3bc5e900ad0593288f8e14eb5f8ed301b..71bfb203741d3afb178e2366fb479e05ecdece41 100644 GIT binary patch delta 50 zcmX@kxQmg)n3tEUY1M}4i5%u~>G~P@xvBa-iDj9FmPQ8p;rT_`#RZAUsrt$JDX9~) FVgZw~5Y7Mq delta 63 zcmdnRc$|^Ln3tF9Mq+E!L=JQ968(()+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX