From 672200f0a5ae788607c48450b0670f291bcc0412 Mon Sep 17 00:00:00 2001 From: Jas-simran Date: Sat, 6 Oct 2018 10:21:58 +0000 Subject: [PATCH 1/4] Done --- __pycache__/__init__.cpython-36.pyc | Bin 168 -> 157 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 193 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 630 -> 554 bytes q01_calculate_statistics/build.py | 10 +++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 199 -> 188 bytes .../__pycache__/test_q01_plot.cpython-36.pyc | Bin 2949 -> 2938 bytes 6 files changed, 9 insertions(+), 1 deletion(-) diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index cd8686b0f9f17c173480b2b430af88fa1427ca13..ddb447527a66a275a1d695f82c895758ea009295 100644 GIT binary patch delta 52 zcmZ3%IG2&bn3tF9Z_6;>4WP_=2L$L(^;Wa_)*Czs}?=9Ludrx&GGCYI#q>L=#pC=?XsXR)LvmlRJ9 zW(*hR1^I~sNH8#SF>*2TFcoo6-peS-TEqqvntY2<+L#;202_`(Z~?_`ao7MIUYe6? S#{}eo&ER0O#O`f+*Ez9#A4mz%-o{HJpJ(eqU_>=#N<@{ HiCM7#vF;Jo delta 63 zcmdnPc$|^Ln3tF9Mq+E!L=JQ968(()+*JLM~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX_Hl#611*{G#mQg2d!h{p9?V K)XhH_dpQ9B=o6X% delta 66 zcmew*)+)|n%*)GlBe6AVBgauj?MnTO{M=Oi#H5T&eV6>?(%jU%l4AYzqSVU7lKfo# V#GD+3f};Ga)Z~)l&2JfdIROmk7=r)+ From 0625390fd09c66c2ddf49e541a900c9efb82827d Mon Sep 17 00:00:00 2001 From: Jas-simran Date: Sun, 4 Nov 2018 10:49:57 +0000 Subject: [PATCH 2/4] Done --- q02_plot/__pycache__/__init__.cpython-36.pyc | Bin 177 -> 166 bytes q02_plot/__pycache__/build.cpython-36.pyc | Bin 775 -> 795 bytes q02_plot/build.py | 11 +++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 183 -> 172 bytes .../__pycache__/test_q02_plot.cpython-36.pyc | Bin 969 -> 958 bytes 5 files changed, 11 insertions(+) diff --git a/q02_plot/__pycache__/__init__.cpython-36.pyc b/q02_plot/__pycache__/__init__.cpython-36.pyc index 215eac083bf88e6537e6d7d6a5471a2c374ca81c..a8384b8d5da72f475d5bc6d01d839b2d98e0a38b 100644 GIT binary patch delta 52 zcmdnUxQvm*n3tF9Z_n1uCj|K=Ji7!UkiZ&IJn*0l zDFG?aQ5Dk|BT34U2=^EyTqc6-F->J!W&#WRDG<>*c!cO!#A5Uj(TTtpXqFrxDmtIx z{**J#JI$OdtYc1Dr?{md+iX5O7R<4H+jLeItx;UsqUy9$*UTuepL2Un(+j5M(tmOv z@z04scm>bC1L9DL_Xv9)xDcueZi7K1E-K?a5}_a>x()wgBf#Q&SOVDS2upoLfqXCL zhXrJrVM4i%lfd@j>c=X>5Qag3tiK(@5J6U zN=NMdwfE{X3+QiEx3z%W2Y(s$bj literal 775 zcmZuvO>fgM7`B}>O+!10i3{R_xaHD}ah(tnh~tFRo0$~3_B-mxX)@a>6s@Pifx~_R zKY+iKE2sShPQ1=QR1=Q;`u(!~JWu>$Hp@<*eCOX7AwS8%h|qt9)4fHbh@ysYI;^aU zc#Ix1qdMUUB|xjOiuRPJkX92#75&Ooe90aYo~e;az7YOE(FMuJw|Evg&uRZi3L`rs zJe1B0ubtP@eSW5d7saaS9F(oq5?on##_Nr+8e8YmZTMs%47>|P84e30KuvJI#_2B5 zc(NxK(T?osj(J)!A0a4q!zjThz9uSCaR7D`|H;t%89%C$YqlSV{p(dEkT~zDL<%F> zn8x;W$rB~q3e+u1Nb<aDB27rURFw<~4{lPijzFtoyib6#O7|iU$)&keF5Aq}45|dZ;}@80y8<$!Xb|#uv*@8#QmYeH_AYjmyvwI;BVS z7(aW2Q9k8KE7quhonXix*20H=qnEfhcvv4+I}Y`;zo0_HeJE~zb@IIY-_w{6Xa@Co yYC))ScnjgZTv|~>ADKql6mJ+%4XPZN85a8V3?=IfybS+f;F8jePFY5eN527_GSx8v diff --git a/q02_plot/build.py b/q02_plot/build.py index 70276d6..39207c0 100644 --- a/q02_plot/build.py +++ b/q02_plot/build.py @@ -1,3 +1,4 @@ +# %load q02_plot/build.py # Default Imports import pandas as pd import matplotlib.pyplot as plt @@ -9,4 +10,14 @@ # Draw the plot for the mean, median and mode for the dataset +def plot(): + plt.figure() + plt.hist(Sales_price, bins=60) + plt.axvline(sale_price.mean(),color='r',linewidth=4) + plt.axvline(sale_price.median(),color='g',linewidth=4) + plt.axvline(sale_price.mode(),color='b',linewidth=4) + plt.show() + + + diff --git a/q02_plot/tests/__pycache__/__init__.cpython-36.pyc b/q02_plot/tests/__pycache__/__init__.cpython-36.pyc index 488a8902e9cb8aed0f38d008a72db519050c874f..b14c918eb242efc7505b8376f8e35e9562e06c48 100644 GIT binary patch delta 52 zcmdnaxQ3C#n3tF9Z_M~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX Date: Sun, 4 Nov 2018 10:54:17 +0000 Subject: [PATCH 3/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 192 -> 181 bytes .../__pycache__/build.cpython-36.pyc | Bin 494 -> 501 bytes q03_pearson_correlation/build.py | 10 ++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 198 -> 187 bytes .../test_q03_correlation.cpython-36.pyc | Bin 1680 -> 1669 bytes 5 files changed, 10 insertions(+) diff --git a/q03_pearson_correlation/__pycache__/__init__.cpython-36.pyc b/q03_pearson_correlation/__pycache__/__init__.cpython-36.pyc index 543c178c4df3a2d7e5b64ffe37ce6264e5b948ea..f323528f944282654ffc77b3748334a0b5d465c0 100644 GIT binary patch delta 52 zcmX@WxRsH^n3tF9Z_6mlo>) diff --git a/q03_pearson_correlation/__pycache__/build.cpython-36.pyc b/q03_pearson_correlation/__pycache__/build.cpython-36.pyc index ba8cf119e61bb596104a35e0bb902136188759a1..d6984d899d7b74ca8077f9c42486d6602acece53 100644 GIT binary patch delta 281 zcmaFI{FPbRn3tF9*!g?W2N)R`9y1^TCLr4Zh>P_mDyy@lvNkg?GEDRet!D;`f#jS) za&kbTgdv4dlA)HNgb_?L)-Yr-)i5?Q)-u&F1v6+e`9*OCC+4IE6lEr-YBJyAPDw0D zOe;#vO^r81<`~^#NzN}S0;*t2NsD4mNi!;90h+#&p@^kE-pw+PSsD&Pf49@%NS(90aVJs$N_|0j71=hCR-F+L1JD?V(~4ef|MwZ kqSVBc_~hcUB9Iq~m?!UKR1*aGs2HS}gNcigixq4gj+79e&82?_y;5{4|s zET$6XEXEYZ6sBILU&QUi)IlT&Z8BCS_#m%e&+!m*%GCl@#lz z7o}DvmgMK^C+6fR6cpuWr6!jYPqtwUVg)&xVe(8yc{XN{A*_@4F{<%{1dBn2axif* Hatq diff --git a/q03_pearson_correlation/build.py b/q03_pearson_correlation/build.py index 33a762b..2ab2739 100644 --- a/q03_pearson_correlation/build.py +++ b/q03_pearson_correlation/build.py @@ -1,3 +1,4 @@ +# %load q03_pearson_correlation/build.py # Default Imports import pandas as pd @@ -7,3 +8,12 @@ # Return the correlation value between the SalePrice column for the two loaded datasets # Your code here +def correlation(): + df=dataframe_1['SalePrice'] + df2=dataframe_2['SalePrice'] + corr=df.corr((df2)) + return corr + +correlation() + + diff --git a/q03_pearson_correlation/tests/__pycache__/__init__.cpython-36.pyc b/q03_pearson_correlation/tests/__pycache__/__init__.cpython-36.pyc index d7eca9980cd94014cb671238783d84df5e9fb7da..122cc57d825702e054b6cc126576475459bee043 100644 GIT binary patch delta 52 zcmX@cxSNr~n3tF9Z_M~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX?(%jU%l4AYzqSVU7lKfo# W#GD+3f};Ga)Z~)l&4(Bdvj70(`4{H^ From 656fbebb988d012fa968bd8949bcc901ea35d35c Mon Sep 17 00:00:00 2001 From: Jas-simran Date: Thu, 3 Jan 2019 09:25:24 +0000 Subject: [PATCH 4/4] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 193 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 505 -> 762 bytes q04_spearman_correlation/build.py | 18 ++++++++++++++++++ .../tests/__pycache__/__init__.cpython-36.pyc | Bin 199 -> 188 bytes ...st_q04_spearman_correlation.cpython-36.pyc | Bin 1717 -> 1706 bytes 5 files changed, 18 insertions(+) diff --git a/q04_spearman_correlation/__pycache__/__init__.cpython-36.pyc b/q04_spearman_correlation/__pycache__/__init__.cpython-36.pyc index 78682675323d8e4b951373280266bfae3fe10d8b..b995d78eb8b2df0b35447ab00748711201dc449f 100644 GIT binary patch delta 52 zcmX@exQ&s+n3tF9Z_l~Z4V6XSwVC9pN0=F9wee)4#4Zz#VXzWqW0e!$K_4$n}`0|W_@l#mfc z7F5zT$=Ft7s0A{R;U~yKNlsuIZO|Kzm-i*NJpIsgM&+$8gfe;6mA1I#y5LqF33Iu; z{jZN`+AD7pK8rsQN{I3t#e74suppL7GJ!Q&{buYBBRy6*fkm(e)aV>~@|P3I=H5H( z@#}l)YyM1E)J8q_GXX?4fidPpEy75|3CO{L*WxXYG4o&zD`w*!C$RE;Cp{ZMAM}Cu zl))HAa0j!j!al@V43D$qgqP~I@81QQ*XLR2ake4Y$rNYDKNiLjx$(nZCi0%S=(tvL z|NH8hvhBE>tQSsZyzo&_#<&RJpO- z7RDCB;Ch>d5;nbf_#`*2;=1B>E*h;>i9Su8o_0kkkJ>9Y`ky($x6LgCAUE*d#Jf+% zh}TI>?h-vh3-%DTyq4VP0n#kiipw1T6CESfKE>8=+sF` z;T#35G^5qd&a8Gb`_AO)d@er@KJ_7gmG93iRi1E>5cU&A*78=wtmT$l@gkP2%C2-7 z1_W}@S9~lS#>U$!ANMRoxFc{_AM4#Eba+iGgE}{!=)ZdM#b}nox3qasjd!TvwplII zr8jGbeGKZJ@Cl-K3c7AFkZ;k%@OC6_YLTpr(@x^5(8U0~g)oZ2>XHy_ZNejEQ~dPF ccJ1%lZ&xH?EYF;`>kiMSyfBSQA-T+d0JY~wzW@LL diff --git a/q04_spearman_correlation/build.py b/q04_spearman_correlation/build.py index 557be32..1920597 100644 --- a/q04_spearman_correlation/build.py +++ b/q04_spearman_correlation/build.py @@ -1,3 +1,4 @@ +# %load q04_spearman_correlation/build.py # Default Import import pandas as pd @@ -5,4 +6,21 @@ dataframe_2 = pd.read_csv('data/house_prices_copy.csv') # Your code here +def spearman_correlation(): + sale = pd.DataFrame(dataframe_1['SalePrice']) + sale2 = pd.DataFrame(dataframe_2['SalePrice']) + sale['rank'] = sale['SalePrice'].rank() + sale2['rank2'] = sale2['SalePrice'].rank() + df = pd.concat([sale,sale2], axis = 1) + df['d'] = abs(df['rank'] - df['rank2']) + df['d squared'] = df['d'] ** 2 + s= df['d squared'].sum() + n = len(df) + result = 1- (6*s)/(n*(n**2-1)) + return result + + + + + diff --git a/q04_spearman_correlation/tests/__pycache__/__init__.cpython-36.pyc b/q04_spearman_correlation/tests/__pycache__/__init__.cpython-36.pyc index 495646a3bc5e900ad0593288f8e14eb5f8ed301b..3b19623b46cf156027c8290477585134839700eb 100644 GIT binary patch delta 52 zcmX@kxQCI$n3tF9Z_M~`m;B_?+|<01V*T`@)XKz?{9OIS SoE(LMqWrAX