From 1ba6f721ae913d6863d6ecf5cacfb5bdc649733d Mon Sep 17 00:00:00 2001 From: tracedence Date: Fri, 18 Jan 2019 04:36:57 +0000 Subject: [PATCH 1/6] Done --- __pycache__/__init__.cpython-36.pyc | Bin 135 -> 153 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 180 bytes .../__pycache__/build.cpython-36.pyc | Bin 534 -> 624 bytes q01_Unique_users_subreddit/build.py | 15 ++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 186 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1390 bytes 6 files changed, 14 insertions(+), 1 deletion(-) create mode 100644 q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc create mode 100644 q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q01_Unique_users_subreddit/tests/__pycache__/test.cpython-36.pyc diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index 3337b5d62216137d54b5097104417c3e227d9f80..f188c6d1b57655be5d343252ce84840b3888b81d 100644 GIT binary patch delta 52 zcmZo?oXN;x%*)Fq6z&)^k;7cUO+O<)H&wr+C^0!TB{eTORX;qxD7&}-$kk8IPf4BV GYXty;8W58J delta 34 pcmbQq*v`md%*)Gl@O4=9L=JO46a9?*+*JLfjMCza#Jq{|RsgT|3kv`M diff --git a/q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc b/q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..e8efba7459a05da98d45487b39e6e772206cf623 GIT binary patch literal 180 zcmYL?u?hk)5JYoeA%cy6VdE;cBKiY1BG(AZnJgGJ*}L7OxKHwzZ2b!>bA>oCkC|y^ zJ)KTw_5N&%-UEKBO4t?asKA+{nOBFWkzxMh)4-JjL6XLjqi6|gmb;XL;+jj8`%Wia)qbpyG)psL{ala$T^8nu5ay30%Sl{#E7~{kV9QBcphHo#$eyJr0uV(7T0A3iD2gGe011@IUGpG) zkiGbmb%zN6io^Ls_r5BOk*B051tG2NYysujm z^Ui}avH>ym-Nu1Zbyy^kStW7@Qk9jzja-9?S!e2-4)8LuGF(NbwqklKT`e~nPXD=Q z--$a$rGLH_S8W3Y_Ev!cQ$carx@&JSEUH#P;Q*C1U{vc$f9C@1wT3_Ab8s|D(w;t{j1|XLL^I%+1ihFO&?jIFwq}CIG4nI0(Powr+X$ zX1!i7N5<7KtUP8`8YR8UFkhsmYmk^3E1vsn4bquagPrKogGSj{#|{5tWOLKO8z%7t aPB4u5J51^{ydU2BBZQph^n~Zrg#HB+Jgpx9 delta 376 zcmYjNJ4*vW5Z>qI42h3MqJ;zwHP<8rI}sJc#@0@Ruw*wT;a=I>Qz92EQd=Acg5n?W zr}!7Pv9PkUwsJQjWMICTZ)W(0nQ!t$yn}kZIw|+BE+7D(V9AilPmQOo!fR1@34B^y zdk@%@sPQw~Iy9ib80KIOXE29j#34rTb~D2|##A;rzhv$gk=uNAYyN16;I>+4!gvWUlFFI7y5;$!oiYLsy8O2K%q zpWbRGWnmHsjRO&BCyPdtO!!!ngsGvXoGI4T#D+H@*NpVfUc22XU*UFHz}=2xud)D8 z6|O?LVKTp>oy2TqsjL{PX_SS@RHG=-WdrSW?aV@I3D)hPdlbez3&gQ`?VqX(U0B1v DWr|-; diff --git a/q01_Unique_users_subreddit/build.py b/q01_Unique_users_subreddit/build.py index 82fe7e5..a8e9d31 100644 --- a/q01_Unique_users_subreddit/build.py +++ b/q01_Unique_users_subreddit/build.py @@ -1,7 +1,20 @@ +# %load q01_Unique_users_subreddit/build.py import pandas as pd import numpy as np from sklearn.model_selection import train_test_split -def q01_Unique_users_subreddit(): +def q01_Unique_users_subreddit(path): + + df = pd.read_csv(path, compression='zip') + variable1 = len(df['username'].unique()) + variable2 = len(df['subreddit'].unique()) + + return df,variable1, variable2 + + +path = 'data/subreddit-interactions-for-25000-users.zip' +q01_Unique_users_subreddit(path) + + diff --git a/q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc b/q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2dac1b976b7f2cfe4c0f521fbca48536668b5558 GIT binary patch literal 186 zcmYL@u?hk)5JYoeA;Nu#jjPy-=nvS4Tq7)+EE+Y*-R`EiPx6;+{R=B|g*Y&enW<)3 z*As2FM^p43@KaU7rdUP=&g{*!+C2>q^BLmPe!@Rx}bwv_!hIix3xtKs<8G1y)Ecgz2}jjqBqRdda=BbCm#aR1?t5!%BlG&no3{ZW-^iH;bMhFvehY#V zPAih*=vB1#a*q=3^PuwUAP+$&pbtPFI-OQg9=Sa$`3T0aTCK%1Q2V%DvAd_pt;R10F&W13P>rw2{rMq~MDU zHxHpdg|1T&h8Vh}AL$X<_l$o;Io%*j2nK=Nd`YL?I$8RN0)z~96oxuRvAFsC15{-M zkD7LB>1llV5j8*j_^q5&-l6rN~@+H@S&?P_1#bF9kxm1q*r23k~88z4wuh*|^x z|H^Eytwm;3Q3}{sitKf({?&7sW@XDorbOA+a3XIN(}&uKn$1ni~z8VY#Y5fZPn)A_qVpT zHXXatg`D@d_U`M59Q%;o;?}D@5i4Oj)x__MsuMbvI&NAM7x6O){Q}9SkSX%hOYl#B z_UEnhuM1P|#o~kseK3WG$QuuU?w+~`y7~h|GEfl=`S?2<*tBa(8(=B<}Rj7{{LvHpf>H>sQS5W*o+-aDB8h{udrqe=q>Wl7XR;|Oc>1!c^1-}lc%iK~=lSJc tPdg(k$7A>*s1S0n5u)?7fZq+4@~awc^stBK5mH=Z*%2MPFQTCN{{vRUbKL*{ literal 0 HcmV?d00001 From d86895fd58cc75926c80f607a1e10c4371a3009d Mon Sep 17 00:00:00 2001 From: tracedence Date: Fri, 18 Jan 2019 12:17:12 +0000 Subject: [PATCH 2/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 182 bytes .../__pycache__/build.cpython-36.pyc | Bin 479 -> 1147 bytes q02_top_subreddits_wordcloud/build.py | 26 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 188 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1195 bytes .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 187 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 850 bytes q03_plot_topK_subreddit_of_a_user/build.py | 12 +++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 193 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1240 bytes 10 files changed, 36 insertions(+), 2 deletions(-) create mode 100644 q02_top_subreddits_wordcloud/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_top_subreddits_wordcloud/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q02_top_subreddits_wordcloud/tests/__pycache__/test.cpython-36.pyc create mode 100644 q03_plot_topK_subreddit_of_a_user/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_plot_topK_subreddit_of_a_user/__pycache__/build.cpython-36.pyc create mode 100644 q03_plot_topK_subreddit_of_a_user/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q03_plot_topK_subreddit_of_a_user/tests/__pycache__/test.cpython-36.pyc diff --git a/q02_top_subreddits_wordcloud/__pycache__/__init__.cpython-36.pyc b/q02_top_subreddits_wordcloud/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..ad71a275f9482b746371e7f58f902e201c47b44f GIT binary patch literal 182 zcmYL?u?oUK5JWFvAwnAe!p0MAMf3-3EYb*z?k*V3WzXFUl27uNZ2b!>FNHWTkC|y^ zRhE-!wL7}3_kf>@9Jbju${=@evts{rI?R83&|f65PkKToZjpT@db60TMfti7 literal 0 HcmV?d00001 diff --git a/q02_top_subreddits_wordcloud/__pycache__/build.cpython-36.pyc b/q02_top_subreddits_wordcloud/__pycache__/build.cpython-36.pyc index 98c1cbb9a442dc1c36b3345272b08dbba074d6c2..d7245057a9a3af3f237df65af9d3901333014918 100644 GIT binary patch literal 1147 zcmaJ=y^h>A5GJYL{q@=T!v!hQZgH!P19yhuz(CTuNrC``0fsAb_b5}Oj-+g#v0JU% zYw{L(gSlL{Hi&osNF0XYHKM!Oukg4$*}u=u$4^@`N#x_aKgc zMyv8YzkfRsmvPUv0i)zZ!MbOV)eoJoEk5Ng-6I zam)gvfC*I4GnoDlFaaIV3BO2=_(+b)0XJCS6BgtgHRObv1ZFCTNJM%=j_Dy4_#7Ql zmL1Y27dS!}#Z7`C))XfodybA-C{O5^AM$2$$V7Pqbi%ZmozS?>54o6#=?xio3o(my z;d~j-1p>t6aH`w&ZovmGshWkS`##crVIdugQOL9(5*Etp#vL(=I$^PSrFPSRYp{?fj7 zQ45+zcU25&$HV17#E$0us2-j5clyx>V#h{kcd-GBVe%S!qK-ZBCvp!U-@m_Cm$sD^ zv_~xk6hT(dHZOe#+p4xgR!-KoZJ~(PF@NoYY+2`QBkNFIZ62~>Q>^5Q5RlERs6-yx{HU8 zHk-}G*u(3$s#~26dB=_5ejuHondw`=K}<*Qw>)&(2CcRLEqXNnu(}1jq_F!BWw}kE literal 479 zcmYjN%}yIJ5VpO$A&?D?Dg+WQfO5(5b48_xp1D+&sD)%X>k%yYFSfUkUh@uphrR$0 z<144WLQkD62WrdTjAuOlzL|^Zbnn;83BM`{c_sg?0{zc;;u1j-MK$4cu#B_87QBEG z*h94;8%p2ajQ9@bm>!#5zB|MUy=NwTLJ3S%xuLfOulbbkW90{^H*~0^U&*}sgFNJV zPV+1U*;$bwCK0{v62^{Kr)T1u?N&XAK0=5h_R9cDb?N7Ul1Vmi7qRshZTvBx<&l?G z$(Wf}nYoyYxQ@BUuy+PcEodyIwVelm*HjU!vAt!zYToafUFaxLM7{w5B!N GKl}$^<&X3L diff --git a/q02_top_subreddits_wordcloud/build.py b/q02_top_subreddits_wordcloud/build.py index ead5d42..899a6da 100644 --- a/q02_top_subreddits_wordcloud/build.py +++ b/q02_top_subreddits_wordcloud/build.py @@ -1,3 +1,4 @@ +# %load q02_top_subreddits_wordcloud/build.py import pandas as pd import numpy as np import matplotlib.pyplot as plt @@ -5,6 +6,29 @@ from sklearn.model_selection import train_test_split from greyatomlib.recommendor_system_project.q01_Unique_users_subreddit.build import q01_Unique_users_subreddit -def q02_top_subreddits_wordcloud(): +def q02_top_subreddits_wordcloud(path): + + # importing data + df, u_user, u_subreddit = q01_Unique_users_subreddit(path) + # Generating a DataFrame that comprise count of each username by subreddit + df_count_subreddit = df.groupby('subreddit')['username'].count().reset_index().sort_values('username',ascending = False) + # setting subreddit name as index of dataframe + df_count_subreddit.index = df_count_subreddit['subreddit'] + df_count_subreddit.drop('subreddit', inplace = True,axis = 1) + #creating dictionary of dataframe where key is subreddit name and value is frequency of particular subreddit + d = df_count_subreddit.to_dict()['username'] + # creating object of wordCloud + wordcloud = WordCloud() + # generating wordcloud with frequencies store in dictionary + wordcloud.generate_from_frequencies(frequencies=d) + plt.figure() + plt.imshow(wordcloud, interpolation='bilinear') + plt.axis('off') + plt.show() + + +path = 'data/subreddit-interactions-for-25000-users.zip' +q02_top_subreddits_wordcloud(path) +ls diff --git a/q02_top_subreddits_wordcloud/tests/__pycache__/__init__.cpython-36.pyc b/q02_top_subreddits_wordcloud/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..1c349b23e74cefbb35aedd66096e0458c7a22468 GIT binary patch literal 188 zcmYL@u?oUK5JWFvAwnAe!p0SCMf3-3EYb*z-Yyu;WzXFUl27uNZ2b!>FNHWTkC~}v zRhE-!wL7}3_kf>@9Jbju${=@evts{rI?R83YPd*XNP6;2+b!TOwIvGAh$v4swB(`LLShsaToX7q(UI(GB;mvTtvfURt C)ioLb literal 0 HcmV?d00001 diff --git a/q02_top_subreddits_wordcloud/tests/__pycache__/test.cpython-36.pyc b/q02_top_subreddits_wordcloud/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..205eba2124d8f4db3a73a088ec80f9ad8fd31668 GIT binary patch literal 1195 zcmaJ=O>fjN5ViBMNw>SLC<1|0P&gnF2_*PzlaUquIAc@j^B&hxM&oYoQFA zs=N|R9JjeFFx}q|)9gUg+h7FAC?}c2DR(YN<{}B`J?;aHfek(iZOVF9P>973HwVym zq3HySA%-sK4|-0H9OIr-P9Ks5B!fiVctNMmeX?*-2T18n6sB6DIeW7A9e5eRBcRw; zqBhTT96jaFqy6$k)ZoRQ!V_(vP0L~3uJ`2jkd<|%sAI=^TF9yOP^Og@HEhFnbZR+{J} zm#xqdZ=$*}QI(tGOEl~BydDv|owh23G-?e@?5K705q~FRZ#H0PAN+&UTVLhHW35nUIBtPs}PMEfEhyT4i25r?`Gmn z8@6?65ULHz8Xt}6>&HKAOUV@q-0{uc&y+aLO;gG8Fj>98>&1}VRt!m()P{{JXJwsB zcr~Sz*&T;JbQA*i zo)~15gaIPc9bK}IO#!i^1c~AiWVkYV-z1(QTd>hCQ9qy(FqBdXp CsWgrN literal 0 HcmV?d00001 diff --git a/q03_plot_topK_subreddit_of_a_user/__pycache__/build.cpython-36.pyc b/q03_plot_topK_subreddit_of_a_user/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..e02ab3659f26c601c2e0cd603f82d2e7e0e91259 GIT binary patch literal 850 zcmah{&5qMB5VoD9P5%}+A-HkOp-p#J+*SyL1P9Pw5JIw6vfS9+P3zdH?I60^p30R6 z;VpQMT#=CW6*w`D5Z%iPOY;-UneUr#=5#U{{`&FiVownIiSC>T@|R%lJve~`R*2#* z5*l?eUL~{#8BzTzr6~@tA~mRnbO`xC^hEzFrX!Kku^h?q9>XpEfU@B&R7B?)ZXbHf zOU=A=p1E3;9`2rQ=Ev-#E;o&2jg!_f*DS0QqV(-x%@mzmXmE0IZU8IyfMu0b27)zR55h za92nzN`09nHej~>OKX~Xv2ByWG}_aVl}>tAY9YVSku%n_&s;UqW&Jj;xxZ@TP_V`8 zmWU2VvRWC>ys6(E>NB%syo1dbO{v7J-nP&F`!)@V25AvF!uA2g>s)Zp z^M6uJOYJ4_^rg{mx-@or@_as@PrKR8uFEUz^$eyEW@X o>89JYX$OIG7{(nJmaa|DfI_3>i-7FHRfCcSbw+eKD26{oZilSlx+L&iprr|YR2l9P~oAHNa Fn=e)4HueAj literal 0 HcmV?d00001 diff --git a/q03_plot_topK_subreddit_of_a_user/tests/__pycache__/test.cpython-36.pyc b/q03_plot_topK_subreddit_of_a_user/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..200d9e7133e20d8291b54658458ad55d89a70e6a GIT binary patch literal 1240 zcmah|O=}x55S8}B-Z*yCrnC@f%jQt%La_@u6-r47A%}u5Ed-WQAzQMuiS{FsHZ&nU zIe(^qN!OnI7kcW09Cx@|&!D0pML|<~tZc1XU!( z-cvO9QjZehi$M8#kcNN>;11w!gQ<$rsM)iY_Mi{ddfrd_lpGMz5#1{yx{@3Z7Jm9j z&@Uv3mT(3cC)D-k(sDgFm7Fd;n1iY9(|0?pQl(|KtUfbSPqY*wv#gvk&T1nyIBjwR zz_OXq8UA?@yLQGrm@57 z+&#k~TP4IuFbso*L%fJyyu8+Nc(3mrb#YIl?kfPR>bBa7Pz1MXcE%bn!>yh02`@@x zvgIQfU%bB+R>&Ezm5tB1s-=lV85gCEb8e?c@w^fFu1DhO$H1VUfJyvDd>!G$8cuk6 z9dREGCfFK0(rx{d*)_4*gymKV3QBDMSBV?{aT2z}?xgKMADQbnd&lui&yP`KR z03=@tr3nh-(H$^7XwAuyABD|Kvf-k-$Selyx>%Chq!w2hS*f6`O)Y&{MxPsS}DV26AUI=cSSBdm#i-)z%R8u4H=5z?5xCr&y e Date: Fri, 18 Jan 2019 12:29:49 +0000 Subject: [PATCH 3/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 167 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 713 bytes q04_weightage/build.py | 20 +++++++++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 173 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1254 bytes 5 files changed, 19 insertions(+), 1 deletion(-) create mode 100644 q04_weightage/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_weightage/__pycache__/build.cpython-36.pyc create mode 100644 q04_weightage/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q04_weightage/tests/__pycache__/test.cpython-36.pyc diff --git a/q04_weightage/__pycache__/__init__.cpython-36.pyc b/q04_weightage/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a88547263d9ee9f22150793726a260aa717fa283 GIT binary patch literal 167 zcmXr!<>e9zcZ^{Gg2x~N1{i@12OutH0TL+;!3>&=ek&P@K*9*(SBQQ_er~FMNl{{Q zYD#Kea;koKeo=OD0g$VooS%}aUzD1hpPQSSmy%x;UtC#SlA0S|P?VpQnp~n^XkZdw po|>7SQIeRRsvjSpnU`4-AFo$Xd5gm)H$SB`C)EyQTQLwb007mKEIj}K literal 0 HcmV?d00001 diff --git a/q04_weightage/__pycache__/build.cpython-36.pyc b/q04_weightage/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a06bdeca8c8aa3df956ec67962f4a531aed84674 GIT binary patch literal 713 zcmZ`%y>8nu5GJYLICju2Y5N2oEV+MM5cFs07N97K0z?3T7B4m%k&;OYjRSj1hrUXO zzD6HHYp1+Ir=AobO@|P;&u&-gU4S%EmwXT*q){fv@+<#o%$iL%`43N!#r0H#9k4MQ2S?0~F}up8 z@FKsP;!GJ2sKTq-xY>DaXU|{F=kwVx?CeT4(@_^U!bssd)<_;1;Uz4 zqu{D=P@y_3WBUif-!Cm}gs*j_7TLqyWDj3(HncX(e2{KatUHYFp4&&POOH`PTfs@s R?D{rSn$j^Hv-BXOe*xcq#nb=* literal 0 HcmV?d00001 diff --git a/q04_weightage/build.py b/q04_weightage/build.py index f7c9792..7fe61f7 100644 --- a/q04_weightage/build.py +++ b/q04_weightage/build.py @@ -1,6 +1,24 @@ +# %load q04_weightage/build.py import pandas as pd import numpy as np from sklearn.model_selection import train_test_split from greyatomlib.recommendor_system_project.q01_Unique_users_subreddit.build import q01_Unique_users_subreddit -def q04_weightage(): +def q04_weightage(path): + + df, u_user, u_subreddit = q01_Unique_users_subreddit(path) + # minimum value in utc + mininum = min(df['utc']) + #maximum value in utc for normalization + maximum = max(df['utc']) + + # creating weight column + df['weight'] = ((df['utc'] - mininum)+1)/maximum + + return df + + +path = 'data/subreddit-interactions-for-25000-users.zip' +q04_weightage(path) + + diff --git a/q04_weightage/tests/__pycache__/__init__.cpython-36.pyc b/q04_weightage/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..cc04cfdcf70e179f82fb004173ff45c416097680 GIT binary patch literal 173 zcmXr!<>e9zcZ^{Gg2x~N1{i@12OutH0TL+;!3>&=ek&P@K*9*(SCoE6er~FMNl{{Q zYD#Kea;koKeo=OD0g$VooS%}aUzD1hpPQSSmy%x;UtC#SlA0S|P?VpQnp~n^XkZdw uo|>7SQIePrG$OUQq*y;bJ~J<~BtBlRpz;=nO>TZlX-=vg$j)LQW&i;GU@oNq literal 0 HcmV?d00001 diff --git a/q04_weightage/tests/__pycache__/test.cpython-36.pyc b/q04_weightage/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..8a875ad4ca9142346371aef698774398eebfc08c GIT binary patch literal 1254 zcmZuwNpBM|6t-u}G)-D4%L%06fW$~mCStiDgo>)Fw_K>GG(rs1v6D=gCAB?;M&*?9 zW4Q2xeC3qCz=`)}nko_4^7HfZw$Gnmbi3`n({~?#n1uW$Ys~`v0EYYof)PeD65?!R zG&e$n5@s?hGjl7nK_{R)ptowBW^U-#Hd|pEW;@%?J7I^CW5OKPx+bi}$+WvL!yQK7 z6W?7z3^MeoZjZT&#aPaGvNT{1wz}tom(f?AjwdP}bJ*C6rQ||IBN693;^$SIC1}5D zXmNErzYMwxLKXpqMJ>g?c7^?PJOxgrrD2hso}5lv%(D-$#ev7Oq?X4Wm1&Tt;ESjB;?&ID&H zRlT%O9BNi+S;*d~6usxK27^Jb0y@b4Je@5+|7w#ZhMo6MCfpNTRif}N;;iD*W2IM= z%FAPwOgz4Npytpw#2qjbcR~1$aA68NH%}9dsv^-A<`V9#_8Qls4Hva7C-DrJDG;gp zg&MJghbv4mlL&p(wB3UviN=IF(06F(Ut~8ehQ6)cC@PTik#0v(Ua~4fy%R-9m*zz5 zf=_WD1yW^AU^c=5fnn?SbPd<3cl=%LRz<4tNp&kN@cXHTpY~amW=tTa4Jxn4f?vj} z%(L{YzfP4+p7l3))~~&2w-o6(E#eIRUz%m1Gm8rrOKr?pc(2j>l}fXkTktD|4Pmv5 ij600skum$Vis}Mukli;88gG$y61QAH6uS$(WBvt;y-(Tz literal 0 HcmV?d00001 From 6d0f81323a0fa220555ac72004931d92161bca5c Mon Sep 17 00:00:00 2001 From: tracedence Date: Fri, 18 Jan 2019 12:53:51 +0000 Subject: [PATCH 4/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 181 bytes .../__pycache__/build.cpython-36.pyc | Bin 0 -> 678 bytes q05_groupby_users_subreddit/build.py | 12 +++++++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 187 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 1555 bytes 5 files changed, 11 insertions(+), 1 deletion(-) create mode 100644 q05_groupby_users_subreddit/__pycache__/__init__.cpython-36.pyc create mode 100644 q05_groupby_users_subreddit/__pycache__/build.cpython-36.pyc create mode 100644 q05_groupby_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q05_groupby_users_subreddit/tests/__pycache__/test.cpython-36.pyc diff --git a/q05_groupby_users_subreddit/__pycache__/__init__.cpython-36.pyc b/q05_groupby_users_subreddit/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..1dcad8bd716e578593f49920984d8216d52462b8 GIT binary patch literal 181 zcmYL?u?hk)5JYoeA;LBOg^dx!PDFpe#^M@b@v@7anrz%niu)vg$=1KHGFONL^O%`t zmUTUuHoK!KdJp)iDq&l!qXIMsGpqJbBg6d1r?nUMWRsj6Aq7XaVYz86)jCG9LXN$s zfGnWBCh`!4ujG<_ELLz9&av$wD~W>URtT|67N84V0+`4CHC}the5cLut;OaGw!<=2 literal 0 HcmV?d00001 diff --git a/q05_groupby_users_subreddit/__pycache__/build.cpython-36.pyc b/q05_groupby_users_subreddit/__pycache__/build.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a12cbcd4424e0e11096c2bf5f253129693ed28b9 GIT binary patch literal 678 zcmaJ<&5qMB5VoDPNxQAY4FPwg9-4%oy&!~k#eF5j0m(wL(s-Jt8#`Is(b84-6kdjR z;R$@@0Sha`!lHQ{vJ84qx0 zb*LtMLWgHTJyj8puny(qGvTqE@)^W1>nZl=d$NjtAPTuyQUAc1ywbvfb;7oF<*>KB z%3g|VsLGwoODIsvxB|>Wyv49jF*$N1J-wwzx~Gy#Rvhc#k zodu(F1$<_^jR7eu=cC^gb`_cd)<>mjx^{E$f$bDOF<`-oN=x{(3Vhh+Zs(cYqTB7W zFT~98lb<5pH40MnP=EwoK>DFEm$t=YS~L<;14W}0XxSKH57vPat!eg9xb!MJ6@M7T zAkT_BY3Zh`YMHbL|KvY!MZ+AXmMLwi|6Zgis1NG&YXs2X9+a25Eg(!e2ijjF3n v@^6>PU%xULeT~x|)tVTg#!22wC)o4xYh>+ecr%dM!C6dWx}XadMUxj6GXXKa@1Rbilx(#D_C{}LYBR! z-m#z#8p&f2zLAaaSZ(ksoI*WdQW8Z?wUBddgh(0{5Zk_uh|4g%rd!W0-Dx*I&}{Ps D1cNla literal 0 HcmV?d00001 diff --git a/q05_groupby_users_subreddit/tests/__pycache__/test.cpython-36.pyc b/q05_groupby_users_subreddit/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..d5f6d50b9ba57e284a0b0df371902826806f85c0 GIT binary patch literal 1555 zcmaJ>&5j&35VreoIJch5F<`pFHpS&S_ zBFM$@)-O&t{fVUU4$dHpl-lW9m{P5EFRGmfV=(mbtNCNLR^8AqFWI1l(o7FaB{;7Q zOrMq-#td7jvJp(Y8cJEAxBZ7+o z*gSgn8^AMyCxCQlL~Fj#Y4SP$GI?IV7Ap#t(O>L* zShe})Kp_{aa*!r@UCKe|gm+2XnWQOAb)Kvpowrw{zN1#f;6~j8k$UO~^%)8TF^Ut= z?8CRBzjmfiVR}SM0qvvzMY~^rK#Uo1Ks*P-kSoFOR7FAH@R{|3>39 zylxeNz_T?fu^)$V=*H6fHXhpAU^duE-Qw$H#tIFWLoK<&8y(5{VXeevX}U(%%j{;2 z+%C859p#oepEmAPy{_9*!t+#1Swwx=@={x`=fwx3o(-m!uEgN6QXvFkV@$=TB|M1; Z;x3pr{&uA3JIqCm$YY=x{}}$6{|`-ipw9pR literal 0 HcmV?d00001 From 47beffd5a88b2ec1d138c8ef3fac01e07661afbc Mon Sep 17 00:00:00 2001 From: tracedence Date: Mon, 21 Jan 2019 05:37:26 +0000 Subject: [PATCH 5/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 0 -> 168 bytes q06_similarity/__pycache__/build.cpython-36.pyc | Bin 0 -> 1064 bytes q06_similarity/build.py | 6 +++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 0 -> 174 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 0 -> 2428 bytes q06_similarity/tests/test_sol.pkl | Bin 0 -> 81 bytes q06_similarity/tests/user_sol.pkl | Bin 0 -> 69 bytes 7 files changed, 5 insertions(+), 1 deletion(-) create mode 100644 q06_similarity/__pycache__/__init__.cpython-36.pyc create mode 100644 q06_similarity/__pycache__/build.cpython-36.pyc create mode 100644 q06_similarity/tests/__pycache__/__init__.cpython-36.pyc create mode 100644 q06_similarity/tests/__pycache__/test.cpython-36.pyc create mode 100644 q06_similarity/tests/test_sol.pkl create mode 100644 q06_similarity/tests/user_sol.pkl diff --git a/q06_similarity/__pycache__/__init__.cpython-36.pyc b/q06_similarity/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..4dedadc38dd6a65f01b9ab7833ea51a270287c49 GIT binary patch literal 168 zcmXr!<>e9zcZ^{Gg2x~N1{i@12OutH0TL+;!3>&=ek&P@K*9*(SEznQer~FMNl{{Q zYD#Kea;koKeo=OD0g$VooS%}aUzD1hpPQSSmy%x;UtC#SlA0S|P?VpQnp~n^XkZp! qoSB=MlUS5lQmG#wpP83g5+AQuPeC5O|>}e|z48s8uRoQWURj#k9a&I=9{QdHeSFGM$k&0 z2J`$Q#tt6OiNEX&m%4OdU1>Wd9iCmOS}Qe_RyI;`Bi#lM@4Q~#FAq%HcdJd=TQIh? z{mOt4()s*+TMg+CPl^(wJV3GkpmM=BI3uUwHe3@y1bs(QlXtYHw}R7X8?C7bMI>U8 zybn*~ZM+UeDl(D3rzF@CF*%~9cF{WCQnV#!1a&%ym?A#eCfm5CPX}a#$iL2!*(Yp{ z*!*kkSc;vKo5x5I_BL&A_H3(qCtJOD2nHU16qvV9k3k+BI%@_xJ{!1e-oQNc$s4YE zus*HOtZ6XkLmwUCt?cTTZk2VftAT~5qGpk(mp`(k z;m*jnEYWaWiu&Kc{D1-fdr};>4HP&86$sE36fatHWIOyUs#ZW@plX{2v}jFfH`YN@ zcBWlJ<%-wKpD&C^vFfD~i*Dn0zcvhs+v}(Tnvv_|GT9{=xs8&MyCkFL8d^>Yfkcb* zDcYCX0p>K2u={mu_J6v+TrT&=xm%pbZa(u#$F<bx0`t1@r6`{5srkcTo+M*%@BCdnqIT13PLi%K!iX literal 0 HcmV?d00001 diff --git a/q06_similarity/build.py b/q06_similarity/build.py index 387e3b0..547e5c9 100644 --- a/q06_similarity/build.py +++ b/q06_similarity/build.py @@ -1,3 +1,4 @@ +# %load q06_similarity/build.py import pandas as pd import numpy as np @@ -6,7 +7,7 @@ from greyatomlib.recommendor_system_project.q05_groupby_users_subreddit.build import q05_groupby_users_subreddit def q06_similarity(path, kind='subreddit', similarity_function=cosine_similarity): - "write your solution here" + 'write your solution here' df = q05_groupby_users_subreddit(path) df01 = df.iloc[:100,:] matrix= df01.pivot_table(values='weights',columns='subreddit',index='username') @@ -22,3 +23,6 @@ def q06_similarity(path, kind='subreddit', similarity_function=cosine_similarity a = q06_similarity('data/subreddit-interactions-for-25000-users.zip') print(a) + + + diff --git a/q06_similarity/tests/__pycache__/__init__.cpython-36.pyc b/q06_similarity/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..9c29d902b216cd97fe6bd65a195efd3ee2828c67 GIT binary patch literal 174 zcmYL?u?oUK5JWFvAwnAe!p0Q@E0OpEHWn!qmT-Bm z%(^UR^Ll@FS?>`)6**MdI>`v`=oZD{>13S$_?+OviNK`s6sYqAHOo!=T)}f75b~T7 vb%6zSP@{ys@Rhv5eYHW2DYlJ78^B0S0Wo&b5SRV%nr;(^M@zf$RI}X|IF&Ct literal 0 HcmV?d00001 diff --git a/q06_similarity/tests/__pycache__/test.cpython-36.pyc b/q06_similarity/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000000000000000000000000000000000000..e46588d2ba2ae2bcc9ba57d7992e4db652f6c413 GIT binary patch literal 2428 zcmb_d-HsbI6t?F-*(AH&($WPASp}18Cgg~gMs(QBw+G^1VX*3x-*~!jdZBNTa z+pF}R=imi+n7QR@Ux6#m@ods$H$^I9Mn1NWkB@ymf5-l!+imY2|M2UXN624f<+GrD z4~m?EV1&_>1Xvp>&5XdHgqh4r&CCjHXcK5V&~|m3re5HI&Q4odJ7{0(wt^1moV1(u zf*vIg33HkEk}!{x>Gs?Vb{Ks`2CWNNj~oqX-JWn2iHR(Ed|`kNRK2H%UxzZuk~9*D zIs?s(xR6QC*Oj}Glw7EAETW8u{Am@XF?wBm=~gDiA9Jaad=gXefgd`3AIg0w@=p*7K$}xa6gXz)-1vR>1y#n> zRMt721AxZ>+fU?Y@(Ws6YZmqf3xnB99}bMua}v5&d|bEiURf{)X0*=9)P>U0^V`t! zmc1=TAT;-=wk20pIon@Hd#E5{IjjKMP!_3Qo~E_&eDoSKG=60!MzbM{R5X;;NN~my zb&%wWizrq}k;{W|Ar3zO>hSRJ0NqP}mXw1|ZI=S9YO5%DURx|lQ;=0w)~-|)<1pkE zBAFz41OsUivAT0P5RR)n4!W?-3K!5_mFnsPog6i{hSUjQ|xhBD77 zqkCko>Bn?`PRGV=GB+_J;i#=6f$Y67LCp3a{05n(IO{{wRS=B&R1W$dv(NeulV?1K z*1!@-a%raT`Q;ua2An6nzUMqps|Elr12n9%Ay7?OC=5W}OhyNe(< z+O7qSb9B%jLSr@PCS(kDj5)Uw=sRE;w3hUneX|Ug@o`k8s{brXD=z!2=;wv%XOW6e z`V$@cy2UCC;$3hnY!H{>i@T^m)~rOocP*kzk8&Rj8wB9!XZx>3U}3*R0ncrT0$yW^ zKz74{gEZjyH3f8zo6xhMn9SHCQyZ=|Yl(|<^u}q~Fy=>Cappfh;r%9QHiE|&gldol zg!(W|i-DtABz9486UAF75KTymlc?kas_AqU$_0@ybwkW&eaC+S^JE(Yp$_~#x^taQ z>ofibARV}n7X)+P9LNiudR^GFM&v)B`O#wTzo03QVVkiOm^=qit{`_baBD9Nb9_6) zx*djD!KxJ7oiN07Z$`u(E{`vs_y7fZTRAPA0+{;(Z>TLOdKr&;JDv@{tM!8$wO8ed z!UU<^B*({I>073@M^%zCfh5;l3BH{Oeio@BOOuhmdX=o-xc>T$>o;z8&<%ne+>xg# zk3{ZgT!|!>ei>Q4rg7kuQO+V+8zl>FHfN{RFV4)(%tD$UGE M;X)PUDrC?D0Ix$C^#A|> literal 0 HcmV?d00001 From d93f89e1923aad652706f359af0147b9eafeb8a2 Mon Sep 17 00:00:00 2001 From: tracedence Date: Mon, 21 Jan 2019 05:40:08 +0000 Subject: [PATCH 6/6] Done --- .../__pycache__/__init__.cpython-36.pyc | Bin 155 -> 173 bytes .../__pycache__/build.cpython-36.pyc | Bin 1491 -> 1509 bytes q07_recommendations/build.py | 7 ++++++- .../tests/__pycache__/__init__.cpython-36.pyc | Bin 161 -> 179 bytes .../tests/__pycache__/test.cpython-36.pyc | Bin 1817 -> 1835 bytes 5 files changed, 6 insertions(+), 1 deletion(-) diff --git a/q07_recommendations/__pycache__/__init__.cpython-36.pyc b/q07_recommendations/__pycache__/__init__.cpython-36.pyc index 6fe9d54f7238d290893446b11b1a71dfd848714d..b6a5c34238f6d0f4af730dfcc5e48c2cffcc5103 100644 GIT binary patch delta 52 zcmbQuxR#N_n3tDJDBLk-B8Ry`lzv8jZmNDsQDSmxN@`wms(yHWQFd_wkgK1ZpOQM! G*AD=U;t=Bi delta 34 pcmZ3>IGd5fn3tF9;OnsHi5%v99{L&ixvBa|8KuP;iFp&_{Q$Ox3tIpH diff --git a/q07_recommendations/__pycache__/build.cpython-36.pyc b/q07_recommendations/__pycache__/build.cpython-36.pyc index 5e2b99a4b34e86eaf886e03745d6e9b287f31e21..b4fabcd396b7feffeb11eee48b490dc3b003123b 100644 GIT binary patch delta 100 zcmcc2{gj)_n3tDJCfYSdiDe^~DU(9Denx(7s(wjPVsdIqYF=`xet3RSc5wlatDl^o zk~-O!$%#>T@&u*@j3Sc_nb$CiPQJ(dpOItoJ(fqpObiSR#auvwgOP)g2Lzb_<)RwS delta 96 zcmaFLeVLofn3tEU=wn#)Pv(tWrc8XU`WgATsrpG7rNtSEd6VOroVbM;7#NCyn4wB_ tvOlx@|j38B9K!SsjgOLXWnE*?P7$g7y diff --git a/q07_recommendations/build.py b/q07_recommendations/build.py index f3ed7f3..3b1d9f2 100644 --- a/q07_recommendations/build.py +++ b/q07_recommendations/build.py @@ -1,3 +1,4 @@ +# %load q07_recommendations/build.py import pandas as pd import numpy as np from sklearn.model_selection import train_test_split @@ -5,7 +6,7 @@ from greyatomlib.recommendor_system_project.q06_similarity.build import q06_similarity def q07_recommendations(path, user='--ANUSTART-', similarity_function=cosine_similarity, kind='subreddit', number=5): - "write your solution here" + 'write your solution here' new_df, matrix = q06_similarity(path, kind='subreddit', similarity_function=cosine_similarity) final_dict = dict() sorted_sub = matrix.loc[user,:].sort_values(ascending=False).index @@ -19,3 +20,7 @@ def q07_recommendations(path, user='--ANUSTART-', similarity_function=cosine_sim final = [x[0] for x in sorted_dict] recommend = [x for x in final if matrix.loc[user,x]==0.0] return recommend[0:number] + + + + diff --git a/q07_recommendations/tests/__pycache__/__init__.cpython-36.pyc b/q07_recommendations/tests/__pycache__/__init__.cpython-36.pyc index 9328f6934fa64c6d488fc03a92138a52774dabe3..d5af7c897f3f104eb07c81af24253b134e66493a 100644 GIT binary patch delta 52 zcmZ3;xS5f|n3tDJDBLk-B8Ry`f__GRZmNDsQDSmxN@`wms(yHWQFd_wkgK1ZpOQM! GHv|BX9uWHg delta 34 pcmdnYxR8;