diff --git a/__pycache__/__init__.cpython-36.pyc b/__pycache__/__init__.cpython-36.pyc index 3337b5d..7e61601 100644 Binary files a/__pycache__/__init__.cpython-36.pyc and b/__pycache__/__init__.cpython-36.pyc differ diff --git a/q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc b/q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000..493dd86 Binary files /dev/null and b/q01_Unique_users_subreddit/__pycache__/__init__.cpython-36.pyc differ diff --git a/q01_Unique_users_subreddit/__pycache__/build.cpython-36.pyc b/q01_Unique_users_subreddit/__pycache__/build.cpython-36.pyc index ca2efed..325bcbb 100644 Binary files a/q01_Unique_users_subreddit/__pycache__/build.cpython-36.pyc and b/q01_Unique_users_subreddit/__pycache__/build.cpython-36.pyc differ diff --git a/q01_Unique_users_subreddit/build.py b/q01_Unique_users_subreddit/build.py index 82fe7e5..5870cd5 100644 --- a/q01_Unique_users_subreddit/build.py +++ b/q01_Unique_users_subreddit/build.py @@ -1,7 +1,15 @@ +# %load q01_Unique_users_subreddit/build.py import pandas as pd import numpy as np from sklearn.model_selection import train_test_split +path = '.data/subreddit-interactions-for-2500-user.csv' + + +def q01_Unique_users_subreddit(path): + + data =pd.read_csv(path, compression= 'zip') + return data, len(data['username'].unique()), len(data['subreddit'].unique()) + -def q01_Unique_users_subreddit(): diff --git a/q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc b/q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc new file mode 100644 index 0000000..41b7b6c Binary files /dev/null and b/q01_Unique_users_subreddit/tests/__pycache__/__init__.cpython-36.pyc differ diff --git a/q01_Unique_users_subreddit/tests/__pycache__/test.cpython-36.pyc b/q01_Unique_users_subreddit/tests/__pycache__/test.cpython-36.pyc new file mode 100644 index 0000000..c06a84e Binary files /dev/null and b/q01_Unique_users_subreddit/tests/__pycache__/test.cpython-36.pyc differ