diff --git a/q01_load_data/build.py b/q01_load_data/build.py index a29c139..66ee28e 100644 --- a/q01_load_data/build.py +++ b/q01_load_data/build.py @@ -1,7 +1,15 @@ +# %load q01_load_data/build.py import pandas as pd import numpy as np from sklearn.model_selection import train_test_split +path ='data/elecdemand.csv' + +def q01_load_data(path): + data = pd.read_csv(path) + data['Datetime']=pd.to_datetime(data['Datetime']) + return data.shape, data + +# q01_load_data(path) - diff --git a/q01_load_data/tests/test_sol.pkl b/q01_load_data/tests/test_sol.pkl new file mode 100644 index 0000000..7912fb6 Binary files /dev/null and b/q01_load_data/tests/test_sol.pkl differ diff --git a/q01_load_data/tests/user_sol.pkl b/q01_load_data/tests/user_sol.pkl new file mode 100644 index 0000000..2ad49fc Binary files /dev/null and b/q01_load_data/tests/user_sol.pkl differ diff --git a/q02_data_splitter/build.py b/q02_data_splitter/build.py index b6c715f..288ce55 100644 --- a/q02_data_splitter/build.py +++ b/q02_data_splitter/build.py @@ -1,7 +1,16 @@ +# %load q02_data_splitter/build.py import pandas as pd import numpy as np from sklearn.model_selection import TimeSeriesSplit from greyatomlib.time_series_day_02_project.q01_load_data.build import q01_load_data +path = 'data/elecdemand.csv' + +def q02_data_splitter(path): + np.random.seed(9) + shape,data = q01_load_data(path) + tscv = TimeSeriesSplit(n_splits=2) + split_data = list(tscv.split(data)) + return split_data + - diff --git a/q02_data_splitter/tests/test_sol.pkl b/q02_data_splitter/tests/test_sol.pkl new file mode 100644 index 0000000..a3e9cc5 Binary files /dev/null and b/q02_data_splitter/tests/test_sol.pkl differ diff --git a/q02_data_splitter/tests/user_sol.pkl b/q02_data_splitter/tests/user_sol.pkl new file mode 100644 index 0000000..70c2333 Binary files /dev/null and b/q02_data_splitter/tests/user_sol.pkl differ diff --git a/q03_time_plot/build.py b/q03_time_plot/build.py index bf18743..874cfa2 100644 --- a/q03_time_plot/build.py +++ b/q03_time_plot/build.py @@ -1,7 +1,19 @@ +# %load q03_time_plot/build.py import pandas as pd import numpy as np import matplotlib.pyplot as plt from greyatomlib.time_series_day_02_project.q01_load_data.build import q01_load_data plt.switch_backend('agg') +path = 'data/elecdemand.csv' + +def q03_time_plot(path): + shp,df=q01_load_data(path) + plt.figure(figsize=(16, 6)) + plt.plot(df['Datetime'], df['Demand']) + plt.xlabel('Time') + plt.ylabel('Demand') + plt.title('Electricity Demand in Australia for a year') + plt.show() + diff --git a/test_sol.pkl b/test_sol.pkl new file mode 100644 index 0000000..cec104b Binary files /dev/null and b/test_sol.pkl differ diff --git a/user_sol.pkl b/user_sol.pkl new file mode 100644 index 0000000..fb41a08 Binary files /dev/null and b/user_sol.pkl differ