Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 9 additions & 1 deletion q01_read_csv_data_to_df/build.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,16 @@
# %load q01_read_csv_data_to_df/build.py
# Default Imports
import pandas as pd

# Path has been given to you already to use in function.
path = "data/ipl_dataset.csv"
path = 'data/ipl_dataset.csv'

def read_csv_data_to_df(path):
df=pd.read_csv(path)
return df
# Solution





12 changes: 10 additions & 2 deletions q02_get_unique_values/build.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,14 @@
# %load q02_get_unique_values/build.py
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("data/ipl_dataset.csv")

ipl_df = read_csv_data_to_df('data/ipl_dataset.csv')
import numpy as np
#Solution

def get_unique_venues():
venues=np.unique(ipl_df['venue'].values)

return venues


15 changes: 14 additions & 1 deletion q03_get_run_counts/build.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,21 @@
# %load q03_get_run_counts/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

import numpy as np
import pandas as pd
# Solution

def get_run_counts():

unique,counts=np.unique(ipl_df['runs'].values,return_counts=True)
d=dict(zip(unique,counts))
runs_count=pd.Series(d)

return runs_count



12 changes: 11 additions & 1 deletion q04_get_match_specific_df/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,17 @@
# %load q04_get_match_specific_df/build.py
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

# Solution
import pandas as pd

def get_match_specific_df(match_code):

dfi=ipl_df.groupby('match_code').get_group(598057)

return dfi



13 changes: 12 additions & 1 deletion q05_create_bowler_filter/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,18 @@
# %load q05_create_bowler_filter/build.py
# Default imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

# Solution
import pandas as pd
def create_bowler_filter(bowler):

b=pd.Series(ipl_df['bowler'])
series=b.isin(['I Sharma'])

return series



9 changes: 8 additions & 1 deletion q06_get_match_innings_runs/build.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,18 @@
# %load q06_get_match_innings_runs/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('data/ipl_dataset.csv')

# Solution

import numpy as np

def get_match_innings_runs():

dfi=ipl_df.groupby(['match_code','inning']).agg({'runs':sum})

return dfi


12 changes: 11 additions & 1 deletion q07_get_run_counts_by_match/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,17 @@
# %load q07_get_run_counts_by_match/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been give the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

# Solution
import pandas as pd

def get_runs_counts_by_match():

df=pd.pivot_table(ipl_df,index='match_code',columns='runs',aggfunc='count').iloc[:,0:7]

return df