Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
10 changes: 8 additions & 2 deletions q01_read_csv_data_to_df/build.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,14 @@
# %load q01_read_csv_data_to_df/build.py
# Default Imports
import pandas as pd

# Path has been given to you already to use in function.
path = "data/ipl_dataset.csv"
path = 'data/ipl_dataset.csv'

def read_csv_data_to_df(path='data/ipl_dataset.csv'):
read_csv=pd.read_csv(path)
return read_csv



# Solution

11 changes: 9 additions & 2 deletions q02_get_unique_values/build.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,13 @@
# %load q02_get_unique_values/build.py
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('data/ipl_dataset.csv')

def get_unique_venues():
venue_unique_array=ipl_df['venue'].unique()
return venue_unique_array




#Solution
11 changes: 9 additions & 2 deletions q03_get_run_counts/build.py
Original file line number Diff line number Diff line change
@@ -1,8 +1,15 @@
# %load q03_get_run_counts/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

def get_run_counts():
runs_count=ipl_df['runs'].value_counts()
return runs_count




# Solution

14 changes: 12 additions & 2 deletions q04_get_match_specific_df/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,17 @@
# %load q04_get_match_specific_df/build.py
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

def get_match_specific_df(match_code):
#creating a filter for the given match code through the function
match_code_filter = ipl_df['match_code']==match_code
#applying the above created filter to the main data frame and assigining it to a variable
match_info=ipl_df[match_code_filter]
return match_info




# Solution

9 changes: 7 additions & 2 deletions q05_create_bowler_filter/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,12 @@
# %load q05_create_bowler_filter/build.py
# Default imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')

def create_bowler_filter(bowler):
bowler_filter=ipl_df['bowler']==bowler
return bowler_filter


# Solution
8 changes: 5 additions & 3 deletions q06_get_match_innings_runs/build.py
Original file line number Diff line number Diff line change
@@ -1,11 +1,13 @@
# %load q06_get_match_innings_runs/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

# You have been given dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("data/ipl_dataset.csv")

# Solution
ipl_df = read_csv_data_to_df('data/ipl_dataset.csv')

def get_match_innings_runs():
innings_summary=ipl_df.groupby(['match_code', 'inning'])[['runs']].sum()
return innings_summary



13 changes: 11 additions & 2 deletions q07_get_run_counts_by_match/build.py
Original file line number Diff line number Diff line change
@@ -1,7 +1,16 @@
# %load q07_get_run_counts_by_match/build.py
# Default Imports
from greyatomlib.pandas_project.q01_read_csv_data_to_df.build import read_csv_data_to_df

import pandas as pd
import numpy as np
# You have been give the dataset already in 'ipl_df'.
ipl_df = read_csv_data_to_df("./data/ipl_dataset.csv")
ipl_df = read_csv_data_to_df('./data/ipl_dataset.csv')
def get_runs_counts_by_match():
runs_per_match=ipl_df.pivot_table(values='batsman',index=['match_code'],columns=('runs'),aggfunc='count')
#value synbolises the runs scored by batsman
return runs_per_match
get_runs_counts_by_match()



# Solution