diff --git a/Assignment2 pandas.ipynb b/Assignment2 pandas.ipynb new file mode 100644 index 0000000..9a08a8f --- /dev/null +++ b/Assignment2 pandas.ipynb @@ -0,0 +1,3138 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 80, + "metadata": {}, + "outputs": [], + "source": [ + "import numpy as np\n", + "import pandas as pd\n", + "#%matplotlib notebook\n", + "%matplotlib inline" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "import the dataset into a dataframe" + ] + }, + { + "cell_type": "code", + "execution_count": 81, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
IdEmployeeNameJobTitleBasePayOvertimePayOtherPayBenefitsTotalPayTotalPayBenefitsYearNotesAgencyStatus
01NATHANIEL FORDGENERAL MANAGER-METROPOLITAN TRANSIT AUTHORITY167411.180.00400184.25NaN567595.43567595.432011NaNSan FranciscoNaN
12GARY JIMENEZCAPTAIN III (POLICE DEPARTMENT)155966.02245131.88137811.38NaN538909.28538909.282011NaNSan FranciscoNaN
23ALBERT PARDINICAPTAIN III (POLICE DEPARTMENT)212739.13106088.1816452.60NaN335279.91335279.912011NaNSan FranciscoNaN
34CHRISTOPHER CHONGWIRE ROPE CABLE MAINTENANCE MECHANIC77916.0056120.71198306.90NaN332343.61332343.612011NaNSan FranciscoNaN
45PATRICK GARDNERDEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT)134401.609737.00182234.59NaN326373.19326373.192011NaNSan FranciscoNaN
56DAVID SULLIVANASSISTANT DEPUTY CHIEF II118602.008601.00189082.74NaN316285.74316285.742011NaNSan FranciscoNaN
67ALSON LEEBATTALION CHIEF, (FIRE DEPARTMENT)92492.0189062.90134426.14NaN315981.05315981.052011NaNSan FranciscoNaN
78DAVID KUSHNERDEPUTY DIRECTOR OF INVESTMENTS256576.960.0051322.50NaN307899.46307899.462011NaNSan FranciscoNaN
89MICHAEL MORRISBATTALION CHIEF, (FIRE DEPARTMENT)176932.6486362.6840132.23NaN303427.55303427.552011NaNSan FranciscoNaN
910JOANNE HAYES-WHITECHIEF OF DEPARTMENT, (FIRE DEPARTMENT)285262.000.0017115.73NaN302377.73302377.732011NaNSan FranciscoNaN
1011ARTHUR KENNEYASSISTANT CHIEF OF DEPARTMENT, (FIRE DEPARTMENT)194999.3971344.8833149.90NaN299494.17299494.172011NaNSan FranciscoNaN
1112PATRICIA JACKSONCAPTAIN III (POLICE DEPARTMENT)99722.0087082.62110804.30NaN297608.92297608.922011NaNSan FranciscoNaN
1213EDWARD HARRINGTONEXECUTIVE CONTRACT EMPLOYEE294580.020.000.00NaN294580.02294580.022011NaNSan FranciscoNaN
1314JOHN MARTINDEPARTMENT HEAD V271329.030.0021342.59NaN292671.62292671.622011NaNSan FranciscoNaN
1415DAVID FRANKLINBATTALION CHIEF, (FIRE DEPARTMENT)174872.6474050.3037424.11NaN286347.05286347.052011NaNSan FranciscoNaN
1516RICHARD CORRIEACOMMANDER III, (POLICE DEPARTMENT)198778.0173478.2013957.65NaN286213.86286213.862011NaNSan FranciscoNaN
1617AMY HARTDEPARTMENT HEAD V268604.570.0016115.86NaN284720.43284720.432011NaNSan FranciscoNaN
1718SEBASTIAN WONGCAPTAIN, EMERGENCYCY MEDICAL SERVICES140546.87119397.2618625.08NaN278569.21278569.212011NaNSan FranciscoNaN
1819MARTY ROSSBATTALION CHIEF, (FIRE DEPARTMENT)168692.6369626.1238115.47NaN276434.22276434.222011NaNSan FranciscoNaN
1920ELLEN MOFFATTASSISTANT MEDICAL EXAMINER257510.59880.1616159.50NaN274550.25274550.252011NaNSan FranciscoNaN
2021VENUS AZARASSISTANT MEDICAL EXAMINER257510.480.0016679.79NaN274190.27274190.272011NaNSan FranciscoNaN
2122JUDY MELINEKASSISTANT MEDICAL EXAMINER257510.44377.2115883.56NaN273771.21273771.212011NaNSan FranciscoNaN
2223GEORGE GARCIACAPTAIN, FIRE SUPPRESSION140546.8893200.5839955.25NaN273702.71273702.712011NaNSan FranciscoNaN
2324VICTOR WYRSCHBATTALION CHIEF, (FIRE DEPARTMENT)168692.6377896.1424083.86NaN270672.63270672.632011NaNSan FranciscoNaN
2425JOSEPH DRISCOLLCAPTAIN, FIRE SUPPRESSION140546.8697868.7731909.28NaN270324.91270324.912011NaNSan FranciscoNaN
2526GREGORY SUHRCHIEF OF POLICE256470.410.0011522.18NaN267992.59267992.592011NaNSan FranciscoNaN
2627JOHN HANLEYCAPTAIN, FIRE SUPPRESSION92080.8040008.00133695.76NaN265784.56265784.562011NaNSan FranciscoNaN
2728RAYMOND GUZMANBATTALION CHIEF, (FIRE DEPARTMENT)168692.5980706.8816063.99NaN265463.46265463.462011NaNSan FranciscoNaN
2829DENISE SCHMITTDEPUTY CHIEF III (POLICE DEPARTMENT)261717.600.002357.00NaN264074.60264074.602011NaNSan FranciscoNaN
2930MONICA FIELDSDEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT)246225.600.0015140.54NaN261366.14261366.142011NaNSan FranciscoNaN
..........................................
148624148625Lorraine RosenthalSenior Clerk0.000.0012.890.0012.8912.892014NaNSan FranciscoNaN
148625148626Renato C GurionRegistered Nurse0.000.006.001.246.007.242014NaNSan FranciscoNaN
148626148627Paulet GainesAccount Clerk0.000.000.000.000.000.002014NaNSan FranciscoNaN
148627148628Brett A LundbergGeneral Laborer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148628148629Mark W McclureGeneral Laborer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148629148630Elizabeth IniguezTranscriber Typist0.000.000.000.000.000.002014NaNSan FranciscoNaN
148630148631Randy J KeysCarpenter0.000.000.000.000.000.002014NaNSan FranciscoNaN
148631148632Andre M JohnsonCommunications Dispatcher 10.000.000.000.000.000.002014NaNSan FranciscoNaN
148632148633Sharon D Owens-WebsterProtective Services Worker0.000.000.000.000.000.002014NaNSan FranciscoNaN
148633148634Edward FerdinandGeneral Laborer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148634148635David M TurnerTransit Car Cleaner0.000.000.000.000.000.002014NaNSan FranciscoNaN
148635148636James S KibblewhiteGeneral Laborer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148636148637Andrew J EnziArborist Technician0.000.000.000.000.000.002014NaNSan FranciscoNaN
148637148638Kadeshra D GreenTransit Fare Inspector0.000.000.000.000.000.002014NaNSan FranciscoNaN
148638148639Lennard B HutchinsonElectrician0.000.000.000.000.000.002014NaNSan FranciscoNaN
148639148640Richard A TalbertCustodian0.000.000.000.000.000.002014NaNSan FranciscoNaN
148640148641Charlene D MccullyParking Control Officer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148641148642Raphael Marquis GoinsMuseum Guard0.000.000.000.000.000.002014NaNSan FranciscoNaN
148642148643Dominic C MarquezSign Worker0.000.000.000.000.000.002014NaNSan FranciscoNaN
148643148644Kim BrewerParking Control Officer0.000.000.000.000.000.002014NaNSan FranciscoNaN
148644148645Randy D WinnStationary Eng, Sewage Plant0.000.000.000.000.000.002014NaNSan FranciscoNaN
148645148646Carolyn A WilsonHuman Services Technician0.000.000.000.000.000.002014NaNSan FranciscoNaN
148646148647Not providedNot providedNaNNaNNaNNaN0.000.002014NaNSan FranciscoNaN
148647148648Joann AndersonCommunications Dispatcher 20.000.000.000.000.000.002014NaNSan FranciscoNaN
148648148649Leon WalkerCustodian0.000.000.000.000.000.002014NaNSan FranciscoNaN
148649148650Roy I TilleryCustodian0.000.000.000.000.000.002014NaNSan FranciscoNaN
148650148651Not providedNot providedNaNNaNNaNNaN0.000.002014NaNSan FranciscoNaN
148651148652Not providedNot providedNaNNaNNaNNaN0.000.002014NaNSan FranciscoNaN
148652148653Not providedNot providedNaNNaNNaNNaN0.000.002014NaNSan FranciscoNaN
148653148654Joe LopezCounselor, Log Cabin Ranch0.000.00-618.130.00-618.13-618.132014NaNSan FranciscoNaN
\n", + "

148654 rows × 13 columns

\n", + "
" + ], + "text/plain": [ + " Id EmployeeName \\\n", + "0 1 NATHANIEL FORD \n", + "1 2 GARY JIMENEZ \n", + "2 3 ALBERT PARDINI \n", + "3 4 CHRISTOPHER CHONG \n", + "4 5 PATRICK GARDNER \n", + "5 6 DAVID SULLIVAN \n", + "6 7 ALSON LEE \n", + "7 8 DAVID KUSHNER \n", + "8 9 MICHAEL MORRIS \n", + "9 10 JOANNE HAYES-WHITE \n", + "10 11 ARTHUR KENNEY \n", + "11 12 PATRICIA JACKSON \n", + "12 13 EDWARD HARRINGTON \n", + "13 14 JOHN MARTIN \n", + "14 15 DAVID FRANKLIN \n", + "15 16 RICHARD CORRIEA \n", + "16 17 AMY HART \n", + "17 18 SEBASTIAN WONG \n", + "18 19 MARTY ROSS \n", + "19 20 ELLEN MOFFATT \n", + "20 21 VENUS AZAR \n", + "21 22 JUDY MELINEK \n", + "22 23 GEORGE GARCIA \n", + "23 24 VICTOR WYRSCH \n", + "24 25 JOSEPH DRISCOLL \n", + "25 26 GREGORY SUHR \n", + "26 27 JOHN HANLEY \n", + "27 28 RAYMOND GUZMAN \n", + "28 29 DENISE SCHMITT \n", + "29 30 MONICA FIELDS \n", + "... ... ... \n", + "148624 148625 Lorraine Rosenthal \n", + "148625 148626 Renato C Gurion \n", + "148626 148627 Paulet Gaines \n", + "148627 148628 Brett A Lundberg \n", + "148628 148629 Mark W Mcclure \n", + "148629 148630 Elizabeth Iniguez \n", + "148630 148631 Randy J Keys \n", + "148631 148632 Andre M Johnson \n", + "148632 148633 Sharon D Owens-Webster \n", + "148633 148634 Edward Ferdinand \n", + "148634 148635 David M Turner \n", + "148635 148636 James S Kibblewhite \n", + "148636 148637 Andrew J Enzi \n", + "148637 148638 Kadeshra D Green \n", + "148638 148639 Lennard B Hutchinson \n", + "148639 148640 Richard A Talbert \n", + "148640 148641 Charlene D Mccully \n", + "148641 148642 Raphael Marquis Goins \n", + "148642 148643 Dominic C Marquez \n", + "148643 148644 Kim Brewer \n", + "148644 148645 Randy D Winn \n", + "148645 148646 Carolyn A Wilson \n", + "148646 148647 Not provided \n", + "148647 148648 Joann Anderson \n", + "148648 148649 Leon Walker \n", + "148649 148650 Roy I Tillery \n", + "148650 148651 Not provided \n", + "148651 148652 Not provided \n", + "148652 148653 Not provided \n", + "148653 148654 Joe Lopez \n", + "\n", + " JobTitle BasePay \\\n", + "0 GENERAL MANAGER-METROPOLITAN TRANSIT AUTHORITY 167411.18 \n", + "1 CAPTAIN III (POLICE DEPARTMENT) 155966.02 \n", + "2 CAPTAIN III (POLICE DEPARTMENT) 212739.13 \n", + "3 WIRE ROPE CABLE MAINTENANCE MECHANIC 77916.00 \n", + "4 DEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT) 134401.60 \n", + "5 ASSISTANT DEPUTY CHIEF II 118602.00 \n", + "6 BATTALION CHIEF, (FIRE DEPARTMENT) 92492.01 \n", + "7 DEPUTY DIRECTOR OF INVESTMENTS 256576.96 \n", + "8 BATTALION CHIEF, (FIRE DEPARTMENT) 176932.64 \n", + "9 CHIEF OF DEPARTMENT, (FIRE DEPARTMENT) 285262.00 \n", + "10 ASSISTANT CHIEF OF DEPARTMENT, (FIRE DEPARTMENT) 194999.39 \n", + "11 CAPTAIN III (POLICE DEPARTMENT) 99722.00 \n", + "12 EXECUTIVE CONTRACT EMPLOYEE 294580.02 \n", + "13 DEPARTMENT HEAD V 271329.03 \n", + "14 BATTALION CHIEF, (FIRE DEPARTMENT) 174872.64 \n", + "15 COMMANDER III, (POLICE DEPARTMENT) 198778.01 \n", + "16 DEPARTMENT HEAD V 268604.57 \n", + "17 CAPTAIN, EMERGENCYCY MEDICAL SERVICES 140546.87 \n", + "18 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.63 \n", + "19 ASSISTANT MEDICAL EXAMINER 257510.59 \n", + "20 ASSISTANT MEDICAL EXAMINER 257510.48 \n", + "21 ASSISTANT MEDICAL EXAMINER 257510.44 \n", + "22 CAPTAIN, FIRE SUPPRESSION 140546.88 \n", + "23 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.63 \n", + "24 CAPTAIN, FIRE SUPPRESSION 140546.86 \n", + "25 CHIEF OF POLICE 256470.41 \n", + "26 CAPTAIN, FIRE SUPPRESSION 92080.80 \n", + "27 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.59 \n", + "28 DEPUTY CHIEF III (POLICE DEPARTMENT) 261717.60 \n", + "29 DEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT) 246225.60 \n", + "... ... ... \n", + "148624 Senior Clerk 0.00 \n", + "148625 Registered Nurse 0.00 \n", + "148626 Account Clerk 0.00 \n", + "148627 General Laborer 0.00 \n", + "148628 General Laborer 0.00 \n", + "148629 Transcriber Typist 0.00 \n", + "148630 Carpenter 0.00 \n", + "148631 Communications Dispatcher 1 0.00 \n", + "148632 Protective Services Worker 0.00 \n", + "148633 General Laborer 0.00 \n", + "148634 Transit Car Cleaner 0.00 \n", + "148635 General Laborer 0.00 \n", + "148636 Arborist Technician 0.00 \n", + "148637 Transit Fare Inspector 0.00 \n", + "148638 Electrician 0.00 \n", + "148639 Custodian 0.00 \n", + "148640 Parking Control Officer 0.00 \n", + "148641 Museum Guard 0.00 \n", + "148642 Sign Worker 0.00 \n", + "148643 Parking Control Officer 0.00 \n", + "148644 Stationary Eng, Sewage Plant 0.00 \n", + "148645 Human Services Technician 0.00 \n", + "148646 Not provided NaN \n", + "148647 Communications Dispatcher 2 0.00 \n", + "148648 Custodian 0.00 \n", + "148649 Custodian 0.00 \n", + "148650 Not provided NaN \n", + "148651 Not provided NaN \n", + "148652 Not provided NaN \n", + "148653 Counselor, Log Cabin Ranch 0.00 \n", + "\n", + " OvertimePay OtherPay Benefits TotalPay TotalPayBenefits Year \\\n", + "0 0.00 400184.25 NaN 567595.43 567595.43 2011 \n", + "1 245131.88 137811.38 NaN 538909.28 538909.28 2011 \n", + "2 106088.18 16452.60 NaN 335279.91 335279.91 2011 \n", + "3 56120.71 198306.90 NaN 332343.61 332343.61 2011 \n", + "4 9737.00 182234.59 NaN 326373.19 326373.19 2011 \n", + "5 8601.00 189082.74 NaN 316285.74 316285.74 2011 \n", + "6 89062.90 134426.14 NaN 315981.05 315981.05 2011 \n", + "7 0.00 51322.50 NaN 307899.46 307899.46 2011 \n", + "8 86362.68 40132.23 NaN 303427.55 303427.55 2011 \n", + "9 0.00 17115.73 NaN 302377.73 302377.73 2011 \n", + "10 71344.88 33149.90 NaN 299494.17 299494.17 2011 \n", + "11 87082.62 110804.30 NaN 297608.92 297608.92 2011 \n", + "12 0.00 0.00 NaN 294580.02 294580.02 2011 \n", + "13 0.00 21342.59 NaN 292671.62 292671.62 2011 \n", + "14 74050.30 37424.11 NaN 286347.05 286347.05 2011 \n", + "15 73478.20 13957.65 NaN 286213.86 286213.86 2011 \n", + "16 0.00 16115.86 NaN 284720.43 284720.43 2011 \n", + "17 119397.26 18625.08 NaN 278569.21 278569.21 2011 \n", + "18 69626.12 38115.47 NaN 276434.22 276434.22 2011 \n", + "19 880.16 16159.50 NaN 274550.25 274550.25 2011 \n", + "20 0.00 16679.79 NaN 274190.27 274190.27 2011 \n", + "21 377.21 15883.56 NaN 273771.21 273771.21 2011 \n", + "22 93200.58 39955.25 NaN 273702.71 273702.71 2011 \n", + "23 77896.14 24083.86 NaN 270672.63 270672.63 2011 \n", + "24 97868.77 31909.28 NaN 270324.91 270324.91 2011 \n", + "25 0.00 11522.18 NaN 267992.59 267992.59 2011 \n", + "26 40008.00 133695.76 NaN 265784.56 265784.56 2011 \n", + "27 80706.88 16063.99 NaN 265463.46 265463.46 2011 \n", + "28 0.00 2357.00 NaN 264074.60 264074.60 2011 \n", + "29 0.00 15140.54 NaN 261366.14 261366.14 2011 \n", + "... ... ... ... ... ... ... \n", + "148624 0.00 12.89 0.00 12.89 12.89 2014 \n", + "148625 0.00 6.00 1.24 6.00 7.24 2014 \n", + "148626 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148627 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148628 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148629 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148630 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148631 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148632 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148633 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148634 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148635 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148636 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148637 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148638 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148639 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148640 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148641 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148642 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148643 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148644 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148645 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148646 NaN NaN NaN 0.00 0.00 2014 \n", + "148647 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148648 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148649 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148650 NaN NaN NaN 0.00 0.00 2014 \n", + "148651 NaN NaN NaN 0.00 0.00 2014 \n", + "148652 NaN NaN NaN 0.00 0.00 2014 \n", + "148653 0.00 -618.13 0.00 -618.13 -618.13 2014 \n", + "\n", + " Notes Agency Status \n", + "0 NaN San Francisco NaN \n", + "1 NaN San Francisco NaN \n", + "2 NaN San Francisco NaN \n", + "3 NaN San Francisco NaN \n", + "4 NaN San Francisco NaN \n", + "5 NaN San Francisco NaN \n", + "6 NaN San Francisco NaN \n", + "7 NaN San Francisco NaN \n", + "8 NaN San Francisco NaN \n", + "9 NaN San Francisco NaN \n", + "10 NaN San Francisco NaN \n", + "11 NaN San Francisco NaN \n", + "12 NaN San Francisco NaN \n", + "13 NaN San Francisco NaN \n", + "14 NaN San Francisco NaN \n", + "15 NaN San Francisco NaN \n", + "16 NaN San Francisco NaN \n", + "17 NaN San Francisco NaN \n", + "18 NaN San Francisco NaN \n", + "19 NaN San Francisco NaN \n", + "20 NaN San Francisco NaN \n", + "21 NaN San Francisco NaN \n", + "22 NaN San Francisco NaN \n", + "23 NaN San Francisco NaN \n", + "24 NaN San Francisco NaN \n", + "25 NaN San Francisco NaN \n", + "26 NaN San Francisco NaN \n", + "27 NaN San Francisco NaN \n", + "28 NaN San Francisco NaN \n", + "29 NaN San Francisco NaN \n", + "... ... ... ... \n", + "148624 NaN San Francisco NaN \n", + "148625 NaN San Francisco NaN \n", + "148626 NaN San Francisco NaN \n", + "148627 NaN San Francisco NaN \n", + "148628 NaN San Francisco NaN \n", + "148629 NaN San Francisco NaN \n", + "148630 NaN San Francisco NaN \n", + "148631 NaN San Francisco NaN \n", + "148632 NaN San Francisco NaN \n", + "148633 NaN San Francisco NaN \n", + "148634 NaN San Francisco NaN \n", + "148635 NaN San Francisco NaN \n", + "148636 NaN San Francisco NaN \n", + "148637 NaN San Francisco NaN \n", + "148638 NaN San Francisco NaN \n", + "148639 NaN San Francisco NaN \n", + "148640 NaN San Francisco NaN \n", + "148641 NaN San Francisco NaN \n", + "148642 NaN San Francisco NaN \n", + "148643 NaN San Francisco NaN \n", + "148644 NaN San Francisco NaN \n", + "148645 NaN San Francisco NaN \n", + "148646 NaN San Francisco NaN \n", + "148647 NaN San Francisco NaN \n", + "148648 NaN San Francisco NaN \n", + "148649 NaN San Francisco NaN \n", + "148650 NaN San Francisco NaN \n", + "148651 NaN San Francisco NaN \n", + "148652 NaN San Francisco NaN \n", + "148653 NaN San Francisco NaN \n", + "\n", + "[148654 rows x 13 columns]" + ] + }, + "execution_count": 81, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df=pd.read_csv('Salaries.csv')\n", + "df\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display the column names" + ] + }, + { + "cell_type": "code", + "execution_count": 82, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Index(['Id', 'EmployeeName', 'JobTitle', 'BasePay', 'OvertimePay', 'OtherPay',\n", + " 'Benefits', 'TotalPay', 'TotalPayBenefits', 'Year', 'Notes', 'Agency',\n", + " 'Status'],\n", + " dtype='object')" + ] + }, + "execution_count": 82, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.columns\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display the number of rows and cols" + ] + }, + { + "cell_type": "code", + "execution_count": 83, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(148654, 13)" + ] + }, + "execution_count": 83, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.shape\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display the dataframe info (types of data in columns and not null values etc.)" + ] + }, + { + "cell_type": "code", + "execution_count": 84, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "\n", + "RangeIndex: 148654 entries, 0 to 148653\n", + "Data columns (total 13 columns):\n", + "Id 148654 non-null int64\n", + "EmployeeName 148654 non-null object\n", + "JobTitle 148654 non-null object\n", + "BasePay 148045 non-null float64\n", + "OvertimePay 148650 non-null float64\n", + "OtherPay 148650 non-null float64\n", + "Benefits 112491 non-null float64\n", + "TotalPay 148654 non-null float64\n", + "TotalPayBenefits 148654 non-null float64\n", + "Year 148654 non-null int64\n", + "Notes 0 non-null float64\n", + "Agency 148654 non-null object\n", + "Status 0 non-null float64\n", + "dtypes: float64(8), int64(2), object(3)\n", + "memory usage: 14.7+ MB\n" + ] + } + ], + "source": [ + "df.info()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display stats of the dataframe like count, mean, std, max, 25% etc....." + ] + }, + { + "cell_type": "code", + "execution_count": 85, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
IdBasePayOvertimePayOtherPayBenefitsTotalPayTotalPayBenefitsYearNotesStatus
count148654.000000148045.000000148650.000000148650.000000112491.000000148654.000000148654.000000148654.0000000.00.0
mean74327.50000066325.4488405066.0598863648.76729725007.89315174768.32197293692.5548112012.522643NaNNaN
std42912.85779542764.63549511454.3805598056.60186615402.21585850517.00527462793.5334831.117538NaNNaN
min1.000000-166.010000-0.010000-7058.590000-33.890000-618.130000-618.1300002011.000000NaNNaN
25%37164.25000033588.2000000.0000000.00000011535.39500036168.99500044065.6500002012.000000NaNNaN
50%74327.50000065007.4500000.000000811.27000028628.62000071426.61000092404.0900002013.000000NaNNaN
75%111490.75000094691.0500004658.1750004236.06500035566.855000105839.135000132876.4500002014.000000NaNNaN
max148654.000000319275.010000245131.880000400184.25000096570.660000567595.430000567595.4300002014.000000NaNNaN
\n", + "
" + ], + "text/plain": [ + " Id BasePay OvertimePay OtherPay \\\n", + "count 148654.000000 148045.000000 148650.000000 148650.000000 \n", + "mean 74327.500000 66325.448840 5066.059886 3648.767297 \n", + "std 42912.857795 42764.635495 11454.380559 8056.601866 \n", + "min 1.000000 -166.010000 -0.010000 -7058.590000 \n", + "25% 37164.250000 33588.200000 0.000000 0.000000 \n", + "50% 74327.500000 65007.450000 0.000000 811.270000 \n", + "75% 111490.750000 94691.050000 4658.175000 4236.065000 \n", + "max 148654.000000 319275.010000 245131.880000 400184.250000 \n", + "\n", + " Benefits TotalPay TotalPayBenefits Year Notes \\\n", + "count 112491.000000 148654.000000 148654.000000 148654.000000 0.0 \n", + "mean 25007.893151 74768.321972 93692.554811 2012.522643 NaN \n", + "std 15402.215858 50517.005274 62793.533483 1.117538 NaN \n", + "min -33.890000 -618.130000 -618.130000 2011.000000 NaN \n", + "25% 11535.395000 36168.995000 44065.650000 2012.000000 NaN \n", + "50% 28628.620000 71426.610000 92404.090000 2013.000000 NaN \n", + "75% 35566.855000 105839.135000 132876.450000 2014.000000 NaN \n", + "max 96570.660000 567595.430000 567595.430000 2014.000000 NaN \n", + "\n", + " Status \n", + "count 0.0 \n", + "mean NaN \n", + "std NaN \n", + "min NaN \n", + "25% NaN \n", + "50% NaN \n", + "75% NaN \n", + "max NaN " + ] + }, + "execution_count": 85, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.describe()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display null values per column" + ] + }, + { + "cell_type": "code", + "execution_count": 86, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Id 0\n", + "EmployeeName 0\n", + "JobTitle 0\n", + "BasePay 609\n", + "OvertimePay 4\n", + "OtherPay 4\n", + "Benefits 36163\n", + "TotalPay 0\n", + "TotalPayBenefits 0\n", + "Year 0\n", + "Notes 148654\n", + "Agency 0\n", + "Status 148654\n", + "dtype: int64" + ] + }, + "execution_count": 86, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.isnull().sum()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "remove columns will all values as NaN" + ] + }, + { + "cell_type": "code", + "execution_count": 87, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
IdEmployeeNameJobTitleBasePayOvertimePayOtherPayBenefitsTotalPayTotalPayBenefitsYearAgency
01NATHANIEL FORDGENERAL MANAGER-METROPOLITAN TRANSIT AUTHORITY167411.180.00400184.25NaN567595.43567595.432011San Francisco
12GARY JIMENEZCAPTAIN III (POLICE DEPARTMENT)155966.02245131.88137811.38NaN538909.28538909.282011San Francisco
23ALBERT PARDINICAPTAIN III (POLICE DEPARTMENT)212739.13106088.1816452.60NaN335279.91335279.912011San Francisco
34CHRISTOPHER CHONGWIRE ROPE CABLE MAINTENANCE MECHANIC77916.0056120.71198306.90NaN332343.61332343.612011San Francisco
45PATRICK GARDNERDEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT)134401.609737.00182234.59NaN326373.19326373.192011San Francisco
56DAVID SULLIVANASSISTANT DEPUTY CHIEF II118602.008601.00189082.74NaN316285.74316285.742011San Francisco
67ALSON LEEBATTALION CHIEF, (FIRE DEPARTMENT)92492.0189062.90134426.14NaN315981.05315981.052011San Francisco
78DAVID KUSHNERDEPUTY DIRECTOR OF INVESTMENTS256576.960.0051322.50NaN307899.46307899.462011San Francisco
89MICHAEL MORRISBATTALION CHIEF, (FIRE DEPARTMENT)176932.6486362.6840132.23NaN303427.55303427.552011San Francisco
910JOANNE HAYES-WHITECHIEF OF DEPARTMENT, (FIRE DEPARTMENT)285262.000.0017115.73NaN302377.73302377.732011San Francisco
1011ARTHUR KENNEYASSISTANT CHIEF OF DEPARTMENT, (FIRE DEPARTMENT)194999.3971344.8833149.90NaN299494.17299494.172011San Francisco
1112PATRICIA JACKSONCAPTAIN III (POLICE DEPARTMENT)99722.0087082.62110804.30NaN297608.92297608.922011San Francisco
1213EDWARD HARRINGTONEXECUTIVE CONTRACT EMPLOYEE294580.020.000.00NaN294580.02294580.022011San Francisco
1314JOHN MARTINDEPARTMENT HEAD V271329.030.0021342.59NaN292671.62292671.622011San Francisco
1415DAVID FRANKLINBATTALION CHIEF, (FIRE DEPARTMENT)174872.6474050.3037424.11NaN286347.05286347.052011San Francisco
1516RICHARD CORRIEACOMMANDER III, (POLICE DEPARTMENT)198778.0173478.2013957.65NaN286213.86286213.862011San Francisco
1617AMY HARTDEPARTMENT HEAD V268604.570.0016115.86NaN284720.43284720.432011San Francisco
1718SEBASTIAN WONGCAPTAIN, EMERGENCYCY MEDICAL SERVICES140546.87119397.2618625.08NaN278569.21278569.212011San Francisco
1819MARTY ROSSBATTALION CHIEF, (FIRE DEPARTMENT)168692.6369626.1238115.47NaN276434.22276434.222011San Francisco
1920ELLEN MOFFATTASSISTANT MEDICAL EXAMINER257510.59880.1616159.50NaN274550.25274550.252011San Francisco
2021VENUS AZARASSISTANT MEDICAL EXAMINER257510.480.0016679.79NaN274190.27274190.272011San Francisco
2122JUDY MELINEKASSISTANT MEDICAL EXAMINER257510.44377.2115883.56NaN273771.21273771.212011San Francisco
2223GEORGE GARCIACAPTAIN, FIRE SUPPRESSION140546.8893200.5839955.25NaN273702.71273702.712011San Francisco
2324VICTOR WYRSCHBATTALION CHIEF, (FIRE DEPARTMENT)168692.6377896.1424083.86NaN270672.63270672.632011San Francisco
2425JOSEPH DRISCOLLCAPTAIN, FIRE SUPPRESSION140546.8697868.7731909.28NaN270324.91270324.912011San Francisco
2526GREGORY SUHRCHIEF OF POLICE256470.410.0011522.18NaN267992.59267992.592011San Francisco
2627JOHN HANLEYCAPTAIN, FIRE SUPPRESSION92080.8040008.00133695.76NaN265784.56265784.562011San Francisco
2728RAYMOND GUZMANBATTALION CHIEF, (FIRE DEPARTMENT)168692.5980706.8816063.99NaN265463.46265463.462011San Francisco
2829DENISE SCHMITTDEPUTY CHIEF III (POLICE DEPARTMENT)261717.600.002357.00NaN264074.60264074.602011San Francisco
2930MONICA FIELDSDEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT)246225.600.0015140.54NaN261366.14261366.142011San Francisco
....................................
148624148625Lorraine RosenthalSenior Clerk0.000.0012.890.0012.8912.892014San Francisco
148625148626Renato C GurionRegistered Nurse0.000.006.001.246.007.242014San Francisco
148626148627Paulet GainesAccount Clerk0.000.000.000.000.000.002014San Francisco
148627148628Brett A LundbergGeneral Laborer0.000.000.000.000.000.002014San Francisco
148628148629Mark W McclureGeneral Laborer0.000.000.000.000.000.002014San Francisco
148629148630Elizabeth IniguezTranscriber Typist0.000.000.000.000.000.002014San Francisco
148630148631Randy J KeysCarpenter0.000.000.000.000.000.002014San Francisco
148631148632Andre M JohnsonCommunications Dispatcher 10.000.000.000.000.000.002014San Francisco
148632148633Sharon D Owens-WebsterProtective Services Worker0.000.000.000.000.000.002014San Francisco
148633148634Edward FerdinandGeneral Laborer0.000.000.000.000.000.002014San Francisco
148634148635David M TurnerTransit Car Cleaner0.000.000.000.000.000.002014San Francisco
148635148636James S KibblewhiteGeneral Laborer0.000.000.000.000.000.002014San Francisco
148636148637Andrew J EnziArborist Technician0.000.000.000.000.000.002014San Francisco
148637148638Kadeshra D GreenTransit Fare Inspector0.000.000.000.000.000.002014San Francisco
148638148639Lennard B HutchinsonElectrician0.000.000.000.000.000.002014San Francisco
148639148640Richard A TalbertCustodian0.000.000.000.000.000.002014San Francisco
148640148641Charlene D MccullyParking Control Officer0.000.000.000.000.000.002014San Francisco
148641148642Raphael Marquis GoinsMuseum Guard0.000.000.000.000.000.002014San Francisco
148642148643Dominic C MarquezSign Worker0.000.000.000.000.000.002014San Francisco
148643148644Kim BrewerParking Control Officer0.000.000.000.000.000.002014San Francisco
148644148645Randy D WinnStationary Eng, Sewage Plant0.000.000.000.000.000.002014San Francisco
148645148646Carolyn A WilsonHuman Services Technician0.000.000.000.000.000.002014San Francisco
148646148647Not providedNot providedNaNNaNNaNNaN0.000.002014San Francisco
148647148648Joann AndersonCommunications Dispatcher 20.000.000.000.000.000.002014San Francisco
148648148649Leon WalkerCustodian0.000.000.000.000.000.002014San Francisco
148649148650Roy I TilleryCustodian0.000.000.000.000.000.002014San Francisco
148650148651Not providedNot providedNaNNaNNaNNaN0.000.002014San Francisco
148651148652Not providedNot providedNaNNaNNaNNaN0.000.002014San Francisco
148652148653Not providedNot providedNaNNaNNaNNaN0.000.002014San Francisco
148653148654Joe LopezCounselor, Log Cabin Ranch0.000.00-618.130.00-618.13-618.132014San Francisco
\n", + "

148654 rows × 11 columns

\n", + "
" + ], + "text/plain": [ + " Id EmployeeName \\\n", + "0 1 NATHANIEL FORD \n", + "1 2 GARY JIMENEZ \n", + "2 3 ALBERT PARDINI \n", + "3 4 CHRISTOPHER CHONG \n", + "4 5 PATRICK GARDNER \n", + "5 6 DAVID SULLIVAN \n", + "6 7 ALSON LEE \n", + "7 8 DAVID KUSHNER \n", + "8 9 MICHAEL MORRIS \n", + "9 10 JOANNE HAYES-WHITE \n", + "10 11 ARTHUR KENNEY \n", + "11 12 PATRICIA JACKSON \n", + "12 13 EDWARD HARRINGTON \n", + "13 14 JOHN MARTIN \n", + "14 15 DAVID FRANKLIN \n", + "15 16 RICHARD CORRIEA \n", + "16 17 AMY HART \n", + "17 18 SEBASTIAN WONG \n", + "18 19 MARTY ROSS \n", + "19 20 ELLEN MOFFATT \n", + "20 21 VENUS AZAR \n", + "21 22 JUDY MELINEK \n", + "22 23 GEORGE GARCIA \n", + "23 24 VICTOR WYRSCH \n", + "24 25 JOSEPH DRISCOLL \n", + "25 26 GREGORY SUHR \n", + "26 27 JOHN HANLEY \n", + "27 28 RAYMOND GUZMAN \n", + "28 29 DENISE SCHMITT \n", + "29 30 MONICA FIELDS \n", + "... ... ... \n", + "148624 148625 Lorraine Rosenthal \n", + "148625 148626 Renato C Gurion \n", + "148626 148627 Paulet Gaines \n", + "148627 148628 Brett A Lundberg \n", + "148628 148629 Mark W Mcclure \n", + "148629 148630 Elizabeth Iniguez \n", + "148630 148631 Randy J Keys \n", + "148631 148632 Andre M Johnson \n", + "148632 148633 Sharon D Owens-Webster \n", + "148633 148634 Edward Ferdinand \n", + "148634 148635 David M Turner \n", + "148635 148636 James S Kibblewhite \n", + "148636 148637 Andrew J Enzi \n", + "148637 148638 Kadeshra D Green \n", + "148638 148639 Lennard B Hutchinson \n", + "148639 148640 Richard A Talbert \n", + "148640 148641 Charlene D Mccully \n", + "148641 148642 Raphael Marquis Goins \n", + "148642 148643 Dominic C Marquez \n", + "148643 148644 Kim Brewer \n", + "148644 148645 Randy D Winn \n", + "148645 148646 Carolyn A Wilson \n", + "148646 148647 Not provided \n", + "148647 148648 Joann Anderson \n", + "148648 148649 Leon Walker \n", + "148649 148650 Roy I Tillery \n", + "148650 148651 Not provided \n", + "148651 148652 Not provided \n", + "148652 148653 Not provided \n", + "148653 148654 Joe Lopez \n", + "\n", + " JobTitle BasePay \\\n", + "0 GENERAL MANAGER-METROPOLITAN TRANSIT AUTHORITY 167411.18 \n", + "1 CAPTAIN III (POLICE DEPARTMENT) 155966.02 \n", + "2 CAPTAIN III (POLICE DEPARTMENT) 212739.13 \n", + "3 WIRE ROPE CABLE MAINTENANCE MECHANIC 77916.00 \n", + "4 DEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT) 134401.60 \n", + "5 ASSISTANT DEPUTY CHIEF II 118602.00 \n", + "6 BATTALION CHIEF, (FIRE DEPARTMENT) 92492.01 \n", + "7 DEPUTY DIRECTOR OF INVESTMENTS 256576.96 \n", + "8 BATTALION CHIEF, (FIRE DEPARTMENT) 176932.64 \n", + "9 CHIEF OF DEPARTMENT, (FIRE DEPARTMENT) 285262.00 \n", + "10 ASSISTANT CHIEF OF DEPARTMENT, (FIRE DEPARTMENT) 194999.39 \n", + "11 CAPTAIN III (POLICE DEPARTMENT) 99722.00 \n", + "12 EXECUTIVE CONTRACT EMPLOYEE 294580.02 \n", + "13 DEPARTMENT HEAD V 271329.03 \n", + "14 BATTALION CHIEF, (FIRE DEPARTMENT) 174872.64 \n", + "15 COMMANDER III, (POLICE DEPARTMENT) 198778.01 \n", + "16 DEPARTMENT HEAD V 268604.57 \n", + "17 CAPTAIN, EMERGENCYCY MEDICAL SERVICES 140546.87 \n", + "18 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.63 \n", + "19 ASSISTANT MEDICAL EXAMINER 257510.59 \n", + "20 ASSISTANT MEDICAL EXAMINER 257510.48 \n", + "21 ASSISTANT MEDICAL EXAMINER 257510.44 \n", + "22 CAPTAIN, FIRE SUPPRESSION 140546.88 \n", + "23 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.63 \n", + "24 CAPTAIN, FIRE SUPPRESSION 140546.86 \n", + "25 CHIEF OF POLICE 256470.41 \n", + "26 CAPTAIN, FIRE SUPPRESSION 92080.80 \n", + "27 BATTALION CHIEF, (FIRE DEPARTMENT) 168692.59 \n", + "28 DEPUTY CHIEF III (POLICE DEPARTMENT) 261717.60 \n", + "29 DEPUTY CHIEF OF DEPARTMENT,(FIRE DEPARTMENT) 246225.60 \n", + "... ... ... \n", + "148624 Senior Clerk 0.00 \n", + "148625 Registered Nurse 0.00 \n", + "148626 Account Clerk 0.00 \n", + "148627 General Laborer 0.00 \n", + "148628 General Laborer 0.00 \n", + "148629 Transcriber Typist 0.00 \n", + "148630 Carpenter 0.00 \n", + "148631 Communications Dispatcher 1 0.00 \n", + "148632 Protective Services Worker 0.00 \n", + "148633 General Laborer 0.00 \n", + "148634 Transit Car Cleaner 0.00 \n", + "148635 General Laborer 0.00 \n", + "148636 Arborist Technician 0.00 \n", + "148637 Transit Fare Inspector 0.00 \n", + "148638 Electrician 0.00 \n", + "148639 Custodian 0.00 \n", + "148640 Parking Control Officer 0.00 \n", + "148641 Museum Guard 0.00 \n", + "148642 Sign Worker 0.00 \n", + "148643 Parking Control Officer 0.00 \n", + "148644 Stationary Eng, Sewage Plant 0.00 \n", + "148645 Human Services Technician 0.00 \n", + "148646 Not provided NaN \n", + "148647 Communications Dispatcher 2 0.00 \n", + "148648 Custodian 0.00 \n", + "148649 Custodian 0.00 \n", + "148650 Not provided NaN \n", + "148651 Not provided NaN \n", + "148652 Not provided NaN \n", + "148653 Counselor, Log Cabin Ranch 0.00 \n", + "\n", + " OvertimePay OtherPay Benefits TotalPay TotalPayBenefits Year \\\n", + "0 0.00 400184.25 NaN 567595.43 567595.43 2011 \n", + "1 245131.88 137811.38 NaN 538909.28 538909.28 2011 \n", + "2 106088.18 16452.60 NaN 335279.91 335279.91 2011 \n", + "3 56120.71 198306.90 NaN 332343.61 332343.61 2011 \n", + "4 9737.00 182234.59 NaN 326373.19 326373.19 2011 \n", + "5 8601.00 189082.74 NaN 316285.74 316285.74 2011 \n", + "6 89062.90 134426.14 NaN 315981.05 315981.05 2011 \n", + "7 0.00 51322.50 NaN 307899.46 307899.46 2011 \n", + "8 86362.68 40132.23 NaN 303427.55 303427.55 2011 \n", + "9 0.00 17115.73 NaN 302377.73 302377.73 2011 \n", + "10 71344.88 33149.90 NaN 299494.17 299494.17 2011 \n", + "11 87082.62 110804.30 NaN 297608.92 297608.92 2011 \n", + "12 0.00 0.00 NaN 294580.02 294580.02 2011 \n", + "13 0.00 21342.59 NaN 292671.62 292671.62 2011 \n", + "14 74050.30 37424.11 NaN 286347.05 286347.05 2011 \n", + "15 73478.20 13957.65 NaN 286213.86 286213.86 2011 \n", + "16 0.00 16115.86 NaN 284720.43 284720.43 2011 \n", + "17 119397.26 18625.08 NaN 278569.21 278569.21 2011 \n", + "18 69626.12 38115.47 NaN 276434.22 276434.22 2011 \n", + "19 880.16 16159.50 NaN 274550.25 274550.25 2011 \n", + "20 0.00 16679.79 NaN 274190.27 274190.27 2011 \n", + "21 377.21 15883.56 NaN 273771.21 273771.21 2011 \n", + "22 93200.58 39955.25 NaN 273702.71 273702.71 2011 \n", + "23 77896.14 24083.86 NaN 270672.63 270672.63 2011 \n", + "24 97868.77 31909.28 NaN 270324.91 270324.91 2011 \n", + "25 0.00 11522.18 NaN 267992.59 267992.59 2011 \n", + "26 40008.00 133695.76 NaN 265784.56 265784.56 2011 \n", + "27 80706.88 16063.99 NaN 265463.46 265463.46 2011 \n", + "28 0.00 2357.00 NaN 264074.60 264074.60 2011 \n", + "29 0.00 15140.54 NaN 261366.14 261366.14 2011 \n", + "... ... ... ... ... ... ... \n", + "148624 0.00 12.89 0.00 12.89 12.89 2014 \n", + "148625 0.00 6.00 1.24 6.00 7.24 2014 \n", + "148626 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148627 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148628 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148629 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148630 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148631 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148632 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148633 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148634 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148635 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148636 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148637 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148638 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148639 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148640 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148641 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148642 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148643 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148644 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148645 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148646 NaN NaN NaN 0.00 0.00 2014 \n", + "148647 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148648 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148649 0.00 0.00 0.00 0.00 0.00 2014 \n", + "148650 NaN NaN NaN 0.00 0.00 2014 \n", + "148651 NaN NaN NaN 0.00 0.00 2014 \n", + "148652 NaN NaN NaN 0.00 0.00 2014 \n", + "148653 0.00 -618.13 0.00 -618.13 -618.13 2014 \n", + "\n", + " Agency \n", + "0 San Francisco \n", + "1 San Francisco \n", + "2 San Francisco \n", + "3 San Francisco \n", + "4 San Francisco \n", + "5 San Francisco \n", + "6 San Francisco \n", + "7 San Francisco \n", + "8 San Francisco \n", + "9 San Francisco \n", + "10 San Francisco \n", + "11 San Francisco \n", + "12 San Francisco \n", + "13 San Francisco \n", + "14 San Francisco \n", + "15 San Francisco \n", + "16 San Francisco \n", + "17 San Francisco \n", + "18 San Francisco \n", + "19 San Francisco \n", + "20 San Francisco \n", + "21 San Francisco \n", + "22 San Francisco \n", + "23 San Francisco \n", + "24 San Francisco \n", + "25 San Francisco \n", + "26 San Francisco \n", + "27 San Francisco \n", + "28 San Francisco \n", + "29 San Francisco \n", + "... ... \n", + "148624 San Francisco \n", + "148625 San Francisco \n", + "148626 San Francisco \n", + "148627 San Francisco \n", + "148628 San Francisco \n", + "148629 San Francisco \n", + "148630 San Francisco \n", + "148631 San Francisco \n", + "148632 San Francisco \n", + "148633 San Francisco \n", + "148634 San Francisco \n", + "148635 San Francisco \n", + "148636 San Francisco \n", + "148637 San Francisco \n", + "148638 San Francisco \n", + "148639 San Francisco \n", + "148640 San Francisco \n", + "148641 San Francisco \n", + "148642 San Francisco \n", + "148643 San Francisco \n", + "148644 San Francisco \n", + "148645 San Francisco \n", + "148646 San Francisco \n", + "148647 San Francisco \n", + "148648 San Francisco \n", + "148649 San Francisco \n", + "148650 San Francisco \n", + "148651 San Francisco \n", + "148652 San Francisco \n", + "148653 San Francisco \n", + "\n", + "[148654 rows x 11 columns]" + ] + }, + "execution_count": 87, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dropna(how='all',axis=1)" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "display number of unique values in each column" + ] + }, + { + "cell_type": "code", + "execution_count": 88, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Id 148654\n", + "EmployeeName 110811\n", + "JobTitle 2159\n", + "BasePay 109489\n", + "OvertimePay 65998\n", + "OtherPay 83225\n", + "Benefits 98465\n", + "TotalPay 138486\n", + "TotalPayBenefits 142098\n", + "Year 4\n", + "Notes 0\n", + "Agency 1\n", + "Status 0\n", + "dtype: int64" + ] + }, + "execution_count": 88, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.nunique()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "mean of total pay of all people based on year" + ] + }, + { + "cell_type": "code", + "execution_count": 89, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "74768.32197169267" + ] + }, + "execution_count": 89, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.TotalPay.mean()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "how many people have 0 overtime pay" + ] + }, + { + "cell_type": "code", + "execution_count": 90, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "77321" + ] + }, + "execution_count": 90, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.OvertimePay.value_counts()[0]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "max, min, mean, median and other stats of TotalPay of people having 0 OvertimePay" + ] + }, + { + "cell_type": "code", + "execution_count": 91, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "count 77321.000000\n", + "mean 60229.348901\n", + "std 49307.912350\n", + "min -618.130000\n", + "25% 13290.450000\n", + "50% 58158.590000\n", + "75% 91115.090000\n", + "max 567595.430000\n", + "Name: TotalPay, dtype: float64" + ] + }, + "execution_count": 91, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df1=df[(df['OvertimePay']==0)]\n", + "df1[\"TotalPay\"].describe()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "find Id of that person with max TotalPay you got in previous question" + ] + }, + { + "cell_type": "code", + "execution_count": 92, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1" + ] + }, + "execution_count": 92, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df1[(df1['TotalPay']==df1['TotalPay'].max())].iloc[0,0]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "name of employee with total pay benefits = 87619.78" + ] + }, + { + "cell_type": "code", + "execution_count": 93, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "'REBECCA CHIU'" + ] + }, + "execution_count": 93, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[(df['TotalPay']==87619.78)].iloc[0,1]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "how many people have BasePay > 150000 and OvertimePay > 100000" + ] + }, + { + "cell_type": "code", + "execution_count": 94, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "12" + ] + }, + "execution_count": 94, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df[(df['BasePay']>150000) & (df[\"OvertimePay\"]>100000)].shape[0]" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "which job title generally has highest average TotalPayBenefits" + ] + }, + { + "cell_type": "code", + "execution_count": 95, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "Index(['Chief Investment Officer'], dtype='object', name='JobTitle')" + ] + }, + "execution_count": 95, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df3=df.groupby(\"JobTitle\").mean()\n", + "df3[(df3['TotalPayBenefits']==df3['TotalPayBenefits'].max())].index" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "How many employees are POLICE" + ] + }, + { + "cell_type": "code", + "execution_count": 100, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "2512" + ] + }, + "execution_count": 100, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "b=df[\"JobTitle\"]\n", + "a=b.str.contains(pat=\"POLICE\")\n", + "sum=0\n", + "for i in range(len(b)):\n", + " if a[i]==True:\n", + " sum=sum+1\n", + "sum" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.7.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}