import pandas as pd
import matplotlib.pyplot as plt

df = pd.read_csv("HRDataset_v14.csv")
df

print("The data has", df.shape[0], "rows and", df.shape[1], "columns.")

The data has 311 rows and 36 columns.

print("Below are the columns of the data.")
df.columns

Below are the columns of the data.

Index(['Employee_Name', 'EmpID', 'MarriedID', 'MaritalStatusID', 'GenderID',
       'EmpStatusID', 'DeptID', 'PerfScoreID', 'FromDiversityJobFairID',
       'Salary', 'Termd', 'PositionID', 'Position', 'State', 'Zip', 'DOB',
       'Sex', 'MaritalDesc', 'CitizenDesc', 'HispanicLatino', 'RaceDesc',
       'DateofHire', 'DateofTermination', 'TermReason', 'EmploymentStatus',
       'Department', 'ManagerName', 'ManagerID', 'RecruitmentSource',
       'PerformanceScore', 'EngagementSurvey', 'EmpSatisfaction',
       'SpecialProjectsCount', 'LastPerformanceReview_Date', 'DaysLateLast30',
       'Absences'],
      dtype='object')

df.isnull().sum().loc[lambda x: x > 0]

DateofTermination    207
ManagerID              8
dtype: int64

df[df['ManagerID'].isnull()]

df.loc[
    df['ManagerName'] == 'Webster Butler',
    ['Employee_Name', 'EmpID', 'ManagerName', 'ManagerID']
].head()

df.loc[
    (df['ManagerName'] == 'Webster Butler') & df['ManagerID'].isnull(),
    'ManagerID'
] = df.loc[
    (df['ManagerName'] == 'Webster Butler') & df['ManagerID'].notnull(),
    'ManagerID'
].iloc[0]

df.isnull().sum().loc[lambda x: x > 0]

DateofTermination    207
dtype: int64

df.loc[
    df['ManagerName'] == 'Webster Butler',
    ['Employee_Name', 'EmpID', 'ManagerName', 'ManagerID']
].head()

df[["Termd", "TermReason", "EmploymentStatus"]].head()

df.loc[
    df['Termd'] == 1,
    ['Termd', 'TermReason', 'EmploymentStatus']
].head()

terminated = df[df['Termd'] == 1].copy()

summary = (
    terminated['EmploymentStatus']
    .value_counts()
    .rename('count')
    .to_frame()
)

summary['proportion'] = summary['count'] / summary['count'].sum()
summary

ax = summary['count'].sort_values().plot(kind='barh')
total = summary['count'].sum()

for i, v in enumerate(summary['count'].sort_values()):
    pct = v / total * 100
    ax.text(v, i, f' {pct:.1f}%', va='center')

ax.set_xlabel('Number of Terminations')
ax.set_ylabel('')

Text(0, 0.5, '')

termination_table = (
    df[df['Termd'] == 1]
    .pivot_table(
        index='TermReason',
        columns='EmploymentStatus',
        values='Termd',
        aggfunc='count',
        fill_value=0
    )
)
termination_table['Total'] = termination_table.sum(axis=1)
cols = ['Total'] + [c for c in termination_table.columns if c != 'Total']
termination_table = termination_table[cols]
termination_table

termreason_cluster_map = {
    # Career Growth & Mobility
    "Another position": "Career Growth & Mobility",
    "career change": "Career Growth & Mobility",
    "relocation out of area": "Career Growth & Mobility",
    
    # Compensation & Benefits
    "more money": "Compensation & Benefits",
    
    # Work–Life Balance & Satisfaction
    "hours": "Work–Life Balance",
    "unhappy": "Work–Life Balance",
    
    # Performance & Conduct
    "performance": "Performance & Conduct",
    "attendance": "Performance & Conduct",
    "no-call, no-show": "Performance & Conduct",
    "gross misconduct": "Performance & Conduct",
    "Fatal attraction": "Performance & Conduct",
    "Learned that he is a gangster": "Performance & Conduct",
    
    # Personal / Life Events
    "medical issues": "Personal / Life Events",
    "military": "Personal / Life Events",
    "maternity leave - did not return": "Personal / Life Events",
    
    # Education & Retirement
    "return to school": "Education & Retirement",
    "retiring": "Education & Retirement"
}
df["TermReasonCluster"] = df["TermReason"].map(termreason_cluster_map)
clustered_table = (
    df[df["Termd"] == 1]
    .groupby(["TermReasonCluster", "EmploymentStatus"])
    .size()
    .unstack(fill_value=0)
    .sort_values(by=["Voluntarily Terminated", "Terminated for Cause"], ascending=False)
)
clustered_table["Total"] = clustered_table.sum(axis=1)
cols = ["Total"] + [c for c in clustered_table.columns if c != "Total"]
clustered_table = clustered_table[cols]
clustered_table

plt.figure(figsize=(7, 7))

plt.pie(
    clustered_table["Total"],
    labels=clustered_table.index,
    autopct="%1.1f%%",
    startangle=90
)

plt.title("Distribution of Termination Reasons (Clustered)")
plt.tight_layout()
plt.show()

clustered_table.plot(
    kind="bar",
    stacked=True,
    figsize=(10, 6)
)

plt.title("Termination Reasons by Cluster and Employment Status")
plt.xlabel("Termination Reason Cluster")
plt.ylabel("Number of Employees")
plt.xticks(rotation=45, ha="right")
plt.legend(title="Employment Status")
plt.tight_layout()
plt.show()

df["Department"].value_counts()

Production              209
IT/IS                    50
Sales                    31
Software Engineering     11
Admin Offices             9
Executive Office          1
Name: Department, dtype: int64

dept_headcount = (
    df.groupby("Department")
      .size()
      .rename("Total Employees")
)
dept_terminations = (
    df[df["Termd"] == 1]
    .groupby("Department")
    .size()
    .rename("Terminations")
)
dept_attrition = (
    pd.concat([dept_headcount, dept_terminations], axis=1)
    .fillna(0)
)
dept_attrition["AttritionRate"] = (
    dept_attrition["Terminations"] / dept_attrition["Total Employees"]
)
dept_attrition = dept_attrition.sort_values(
    by="AttritionRate",
    ascending=False
)

dept_attrition

dept_attrition["AttritionRate"].plot(
    kind="bar",
    figsize=(10, 6)
)

plt.title("Attrition Rate by Department")
plt.xlabel("Department")
plt.ylabel("Attrition Rate (%)")
plt.xticks(rotation=45, ha="right")
plt.tight_layout()
plt.show()

terminated = df[df['Termd'] == 1].copy()
dept_split = (
    terminated
    .groupby(['Department', 'EmploymentStatus'])
    .size()
    .unstack(fill_value=0)
)
dept_split["Total"] = dept_split.sum(axis=1)
cols = ["Total"] + [c for c in dept_split.columns if c != "Total"]
dept_split = dept_split[cols]
dept_split

dept_rate = dept_split.drop(columns=["Total"]).div(dept_split["Total"], axis=0)
dept_rate

dept_prop_sorted = dept_rate.sort_values(
    by="Terminated for Cause", ascending=False
)

plt.figure(figsize=(9, 5))

plt.barh(
    dept_prop_sorted.index,
    dept_prop_sorted["Voluntarily Terminated"]
)
plt.barh(
    dept_prop_sorted.index,
    dept_prop_sorted["Terminated for Cause"],
    left=dept_prop_sorted["Voluntarily Terminated"]
)

plt.xlabel("Share of Terminations")
plt.title("Voluntary vs Involuntary Termination Share by Department")
plt.xlim(0, 1)
plt.legend(["Voluntarily Terminated", "Terminated for Cause"])

# Force white background (important for reports)
plt.gca().set_facecolor("white")
plt.gcf().set_facecolor("white")

plt.tight_layout()
plt.show()

df["ManagerName"].value_counts()

Michael Albert        22
Elijiah Gray          22
Kissy Sullivan        22
Brannon Miller        22
Kelley Spirea         22
Ketsia Liebig         21
Webster Butler        21
David Stanley         21
Amy Dunn              21
Janet King            19
Simon Roup            17
Peter Monroe          14
John Smith            14
Lynn Daneault         13
Alex Sweetwater        9
Brian Champaigne       8
Jennifer Zamora        7
Brandon R. LeBlanc     7
Eric Dougall           4
Debra Houlihan         3
Board of Directors     2
Name: ManagerName, dtype: int64

df["ManagerID"].value_counts()

18.0    22
20.0    22
16.0    22
12.0    22
14.0    21
39.0    21
11.0    21
19.0    21
22.0    21
2.0     19
4.0     17
7.0     14
17.0    14
21.0    13
10.0     9
13.0     8
5.0      7
1.0      6
6.0      4
15.0     3
9.0      2
3.0      1
30.0     1
Name: ManagerID, dtype: int64

manager_team_size = (
    df.groupby("ManagerName")
      .size()
      .rename("Team Size")
)
manager_terminations = (
    df[df["Termd"] == 1]
    .groupby("ManagerName")
    .size()
    .rename("Terminations")
)
manager_attrition = (
    pd.concat([manager_team_size, manager_terminations], axis=1)
    .fillna(0)
)
manager_attrition["Terminations"] = manager_attrition["Terminations"].astype(int)
manager_attrition["Attrition Rate"] = (
    manager_attrition["Terminations"] / manager_attrition["Team Size"]
)

# manager_attrition["AttritionRatePct"] = manager_attrition["AttritionRate"] * 100

MIN_TEAM_SIZE = 1

manager_attrition_filtered = (
    manager_attrition[manager_attrition["Team Size"] >= MIN_TEAM_SIZE]
    .sort_values("Attrition Rate", ascending=False)
)

manager_attrition_filtered

manager_attrition_filtered["Attrition Rate"].sort_values().plot(
    kind="barh",
    figsize=(10, 6)
)

plt.title("Manager-Level Attrition Rate")
plt.xlabel("Attrition Rate (%)")
plt.ylabel("Manager Name")
plt.tight_layout()
plt.show()

terminated = df[df['Termd'] == 1].copy()

manager_split = (
    terminated
    .groupby(['ManagerName', 'EmploymentStatus'])
    .size()
    .unstack(fill_value=0)
)

manager_split = manager_split[manager_split.sum(axis=1) >= 1]

manager_rate = manager_split.div(manager_split.sum(axis=1), axis=0)
manager_rate.sort_values(by='Voluntarily Terminated', ascending=False)

df["PerfScoreID"].value_counts()

3    243
4     37
2     18
1     13
Name: PerfScoreID, dtype: int64

df["PerformanceScore"].value_counts()

Fully Meets          243
Exceeds               37
Needs Improvement     18
PIP                   13
Name: PerformanceScore, dtype: int64

df.groupby('PerfScoreID')['PerformanceScore'].nunique()

PerfScoreID
1    2
2    1
3    2
4    1
Name: PerformanceScore, dtype: int64

df.groupby('PerformanceScore')['PerfScoreID'].nunique()

PerformanceScore
Exceeds              1
Fully Meets          2
Needs Improvement    1
PIP                  2
Name: PerfScoreID, dtype: int64

problem_ids = (
    df.groupby('PerfScoreID')['PerformanceScore']
      .nunique()
      .loc[lambda x: x > 1]
      .index
)

(
    df[df['PerfScoreID'].isin([1, 3])]
    .groupby(['PerfScoreID', 'PerformanceScore'])
    .size()
    .reset_index(name='count')
    .sort_values(['PerfScoreID', 'count'], ascending=[True, False])
)

df.loc[
    (df['PerfScoreID'] == 1) & (df['PerformanceScore'] == 'Fully Meets'),
    'PerformanceScore'
] = 'PIP'

df.loc[
    (df['PerfScoreID'] == 3) & (df['PerformanceScore'] == 'PIP'),
    'PerformanceScore'
] = 'Fully Meets'

df.groupby('PerfScoreID')['PerformanceScore'].nunique()

PerfScoreID
1    1
2    1
3    1
4    1
Name: PerformanceScore, dtype: int64

perf_attrition = (
    df
    .groupby(['PerfScoreID', 'PerformanceScore'])
    .agg(
        total_employees=('EmpID', 'count'),
        terminations=('Termd', 'sum')
    )
    .reset_index()
)
perf_attrition['attrition_rate'] = (
    perf_attrition['terminations']
    / perf_attrition['total_employees']
)
perf_attrition = perf_attrition.sort_values('PerfScoreID')
perf_attrition

plt.figure(figsize=(8, 5))

plt.plot(
    perf_attrition['PerformanceScore'],
    perf_attrition['attrition_rate'],
    marker='o'
)

plt.xlabel('Performance Score')
plt.ylabel('Attrition Rate')
plt.title('Attrition Rate by Performance Level')

plt.show()

perf_attrition_sorted = perf_attrition.sort_values(
    'attrition_rate'
)

plt.figure(figsize=(10, 6))

plt.barh(
    perf_attrition_sorted['PerformanceScore'],
    perf_attrition_sorted['attrition_rate']
)

plt.xlabel('Attrition Rate')
plt.ylabel('Performance Score')
plt.title('Attrition Rate by Performance Level')

plt.tight_layout()
plt.show()

exit_by_perf = pd.crosstab(
    df['PerformanceScore'],
    df['EmploymentStatus'],
    values=df['EmpID'],
    aggfunc='count'
)
exit_by_perf

exit_by_perf = exit_by_perf.fillna(0)
exit_by_perf = exit_by_perf.loc[perf_attrition['PerformanceScore']]

exit_by_perf.plot(
    kind='bar',
    figsize=(10, 6)
)

plt.xlabel('Performance Score')
plt.ylabel('Number of Exits')
plt.title('Exit Type by Performance Level')

plt.xticks(rotation=0)
plt.tight_layout()
plt.show()

exit_by_perf_prop = pd.crosstab(
    df['PerformanceScore'],
    df['EmploymentStatus'],
    normalize='index'
)

exit_by_perf_prop.plot(
    kind='bar',
    stacked=True,
    figsize=(10, 6)
)

plt.ylabel('Proportion of Exits')
plt.title('Exit Type Distribution by Performance Level')
plt.show()

df["RecruitmentSource"].value_counts()

Indeed                     87
LinkedIn                   76
Google Search              49
Employee Referral          31
Diversity Job Fair         29
CareerBuilder              23
Website                    13
Other                       2
On-line Web application     1
Name: RecruitmentSource, dtype: int64

df["Employee_Name"].value_counts()

Ndzi, Colombui        1
Bachiochi, Linda      1
Leach, Dallas         1
Voldemort, Lord       1
Hitchcock, Alfred     1
                     ..
Winthrop, Jordan      1
Clayton, Rick         1
Forrest, Alex         1
Lecter, Hannibal      1
Houlihan, Debra       1
Name: Employee_Name, Length: 311, dtype: int64

df["EmpID"].value_counts()

10239    1
10034    1
10027    1
10028    1
10029    1
        ..
10136    1
10137    1
10138    1
10139    1
10240    1
Name: EmpID, Length: 311, dtype: int64

recruitment_attrition = (
    df
    .groupby('RecruitmentSource')
    .agg(
        total_hires=('EmpID', 'count'),
        terminations=('Termd', 'sum')
    )
    .reset_index()
)
recruitment_attrition['Attrition Rate'] = (
    recruitment_attrition['terminations']
    / recruitment_attrition['total_hires']
)
recruitment_attrition = recruitment_attrition[
    recruitment_attrition['total_hires'] >= 10
]
recruitment_attrition = recruitment_attrition.sort_values(
    by='Attrition Rate',
    ascending=False
)
recruitment_attrition

plt.figure(figsize=(10, 6))
plt.barh(
    recruitment_attrition['RecruitmentSource'],
    recruitment_attrition['Attrition Rate']
)

plt.xlabel('Attrition Rate')
plt.ylabel('Recruitment Source')
plt.title('Attrition Rate by Recruitment Source')

plt.show()

recruitment_crosstab = pd.crosstab(
    df['RecruitmentSource'],
    df['EmploymentStatus'],
    values=df['EmpID'],
    aggfunc='count'
).fillna(0).astype(int)

recruitment_crosstab

exit_type = pd.crosstab(
    df['RecruitmentSource'],
    df['EmploymentStatus'],
    normalize='index'
)

exit_type.plot(
    kind='bar',
    stacked=True,
    figsize=(10, 6)
)

plt.ylabel('Proportion')
plt.title('Exit Type Distribution by Recruitment Source')
plt.show()

# Shows how many employee that a manager have, including the salaries
df.groupby('ManagerName').agg({
    'EmpID': 'count',
    'Salary': 'mean'
    })

# Average Salary based on the Engagement Survey and Performance Score
df.groupby(["PerformanceScore", "EngagementSurvey"])["Salary"].mean()

PerformanceScore  EngagementSurvey
Exceeds           3.60                 63353.0
                  3.70                170500.0
                  3.90                 57815.0
                  4.00                 52984.0
                  4.10                 63777.5
                                        ...   
PIP               2.33                 52674.0
                  2.40                 64021.0
                  3.00                 60515.0
                  3.20                 48513.0
                  4.30                 56991.0
Name: Salary, Length: 144, dtype: float64

EmploymentStatus	Terminated for Cause	Voluntarily Terminated
Department
Admin Offices	0.500000	0.500000
IT/IS	0.400000	0.600000
Production	0.096386	0.903614
Sales	0.400000	0.600000
Software Engineering	0.250000	0.750000

EmploymentStatus	Terminated for Cause	Voluntarily Terminated
ManagerName
Webster Butler	0.000000	1.000000
Peter Monroe	0.000000	1.000000
Brannon Miller	0.000000	1.000000
David Stanley	0.000000	1.000000
Debra Houlihan	0.000000	1.000000
Jennifer Zamora	0.000000	1.000000
Amy Dunn	0.000000	1.000000
Michael Albert	0.111111	0.888889
Elijiah Gray	0.125000	0.875000
Kissy Sullivan	0.166667	0.833333
Janet King	0.166667	0.833333
Ketsia Liebig	0.200000	0.800000
Alex Sweetwater	0.333333	0.666667
Kelley Spirea	0.333333	0.666667
John Smith	0.333333	0.666667
Brandon R. LeBlanc	0.500000	0.500000
Simon Roup	0.500000	0.500000
Lynn Daneault	1.000000	0.000000

Employee Attrition Analysis: Identifying Organizational and Managerial Drivers of Turnover¶

01 Data Preparation¶

Importing the Libraries and the Dataset¶

Handling Missing Data¶

02 Attrition Analysis¶

Analysis 1 — Common Reasons for Employee Termination¶

Analysis 2 — Department-Level Attrition Patterns¶

Analysis 3 — Patterns on Attrition based on Manager¶

Analysis 4 — Attrition Patterns by Performance Score¶

Analysis 5 — Attrition Patterns by Recruitment Source¶

Other Analyses¶

03 Recommendations and Improvements¶

Recommendations for the Human Resources Team¶

Improvements for the Project¶

	Employee_Name	EmpID	MarriedID	MaritalStatusID	GenderID	EmpStatusID	DeptID	PerfScoreID	FromDiversityJobFairID	Salary	...	ManagerName	ManagerID	RecruitmentSource	PerformanceScore	EngagementSurvey	EmpSatisfaction	SpecialProjectsCount	LastPerformanceReview_Date	DaysLateLast30	Absences
0	Adinolfi, Wilson K	10026	0	0	1	1	5	4	0	62506	...	Michael Albert	22.0	LinkedIn	Exceeds	4.60	5	0	1/17/2019	0	1
1	Ait Sidi, Karthikeyan	10084	1	1	1	5	3	3	0	104437	...	Simon Roup	4.0	Indeed	Fully Meets	4.96	3	6	2/24/2016	0	17
2	Akinkuolie, Sarah	10196	1	1	0	5	5	3	0	64955	...	Kissy Sullivan	20.0	LinkedIn	Fully Meets	3.02	3	0	5/15/2012	0	3
3	Alagbe,Trina	10088	1	1	0	1	5	3	0	64991	...	Elijiah Gray	16.0	Indeed	Fully Meets	4.84	5	0	1/3/2019	0	15
4	Anderson, Carol	10069	0	2	0	5	5	3	0	50825	...	Webster Butler	39.0	Google Search	Fully Meets	5.00	4	0	2/1/2016	0	2
...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...	...
306	Woodson, Jason	10135	0	0	1	1	5	3	0	65893	...	Kissy Sullivan	20.0	LinkedIn	Fully Meets	4.07	4	0	2/28/2019	0	13
307	Ybarra, Catherine	10301	0	0	0	5	5	1	0	48513	...	Brannon Miller	12.0	Google Search	PIP	3.20	2	0	9/2/2015	5	4
308	Zamora, Jennifer	10010	0	0	0	1	3	4	0	220450	...	Janet King	2.0	Employee Referral	Exceeds	4.60	5	6	2/21/2019	0	16
309	Zhou, Julia	10043	0	0	0	1	3	3	0	89292	...	Simon Roup	4.0	Employee Referral	Fully Meets	5.00	3	5	2/1/2019	0	11
310	Zima, Colleen	10271	0	4	0	1	5	3	0	45046	...	David Stanley	14.0	LinkedIn	Fully Meets	4.50	5	0	1/30/2019	0	2

	Employee_Name	EmpID	MarriedID	MaritalStatusID	GenderID	EmpStatusID	DeptID	PerfScoreID	Salary	...	ManagerName	ManagerID	RecruitmentSource	PerformanceScore	EngagementSurvey	EmpSatisfaction	LastPerformanceReview_Date	Absences
19	Becker, Scott	10277	0	0	1	3	5	3	53250	...	Webster Butler	NaN	LinkedIn	Fully Meets	4.20	4	1/11/2019	13
30	Buccheri, Joseph	10184	0	0	1	1	5	3	65288	...	Webster Butler	NaN	Google Search	Fully Meets	3.19	3	2/1/2019	9
44	Chang, Donovan E	10154	0	0	1	1	5	3	60380	...	Webster Butler	NaN	LinkedIn	Fully Meets	3.80	5	1/14/2019	4
88	Fancett, Nicole	10136	0	0	0	1	5	3	65902	...	Webster Butler	NaN	LinkedIn	Fully Meets	4.00	4	1/7/2019	7
135	Hutter, Rosalie	10214	0	3	0	2	5	3	64995	...	Webster Butler	NaN	Indeed	Fully Meets	4.50	3	2/14/2019	6
177	Manchester, Robyn	10077	1	1	0	2	5	3	62385	...	Webster Butler	NaN	LinkedIn	Fully Meets	5.00	3	1/21/2019	4
232	Rivera, Haley	10011	1	1	0	1	5	4	46738	...	Webster Butler	NaN	Google Search	Exceeds	4.36	5	2/11/2019	16
251	Sewkumar, Nori	10071	0	0	0	3	5	3	50923	...	Webster Butler	NaN	Google Search	Fully Meets	5.00	5	2/6/2019	14

	Termd	TermReason	EmploymentStatus
0	0	N/A-StillEmployed	Active
1	1	career change	Voluntarily Terminated
2	1	hours	Voluntarily Terminated
3	0	N/A-StillEmployed	Active
4	1	return to school	Voluntarily Terminated

	count	proportion
Voluntarily Terminated	88	0.846154
Terminated for Cause	16	0.153846

EmploymentStatus	Total	Terminated for Cause	Voluntarily Terminated
TermReason
Another position	20	0	20
Fatal attraction	1	1	0
Learned that he is a gangster	1	1	0
attendance	7	6	1
career change	9	0	9
gross misconduct	1	1	0
hours	8	0	8
maternity leave - did not return	3	0	3
medical issues	3	0	3
military	4	0	4
more money	11	0	11
no-call, no-show	4	4	0
performance	4	3	1
relocation out of area	5	0	5
retiring	4	0	4
return to school	5	0	5
unhappy	14	0	14

EmploymentStatus	Total	Terminated for Cause	Voluntarily Terminated
TermReasonCluster
Career Growth & Mobility	34	0	34
Work–Life Balance	22	0	22
Compensation & Benefits	11	0	11
Personal / Life Events	10	0	10
Education & Retirement	9	0	9
Performance & Conduct	18	16	2

	Total Employees	Terminations	AttritionRate
Production	209	83.0	0.397129
Software Engineering	11	4.0	0.363636
Admin Offices	9	2.0	0.222222
IT/IS	50	10.0	0.200000
Sales	31	5.0	0.161290
Executive Office	1	0.0	0.000000

	Team Size	Terminations	Attrition Rate
Webster Butler	21	13	0.619048
Amy Dunn	21	13	0.619048
Kissy Sullivan	22	12	0.545455
Simon Roup	17	8	0.470588
Michael Albert	22	9	0.409091
Elijiah Gray	22	8	0.363636
Debra Houlihan	3	1	0.333333
Alex Sweetwater	9	3	0.333333
Janet King	19	6	0.315789
David Stanley	21	6	0.285714
Brandon R. LeBlanc	7	2	0.285714
Kelley Spirea	22	6	0.272727
Brannon Miller	22	6	0.272727
Ketsia Liebig	21	5	0.238095
John Smith	14	3	0.214286
Jennifer Zamora	7	1	0.142857
Lynn Daneault	13	1	0.076923
Peter Monroe	14	1	0.071429
Eric Dougall	4	0	0.000000
Brian Champaigne	8	0	0.000000
Board of Directors	2	0	0.000000

	PerfScoreID	PerformanceScore	total_employees	terminations	attrition_rate
0	1	PIP	13	4	0.307692
1	2	Needs Improvement	18	10	0.555556
2	3	Fully Meets	243	82	0.337449
3	4	Exceeds	37	8	0.216216

EmploymentStatus	Active	Terminated for Cause	Voluntarily Terminated
PerformanceScore
Exceeds	29	1	7
Fully Meets	161	9	73
Needs Improvement	8	5	5
PIP	9	1	3

	RecruitmentSource	total_hires	terminations	Attrition Rate
3	Google Search	49	30	0.612245
1	Diversity Job Fair	29	16	0.551724
0	CareerBuilder	23	11	0.478261
4	Indeed	87	21	0.241379
5	LinkedIn	76	18	0.236842
2	Employee Referral	31	5	0.161290
8	Website	13	1	0.076923

	EmpID	Salary
ManagerName
Alex Sweetwater	9	98203.222222
Amy Dunn	21	57881.857143
Board of Directors	2	174675.500000
Brandon R. LeBlanc	7	64818.571429
Brannon Miller	22	60095.454545
Brian Champaigne	8	98319.750000
David Stanley	21	56938.571429
Debra Houlihan	3	69240.000000
Elijiah Gray	22	60635.954545
Eric Dougall	4	63188.750000
Janet King	19	94814.842105
Jennifer Zamora	7	136061.142857
John Smith	14	65350.428571
Kelley Spirea	22	58912.181818
Ketsia Liebig	21	56936.666667
Kissy Sullivan	22	57183.818182
Lynn Daneault	13	64482.538462
Michael Albert	22	58343.636364
Peter Monroe	14	73578.500000
Simon Roup	17	99331.411765
Webster Butler	21	57381.238095