Professional Documents
Culture Documents
Satya772244@gmail Compdf
Satya772244@gmail Compdf
ipynb - Colaboratory
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
attrition=pd.read_csv('https://github.com/ybifoundation/Dataset/raw/main/EmployeeAttrition
attrition.head()
Research &
1 49 No Travel_Frequently 279 8
Development
Research &
2 37 Yes Travel_Rarely 1373 2
Development
Research &
3 33 No Travel_Frequently 1392 3
Development
Research &
4 27 No Travel_Rarely 591 2
Development
5 rows × 35 columns
attrition.info()
<class 'pandas.core.frame.DataFrame'>
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 1/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
attrition.describe()
8 rows × 26 columns
attrition.isna().sum()
Age 0
Attrition 0
BusinessTravel 0
DailyRate 0
Department 0
DistanceFromHome 0
Education 0
EducationField 0
EmployeeCount 0
EmployeeNumber 0
EnvironmentSatisfaction 0
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 2/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
Gender 0
HourlyRate 0
JobInvolvement 0
JobLevel 0
JobRole 0
JobSatisfaction 0
MaritalStatus 0
MonthlyIncome 0
MonthlyRate 0
NumCompaniesWorked 0
Over18 0
OverTime 0
PercentSalaryHike 0
PerformanceRating 0
RelationshipSatisfaction 0
StandardHours 0
StockOptionLevel 0
TotalWorkingYears 0
TrainingTimesLastYear 0
WorkLifeBalance 0
YearsAtCompany 0
YearsInCurrentRole 0
YearsSinceLastPromotion 0
YearsWithCurrManager 0
dtype: int64
attrition.nunique()
Age 43
Attrition 2
BusinessTravel 3
DailyRate 886
Department 3
DistanceFromHome 29
Education 5
EducationField 6
EmployeeCount 1
EmployeeNumber 1470
EnvironmentSatisfaction 4
Gender 2
HourlyRate 71
JobInvolvement 4
JobLevel 5
JobRole 9
JobSatisfaction 4
MaritalStatus 3
MonthlyIncome 1349
MonthlyRate 1427
NumCompaniesWorked 10
Over18 1
OverTime 2
PercentSalaryHike 15
PerformanceRating 2
RelationshipSatisfaction 4
StandardHours 1
StockOptionLevel 4
TotalWorkingYears 40
TrainingTimesLastYear 7
WorkLifeBalance 4
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 3/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
YearsAtCompany 37
YearsInCurrentRole 19
YearsSinceLastPromotion 16
YearsWithCurrManager 18
dtype: int64
sns.pairplot(attrition)
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 4/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
<seaborn.axisgrid.PairGrid at 0x7f96303e11d0>
attrition.columns
'YearsWithCurrManager'],
dtype='object')
y= attrition ['Attrition']
X = attrition[['Age', 'DailyRate', 'DistanceFromHome', 'Education', 'EmployeeCount',
'EmployeeNumber', 'EnvironmentSatisfaction', 'HourlyRate',
'JobInvolvement', 'JobLevel', 'JobSatisfaction', 'MonthlyIncome',
'MonthlyRate', 'NumCompaniesWorked', 'PercentSalaryHike',
'PerformanceRating', 'RelationshipSatisfaction', 'StandardHours',
'StockOptionLevel', 'TotalWorkingYears', 'TrainingTimesLastYear',
'WorkLifeBalance', 'YearsAtCompany', 'YearsInCurrentRole',
'YearsSinceLastPromotion', 'YearsWithCurrManager']]
from sklearn.model_selection import train_test_split
X_train,X_test,y_train,y_test= train_test_split(
X,y, train_size=.30 ,random_state=2529)
X_train.shape,X_test.shape,y_train.shape,y_test.shape
from sklearn.ensemble import RandomForestClassifier
model=RandomForestClassifier()
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 5/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
model.fit(X_train,y_train)
RandomForestClassifier()
y_pred=model.predict(X_test)
from sklearn.metrics import accuracy_score,confusion_matrix,classification_report
accuracy_score(y_test,y_pred)
0.8435374149659864
confusion_matrix(y_test,y_pred)
array([[856, 5],
[156, 12]])
print(classification_report(y_test,y_pred))
sample=attrition.sample()
sample
Research &
72 31 No Travel_Rarely 1082 1
Development
1 rows × 35 columns
X_new=sample.loc[:,X.describe().columns]
X_new
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 6/7
8/29/22, 11:07 PM Untitled7.ipynb - Colaboratory
72 31 1082 1 4 1 95
model.predict(X_new)
1 rows × 26 columns
array(['No'], dtype=object)
https://colab.research.google.com/drive/1u09TB-hT0mvGYRTydvGBKX65XQRWRCEc#scrollTo=ecTMjB3IrXKD&printMode=true 7/7