Professional Documents
Culture Documents
1. Key Drivers:
2. CODE RULES:
getwd()
scalene.df<-read.csv("Dataset_of_Scalene.csv",header=TRUE)
str(scalene.df)
scalene.df$DOJ.Extended = as.factor(scalene.df$DOJ.Extended)
scalene.df$Offered.band = as.factor(scalene.df$Offered.band )
scalene.df$Joining.Bonus = as.factor(scalene.df$Joining.Bonus )
scalene.df$Candidate.relocate.actual =
as.factor(scalene.df$Candidate.relocate.actual)
scalene.df$Gender = as.factor(scalene.df$Gender )
scalene.df$Candidate.Source = as.factor(scalene.df$Candidate.Source )
scalene.df$LOB = as.factor(scalene.df$LOB )
scalene.df$Location = as.factor(scalene.df$Location )
scalene.df$Status = as.factor(scalene.df$Status )
library(caTools)
set.seed(1)
split_indices=sample.split(scalene.df$Status,SplitRatio = 0.7)
train=scalene.df[split_indices,]
test=scalene.df[-split_indices,]
training_logit=glm(Status ~., data = scalene.df, family = binomial(link =
"logit"))
summary(training_logit)
library(rpart)
r.ctrl = rpart.control(minsplit=50, minbucket = 10, cp = 0, xval = 10)
## calling the rpart function to build the tree
m1 <- rpart(Status ~ ., data = train,control = r.ctrl, method = "class")
printcp(m1)
ptree = prune(m1, cp= 0.00677966 ,"CP")
prp(ptree,type = 5)
test$predict.class <- predict(ptree, test, type="class")
train$predict.class <- predict(ptree, train, type="class")
conf <- confusionMatrix(test$predict.class, test$Status)
conf
confusin_training <- confusionMatrix(train$predict.class, train$Status)
confusin_training
CONFUSION MATRIX:
3. INTERPRETATIONS: