01 Pima End To End Script
01 Pima End To End Script
library(mlr)
train = read.csv("01_pima.csv")
test = read.csv("01_pimaTest.csv")
summarizeColumns(train)
summarizeColumns(test)
train$Y = as.factor(train$Y)
test$Y = as.factor(test$Y)
summary(train)
summary(test)
###
## Essential Step in mlr package. You have to ensure that response variable is
identified correctly
## SOP
## 1. Make Learner
## 2. Train Learner with Task
## 3. Predict
nb.learner = makeLearner("classif.naiveBayes")
calculateConfusionMatrix(nb.predict)
calculateConfusionMatrix(qda.predict)
calculateConfusionMatrix(logistic.predict)
## Method 4: CART
## Something Extra
cartModel=getLearnerModel(cart.model) ## In case you need to plot tree
library(rpart.plot)
prp(cartModel,extra=2, roundint=FALSE)## For plotting tree, you may need rpart.plot
#make predictions
cart.predict = predict(cart.model, testTask)
calculateConfusionMatrix(cart.predict)
calculateConfusionMatrix(rf.predict)
## Method: 6 SVM
calculateConfusionMatrix(ksvm.predict)
#Method 7: GBM
gbm.learner = makeLearner("classif.gbm", predict.type = "response", distribution =
"bernoulli")
gbm.model = train(gbm.learner, trainTask)
gbm.predict = predict(gbm.model, testTask)
calculateConfusionMatrix(gbm.predict)
#Method 8: XGB
calculateConfusionMatrix(xgb.predict)
#Method 9: knn
knn.learner=makeLearner("classif.knn",predict.type = "response")
knn.model=train(knn.learner,trainTask)
knn.predict=predict(knn.model, testTask)
calculateConfusionMatrix(knn.predict)