Professional Documents
Culture Documents
Association R: Appendix
Association R: Appendix
Association R
Clustering R
#*****************Clustering******************************
#import needed packages
library(dplyr)
library(FactoMineR)
library(ggplot2)
library(funModeling)
library(psych)
#import Kaggle data
cluster=read.csv("C:/Users/khouloud.bennour/Desktop/R code/Mall_Customers.csv",
sep=",")
View(cluster)
#Data cleaning
str(cluster)
#convert gender to factor
cluster$Gender=as.factor(cluster$Gender)
#count na
colSums(is.na(cluster))
summary(cluster)
#standarisation
scaled <-scale(cluster[,c(4,5)])
Classification R
#Import needed libraries
library(ggplot2)
library(gridExtra)
library(psych)
library(dplyr)
library(FactoMineR)
library(ggplot2)
library(funModeling)
library(caret)
library(rpart)
library(rpart.plot)
library("caret")
#logistic regression
logit <- glm(Grade ~., data=train, family='binomial')
summary(logit)
#Confusion Matrix
confusionMatrix(as.factor(as.numeric(predicted>0.5)),as.factor(test$Grade))
#KNN
model_knn <- train(Grade~.,data=train, method='knn')
#Prediction
test <- data[-train_ind, ]
predicted <- predict(model_knn, test)
#Confusion Matrix
confusionMatrix(predicted,test$Grade)
#Decision TREE
#Confusion Matrix
confusionMatrix(test$Grade, predicted)