Professional Documents
Culture Documents
A008 - KNN.R: # Load The Dataset
A008 - KNN.R: # Load The Dataset
A008 - KNN.R: # Load The Dataset
R
2024-04-09
# Load the dataset
data = read.csv("C:/Users/Bhushan Sapkar/Downloads/Breast Cancer
Wisconsin.csv")
## [1] 569 32
# Evaluate performance
train_accuracy = sum(knn(train_set[, -c(1, 2)], train_set[, -c(1, 2)], cl =
train_set$Diagnosis, k = k) == train_set$Diagnosis) / nrow(train_set)
test_accuracy = sum(knn_model == test_set$Diagnosis) / nrow(test_set)
## V3 V4 V5
## Min. : 43.79 Min. : 143.5 Min. :0.05263
## 1st Qu.: 75.17 1st Qu.: 420.3 1st Qu.:0.08637
## Median : 86.24 Median : 551.1 Median :0.09587
## Mean : 91.97 Mean : 654.9 Mean :0.09636
## 3rd Qu.:104.10 3rd Qu.: 782.7 3rd Qu.:0.10530
## Max. :188.50 Max. :2501.0 Max. :0.16340
# Evaluate performance
train_accuracy1 = sum(knn(train_set1[, -c(1, 2)], train_set1[, -c(1, 2)], cl
= train_set1$Diagnosis, k = k) == train_set1$Diagnosis) / nrow(train_set1)
test_accuracy1 = sum(knn_model1 == test_set1$Diagnosis) / nrow(test_set1)
# Evaluate performance
train_accuracy2 = sum(knn(train_set2, train_set2, cl = train_set1$Diagnosis,
k = k) == train_set1$Diagnosis) / nrow(train_set2)
test_accuracy2 = sum(knn_model2 == test_set1$Diagnosis) / nrow(test_set2)