Professional Documents
Culture Documents
R Code Cars Data
R Code Cars Data
spark_install()
# Scatter plot
mtcars_spark %>%
collect() %>%
ggplot(aes(x = hp, y = mpg)) +
geom_point() +
ggtitle("Horsepower vs. MPG") +
xlab("Horsepower") +
ylab("MPG")
# Model summary
summary(linear_model)
#########################################
# K-means clustering model
k <- 3
kmeans_model <- mtcars_spark %>%
ml_kmeans(k = k, features = c("hp", "wt"))
# Visualization of clusters
clustered_data %>%
collect() %>%
ggplot(aes(x = hp, y = wt, color = cluster)) +
geom_point() +
ggtitle("K-Means Clustering (k=3)") +
xlab("Horsepower") +
ylab("Weight")