Klasterisasi Menggunakan Python

You might also like

Download as docx, pdf, or txt
Download as docx, pdf, or txt
You are on page 1of 2

Library

#import Library
import matplotlib.pyplot as plt
#library import file
import pandas as pd

#library data numerik


import numpy as np

#library claster
from sklearn.cluster import KMeans
from sklearn.preprocessing import MinMaxScaler

Import data

dfmhs = pd.read_csv('claster.csv',sep=';',engine='python')

dfmhs.describe()

#melihat karakter data


dfmhs.info()

#visualisasi data
plt.scatter(dfmhs['UTS'], dfmhs['UAS'])
plt.xlabel ("UTS")
plt.ylabel ("UAS")
plt.title ("Grafik nilai mahasiswa")

#data training
x_train = dfmhs[['UTS','UAS']].values

#scaling (berpengaruh pada perhitungan jarak)


from sklearn.preprocessing import MinMaxScaler
scaler = MinMaxScaler()
x_train=scaler.fit_transform(x_train)

x_train
#Menentukan klaster
from sklearn.cluster import KMeans
kmean = KMeans (n_clusters=2)
kmean

#klasterisasi
y_cluster = kmean.fit_predict(x_train)

y_cluster

#tambah fitur data (klaster)


dfmhs['klaster'] =y_cluster

dfmhs

#melihat centroid
kmean.cluster_centers_

You might also like