답 → 3번, k-means clustering은 k값을 지정해줘야 작동하는 알고리즘이기 때문이다.
import pandas as pd
data = pd.read_csv('C:/Users/bbiga/OneDrive/바탕 화면/학교생활/대학교1(세종대)/2학년/SAI/CustomerDataSet.csv')
data.head()
from sklearn.preprocessing import MinMaxScaler
mms = MinMaxScaler()
mms.fit(data)
data_scaled = mms.transform(data)
import matplotlib.pyplot as plt
from sklearn.cluster import KMeans
fig, ax = plt.subplots(3, 2, figsize = (10,15))
col = 0
row = 0
for i in range(1,7) :
km = KMeans(n_clusters = i, random_state = 42)
km.fit(data_scaled[:, 1:3])
label = km.labels_
ax[col][row].scatter(data_scaled[:,1], data_scaled[:,2], c = label)
ax[col][row].set_xlabel('ItemBought')
ax[col][row].set_ylabel('ItmesReturned')
ax[col][row].set_title('K value = %d' %i)
row += 1
if(row >= 2) :
row = 0
col += 1
plt.savefig('KMeans 클러스터링.png')
plt.show()
