Kmeans
Kmeans
January 2, 2025
1
[2]: from sklearn.preprocessing import StandardScaler
scaler = StandardScaler()
scaled_df = scaler.fit_transform(df[["age", "income"]])
scaled_df[0:5]
2
[5]: clusters = KMeans(3)
clusters.fit(scaled_df)
df["new_clusterid"] = clusters.labels_
df.groupby("new_clusterid")[['age', 'income']].agg(["mean", 'std']).
↪reset_index() # Changed tuple to list
3
[ ]: