jrtechs
/
PerryXDeng-wheatyeeters
mirror of https://github.com/PerryXDeng/wheatyeeters.git

import sklearn.cluster as clusterimport pandas as pdfrom matplotlib import pyplot as plt

def find_kmeans(mat, k, first, second):    km = cluster.KMeans(n_clusters=k)    km.fit(mat)
    # Plot sse against k    plt.figure(figsize=(6, 6))    plt.xlabel('Metric: ' + first)    plt.ylabel('Metric: ' + second)    plt.scatter(mat[:, 0], mat[:, 1], c=km.labels_, cmap='rainbow')    plt.show()

# Read csv indf = pd.read_csv('../data_preparation/cleaned/time_series_normalized_wellness_menstruation.csv')
# Specify what things you wantdf = df[["normFatigue", "normSleepQuality"]]
# values, num clusters, axis labelsgfind_kmeans(df.values, 2, "normFatigue", "normSleepQuality")