#https://datahexa.com/kmeans-clustering-with-wine-dataset/参考

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn import cluster, preprocessing, datasets

from sklearn.cluster import KMeans

wine = datasets.load_wine()

X = wine.data

X.shape

(178, 13)

y=wine.target

y.shape

(178,)

wine.target_names

array(['class_0', 'class_1', 'class_2'], dtype='<U7')

model = KMeans(n_clusters=10)

labels = model.fit_predict(X)

df = pd.DataFrame({'labels': labels})
type(df)

pandas.core.frame.DataFrame

def species_label(theta):
    if theta == 0:
        return wine.target_names[0]
    if theta == 1:
        return wine.target_names[1]
    if theta == 2:
        return wine.target_names[2]

df['species'] = [species_label(theta) for theta in wine.target]

pd.crosstab(df['labels'], df['species'])

species	class_0	class_1	class_2
labels
0	5	5	6
1	8	0	0
2	0	15	14
3	0	17	0
4	18	1	0
5	6	0	0
6	1	12	18
7	7	3	5
8	0	18	5
9	14	0	0