Я попытался написать алгоритм K-средних и получил эту ошибку в строке: points = np.array ([x[j] for j in range (len (x)) if cluster [j] == i])
кто-нибудь может помочь?
from copy import deepcopy
def euclidean_distance (a, b, ax = 1):
return np.linalg.norm (a - b , axis = ax)
c_prev = np.zeros (c.shape)
clusters = np.zeros (len(x))
distance_differences = euclidean_distance (c, c_prev)
while distance_differences.any () != 0:
for i in range (len(x)):
distances = euclidean_distance (x[i], c)
cluster = np.argmin (distances)
clusters [i] = cluster
c_prev = deepcopy (c)
for i in range (k):
points = [x[j] for j in range (len(x)) if clusters [j] == i]
if len(points) != 0:
c[i] = np.mean (points, axis = 0)
distance_differences = euclidean_distance (c, c_prev)
colors = ['b', 'r', 'y', 'g', 'c', 'm']
for i in range (k):
points = np.array ([x[j] for j in range (len (x)) if cluster [j] == i])
if len(points) > 0:
plt.scatter (points [:, 0], points [:, 1], s= 10, c = colors [i])
else:
print ('Please regenerate your centeroids again')
plt.scatter (points [:, 0], points [:, 1], s= 10, c = colors [i])
plt.scatter(c[:, 0], c[:, 1], marker = '*', s =100, c ='k')
plt.show();