Skip to content

Commit

Permalink
fixed mistake with distance to cluster
Browse files Browse the repository at this point in the history
Remove momoization of clusters
  • Loading branch information
MarcosTirador committed Dec 22, 2022
1 parent a47b518 commit ed7e868
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions src/models/kmeans_based_model.py
Original file line number Diff line number Diff line change
Expand Up @@ -59,7 +59,7 @@ def search(self, query: str):

query_vector = self.GetQueryVector(query)

query_distances = self.kmeans.transform(query_vector)
query_distances = self.kmeans.transform([query_vector])[0]
best_clusters = []
for i in range(self.noClusters):
best_clusters.append((query_distances[i], i))
Expand Down Expand Up @@ -204,6 +204,7 @@ def Getkmeans(self, k, sparse_matrix):
json = f'{self.__class__.__name__}/{dataset}/Kmeans_object'

s = ddb.at(json)
kmeans = KMeans(n_clusters=k, n_init= 10, init="k-means++").fit(sparse_matrix)
if not s.exists():
kmeans = KMeans(n_clusters=k, n_init= 10, init="k-means++").fit(sparse_matrix)
kmeans2 = OurKmeans(kmeans.cluster_centers_, kmeans.labels_)
Expand All @@ -217,7 +218,7 @@ def Getkmeans(self, k, sparse_matrix):
data = s.read()
kmeans2 = OurKmeans(data['cluster_centers_'], data['labels_'])

return kmeans2
return kmeans

def ElbowMethod(sparse_matrix, min, max):
k = min
Expand Down

0 comments on commit ed7e868

Please sign in to comment.