Skip to content

Commit 1c6a6e5

Browse files
committed
gpu umap
1 parent 0bcdb43 commit 1c6a6e5

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

top2vec/Top2Vec.py

+5-3
Original file line numberDiff line numberDiff line change
@@ -1276,10 +1276,12 @@ def compute_topics(self, umap_args=None, hdbscan_args=None, topic_merge_delta=0.
12761276
'n_components': 5,
12771277
'metric': 'cosine'}
12781278

1279-
if gpu_umap:
1280-
pass
1279+
if gpu_umap and _HAVE_CUMAP:
1280+
umap_model = cuUMAP(**umap_args).fit(self.document_vectors)
1281+
umap_embedding = umap_model.transform(self.document_vectors)
12811282
else:
12821283
umap_model = umap.UMAP(**umap_args).fit(self.document_vectors)
1284+
umap_embedding = umap_model.embedding_
12831285

12841286
# find dense areas of document vectors
12851287
logger.info('Finding dense areas of documents')
@@ -1289,7 +1291,7 @@ def compute_topics(self, umap_args=None, hdbscan_args=None, topic_merge_delta=0.
12891291
'metric': 'euclidean',
12901292
'cluster_selection_method': 'eom'}
12911293

1292-
cluster = hdbscan.HDBSCAN(**hdbscan_args).fit(umap_model.embedding_)
1294+
cluster = hdbscan.HDBSCAN(**hdbscan_args).fit(umap_embedding)
12931295

12941296
# calculate topic vectors from dense areas of documents
12951297
logger.info('Finding topics')

0 commit comments

Comments
 (0)