>>> from techminer2.tech_mining.svd.tfidf_matrix.kmeans import cluster_centers
>>> cluster_centers(
... #
... # PARAMS:
... field="nlp_phrases",
... #
... # TF PARAMS:
... is_binary=True,
... cooc_within=1,
... #
... # TF-IDF parameters:
... norm=None,
... use_idf=False,
... smooth_idf=False,
... sublinear_tf=False,
... #
... # ITEM PARAMS:
... top_n=20,
... occ_range=(None, None),
... gc_range=(None, None),
... custom_items=None,
... #
... # SVD PARAMS:
... n_components=5,
... algorithm_svd="randomized",
... n_iter=5,
... n_oversamples=10,
... power_iteration_normalizer="auto",
... random_state=0,
... tol=0.0,
... #
... # KMEANS PARAMS:
... n_clusters=6,
... init="k-means++",
... n_init=10,
... max_iter=300,
... kmeans_tol=0.0001,
... algorithm_kmeans="auto",
... #
... # DATABASE PARAMS:
... root_dir="example/",
... database="main",
... year_filter=(None, None),
... cited_by_filter=(None, None),
... )
DIM_0 DIM_1 DIM_2 DIM_3 DIM_4
LABELS
CL_0 1.923172 -0.248246 -0.185237 0.388381 -0.678765
CL_1 1.999181 1.313913 0.516360 -0.146503 0.186634
CL_2 1.957021 -1.108232 0.089587 0.307670 1.527393
CL_3 2.132002 1.243576 -1.446699 -0.095713 0.644459
CL_4 5.637435 -1.177566 -0.626955 -0.713120 0.625639
CL_5 3.559041 -1.037701 2.320191 -0.835742 -0.441154