>>> from techminer2.tech_mining.pca.tfidf_matrix.kmeans import communities
>>> communities(
... #
... # PARAMS:
... field="author_keywords",
... #
... # TF PARAMS:
... is_binary=True,
... cooc_within=1,
... #
... # TF-IDF parameters:
... norm=None,
... use_idf=False,
... smooth_idf=False,
... sublinear_tf=False,
... #
... # ITEM PARAMS:
... top_n=20,
... occ_range=(None, None),
... gc_range=(None, None),
... custom_items=None,
... #
... # PCA PARAMS:
... n_components=5,
... whiten=False,
... svd_solver="auto",
... pca_tol=0.0,
... iterated_power="auto",
... n_oversamples=10,
... power_iteration_normalizer="auto",
... random_state=0,
... #
... # KMEANS PARAMS:
... n_clusters=6,
... init="k-means++",
... n_init=10,
... max_iter=300,
... kmeans_tol=0.0001,
... algorithm="auto",
... #
... # DATABASE PARAMS:
... root_dir="example/",
... database="main",
... year_filter=(None, None),
... cited_by_filter=(None, None),
... ).head()
CL_0 ... CL_5
0 FINANCIAL_INCLUSION 03:0590 ... FINTECH 31:5168
1 CASE_STUDIES 03:0442 ...
2 BLOCKCHAIN 03:0369 ...
3 CROWDFUNDING 03:0335 ...
4 MOBILE_PAYMENT 03:0309 ...
[5 rows x 6 columns]